-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathmain.py
204 lines (167 loc) · 6.09 KB
/
main.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
import requests
from PIL import Image
from io import BytesIO
from bs4 import BeautifulSoup
from captcha_ocr import get_ocr_res
import os
from dotenv import load_dotenv
load_dotenv()
# 设置基本的URL和数据
# 验证码请求URL
RandCodeUrl = "http://zhjw.qfnu.edu.cn/verifycode.servlet"
# 登录请求URL
loginUrl = "http://zhjw.qfnu.edu.cn/Logon.do?method=logonLdap"
# 初始数据请求URL
dataStrUrl = "http://zhjw.qfnu.edu.cn/Logon.do?method=logon&flag=sess"
def get_initial_session():
"""
创建会话并获取初始数据
返回: (session对象, cookies字典, 初始数据字符串)
"""
session = requests.session()
response = session.get(dataStrUrl, timeout=1000)
cookies = session.cookies.get_dict()
return session, cookies, response.text
def handle_captcha(session, cookies):
"""
获取并识别验证码
返回: 识别出的验证码字符串
"""
response = session.get(RandCodeUrl, cookies=cookies)
# 添加调试信息
if response.status_code != 200:
print(f"请求验证码失败,状态码: {response.status_code}")
return None
try:
image = Image.open(BytesIO(response.content))
except Exception as e:
print(f"无法识别图像文件: {e}")
return None
return get_ocr_res(image)
def generate_encoded_string(data_str, user_account, user_password):
"""
生成登录所需的encoded字符串
参数:
data_str: 初始数据字符串
user_account: 用户账号
user_password: 用户密码
返回: encoded字符串
"""
res = data_str.split("#")
code, sxh = res[0], res[1]
data = f"{user_account}%%%{user_password}"
encoded = ""
b = 0
for a in range(len(code)):
if a < 20:
encoded += data[a]
for _ in range(int(sxh[a])):
encoded += code[b]
b += 1
else:
encoded += data[a:]
break
return encoded
def login(session, cookies, user_account, user_password, random_code, encoded):
"""
执行登录操作
返回: 登录响应结果
"""
headers = {
"Accept": "text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.9",
"Content-Type": "application/x-www-form-urlencoded",
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/83.0.4103.116 Safari/537.36",
"Origin": "http://zhjw.qfnu.edu.cn",
"Referer": "http://zhjw.qfnu.edu.cn/",
"Upgrade-Insecure-Requests": "1",
}
data = {
"userAccount": user_account,
"userPassword": user_password,
"RANDOMCODE": random_code,
"encoded": encoded,
}
return session.post(
loginUrl, headers=headers, data=data, cookies=cookies, timeout=1000
)
def get_user_credentials():
"""
获取用户账号和密码
返回: (user_account, user_password)
"""
user_account = os.getenv("USER_ACCOUNT")
user_password = os.getenv("USER_PASSWORD")
print(f"用户名: {user_account}\n")
print(f"密码: {user_password}\n")
return user_account, user_password
def simulate_login(user_account, user_password):
"""
模拟登录过程
返回: (session对象, cookies字典)
抛出:
Exception: 当验证码错误时
"""
session, cookies, data_str = get_initial_session()
for attempt in range(3): # 尝试三次
random_code = handle_captcha(session, cookies)
print(f"验证码: {random_code}\n")
encoded = generate_encoded_string(data_str, user_account, user_password)
response = login(
session, cookies, user_account, user_password, random_code, encoded
)
# 检查响应状态码和内容
if response.status_code == 200:
if "验证码错误!!" in response.text:
print(f"验证码识别错误,重试第 {attempt + 1} 次\n")
continue # 继续尝试
if "密码错误" in response.text:
raise Exception("用户名或密码错误")
print("登录成功,cookies已返回\n")
return session, cookies
else:
raise Exception("登录失败")
raise Exception("验证码识别错误,请重试")
# 获取xls文件
def get_xls_file(session, cookies, user_account, semester):
url = f"http://zhjw.qfnu.edu.cn/jsxsd/xskb/xskb_print.do?xnxq01id={semester}"
response = session.get(url, cookies=cookies, timeout=1000)
if response.status_code != 200:
print(
f"获取xls文件失败,状态码: {response.status_code},错误信息: {response.text}"
)
return None
with open(f"{user_account}-{semester}.xls", "wb") as f:
f.write(response.content)
return f"{user_account}-{semester}.xls"
def print_welcome():
print("\n" * 30)
print(f"\n{'*' * 10} 曲阜师范大学教务系统模拟登录脚本 {'*' * 10}\n")
print("By W1ndys")
print("https://github.com/W1ndys")
print("\n\n")
def main():
"""
主函数,协调整个程序的执行流程
"""
print_welcome()
# 获取环境变量
user_account, user_password = get_user_credentials()
if not user_account or not user_password:
print("请在.env文件中设置USER_ACCOUNT和USER_PASSWORD环境变量\n")
with open(".env", "w", encoding="utf-8") as f:
f.write("USER_ACCOUNT=\nUSER_PASSWORD=")
return
# 模拟登录并获取会话
session, cookies = simulate_login(user_account, user_password)
if not session or not cookies:
print("无法建立会话,请检查网络连接或教务系统的可用性。")
return
# 等待用户输入学期
semester = input("请输入学期(例如:2024-2025-1): \n")
xls_file = get_xls_file(session, cookies, user_account, semester)
if xls_file:
print(f"已成功获取 {xls_file} 文件")
else:
print("获取xls文件失败,请检查网络连接或教务系统的可用性。")
if __name__ == "__main__":
main()