-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathfunc.py
217 lines (187 loc) · 7.25 KB
/
func.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
# -*- coding: utf-8 -*-
from PIL import Image
from bs4 import BeautifulSoup
from keras.models import *
import urllib
import urllib.request
import http.cookiejar
import shutil
import string
import os
import cv2
import numpy as np
import shutil
temp_dir = (os.environ["TMP"])+'\\scoreTemp'
def getCheckCode():
# 携带Cookie获取验证码并保留在CookieJar中管理
captcha_url = "http://jwgls.jmu.edu.cn/Common/CheckCode.aspx"
captcha_path = temp_dir+'\\captcha.gif'
cookie = http.cookiejar.CookieJar()
opener = urllib.request.build_opener(urllib.request.HTTPCookieProcessor(cookie), urllib.request.HTTPHandler)
urllib.request.install_opener(opener)
captcha = opener.open(captcha_url).read()
captcha1 = open('./captcha.gif', 'wb')
captcha1.write(captcha)
captcha1.close()
captcha2 = open(captcha_path, 'wb')
captcha2.write(captcha)
captcha2.close()
os.remove('./captcha.gif')
return captcha_path
def predictCheckCode(captcha_path):
def color_range(color):
c_range = 50
r, g, b = color
color = [b, g, r]
return np.clip([i - c_range for i in color], 0, 255), \
np.clip([i + c_range for i in color], 0, 255)
colors = [
color_range([255, 0, 0]),
color_range([153, 43, 51]),
color_range([204, 43, 51]),
color_range([0, 0, 153]),
color_range([0, 0, 102]),
color_range([0, 128, 153]),
color_range([0, 170, 153]),
color_range([255, 170, 0]),
color_range([255, 128, 0]),
color_range([0, 0, 0]),
color_range([0, 128, 0]),
color_range([0, 85, 0])
]
def process_image(path):
code_pic = Image.open(path).convert('RGB').crop((8, 5, 72, 21))
cv_image = cv2.cvtColor(np.array(code_pic), cv2.COLOR_RGB2BGR)
pics = []
center = [6, 18, 30, 42, 54]
for (lower, upper) in colors:
# 创建NumPy数组
lower = np.array(lower, dtype="uint8") # 颜色下限
upper = np.array(upper, dtype="uint8") # 颜色上限
# 根据阈值找到对应颜色
mask = cv2.inRange(cv_image, lower, upper)
if np.sum(mask) > 14000:
break
for a in range(5):
size = (12, 16)
cropped = cv2.getRectSubPix(mask, size, (center[a], 8))
pics.append(cropped)
return pics
characters = string.digits
def vec2word(vec):
char_idxs = np.argmax(vec, axis=1)
return ''.join([characters[idx] for idx in char_idxs])
model = load_model('jmu_jw_captcha_break_splited.h5')
width, height = 12, 16
images = process_image(captcha_path)
X = np.zeros((len(images), height, width, 1), dtype=np.uint8)
for idx, im in enumerate(images):
X[idx, :, :, 0] = im[:, :]
y = model.predict(X)
predict_word = vec2word(y)
print("Predict: "+predict_word)
return predict_word
def userLogin(captcha, username, password):
home_url = "http://jwgls.jmu.edu.cn/Login.aspx"
home_page = BeautifulSoup(urllib.request.urlopen(home_url), "html.parser", from_encoding="gb2312")
get_viewstate = (home_page.find_all("input", id="__VIEWSTATE")[0])["value"]
# username = input('输入用户名: ')
# password = input('输入密码: ')
os.system('cls')
post_data = urllib.parse.urlencode({
'__VIEWSTATE': get_viewstate,
'TxtUserName': username,
'TxtPassword': password,
'TxtVerifCode': captcha,
'BtnLoginImage.x': '0',
'BtnLoginImage.y': '0'
})
post_data = post_data.encode('utf-8')
# 禁止gzip压缩
headers = {
'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8',
'Referer': 'http://jwgls.jmu.edu.cn/Login.aspx',
'Connection': 'Keep-Alive'
}
# 构建请求,模拟登录post
login_request = urllib.request.Request(home_url, data=post_data, headers=headers)
login_response = urllib.request.urlopen(login_request)
login_status = login_response.read()
# 解析post后页面,判断是否登录
login_page = BeautifulSoup(login_status, "html.parser", from_encoding='utf-8')
get_title = str(login_page.find_all("title")[0].get_text(strip=True))
if get_title == "集美大学综合教务管理系统":
os.system('cls')
print("你已成功登录!")
flag = 1
else:
print("登录失败。")
print("请检查用户名密码或验证码是否正确后再次尝试。")
flag = 0
return flag
def getPage(href, term, viewstate):
headers = {
'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8',
'Connection': 'Keep-Alive',
'DNT': '1',
'Origin': 'http://jwgls.jmu.edu.cn',
'Referer': 'http://jwgls.jmu.edu.cn/Student/ScoreCourse/ScoreAll.aspx',
'Upgrade-Insecure-Requests': '1'
}
get_data = urllib.parse.urlencode({
'ctl00_ToolkitScriptManager1_HiddenField': '',
'__EVENTTARGET': 'ctl00$ContentPlaceHolder1$semesterList',
'__EVENTARGUMENT': '',
'__VIEWSTATE': viewstate,
'ctl00$ContentPlaceHolder1$semesterList': term,
'ctl00$ContentPlaceHolder1$pageNumber': '20'
}).encode('utf-8')
ev_request = urllib.request.Request(href, data=get_data, headers=headers)
ev_response = urllib.request.urlopen(ev_request)
ev_status = ev_response.read()
ev_page = BeautifulSoup(ev_status, "html.parser")
return ev_page
def scoreRead(response):
page = BeautifulSoup(response, "html.parser")
trs = page.find_all("tr")
# 成绩tr区块开始序号为4,trs[3],总数目为len(trs) - 3。
# 注意在循环中由于list从0开始,结束数目要 + 1
score_trs_start = 4 - 1
score_trs_end = len(trs) - 3 + 1
course_name = []
course_score = []
for i in range(score_trs_start + 1, score_trs_end):
tds = trs[i].find_all("td")
course_name.append(tds[2].text)
course_score.append(tds[8].text)
return course_name, course_score
def getViewstate():
url = 'http://jwgls.jmu.edu.cn/Student/ScoreCourse/ScoreAll.aspx'
headers = {
'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,*/*;q=0.8',
'Connection': 'Keep-Alive',
'DNT': '1',
'Origin': 'http://jwgls.jmu.edu.cn',
'Referer': 'http://jwgls.jmu.edu.cn/Student/ScoreCourse/ScoreAll.aspx',
'Upgrade-Insecure-Requests': '1'
}
get_request = urllib.request.Request(url, headers=headers)
get_response = BeautifulSoup(urllib.request.urlopen(get_request), "html.parser", from_encoding='utf-8')
viewstate = (get_response.find_all("input", id="__VIEWSTATE")[0])["value"]
return viewstate
def cleanDir(dir_path):
if os.path.isdir(dir_path):
paths = os.listdir(dir_path)
for path in paths:
file_path = os.path.join(dir_path, path)
if os.path.isfile(file_path):
try:
os.remove(file_path)
except os.error:
pass
elif os.path.isdir(file_path):
if file_path[-4:].lower() == ".svn".lower():
continue
shutil.rmtree(file_path, True)
os.rmdir(dir_path)
return True