|
10 | 10 |
|
11 | 11 | class GetCode: |
12 | 12 | def __init__(self, path, url=None, headers=headers, origin='chaxun.heyuanedu.cn:88', threshold=185): # 初始化对象实例 |
13 | | - self.path = path |
| 13 | + self.path = path # 赋值变量 |
14 | 14 | self.url = url |
15 | 15 | self.headers = headers |
16 | 16 | self.origin = origin |
17 | 17 | self.threshold = threshold |
18 | 18 |
|
19 | 19 | def getReq(self, url=None, headers=None, origin='chaxun.heyuanedu.cn:88'): # 获取 Request 对象 |
20 | | - self.url = url if url != None else self.url |
| 20 | + self.url = url if url != None else self.url # 赋值变量 |
21 | 21 | self.headers = headers if headers != None else self.headers |
22 | 22 | self.origin = origin if origin != None else self.origin |
23 | | - return Request(self.url, None, self.headers, self.origin) |
| 23 | + return Request(self.url, None, self.headers, self.origin) # 返回 Request 对象 |
24 | 24 |
|
25 | 25 | def setting(self, path=None, url=None, headers=None, origin=None, threshold=None): # 设置实例的各类变量 |
26 | | - self.path = path if path != None else self.path |
| 26 | + self.path = path if path != None else self.path # 赋值变量 |
27 | 27 | self.url = url if url != None else self.url |
28 | 28 | self.headers = headers if headers != None else self.headers |
29 | 29 | self.origin = origin if origin != None else self.origin |
30 | 30 | self.threshold = threshold if threshold != None else self.threshold |
31 | 31 |
|
32 | 32 | def getSession(self, url=None, headers=None, origin=None): # 获取对应系统的 Session ,注意:请勿重复调用!否则将可能导致不可预知的问题! |
33 | | - self.url = url if url != None else self.url |
| 33 | + self.url = url if url != None else self.url # 赋值变量 |
34 | 34 | self.headers = headers if headers != None else self.headers |
35 | 35 | self.origin = origin if origin != None else self.origin |
36 | | - self.headers['Cookie'] = urlopen(self.getReq()).info()['Set-Cookie'].split(';')[0] |
37 | | - return self.headers |
| 36 | + self.headers['Cookie'] = urlopen(self.getReq()).info()['Set-Cookie'].split(';')[0] # 写入 Cookie(无法处理多个 Cookies 的情况!如果重复调用也可能导致出现问题)(其实就是因为我懒) |
| 37 | + return self.headers # 返回 headers |
38 | 38 |
|
39 | 39 | def download(self, url=None, path=None, headers=None, origin=None): # 下载验证码图片 |
40 | | - self.url = url if url != None else self.url |
| 40 | + self.url = url if url != None else self.url # 赋值变量 |
41 | 41 | self.path = path if path != None else self.path |
42 | 42 | self.headers = headers if headers != None else self.headers |
43 | 43 | self.origin = origin if origin != None else self.origin |
44 | 44 | if not os.path.exists(self.path[:self.path.rfind(os.sep)]): # 防止目录不存在出错 |
45 | | - os.mkdir(self.path[:self.path.rfind(os.sep)]) |
46 | | - with open(self.path, 'wb') as f: |
47 | | - size = f.write(urlopen(self.getReq()).read()) |
48 | | - return size |
| 45 | + os.mkdir(self.path[:self.path.rfind(os.sep)]) # 创建目录 |
| 46 | + with open(self.path, 'wb') as f: # 开文件 |
| 47 | + size = f.write(urlopen(self.getReq()).read()) # 写文件(图片) |
| 48 | + return size # 返回文件大小 |
49 | 49 |
|
50 | 50 | def identify(self, path=None, threshold=None): # 识别验证码 |
51 | | - self.path = path if path != None else self.path |
| 51 | + self.path = path if path != None else self.path # 赋值变量 |
52 | 52 | self.threshold = threshold if threshold != None else self.threshold |
53 | | - image = Image.open(self.path) |
54 | | - pixdata = image.load() |
55 | | - w, h = image.size |
56 | | - for y in range(h): # 处理多余色彩 |
| 53 | + image = Image.open(self.path) # PIL 打开图片 |
| 54 | + pixdata = image.load() # 载入图片到变量 |
| 55 | + w, h = image.size # 获取宽高 |
| 56 | + for y in range(h): # 处理色彩 |
57 | 57 | for x in range(w): |
58 | 58 | if pixdata[x, y][0] < self.threshold and pixdata[x, y][1] < self.threshold and pixdata[x, y][2] < self.threshold: |
59 | 59 | pixdata[x, y] = (0, 0, 0) |
|
0 commit comments