forked from dyy747169800/bjjj-python
-
Notifications
You must be signed in to change notification settings - Fork 0
/
loadpaper.py
51 lines (45 loc) · 1.35 KB
/
loadpaper.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
#!/usr/bin/python
# encoding: utf-8
"""
@auth: zhaopan
@time: 2017/11/6 09:21
"""
import requests
from bs4 import BeautifulSoup
# Domain Host
host = 'https://enterbj.zhongchebaolian.com'
domain = 'enterbj.zhongchebaolian.com'
# 通用headers
headers = {
'Host': domain,
'Origin': host,
'Accept': '*/*',
'Accept-Encoding': 'gzip, deflate',
'Accept-Language': 'zh-CN',
'Connection': 'keep-alive',
'User-Agent': 'Mozilla/5.0 (Linux; Android 4.4.2; E6883 Build/KOT49H) AppleWebKit/537.36 (KHTML, like Gecko) Version/4.0 Chrome/30.0.0.0 Mobile Safari/537.36',
'X-Requested-With': 'XMLHttpRequest',
'Content-Type': 'application/x-www-form-urlencoded; charset=UTF-8'
}
# 主页
page_index = '/enterbj/jsp/enterbj/index.html'
# loadpaper
page_loadpaper = '/enterbj/platform/enterbj/loadpaper'
def loadPaper(applyid):
url = host + page_loadpaper
data = [
('applyid', applyid)
]
head = headers
head['Referer'] = host + page_index
res = requests.post(url, data=data, headers=head, allow_redirects=False, verify=False)
if res.status_code in [200, 201]:
return res.content
return None
def getPaperImage(html):
soup = BeautifulSoup(html, 'html.parser', from_encoding='utf-8')
tag = soup.find('p', class_='Nop')
return tag.get_text()
applyid = ''
res = getPaperImage(loadPaper(applyid))
print(res)