-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy path爬,都可以爬.py
64 lines (56 loc) · 2.29 KB
/
爬,都可以爬.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
from types import BuiltinMethodType
import requests
import re
def esu(searchid,page):
url = "https://findcumt.libsp.com/find/unify/search"
payload ={"docCode":[None],"searchFieldContent":searchid,"searchField":"keyWord","matchMode":"2","resourceType":[],"subject":[],"discode1":[],"publisher":[],"libCode":[],"locationId":[],"eCollectionIds":[],"curLocationId":[],"campusId":[],"kindNo":[],"collectionName":[],"author":[],"langCode":[],"countryCode":[],"publishBegin":None,"publishEnd":None,"coreInclude":[],"ddType":[],"verifyStatus":[],"group":[],"sortField":"relevance","sortClause":"asc","page":page,"rows":10,"onlyOnShelf":None,"indexSearch":1,"searchItems":None}
headers = {
'Content-Type': 'application/json;charset=UTF-8',
'groupCode': '200069',
'Host': 'findcumt.libsp.com',
'Referer': 'https://findcumt.libsp.com/',
'Cookie': 'SameSite=None; SameSite=None'
}
response = requests.request("POST", url, headers=headers, json=payload )
return response.text
def introduction(result):
introduction=re.findall('"adstract":(".+?"|null),"dd',result)
return introduction
def simplify_bookid(result):
recordid=re.findall('"recordId":([0-9]*?),"fa',result)
return recordid
def simplify_name(result):
name=re.findall('"title": (".+?"),"co',result)
return name
def simplify_author(result):
author=re.findall('"author":(".+?"|null)',result)
return author
def simplify_publisher(result):
publisher=re.findall('"publisher":(".+?"|null),"is',result)
return publisher
def simplify_isbn(result):
isbn=re.findall('"isbn":(".+?"|null),"isbns',result)
return isbn
print("请输入‘搜索目标 页数’" )
INPUT=input().split()
searchid=INPUT[0]
page=INPUT[1]
result=esu(searchid,page)
recordid=simplify_bookid(result)
author=simplify_author(result)
publisher=simplify_publisher(result)
brief=introduction(result)
isbn=simplify_isbn(result)
sum=[]
N=len(recordid)
for i in range(N):
temporary={"bookid":recordid[i],"author":author[i],"出版社":publisher[i],"isbn":isbn[i],"简介":brief[i],"第几本书":i+1}
sum.append(temporary)
print(sum)
print("本页记录数")
print(len(sum))
print("page")
print(page)
print("想具体看哪本书,输入一个数字")
check=int(input())
print(sum[check-1])