import requests, os
from bs4 import BeautifulSoup
directory = os.path.normpath("C:\\Users\x\\Desktop\\names.txt")
f = open(directory, 'r', encoding='utf8')
x = f.readlines()
for line in x:
s = line.split(",")[0].replace(" ","")
n = line.split(",")[1].replace(" ","")
print(s + " " + n)
res = requests.get('http://www.scopus.com/results/authorNamesList.uri? origin=searchauthorlookup&src=al&edit=&poppUp=&basicTab=&affiliationTab=&advancedTab=&st1=' + s + '&st2=' + n + '&institute=&orcidId=&authSubject=LFSC&_authSubject=on&authSubject=HLSC&_authSubject=on&authSubject=PHSC&_authSubject=on&authSubject=SOSC&_authSubject=on&s=AUTH--LAST--NAME%28' + s + '%29+AND+AUTH--FIRST%28' + n + '%29&sdt=al&sot=al&searchId=81BECD653C7453F7BFBBB1CD8D8E5B04.wsnAw8kcdt7IPYLO0V48gA%3A220&exactSearch=off&sid=81BECD653C7453F7BFBBB1CD8D8E5B04.wsnAw8kcdt7IPYLO0V48gA%3A220')
content = res.content
soup = BeautifulSoup(content, 'lxml').find_all('div', {'class':'dataCol2'})
for item in soup:
print(item.text)
break
beautifulsoup. (content, 'lxml'). find_all은 x의 마지막 줄에서만 작동합니다. 어떻게 해결할 수 있습니까?
예상대로 작동합니다.
import requests, os
from bs4 import BeautifulSoup
x=["Aaroe, L","Abbas, Z","Abbott, G"]
for line in x:
l=line.split(',')
s=l[0].strip()
n=l[1].strip()
print("------------------------------------")
print("FirstName: "+s + ", Last Name: " + n)
res = requests.get('http://www.scopus.com/results/authorNamesList.uri?origin=searchauthorlookup&src=al&edit=&poppUp=&basicTab=&affiliationTab=&advancedTab=&st1=' + s + '&st2=' + n + '&institute=&orcidId=&authSubject=LFSC&_authSubject=on&authSubject=HLSC&_authSubject=on&authSubject=PHSC&_authSubject=on&authSubject=SOSC&_authSubject=on&s=AUTH--LAST--NAME%28' + s + '%29+AND+AUTH--FIRST%28' + n + '%29&sdt=al&sot=al&searchId=81BECD653C7453F7BFBBB1CD8D8E5B04.wsnAw8kcdt7IPYLO0V48gA%3A220&exactSearch=off&sid=81BECD653C7453F7BFBBB1CD8D8E5B04.wsnAw8kcdt7IPYLO0V48gA%3A220')
content = res.content
soup = BeautifulSoup(content, 'lxml').find_all('div', {'class':'dataCol2'})
for item in soup:
print(item.text.strip())
break
산출:
------------------------------------
FirstName: Aaroe, Last Name: L
Aarøe, Lene
Aaroe, Lene
------------------------------------
FirstName: Abbas, Last Name: Z
Abbas, Zaigham
Abbas, Z.
ABBAS, ZAIGHAM
------------------------------------
FirstName: Abbott, Last Name: G
Abbott, Albert Glenn
Abbott, A. G.
Abbott, Albert G.
Abbott, A.
이 기사는 인터넷에서 수집됩니다. 재 인쇄 할 때 출처를 알려주십시오.
침해가 발생한 경우 연락 주시기 바랍니다[email protected] 삭제
몇 마디 만하겠습니다