import requests from bs4 import BeautifulSoup class Spider: def __init__(self, url): self.url = url self.soup = None def scrap(self): header = {'user-agent': "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 " "(KHTML, like Gecko) Chrome/74.0.3729.169 Safari/537.36"} url = self.url res = requests.get(url, headers=header) self.soup = BeautifulSoup(res.text, 'lxml') seeMoreLink = self.soup.select('body > div.content > div.mainContentContainer > div.mainContent > ' 'div.mainContentFloat > div.rightContainer > div[id^=relatedWorks] > div > ' 'div.bigBoxBody > div > a')[0].get("href") print(seeMoreLink) # print(soup) # print(soup.title.string) # print(soup.find_all('a')) # aTypes = soup.find_all('a')[0] # print(aTypes) # for obj in aTypes: # if obj. # print(soup.)