import requests
from bs4 import BeautifulSoup
file_out = open("D:/群晖NAS/Desktop/MEME网站结果/JASPAR.爬虫结果.txt", "w")
with open("D:/群晖NAS/Desktop/MEME网站结果/JASPAR.id.txt", "r") as file_id:
lines = file_id.readlines()
for line in lines:
# 指定要爬取的网址
url = 'https://jaspar.elixir.no/matrix/' + line.replace("\n", "") + '/'
print(url)
# 发送 GET 请求并获取网页内容
response = requests.get(url)
soup = BeautifulSoup(response.text, 'html.parser')
profile = soup.find('table', class_='table table-hover')
tr_tags = profile.find_all("tr")
class_txt = tr_tags[2].find_all('td')[1].get_text()
file_out.write(line.replace("\n", "") + "\t" + class_txt + "\n")
file_out.close()
Previous
![代谢物鉴定函数](/blog/img/cover/rfunction.png)
一个函数解决所有问题......
2024-06-12
Next
![Rstudio-Server安装igraph报错解决](/blog/img/cover/rstudioerror.png)
......
2024-03-07