Python爬取CST信号通路图片
按研究分类
CST信号通路 网站为https://www.cellsignal.cn/pathways/
我们爬取前要先查看robots.txt 注意爬虫协议,避免违规爬取
输入网址https://www.cellsignal.cn/robots.txt
查看,可以爬取pathway目录,具体内容见文末
爬取结果展示:爬取73份PDF,耗时 13min15.2s (增加了休眠,防止反爬)
合并后
爬取单个PDF
采用ipynb方式运行
代码如下:
精简版:
import requests
import re
import time
import random
from bs4 import BeautifulSoup
from urllib.request import urlopen
# 发送 HTTP 请求获取网页内容
url = r"https://www.cellsignal.cn/pathways/by-research-area"
url_root = r"https://www.cellsignal.cn/pathways/"
response = requests.get(url)
# 解析网页内容
soup = BeautifulSoup(response.content, 'html.parser')
# 查找特定 class 的 div
target_divs = soup.find_all('div', attrs={'class': 'accordionGroup'})
results = re.findall('<li><a href="(.*?)">(.*?)</a></li>', str(target_divs),re.S)
urls=[]
for result in results:
# print(result[0])
title = result[0].split('/')[-1]
pdf_url = url_root + str(title)
# print(pdf_url)
urls.append(pdf_url)
for url in urls:
# 获取PDF链接
headers = {
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/55.0.2883.87 Safari/537.36"}
req = requests.get(url=url, headers=headers)
req.encoding = 'utf-8'
html=req.text
results = re.findall('<a target="_blank" id="pathway_pdf" href="(.*?)">查看 PDF 文件</a>', html,re.S)
print(results)
if not results:
continue
link = results[0]
name = results[0].split('/')[-1]
# print(link)
# print(name)
# 下载
headers ={
'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/96.0.4664.45 Safari/537.36'
}
pdfname = name
r = requests.get(link,headers=headers)
# 保存在当前路径
with open(pdfname ,mode = "wb") as f:
f.write(r.content) #图片内容写入文件
x = random.randint(1, 4) # 随机一个大于等于1且小于等于5的整数
time.sleep(x)
合并PDF
采用文件运行方式
import os
from PyPDF2 import PdfMerger
# 假设单页 PDF 文件所在的目录
pdf_directory = r'E:\Coding\python_gzlab_docu\pachong_gz_vs\cst-signaling'
# 获取目录下所有的 PDF 文件路径
pdf_files = [os.path.join(pdf_directory, filename) for filename in os.listdir(pdf_directory) if filename.endswith('.pdf')]
# 根据文件的创建时间进行排序
sorted_pdf_files = sorted(pdf_files, key=lambda x: os.stat(x).st_ctime)
# 创建 PdfMerger 对象用于合并 PDF
merger = PdfMerger()
# 逐个添加 PDF 文件到合并器中
for pdf_file in sorted_pdf_files:
merger.append(pdf_file)
# 输出合并后的 PDF 文件
output_filename = '合并后的 PDF 文件名称.pdf'
merger.write(output_filename)
merger.close()
print(f"已成功将单页 PDF 文件按创建时间顺序合并为 {output_filename}。")
注:
爬虫协议
User-agent: *
Disallow: /account
Disallow: /order
Disallow: /product/include
Disallow: /product/protocol.jsp
Disallow: /ajax
Disallow: /checkout/include
Disallow: /include
Disallow: /product/include
Disallow: /product/productDetail.jsp
Disallow: /product-comparison
Disallow: /compare-products.jsp
Disallow: /search/include
Disallow: /punchout
Disallow: /test
Disallow: /*?country=
Disallow: /productsitemap-tp.xml
Sitemap: https://www.cellsignal.cn/sitemap.xml
User-agent: AspiegelBot
Disallow: /
User-agent: cognitiveseo
Disallow: /
User-agent: Dotbot
Disallow: /
User-agent: JamesBOT
Disallow: /
User-agent: Metauri
Disallow: /
User-agent: MauiBot
Disallow: /
User-agent: MJ12Bot
Disallow: /
User-agent: Petalbot
Disallow: /
User-agent: SplitSignalBot
Disallow: /
User-agent: spyfu
Disallow: /
User-agent: WinHTTrack
Disallow: /
爬虫全部代码
全部代码:含注释
import requests
import re
import time
import random
from bs4 import BeautifulSoup
from urllib.request import urlopen
import requests
from bs4 import BeautifulSoup
# 发送 HTTP 请求获取网页内容
url = r"https://www.cellsignal.cn/pathways/by-research-area"
url_root = r"https://www.cellsignal.cn/pathways/"
response = requests.get(url)
# 解析网页内容
soup = BeautifulSoup(response.content, 'html.parser')
# 查找特定 class 的 div
target_divs = soup.find_all('div', attrs={'class': 'accordionGroup'})
# results = re.findall('<img.*?src="(.*?)".*?title="(.*?)"', html,re.S)
# <li><a href="/pathways/adherens-junction-dynamics-pathway">黏附连接动力学</a></li>
# results = re.findall('<li><a href="(.*?)">', html,re.S)
results = re.findall('<li><a href="(.*?)">(.*?)</a></li>', str(target_divs),re.S)
# print(results[0][0])
urls=[]
# print(cst_url[:-17])
# print(url_root)
for result in results:
# print(result[0])
title = result[0].split('/')[-1]
pdf_url = url_root + str(title)
# print(pdf_url)
urls.append(pdf_url)
# print(urls)
# new_text = text.replace("/", "-")
# url = r"https://www.cellsignal.cn/pathways/by-research-area" 只留 https://www.cellsignal.cn/pathways/
#<li><a href="/pathways/by-research/adhesiocn-ecm-cytoskeleton-pathways"> 取最后一个斜杆后的文本作title 21
#https://www.cellsignal.cn/pathways/adherens-junction-dynamics-pathway 最后真实地址
# with open('target_divs.txt','w') as file:
# file.write(str(target_divs))
# 打印找到的 div 内容
# for div in target_divs:
# print(div.text)
import sys
for url in urls:
# <a target="_blank" id="pathway_pdf" href="https://media.cellsignal.cn/www/pdfs/science/pathways/Adherens_Junction.pdf" data-en-label="pathway" data-en-action="Adherens_Junction.pdf" data-en-category="downloads">查看 PDF 文件</a>
# <a target="_blank" id="pathway_pdf" href="(.*?)" data-en-label="pathway" data-en-action="(.*?)" data-en-category="downloads">查看 PDF 文件</a>
# [0] 为网址 [2]为名字
#<a target="_blank" id="pathway_pdf" href="https://media.cellsignal.cn/www/pdfs/science/pathways/fibrosis-signaling.pdf" data-en-label="pathway" data-en-action="fibrosis-signaling.pdf" data-en-category="downloads">查看 PDF 文件</a>
# 发送 HTTP 请求获取网页内容
# response = requests.get(url)
# # 解析网页内容
# soup = BeautifulSoup(response.content, 'html.parser')
# # 查找特定 class 的 div
# target_divs = soup.find_all('div', attrs={'class': 'accordionGroup'})
# 获取PDF链接
headers = {
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/55.0.2883.87 Safari/537.36"}
req = requests.get(url=url, headers=headers)
req.encoding = 'utf-8'
html=req.text
# print(html)
results = re.findall('<a target="_blank" id="pathway_pdf" href="(.*?)" data-en-label="pathway" data-en-action="(.*?)" data-en-category="downloads">', html,re.S)
#<a target="_blank" id="pathway_pdf" href="https://media.cellsignal.cn/www/pdfs/science/pathways/Adherens_Junction.pdf">查看 PDF 文件</a>
#<a target="_blank" id="pathway_pdf" href="(.*?)">查看 PDF 文件</a>
results = re.findall('<a target="_blank" id="pathway_pdf" href="(.*?)">查看 PDF 文件</a>', html,re.S)
print(results)
if not results:
continue
link = results[0]
name = results[0].split('/')[-1]
# print("程序即将暂停,按回车键继续...")
# input()
print(link)
print(name)
# # 下载
headers ={
'User-Agent':'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/96.0.4664.45 Safari/537.36'
}
pdfname = name
# print(pdfname)
r = requests.get(link,headers=headers)
# # 保存在当前路径
with open(pdfname ,mode = "wb") as f:
f.write(r.content) #图片内容写入文件
x = random.randint(1, 4) # 随机一个大于等于1且小于等于5的整数
time.sleep(x)
运行日志
[]
['https://media.cellsignal.cn/www/pdfs/science/pathways/Adherens_Junction.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Adherens_Junction.pdf
Adherens_Junction.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Contribution_of_Extracellular_Matrix_to_EMT.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Contribution_of_Extracellular_Matrix_to_EMT.pdf
Contribution_of_Extracellular_Matrix_to_EMT.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Contribution_of_Soluble_Factors_to_EMT.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Contribution_of_Soluble_Factors_to_EMT.pdf
Contribution_of_Soluble_Factors_to_EMT.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Tumor_Angiogenesis.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Tumor_Angiogenesis.pdf
Tumor_Angiogenesis.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/fibrosis-signaling.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/fibrosis-signaling.pdf
fibrosis-signaling.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Regulation_Actin.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Regulation_Actin.pdf
Regulation_Actin.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Regulation_Microtubule.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Regulation_Microtubule.pdf
Regulation_Microtubule.pdf
[]
['https://media.cellsignal.cn/www/pdfs/science/pathways/DNA-Damage-Response.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/DNA-Damage-Response.pdf
DNA-Damage-Response.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Cell_Cycle_G2M_DNA.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Cell_Cycle_G2M_DNA.pdf
Cell_Cycle_G2M_DNA.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Cell_Cycle_G1S.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Cell_Cycle_G1S.pdf
Cell_Cycle_G1S.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/senescence-signaling.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/senescence-signaling.pdf
senescence-signaling.pdf
[]
['https://media.cellsignal.cn/www/pdfs/science/pathways/Apoptosis_Overview.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Apoptosis_Overview.pdf
Apoptosis_Overview.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Death_Receptor.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Death_Receptor.pdf
Death_Receptor.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Apoptosis_Mitochondrial.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Apoptosis_Mitochondrial.pdf
Apoptosis_Mitochondrial.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Apoptosis_Inhibition.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Apoptosis_Inhibition.pdf
Apoptosis_Inhibition.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/necrotic-cell-death.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/necrotic-cell-death.pdf
necrotic-cell-death.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Autophagy.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Autophagy.pdf
Autophagy.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/senescence-signaling.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/senescence-signaling.pdf
senescence-signaling.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Autophagy.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Autophagy.pdf
Autophagy.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Insulin_Receptor.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Insulin_Receptor.pdf
Insulin_Receptor.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Warburg_Effect.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Warburg_Effect.pdf
Warburg_Effect.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Hypoxia.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Hypoxia.pdf
Hypoxia.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/glutamine-metabolism.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/glutamine-metabolism.pdf
glutamine-metabolism.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/mTor.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/mTor.pdf
mTor.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/AMPK.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/AMPK.pdf
AMPK.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/senescence-signaling.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/senescence-signaling.pdf
senescence-signaling.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/fibrosis-signaling.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/fibrosis-signaling.pdf
fibrosis-signaling.pdf
[]
['https://media.cellsignal.cn/www/pdfs/science/pathways/Wnt_beta_Catenin.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Wnt_beta_Catenin.pdf
Wnt_beta_Catenin.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/TGF_beta.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/TGF_beta.pdf
TGF_beta.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Hedgehog.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Hedgehog.pdf
Hedgehog.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Notch.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Notch.pdf
Notch.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Hippo_Signaling.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Hippo_Signaling.pdf
Hippo_Signaling.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Angiogenesis.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Angiogenesis.pdf
Angiogenesis.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/esc_pluripotency.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/esc_pluripotency.pdf
esc_pluripotency.pdf
[]
['https://media.cellsignal.cn/www/pdfs/science/pathways/DNA_Methylation.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/DNA_Methylation.pdf
DNA_Methylation.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Histone_Methylation.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Histone_Methylation.pdf
Histone_Methylation.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Protein_Acetylation.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Protein_Acetylation.pdf
Protein_Acetylation.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Crosstalk_PostTrans.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Crosstalk_PostTrans.pdf
Crosstalk_PostTrans.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Epigenetic-Histone-H2A-H2B-H4.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Epigenetic-Histone-H2A-H2B-H4.pdf
Epigenetic-Histone-H2A-H2B-H4.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Epigenetic-Histone-H3.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Epigenetic-Histone-H3.pdf
Epigenetic-Histone-H3.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/atp-dependent-chromatin-remodeling-complexes.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/atp-dependent-chromatin-remodeling-complexes.pdf
atp-dependent-chromatin-remodeling-complexes.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Nuclear_Receptor.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Nuclear_Receptor.pdf
Nuclear_Receptor.pdf
[]
['https://media.cellsignal.cn/www/pdfs/science/pathways/Protein_Kinase.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Protein_Kinase.pdf
Protein_Kinase.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Phospholipase.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Phospholipase.pdf
Phospholipase.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/gpcr-overview.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/gpcr-overview.pdf
gpcr-overview.pdf
[]
['https://media.cellsignal.cn/www/pdfs/science/pathways/Toll_Like.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Toll_Like.pdf
Toll_Like.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Jak_Stat_IL_6.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Jak_Stat_IL_6.pdf
Jak_Stat_IL_6.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/T_Cell_Receptor.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/T_Cell_Receptor.pdf
T_Cell_Receptor.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/NF_kappaB.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/NF_kappaB.pdf
NF_kappaB.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Cell-Intrinsic-Innate-Immunity-Signaling.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Cell-Intrinsic-Innate-Immunity-Signaling.pdf
Cell-Intrinsic-Innate-Immunity-Signaling.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/B_Cell_Antigen.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/B_Cell_Antigen.pdf
B_Cell_Antigen.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/inflammasome.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/inflammasome.pdf
inflammasome.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Immune-Cell-Markers-Human.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Immune-Cell-Markers-Human.pdf
Immune-Cell-Markers-Human.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Immune-Cell-Markers-Mouse.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Immune-Cell-Markers-Mouse.pdf
Immune-Cell-Markers-Mouse.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Immune-Checkpoint.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Immune-Checkpoint.pdf
Immune-Checkpoint.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/fibrosis-signaling.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/fibrosis-signaling.pdf
fibrosis-signaling.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/car-signaling-networks.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/car-signaling-networks.pdf
car-signaling-networks.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/rheumatoid-arthritis.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/rheumatoid-arthritis.pdf
rheumatoid-arthritis.pdf
[]
['https://media.cellsignal.cn/www/pdfs/science/pathways/ErbB_HER.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/ErbB_HER.pdf
ErbB_HER.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/SAPK_JNK.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/SAPK_JNK.pdf
SAPK_JNK.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/MAPK_ERK_Growth.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/MAPK_ERK_Growth.pdf
MAPK_ERK_Growth.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/gpcr-overview.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/gpcr-overview.pdf
gpcr-overview.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/MAPK_p38.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/MAPK_p38.pdf
MAPK_p38.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/AMPK.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/AMPK.pdf
AMPK.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/mTor.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/mTor.pdf
mTor.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Akt_PKB.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Akt_PKB.pdf
Akt_PKB.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/phosphoinositide-lipid-signaling.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/phosphoinositide-lipid-signaling.pdf
phosphoinositide-lipid-signaling.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Protein_Kinase.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Protein_Kinase.pdf
Protein_Kinase.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Insulin_Receptor.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Insulin_Receptor.pdf
Insulin_Receptor.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Translation_eIF_4.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Translation_eIF_4.pdf
Translation_eIF_4.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Jak_Stat_IL_6.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Jak_Stat_IL_6.pdf
Jak_Stat_IL_6.pdf
[]
['https://media.cellsignal.cn/www/pdfs/science/pathways/gpcr-overview.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/gpcr-overview.pdf
gpcr-overview.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/trem2-signaling.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/trem2-signaling.pdf
trem2-signaling.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Vesicle_Trafficking.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Vesicle_Trafficking.pdf
Vesicle_Trafficking.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Molecular_and_Cellular_Biology_of_Alzheimers_Disease.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Molecular_and_Cellular_Biology_of_Alzheimers_Disease.pdf
Molecular_and_Cellular_Biology_of_Alzheimers_Disease.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Genetics-of-AD_web-handout.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Genetics-of-AD_web-handout.pdf
Genetics-of-AD_web-handout.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Dopamine_Parkinsons.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Dopamine_Parkinsons.pdf
Dopamine_Parkinsons.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Neuronal_Markers.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Neuronal_Markers.pdf
Neuronal_Markers.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/post-synaptic-signaling.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/post-synaptic-signaling.pdf
post-synaptic-signaling.pdf
[]
['https://media.cellsignal.cn/www/pdfs/science/pathways/Akt_PKB.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Akt_PKB.pdf
Akt_PKB.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/phosphoinositide-lipid-signaling.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/phosphoinositide-lipid-signaling.pdf
phosphoinositide-lipid-signaling.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/MAPK_ERK_Growth.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/MAPK_ERK_Growth.pdf
MAPK_ERK_Growth.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/MAPK_p38.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/MAPK_p38.pdf
MAPK_p38.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/gpcr-overview.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/gpcr-overview.pdf
gpcr-overview.pdf
[]
['https://media.cellsignal.cn/www/pdfs/science/pathways/m6a-rna.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/m6a-rna.pdf
m6a-rna.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/rna-lifecycle.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/rna-lifecycle.pdf
rna-lifecycle.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Translation_eIF_4.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Translation_eIF_4.pdf
Translation_eIF_4.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Translation_eIF_2.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Translation_eIF_2.pdf
Translation_eIF_2.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Stress-Granule-PWHO-11x16.5.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Stress-Granule-PWHO-11x16.5.pdf
Stress-Granule-PWHO-11x16.5.pdf
['https://media.cellsignal.cn/www/pdfs/science/pathways/Translation_Overview.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Translation_Overview.pdf
Translation_Overview.pdf
[]
[]
[]
['https://media.cellsignal.cn/www/pdfs/science/pathways/Ubiquitin_Proteasome.pdf']
https://media.cellsignal.cn/www/pdfs/science/pathways/Ubiquitin_Proteasome.pdf
Ubiquitin_Proteasome.pdf
更新,改进
2024.10.25-01:28
可以在文件名前加上index方便排序
重新运行时间5m1.2s。 91份PDF
if not results:
continue
index = index + 1
link = results[0]
name = str(index) + "-" + results[0].split('/')[-1]