#file-name: pdf_download.py
import os
import requests
from bs4 import BeautifulSoup
def download_file(url, index):
#local_filename1 = index+"-"+url.split('/')[-1]
local_filename1 = url.split('/')[-1]
local_filename = local_filename1.replace('%20','_')
# NOTE the stream=True parameter
r = requests.get(url, stream=True)
with open(local_filename, 'wb') as f:
for chunk in r.iter_content(chunk_size=1024):
if chunk: # filter out keep-alive new chunks
f.write(chunk)
f.flush()
return local_filename root_link="https://rockchip.fr/"
#sub = ["main1", "ampak", "chipspark", "firefly", "geekbox", "marsboard", "radxa", "RK312X TRM", "RK3288 TRM"]
sub = [ "ampak", "chipspark", "firefly", "geekbox", "marsboard", "radxa", "RK312X TRM", "RK3288 TRM"]
for i in sub:
if(i != "main"):
r=requests.get(root_link+i)
if(not os.path.exists(i)):
directory = i.replace(" ", "_")
os.mkdir( "./"+directory )
os.chdir( "./"+directory)
else:
continue
#//else:
# r=requests.get(root_link) print(root_link+i)
if r.status_code==200:
soup=BeautifulSoup(r.text)
# print(soup.prettify())
index=1
for link in soup.find_all('a'):
new_link=root_link+i+'/'+link.get('href')
if new_link.endswith(".pdf") or new_link.endswith(".DSN") or new_link.endswith(".apk") :
file_path=download_file(new_link,str(index))
print("downloading:"+new_link+" -> "+file_path)
index+=1
print(i+" download finished")
else:
print("errors occur.")
exit() if(i != "main"):
os.chdir( "../")
#else:
# pass print("all download finished")

  

最新文章

  1. 慕课网__css_ float
  2. Eclipse和PyDev搭建完美Python开发环境(Windows篇)
  3. django 架构点点滴滴
  4. Linux脚本执行过程重定向
  5. C# Enum Type
  6. hive-安装0.13.1(hadoop2.2.0)
  7. NPOI的版本查看
  8. 修改LiteIDE 编辑窗口的主题
  9. Cracking the coding interview
  10. C# 内存管理优化畅想----前言
  11. 1. Git 克隆代码
  12. R语言 决策树算法
  13. 现代3D图形编程学习--opengl使用不同的缓存对象(译者添加)
  14. 【读书笔记】【深入理解ES6】#5-解构:使数据访问更便捷
  15. iphone开发笔记目录
  16. java基础之修饰符和内部类
  17. 同时使用n和nvm踩到的坑
  18. Linux tmpwatch命令详解
  19. 转载 - java中接口的向上转型。和多态性
  20. Pytest+Allure环境的搭建

热门文章

  1. [编程基础] Python日志记录库logging总结
  2. CSP-S2022 游记
  3. Spark详解(09) - Spark调优
  4. python之路39 前端开始 各种标签
  5. 琐碎的想法(五)for 的前世今生
  6. pytorch 配置详细过程
  7. 「HNOI2019」校园旅行
  8. 前端基础知识-react(一)个人学习记录 _
  9. RA-Depth: Resolution Adaptive Self-Supervised Monocular Depth Estimation
  10. 12月22日内容总结——django中间件的三个了解要求的方法、基于django中间件的功能设计、cookie与session