新学习了selenium,啪一下腾讯招聘
 from lxml import etree
from selenium import webdriver
import pymysql
def Geturl(fullurl):#获取每个招聘网页的链接
browser.get(fullurl)
shouye_html_text = browser.page_source
shouye_ele = etree.HTML(shouye_html_text)
zp_list = shouye_ele.xpath('//*[@id="position"]/div[1]/table/tbody/tr/td/a/@href')#链接url
zp_url_list = []
for zp_url_lost in zp_list:
zp_url = 'https://hr.tencent.com/'+zp_url_lost
zp_url_list.append(zp_url)
return zp_url_list
def Getinfo(zp_url_list):#获取每个招聘链接内部的内容
for zp_url in zp_url_list:
browser.get(zp_url)
zp_info_html = browser.page_source
zp_ele = etree.HTML(zp_info_html)
zp_info_title = str(zp_ele.xpath('//*[@id="sharetitle"]/text()')[0])
zp_info_location = str(zp_ele.xpath('//*[@id="position_detail"]/div/table/tbody/tr[2]/td[1]/text()')[0])
zp_info_type = str(zp_ele.xpath('//*[@id="position_detail"]/div/table/tbody/tr[2]/td[2]/text()')[0])
zp_info_num = str(zp_ele.xpath('//*[@id="position_detail"]/div/table/tbody/tr[2]/td[3]/text()')[0])
zp_info_need = str(zp_ele.xpath('//*[@id="position_detail"]/div/table/tbody/tr[3]/td/ul/li/text()'))
connection = pymysql.connect(host='localhost', user='root', password='', db='txzp', )
try:
with connection.cursor() as cursor:
sql = "INSERT INTO `txzp_info` (`title`, `location`,`type`,`num`,`need`) VALUES (%s,%s,%s,%s, %s)"
cursor.execute(sql, (zp_info_title,zp_info_location,zp_info_type,zp_info_num,zp_info_need))
connection.commit()
finally:
connection.close()
print(zp_info_title,zp_info_location,zp_info_type,zp_info_num,zp_info_need)
if __name__ == '__main__':
browser = webdriver.Chrome()
pags = int(input('需要几页?'))
for i in range(0,pags):
url = 'https://hr.tencent.com/position.php?keywords=&tid=0&start={}'
fullurl = url.format(str(i*10))
zp_url_list = Geturl(fullurl)
Getinfo(zp_url_list)
browser.close()

最新文章

  1. Android 滑动菜单框架--SwipeMenuListView框架完全解析
  2. C语言初级进阶1
  3. iOS-使用Xcode拉伸图片
  4. BZOJ3058 四叶草魔杖
  5. 弹出框、遮罩层demo
  6. Spring再学习
  7. fidder从基础到熟练
  8. iter迭代器的应用
  9. AHB/APB简介
  10. mycat使用之MySQL单库分表及均分数据
  11. CSS3效果:波浪效果
  12. android studio报Resolved versions for app (26.1.0) and test app (27.1.1)differ. 错误的解决办法
  13. JAVA中各种日期表示字母
  14. caffe SSD目标检测lmdb数据格式制作
  15. Day1-Python基础--数据类型
  16. Centos7 Nginx 开机启动
  17. 数据库连接池DBUtils使用
  18. PAT甲题题解-1077. Kuchiguse (20)-找相同后缀
  19. 【ElasticSearch】ES5新特性-keyword-text类型-查询区别
  20. windows7安装node

热门文章

  1. Access 64-bit HKLM\Software Registry by 32-bit C#.NET Application
  2. 通过CXF,开发soap协议接口
  3. VMware安装VMware tool后mount /dev/cdrom /mnt成功挂载含rpm包的镜像
  4. 在windows平台上构建自己的PHP(php5.3+)
  5. 代码大全读书笔记 Part 1
  6. LevelDB源码分析之:arena内存管理
  7. BZOJ2337:[HNOI2011]XOR和路径(高斯消元)
  8. UVA12034 Race
  9. rc.local 开机自启脚本无法启动
  10. ecshop 中如何禁用右键和F12