『姵来晓晓看娱乐』并存入mysql数据库,超详细,python3快速爬取房源信息( 二 )
文章图片
以下为完整代码:
#fromseleniumimportwebdriverimportrequestsimportrefrombs4importBeautifulSoupimportpymysql#importtime#chrome_driver=r''C:Users秦QQAppDataLocalProgramsPythonPython38-32Libsite-packagesselenium-3.141.0-py3.8.eggseleniumwebdriverchromechromedriver.exe''#brower=webdriver.Chrome(executable_path=chrome_driver)#pool_url='http://localhost:5555/random'page=1whilepage<11:#brower.get(''https://tianjin.anjuke.com/sale/p%d/#filtersort''%page)#time.sleep(1)print(''这是第''+str(page)+''页'')#proxy=requests.get(pool_url).text#proxies={#'http':'http://'+proxy#}ifpage==1:url='https://tianjin.anjuke.com/sale/'headers={'referer':'https://tianjin.anjuke.com/sale/','user-agent':'Mozilla/5.0(WindowsNT10.0;Win64;x64)AppleWebKit/537.36(KHTML,likeGecko)Chrome/79.0.3945.130Safari/537.36',}else:url='https://tianjin.anjuke.com/sale/p%d/#filtersort'%pageheaders={'referer':'https://tianjin.anjuke.com/sale/p%d/#filtersort'%page,'user-agent':'Mozilla/5.0(WindowsNT10.0;Win64;x64)AppleWebKit/537.36(KHTML,likeGecko)Chrome/79.0.3945.130Safari/537.36',}#html=requests.get(url,allow_redirects=False,headers=headers,proxies=proxies)html=requests.get(url,headers=headers)soup=BeautifulSoup(html.content,'lxml')#图片地址myjpg=r''jpg=re.findall(myjpg,html.text)#描述mytail=r'(.*?)'mytotal=re.findall(totalprice,html.text)#单价simpleprice=r'(.*?)'simple=re.findall(simpleprice,html.text)db=pymysql.connect(''localhost'',''root'','''',''anjuke'')conn=db.cursor()print(len(jpg))foriinrange(0,len(tail)):jpgs=jpg[i]scripts=tail[i]localroom=my[i][0]localarea=my[i][1]localhigh=my[i][2]localtimes=my[i][3]local=my[i][4]total=mytotal[i]oneprice=simple[i]sql=''insertintoshanghai_adminvalue('%s','%s','%s','%s','%s','%s','%s','%s','%s')''%(jpgs,scripts,local,total,oneprice,localroom,localarea,localhigh,localtimes)conn.execute(sql)db.commit()db.close()#button=brower.find_element_by_class_name('aNxt')#button.click()#time.sleep(1)page=page+1#brower.close()
- 豆豆看娱乐乐■阅读时间和文章长短有关,小金车系统定时任务50篇
- 「深扒娱乐圈圈」可拆卸式柔性保温套功不可没!,显著减少机器热损失
- [忧家娱乐]搭载i9-10980HK处理器,戴尔XPS15曝光
- 忧家娱乐▲Ace放弃挣扎价格跳水!,骁龙865版OPPO Reno Ace2曝光,Reno
- 忧家娱乐■魅族16T发布新版本?有阳光的地方就有电延长续航
- 忧家娱乐:很快上线,魅族:16T日光橙太阳能充电版
- #忧家娱乐#所见即所得!明基SW系列专业摄影修图显示器天猫家装节推荐
- 「忧家娱乐」5G版荣耀30S正式发布,荣耀20大米价提前砸场!,麒麟820
- 忧家娱乐▲荣耀20泪流满面加速降价!,麒麟820+四摄荣耀30S正式发布
- 「忧家娱乐」i9-10980HK+4K屏+64G内存,预计本月发布,戴尔XPS15曝光