Python爬虫实战:抓取58同城二手房信息并保存
import requests
from lxml import etree
# 获取网站的HTML代码
url = 'https://bj.58.com/ershoufang/pn1/'
response = requests.get(url)
html = response.text
# 创建etree_html对象
etree_html = etree.HTML(html)
# 解析页面数据
house_list = etree_html.xpath('//ul[@class="house-list-wrap"]/li')
result = []
for house in house_list:
title = house.xpath('.//h2[@class="title"]/a/text()')[0]
price = house.xpath('.//div[@class="price"]/p/text()')[0]
result.append(title + ' ' + price)
# 将解析的页面结果保存到txt文件中
with open('house_info.txt', 'w', encoding='utf-8') as f:
for item in result:
f.write(item + '\n')
原文地址: https://www.cveoy.top/t/topic/f4pw 著作权归作者所有。请勿转载和采集!