课时28 在MongoDB中筛选房源

'''
from pymongo import MongoClient
from bs4 import BeautifulSoup
import requests

host = 'localhost'
port = 27017

client = MongoClient(host,port)
db = client['test']
sheet = db['sheet']

urls = ['http://bj.xiaozhu.com/search-duanzufang-p{}-0/'.format(str(i)) for i in range(1,4)]
print(urls)

for url in urls:
    wb_data = requests.get(url)
    soup = BeautifulSoup(wb_data.text, 'lxml')
    titles = soup.select('#page_list > ul > li > div.result_btm_con.lodgeunitname > div > a > span')
    prices = soup.select('#page_list > ul > li > div.result_btm_con.lodgeunitname > span.result_price > i')

    for title, price in zip(titles,prices):
        data = {
            'title':title.get_text(),
            'price':price.get_text()
        }

        print(data)
        sheet.insert_one(data)
print('----------------------------------------')
for record in sheet.find():
    if int(record['price']) >= 500:
        print(record)

'''

最后编辑于
©著作权归作者所有,转载或内容合作请联系作者
平台声明:文章内容(如有图片或视频亦包括在内)由作者上传并发布,文章内容仅代表作者本人观点,简书系信息发布平台,仅提供信息存储服务。

推荐阅读更多精彩内容