爬取人人贷网站

# -*- coding: UTF-8 -*- 
import bs4
import sys 
reload(sys) 
sys.setdefaultencoding("utf-8") 
import requests
from bs4 import BeautifulSoup
import json

url="https://www.renrendai.com/loan#page-1"
def gethtml(url):
    try:
        r=requests.get(url)
        r.raise_for_status()
        return r.text
    except:
        print "连接失败"

def parsehtml(html):
    soup=BeautifulSoup(html,"html.parser")
    a=soup(id="loan-list-rsp")
    mess=[]
    for i in a:   #type(i)=<class 'bs4.element.Tag'>
        b=str(i.string)
        htmllist=json.loads(b)["data"]["loans"]
        for j in htmllist:
            mess.append([j["loanId"],j["title"],j["amount"],j["interest"],j["months"],j["startTime"]])
    return mess

def showinfo(num,mess):
    tplt="{:^10}\t{:^10}\t{:^10}\t{:^10}\t{:^10}\t{:^10}"
    print (tplt.format("订单标的","借款标题","金额","利息","期限","募资时间"))  #括号不能遗漏,否则在下一步循环报错
    for i in range(num):
        cc=mess[i]
        print tplt.format(cc[0],cc[1],cc[2],cc[3],cc[4],cc[5])

def main():
    html=gethtml(url)
    mess=parsehtml(html)
    showinfo(20,mess)

main()
最后编辑于
©著作权归作者所有,转载或内容合作请联系作者
平台声明:文章内容(如有图片或视频亦包括在内)由作者上传并发布,文章内容仅代表作者本人观点,简书系信息发布平台,仅提供信息存储服务。

推荐阅读更多精彩内容