第二讲作业

# 酷狗歌曲榜单TOP500

import requests

headers ={

  'User-Agent':'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/49.0.2623.87 Safari/537.36'

}

from lxml import etree

import xlwt


def get_info(url):

  res = requests.get(url,headers=headers)

  html = etree.HTML(res.text)

  infos = html.xpath('//div[@class="pc_temp_songlist "]/ul/li')

  for info in infos:

    rank1 = info.xpath('span[3]')[0]

    rank = rank1.xpath('string(.)').strip()

    name = info.xpath('a/text()')[0]

    singer = name.split('-')[0]

    song = name.split('-')[1]

    time = info.xpath('span[4]/span/text()')[0].strip()

    print(rank,singer,song,time)

if __name__ == '__main__':

  urls = ['https://www.kugou.com/yy/rank/home/{}-8888.html'.format(str(i)) for i in range(1,24)]

  for url in urls:

    get_info(url)

# 糗事百科24小时

import requests

headers ={

  'User-Agent':'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/49.0.2623.87 Safari/537.36'

}

from lxml import etree

  def get_info(url):

  res = requests.get(url,headers=headers)

  html = etree.HTML(res.text)

  infos = html.xpath('//div[@id="content-left"]/div')

  for info in infos:

    name = info.xpath('div[1]/a[2]/h2/text()')

    laugh = info.xpath('div[2]/span[1]/i/text()')

    content = info.xpath('a[1]/div/span/text()')

    comment = info.xpath('div[2]/span[2]/a/i/text()')

    print(name,content,laugh,comment)


if __name__ == '__main__':

  urls = ['https://www.qiushibaike.com/hot/page/{}/'.format(str(i)) for i in range(1,14)]

  for url in urls:

    get_info(url)

©著作权归作者所有,转载或内容合作请联系作者
平台声明:文章内容(如有图片或视频亦包括在内)由作者上传并发布,文章内容仅代表作者本人观点,简书系信息发布平台,仅提供信息存储服务。

推荐阅读更多精彩内容

  • import requests from lxmlimport etree import xlwt all_inf...
    晴空万里_c4a9阅读 186评论 0 0
  • import requests from lxml import etree import xlwt all_in...
    包筱莺阅读 168评论 0 0
  • import requests from lxml import etree import xlwt #作业二 :...
    史_学语言阅读 260评论 0 0
  • 一个选择,往往要过了更久才能看到它于自己的影响。实际上所有的影响,也都是缓慢的、轻柔的、默默的、甚至毫无察觉的。而...
    梦蝶随记阅读 299评论 0 3
  • 《明娜》是卡尔·耶勒鲁普在1889年出版的代表作长篇小说,讲述着三个青年间的爱情故事。 故事的主角日理工学院的学生...
    乐播报阅读 2,748评论 0 5