本帖最后由 小檀 于 2018-8-1 13:15 编辑
- # coding=utf-8
- import requests
- from bs4 import BeautifulSoup
- # 获取html文档
- def get_html(url):
"""get the content of the url""" - response = requests.get(url)
- response.encoding = 'utf-8'
- return response.text
- # 获取笑话
- def get_certain_joke(html):
- """get the joke of the html"""
- soup = BeautifulSoup(html, 'lxml')
- joke_content = soup.select('div.content')[0].get_text()
- return joke_content
- url_joke = "https://www.qiushibaike.com"
- html = get_html(url_joke)
- joke_content = get_certain_joke(html)
- print joke_content
|
|