xxxx18一60岁hd中国/日韩女同互慰一区二区/西西人体扒开双腿无遮挡/日韩欧美黄色一级片 - 色护士精品影院www

  • 大小: 2.58KB
    文件類型: .rar
    金幣: 1
    下載: 0 次
    發布日期: 2024-05-08
  • 語言: Python
  • 標簽: 爬蟲??壁紙??

資源簡介

彼岸花網壁紙爬蟲

資源截圖

代碼片段和文件信息

import?time?
import?re
import?random
from?bs4?import?BeautifulSoup?as?bf
from??urllib.request??import?urlopenurlretrieve
def?get_page(url):
????????html_url??=?url
????????html?=?urlopen(html_url)
????????page??=??bf(html.read()‘html.parser‘)
????????return?page?

#讀取a標簽中的超鏈接,并篩選出圖片的鏈接
def?GetImg_href(page):
????????img_href?=?[]
????????for?i?in??page.find_all(‘a‘):
????????????????tupian_href??=?i.get(‘href‘)
????????????????img_search?=?re.search(“^\/tupian\/.*\.html$“tupian_href)
????????????????if??img_search==?None:
????????????????????????continue
????????????????img_href.append(“http://pic.netbian.com“?+?str(img_search.group()))
????????????????#返回的列表
????????return?img_href
def?New_GetImg_href(page):
????????“““
????????獲取圖片的url
????????return:img_src;
????????“““
????????img_src?=?[]
????????for?i?in??page.find_all(‘img‘):
????????????????tupian_href??=?i.get(‘src‘)
????????????????img_search_href?=?re.search(“^\/uploads/.*\.jpg$“tupian_href)
????????????????if??img_search_href==?None:
????????????????????????continue
????????????????img_src.append(img_search_href.group())
????????return?img_src
def?img_down_load(abc):
????????‘‘‘
?????????@a:已經下載的數據塊?
????????@b

評論

共有 條評論