Python 爬虫笔记(三)
#用正则表达式爬取图片#! /usr/bin/env python#coding=utf-8import urllib2importrefrombs4 importBeautifulSouphtml=urllib2.urlopen("http://www.pythonscraping.com/pages/page3.html")bsObj=BeautifulSoup(ht
·
#用正则表达式爬取图片
#! /usr/bin/env python
#coding=utf-8
import urllib2
import re
from bs4 import BeautifulSoup
html=urllib2.urlopen("http://www.pythonscraping.com/pages/page3.html")
bsObj=BeautifulSoup(html)
images=bsObj.findAll("img", {"src":re.compile("\.\.\/img\/gifts/img.*\.jpg")})
for image in images:
print(image["src"])更多推荐



所有评论(0)