代码如下:
#!/usr/bin/env python#coding:utf-8import re,sysimport urllibfrom bs4 import beautifulsoupglobal r_url
def hq_url(): so_url = “http://movie.douban.com/subject_search?search_text=” data = urllib.urlopen(so_url+gjz).read() r = re.findall(r’ r_url = re.sub(‘”‘,”,r[0]) ymdata = urllib.urlopen(r_url).read() soup = beautifulsoup(ymdata) wz = soup(‘span’,{‘property’:’v:summary’}) title = re.findall(r’name=”title” value=”(.*?)”‘,ymdata) zy = re.findall(r’name=”desc” value=”(.*?)”‘,ymdata) imdb = re.findall(r’:
shijian = re.findall(r'(.*?)’,ymdata) print u”imdb电影网链接” print imdb print u”豆瓣电影链接” print r_url print ‘*’*70 print title[0] print zy[0] print “电影简介” print ‘*’*70 print wzif __name__==’__main__’: gjz=raw_input(“请输入电影名: “).strip() hq_url()