我想获取源代码里的内容,总是返回none,这是为什么?。代码如下:
#coding:utf-8
import re, urllib2
from re import *
url = 'http://d.weibo.com/102803?feed_filter=102803_ctg1_99991_-_ctg1_99991&feed_sort=102803_ctg1_99991_-_ctg1_99991¤t_page=3&since_id=&page=1#feedtop'
hea = {
'Connection': 'Keep-Alive',
'Accept': 'Mozilla/5.0 (Windows NT 6.3; WOW64; rv:38.0) Gecko/20100101 Firefox/38.0',
'User-Agent': 'Mozilla/5.0 (Windows NT 6.3; WOW64; rv:38.0) Gecko/20100101 Firefox/38.0',
'Accept-Language': 'zh-CN,zh;q=0.8,en-US;q=0.5,en;q=0.3',
# 'Accept-Encoding': 'gzip, deflate',
'Cookie': 'UOR=mozilla.com.cn,widget.weibo.com,http://www.baidu.com; SINAGLOBAL=6055804417730.377.1431913644255; ULV=1432997090967:7:7:6:4613413533035.514.1432997090946:1432865309305; SUB=_2AkMiBcCdf8NhqwJRmPoUy2_kZYRxzArEiebDAHzsJxIyHm8Z7L_3Su3A0O1GNCtReIq1--K5_c73; SUBP=0033WrSXqPxfM72-Ws9jqgMF55529P9D9WFnDhW3rn3vBGTzTJDl0W-K; YF-Page-G0=416186e6974c7d5349e42861f3303251; _s_tentry=-; Apache=4613413533035.514.1432997090946',
'Host': 'd.weibo.com',
'Cache-Control': 'max-age=0'
}
req = urllib2.Request(url)
for key in hea:
req.add_header(key,hea[key])
html = urllib2.urlopen(req).read()
ss = re.search('nick-name=\"(.*?)\"', html, re.S)
print ss
输出 : None
或者说有其他的方法吗?
#coding:utf-8
import re, urllib2
from re import *
url = 'http://d.weibo.com/102803?feed_filter=102803_ctg1_99991_-_ctg1_99991&feed_sort=102803_ctg1_99991_-_ctg1_99991¤t_page=3&since_id=&page=1#feedtop'
hea = {
'Connection': 'Keep-Alive',
'Accept': 'Mozilla/5.0 (Windows NT 6.3; WOW64; rv:38.0) Gecko/20100101 Firefox/38.0',
'User-Agent': 'Mozilla/5.0 (Windows NT 6.3; WOW64; rv:38.0) Gecko/20100101 Firefox/38.0',
'Accept-Language': 'zh-CN,zh;q=0.8,en-US;q=0.5,en;q=0.3',
# 'Accept-Encoding': 'gzip, deflate',
'Cookie': 'UOR=mozilla.com.cn,widget.weibo.com,http://www.baidu.com; SINAGLOBAL=6055804417730.377.1431913644255; ULV=1432997090967:7:7:6:4613413533035.514.1432997090946:1432865309305; SUB=_2AkMiBcCdf8NhqwJRmPoUy2_kZYRxzArEiebDAHzsJxIyHm8Z7L_3Su3A0O1GNCtReIq1--K5_c73; SUBP=0033WrSXqPxfM72-Ws9jqgMF55529P9D9WFnDhW3rn3vBGTzTJDl0W-K; YF-Page-G0=416186e6974c7d5349e42861f3303251; _s_tentry=-; Apache=4613413533035.514.1432997090946',
'Host': 'd.weibo.com',
'Cache-Control': 'max-age=0'
}
req = urllib2.Request(url)
for key in hea:
req.add_header(key,hea[key])
html = urllib2.urlopen(req).read()
ss = re.search('nick-name=\"(.*?)\"', html, re.S)
print ss
输出 : None
或者说有其他的方法吗?