python大皿指数の読み取り
1161 ワード
#coding=utf-8
import HTMLParser
import time
import urllib2
#
class MyParser(HTMLParser.HTMLParser):
targetid = ''
def __init__(self,targetid):
HTMLParser.HTMLParser.__init__(self)
self.targetid = targetid
def handle_starttag(self, tag, attrs):
self.is_h4 = ""
#
if tag == 'span':
# <a>
for name,value in attrs:
if name == 'id':
if value == self.targetid:
self.is_h4 = 1
def handle_endtag(self, tag):
self.is_h4 = -1
def handle_data(self, data):
if self.is_h4 == 1:
print " :", data
st = time.time()
pageContent = urllib2.urlopen('https://www.google.com.hk/finance?client=ob&hl=zh-CN&q=SHA:000001').read()
my = MyParser('ref_7521596_l')
my.feed(pageContent)
end = time.time()
print ' : %d '%(end-st)