python大皿指数の読み取り

1161 ワード

#coding=utf-8

import HTMLParser
import time
import urllib2

#     
class MyParser(HTMLParser.HTMLParser): 
    targetid = ''   
     
    def __init__(self,targetid):
        HTMLParser.HTMLParser.__init__(self) 
        self.targetid = targetid
               
    def handle_starttag(self, tag, attrs):
        self.is_h4 = ""
        #                 
        if tag == 'span':
            #     <a>   
            for name,value in attrs:
                if name == 'id':
                    if value == self.targetid:
                        self.is_h4 = 1
                    
    def handle_endtag(self, tag):
        self.is_h4 = -1
                            
    def handle_data(self, data):
        if self.is_h4 == 1:
            print "    :", data
            
            
           
st = time.time()   
pageContent =  urllib2.urlopen('https://www.google.com.hk/finance?client=ob&hl=zh-CN&q=SHA:000001').read()                 
my = MyParser('ref_7521596_l')
my.feed(pageContent)

end = time.time()
print '    : %d  '%(end-st)