早就想寫一個更新程式
方便我抓mlb資訊(又聽說python這方面很強,就摸摸看)
先搞定一個抓取網頁,然後parser指定區域後到csv的陽春程式
紀錄一下
#coding: utf-8
import urllib.request, csv
from html.parser import HTMLParser
data = urllib.request.urlopen('http://tw.movies.yahoo.com/movieinfo_main.html/id=4569')
content = data.read().decode('utf_8')
data.close()
f = open('example.csv','wt')
writer = csv.writer(f)
class myparser(HTMLParser):
def __init__(self):
HTMLParser.__init__(self)
self.isNumber = 0
self.numbers = []
def handle_data(self, data):
if self.isNumber == 1:
writer.writerow([data])
print(data)
self.isNumber = 0
def handle_starttag(self, tag, attrs):
if tag == 'span' and attrs == [('class','dta')]:
self.isNumber = 1
Parser = myparser()
Parser.feed(content)
f.close()