Python基本爬虫(数据存储器)

2017-12-12  本文已影响0人  原来不语
# -*-encoding:utf-8 -*-
import codecs

class DataOutput(object):
"""docstring for DataOutput"""
def __init__(self):
    super(DataOutput, self).__init__()
    self.datas=[]
    
def store_data(self,data):
    if data is None:
        return 
    self.datas.append(data)

def output_html(self):
    fout = codecs.open('baike.html','w',encoding='utf-8')
    fout.write("<html>")
    fout.write("<head><meta charset='utf-8'/></head>")
    fout.write("<body>")
    fout.write("<table>")
    for data in self.datas:
        fout.write("<tr>")
        fout.write("<td>%s</td>"%data['url'])
        fout.write("<td>%s</td>"%data['title'])
        fout.write("<td>%s</td>"%data['summary'])
        fout.write("</tr>")
        self.datas.remove(data)
    fout.write("</table>")
    fout.write("</body>")
    fout.write("</html>")
    fout.close()
上一篇 下一篇

猜你喜欢

热点阅读