#!/usr/bin/env python # -*- coding: utf8 -*- import sys import re import codecs import xml.etree.cElementTree def read_csv_from_file(path, num_of_fields): with codecs.open(path, encoding='utf-8') as f: for line in f: e = [x.encode("utf-8") for x in line[:-1].split('\t')] yield e[0:num_of_fields] if __name__ == '__main__': html = '
%s | %s | %s | %s | %s | %s | %s |