adding codecs to table parsing, enabling utf-8 support
from urlparse import urlparse
from lxml import etree
from urlparse import urlparse
from lxml import etree
self.cols = []
def parse(self):
self.cols = []
def parse(self):
- f = file(self.tablefile, 'r')
+ f = codecs.open(self.tablefile, encoding='utf-8')
+ c = re.split(r'\t+', line.rstrip())
self.cols.append(c)
def db_xml(self):
self.cols.append(c)
def db_xml(self):