#!/usr/bin/python
import os
+import codecs
import re
import shutil
+import sys
import gettext
import tempfile
from lxml import etree
from treecutter import constants as const
from treecutter.trie import Trie
from treecutter.link import Link
-from treecutter.tools import ssh_cmd, publish, mkdir_p
+from treecutter.tools import ssh_cmd, publish, mkdir_p,get_folder_size,sizeof_fmt
+
class Sitemap():
"""Class keeping the internal site structure"""
- def __init__(self):
+ def __init__(self,args):
+ self._output = args.output
+ self._style = args.style
+ self._subdir = args.subdir
self._file = 'sitemap.txt'
self._tree = Trie()
self._sitelang = set()
# representing the text on the site.
# A link can have several pages in different languages.
def add_link(self, link):
- tokens = filter(None,re.split(r'(^/[\w-]*/|[\w-]*/)',link))
+ tokens = filter(None,re.split(r'(^/[\w\.:-]*$|^/[\w\.:-]*/|[\w\.:-]*/)',link,flags=re.UNICODE))
self._tree.add(tokens,Link(link))
def write_map(self):
- f = open(self._file,'w')
- f.write('\n'.join(link.link() for link in self._tree))
+ f = codecs.open(self._file,'w','utf-8')
+ s = '\n'.join(link.link() for link in self._tree)
+ f.write(s)
f.close()
def read_map(self):
try:
- f = open(self._file)
+ f = codecs.open(self._file, 'r', 'utf-8')
sml = f.read().split()
f.close()
for line in sml:
# Main driver in the application processing the documents
# in the collected sitemap
- def process(self, style):
+ def process(self):
t1 = time()
print "Prepareing the input"
for link in self._tree:
languages=[tran])
t3 = time()
print "Language [%5.2f s]" % (round(t3-t2,2))
+ transform = {}
+ transform['xhtml5'] = etree.XSLT(etree.parse(self._style+"docbook.xhtml5.xsl"))
for link in self._tree:
- link.render(style)
+ link.render(transform)
t4 = time()
print "Render [%5.2f s]" % (round(t4-t3,2))
for link in self._tree:
- link.template(self, style, self._tmptarget)
+ link.template(self, self._style, self._tmptarget,self._subdir)
t5 = time()
print "Template [%5.2f s]" % (round(t5-t4,2))
t6 = time()
sitmaplink.add_page((l,'/sitemap.'+l+'.xml'))
for l in self._sitelang:
sitmaplink.page(l).set_article(self.gen_menu(l,None,"tree sitemap"))
- sitmaplink.page(l).template(self,style,self._tmptarget)
+ sitmaplink.page(l).template(self,self._style,self._tmptarget,self._subdir)
t7 = time()
print "Sitemap [%5.2f s]" % (round(t7-t6,2))
self._tree.graph()
def gen_menu(self,lang,page,cssclass):
- return self._tree.menu(lang,page,cssclass)
+ return self._tree.menu(lang,page,cssclass,self._subdir)
def lang_menu(self,lang,link):
html = ElementMaker()
ln = self._isocode.xpath(isoxml)[0].get('name')
if lang != 'en':
ln = self._tranlang[lang].gettext(ln)
- p = link.link()
- if p[-1] == '/':
- p = p +'index'
- p = p+'.'+l
- li = html.li(html.a(ln.decode('utf-8'),href=p,hreflang=l))
+ p = unicode(link.link())
+ if p[-1] == u'/':
+ p = p +u'index'
+ p = p+u'.'+l
+ li = html.li(html.a(ln.decode('utf-8'),
+ href=self._subdir+p,hreflang=l))
menu.append(li)
return etree.tostring(menu,encoding='UTF-8',pretty_print=False)
- def publish(self,output,style):
- ssh_cmd(output,"mkdir -p")
- publish(self._tmptarget, output)
- for res in ["css","images","js","fonts","favicon.ico"]:
- if (os.path.exists(style+res)):
- publish(style+res, output)
- ssh_cmd(output,"chmod a+rx")
+ def publish(self):
+ print "Size [ %7s ]" % (sizeof_fmt(get_folder_size(self._tmptarget)))
+ ssh_cmd(self._output,"mkdir -p")
+ publish(self._tmptarget, self._output)
+ for res in ["stylesheets","images","js","fonts","favicon.ico"]:
+ if (os.path.exists(self._style+res)):
+ publish(self._style+res, self._output)
+ ssh_cmd(self._output,"chmod a+rx")