import shutil
import pygraphviz as pgv
import glob
+import gettext
+import shutil
from amara import bindery
from amara.xslt import transform
from Cheetah.Template import Template
args = parser.parse_args()
style_xslt = args.style+"docbook.xsl"
-style_tmpl = args.style+"index.en.html.tmpl"
outputdir = args.output
tmptarget = tempfile.mkdtemp()+'/'
class Page():
"""Class representing a version of a webpage"""
- def __init__(self,page):
+ def __init__(self,link,page):
+ self._link = link
self._file = page[1]
self._lang = page[0]
self._doc = None
def language(self):
return self._lang
+ def resources(self):
+ return set(self._resources)
+
def menu(self):
return self._menu
for c in code:
(p, ext) = os.path.splitext(c.href)
if ext in valid_scripts:
- exe = os.path.join(os.path.abspath(dirname+c.href))
+ exe = os.path.join(os.path.abspath(dirname)+'/'+c.href)
xml = subprocess.Popen([exe],stdout=subprocess.PIPE)
xstr = bindery.parse(str(xml.stdout.read()))
idp = c.xml_index_on_parent
os.chdir(cwd)
def template(self,sitemap):
- htmlmenu = sitemap.gen_menu(self._lang,None,None)
+ htmlmenu = sitemap.gen_menu(self._lang,None,"menu")
levelmenu = sitemap.gen_menu(self._lang,self,"tree")
- template = Template(file=style_tmpl,
+ langmenu = sitemap.lang_menu(self._lang,self._link)
+ template = Template(file=args.style+'index.'+self._lang+'.html.tmpl',
searchList=[{'title':self._title},
{'menu':htmlmenu},
{'article':self._rendered_article},
{'levelmenu':levelmenu},
- {'levelname':'Menu'}])
+ {'langmenu':langmenu}])
outfile = tmptarget+'html'.join(self._file.rsplit('xml',1))
mkdir_p(os.path.dirname(outfile))
out = open(outfile, 'w')
path = path+'index'
lang = self._scan_languages(path)
for l in lang:
- self._pages.append(Page(l))
+ self._pages.append(Page(self,l))
+
+ def add_page(self,l):
+ self._pages.append(Page(self,l))
def _scan_languages(self,path):
lang = []
for page in self._pages:
if page.language()==lang:
return page
+ return None
+
+ def resources(self):
+ res = set()
+ for page in self._pages:
+ res = res.union(page.resources())
+ return res
+
class Node():
def __init__(self,token,value):
html = "<ul%s>\n" % css
for l in trie:
sel = ''
- if l.value().page(lang) == page:
+ p = l.value().page(lang)
+ if p == page:
sel = ' class="selected"'
- html += '<li%s><a href="%s">%s</a>\n' \
- % (sel,l.value().link(),l.value().page(lang).menu())
- html += self._menu(l.children(), lang, page, "")
+ if p != None:
+ html += '<li%s><a href="%s">%s</a>\n' \
+ % (sel,l.value().link(),p.menu())
+ else:
+ html += '<li%s><a href="%s.en" hreflang="en">%s</a>*\n' \
+ % (sel,l.value().link(), l.value().page('en').menu())
+ if l.children():
+ html += self._menu(l.children(), lang, page, "")
html += "</ul>\n"
return html
def __init__(self):
self._file = 'sitemap.txt'
self._tree = Trie()
+ self._sitelang = set()
+ self._isocode = bindery.parse('/usr/share/xml/iso-codes/iso_639_3.xml')
+ self._tranlang = {}
def add_link(self, link):
- tokens = filter(None,re.split(r'(^/\w*/|\w*/)',link))
+ tokens = filter(None,re.split(r'(^/[\w-]*/|[\w-]*/)',link))
self._tree.add(tokens,Link(link))
def write_map(self):
def set(self):
return set(link.link() for link in self._tree)
+ def process(self):
+ t1 = time.time()
+ for link in self._tree:
+ link.prepare()
+ t2 = time.time()
+ print "Prepare [%5.2f s]" % (round(t2-t1,2))
+ for link in self._tree:
+ self._sitelang = self._sitelang.union(set(link.languages()))
+ for tran in self._sitelang:
+ if tran != 'en':
+ self._tranlang[tran] = gettext.translation('iso_639_3',
+ languages=[tran])
+ t3 = time.time()
+ print "Language [%5.2f s]" % (round(t3-t2,2))
+ for link in self._tree:
+ link.render()
+ t4 = time.time()
+ print "Render [%5.2f s]" % (round(t4-t3,2))
+ for link in self._tree:
+ link.template(self)
+ t5 = time.time()
+ print "Template [%5.2f s]" % (round(t5-t4,2))
+ t6 = time.time()
+ res = set()
+ cwd = os.getcwd()
+ for link in self._tree:
+ res = res.union(link.resources())
+ for f in res:
+ outfile = tmptarget+f
+ mkdir_p(os.path.dirname(outfile))
+ shutil.copyfile(f,outfile)
+ print "Resources[%5.2f s]" % (round(t6-t5,2))
+ sitmaplink = Link('/sitemap')
+ for l in self._sitelang:
+ sitmaplink.add_page((l,'/sitemap.'+l+'.xml'))
+ for l in self._sitelang:
+ sitmaplink.page(l).set_article(self.gen_menu(l,None,"tree sitemap"))
+ sitmaplink.page(l).template(self)
+ t7 = time.time()
+ print "Sitemap [%5.2f s]" % (round(t7-t6,2))
+
def graph(self):
self._tree.graph()
def gen_menu(self,lang,page,cssclass):
return self._tree.menu(lang,page,cssclass)
+ def lang_menu(self,lang,link):
+ html = "<ul>"
+ for l in link.languages():
+ isoxml = u"//iso_639_3_entry[@*='"+l+"']"
+ ln = self._isocode.xml_select(isoxml)[0].name
+ if lang != 'en':
+ ln = self._tranlang[lang].gettext(ln)
+ p = link.link()
+ if p[-1] == '/':
+ p = p +'index'
+ p = p+'.'+l
+ html += '<li><a href="%s" hreflang="%s">%s</a></li>' % (p, l, ln)
+ html += "</ul>"
+ return html
+
+ def publish(self):
+ publish(tmptarget, args.output)
+ publish(args.style+"css", args.output)
+ publish(args.style+"images",args.output)
+
def generateSitemap():
sitemap = []
try:
missing = dir_.set() - sitemap.set()
removed = sitemap.set() - dir_.set()
for page in removed:
- print removed+' pages missing!!'
+ print page+' pages missing!!'
for page in missing:
print 'adding missing page '+page
sitemap.add_link(page)
-if len(missing & removed) != 0:
+if len(missing)+len(removed) != 0:
print 'writing new sitemap - please adjust if needed'
sitemap.write_map()
sitemap.graph()
+sitemap.process()
+
+t1 = time.time()
+sitemap.publish()
+t2 = time.time()
+print "Publish [%5.2f s]" % (round(t2-t1,2))
sitemap = generateSitemap()
tmptarget = tempfile.mkdtemp()+'/'
+tot = 0
for page in sitemap:
t1 = time.time()
print "Page : %-30s %30s" % (page['link'],
writeToTemplate(page,pubdoc,sitemap)
t2 = time.time()
print "[%5.2f s]" % (round(t2-t1,2))
+ tot = tot + (t2-t1)
+print "Total time\t\t\t\t\t\t\t [%5.2f s]" % (round(tot,2))
createSitemap(sitemap)
publish(tmptarget, args.output)
publish(args.style+"css", args.output)