X-Git-Url: https://source.tree.se/git?p=treecutter.git;a=blobdiff_plain;f=src%2Ftree-cutter.py;h=37b893a0961529fcdb66b230f5bb9d68f0e83e31;hp=0be43854431e635270704f59891bf8629db3ca9a;hb=9efe89fdf3454731169d3f51ce357cf16a04bd76;hpb=6d43dd78472d987405abf540be1744dbc7ed4576 diff --git a/src/tree-cutter.py b/src/tree-cutter.py index 0be4385..37b893a 100755 --- a/src/tree-cutter.py +++ b/src/tree-cutter.py @@ -26,6 +26,8 @@ style_xslt = args.style+"docbook.xsl" style_tmpl = args.style+"index.en.html.tmpl" outputdir = args.output +tmptarget = tempfile.mkdtemp()+'/' + valid_scripts = ['.py','.pl'] MAXLEVEL = 10000 @@ -81,6 +83,84 @@ class Page(): self._menu = None self._rendered_article = None + def language(self): + return self._lang + + def menu(self): + return self._menu + + def set_article(self,art): + self._rendered_article = art + + def prepare(self): + self._doc = bindery.parse(self._file, prefixes=PREFIXES) + if self._doc.xml_select(u'/db:article/db:info/db:title'): + self._title = unicode(self._doc.article.info.title) + if self._doc.xml_select(u'/db:article/db:info/db:titleabbrev'): + self._menu = unicode(self._doc.article.info.titleabbrev) + + dirname = os.path.dirname(self._file) + code = self._doc.xml_select(u"//xi:include[@parse='text']") + if code: + for c in code: + (p, ext) = os.path.splitext(c.href) + if ext in valid_scripts: + exe = os.path.join(os.path.abspath(dirname+c.href)) + xml = subprocess.Popen([exe],stdout=subprocess.PIPE) + xstr = bindery.parse(str(xml.stdout.read())) + idp = c.xml_index_on_parent + for x in xstr.xml_children: + c.xml_parent.xml_insert(idp,x) + c.xml_parent.xml_remove(c) + + for r in self._doc.xml_select(u"//db:link[@xl:href]"): + rf = os.path.join(dirname,r.href) + if os.path.isfile(rf): + self._resources.append(rf) + for i in self._doc.xml_select(u"//db:imagedata[@fileref]"): + im = os.path.join(dirname,i.fileref) + if os.path.isfile(im): + self._resources.append(im) + + def render(self): + # amara can not handle the docbook stylesheets + # xmlarticle = transform(doc,style_xslt) + cwd = os.getcwd() + dirname = os.path.dirname(self._file) + os.chdir(dirname) + infile = os.path.basename(tempfile.mktemp()) + outfile = tempfile.mktemp() + tfi = open(infile,'w') + tfi.write(self._doc.xml_encode()) + tfi.close() +# cmd = ["saxon-xslt-xinclude","-o",outfile,infile,style_xslt] + cmd = ["xsltproc","--xinclude","--output",outfile,style_xslt,infile] + retcode = subprocess.call(cmd) + if retcode: + print 'Error: '+' '.join(cmd)+' Returncode ['+str(retcode)+']' + tfo = open(outfile,'r') + self._rendered_article = tfo.read() + tfo.close() + os.remove(infile) + os.remove(outfile) + os.chdir(cwd) + + def template(self,sitemap): + htmlmenu = sitemap.gen_menu(self._lang,None,None) + levelmenu = sitemap.gen_menu(self._lang,self,"tree") + template = Template(file=style_tmpl, + searchList=[{'title':self._title}, + {'menu':htmlmenu}, + {'article':self._rendered_article}, + {'levelmenu':levelmenu}, + {'levelname':'Menu'}]) + outfile = tmptarget+'html'.join(self._file.rsplit('xml',1)) + mkdir_p(os.path.dirname(outfile)) + out = open(outfile, 'w') + out.write(str(template)) + out.close() + + class Link(): """Class representing a webpage on the site""" def __init__(self,link): @@ -105,6 +185,29 @@ class Link(): def link(self): return self._link + def prepare(self): + for page in self._pages: + page.prepare() + + def languages(self): + p = [] + for page in self._pages: + p.append(page.language()) + return p + + def render(self): + for page in self._pages: + page.render() + + def template(self,sitemap): + for page in self._pages: + page.template(sitemap) + + def page(self,lang): + for page in self._pages: + if page.language()==lang: + return page + class Node(): def __init__(self,token,value): self._token = token @@ -124,6 +227,15 @@ class Trie(): def __init__(self): self._root = [] + def __iter__(self): + return self.inorder(self._root) + + def inorder(self,t): + for l in t: + yield l.value() + for x in self.inorder(l.children()): + yield x + def _add(self,trie, key, content): # is the key a leaf k = key.pop(0) @@ -153,7 +265,25 @@ class Trie(): self._graph(self._root, G) # G.layout('dot') # G.draw('g.png') - print G.string() +# print G.string() + + def _menu(self, trie, lang, page, css): + html = "\n" % css + for l in trie: + sel = '' + if l.value().page(lang) == page: + sel = ' class="selected"' + html += '%s\n' \ + % (sel,l.value().link(),l.value().page(lang).menu()) + html += self._menu(l.children(), lang, page, "") + html += "\n" + return html + + def menu(self,lang,page,cssclass): + css = '' + if cssclass: + css = ' class="'+cssclass+'"' + return self._menu(self._root, lang, page, css) class Sitemap(): """Class keeping the internal site structure""" @@ -165,6 +295,11 @@ class Sitemap(): tokens = filter(None,re.split(r'(^/\w*/|\w*/)',link)) self._tree.add(tokens,Link(link)) + def write_map(self): + f = open(self._file,'w') + f.write('\n'.join(link.link() for link in self._tree)) + f.close() + def read_map(self): try: f = open(self._file) @@ -178,9 +313,44 @@ class Sitemap(): def set(self): return set(link.link() for link in self._tree) + def process(self): + t1 = time.time() + for link in self._tree: + link.prepare() + t2 = time.time() + print "Prepare [%5.2f s]" % (round(t2-t1,2)) + sitelang = set() + for link in self._tree: + sitelang = lang.union(set(link.languages())) + t3 = time.time() + print "Language [%5.2f s]" % (round(t3-t2,2)) + for link in self._tree: + link.render() + t4 = time.time() + print "Render [%5.2f s]" % (round(t4-t3,2)) + for link in self._tree: + link.template(self) + t5 = time.time() + print "Template [%5.2f s]" % (round(t5-t4,2)) + sm = {} + for l in sitelang: + sm[l] = Page((l,'/sitemap')) + sm[l].set_article(self.gen_menu(l,None,"tree sitemap")) + sm[l].template(self) + t6 = time.time() + print "Sitemap [%5.2f s]" % (round(t6-t5,2)) + def graph(self): self._tree.graph() + def gen_menu(self,lang,page,cssclass): + return self._tree.menu(lang,page,cssclass) + + def publish(self): + publish(tmptarget, args.output) + publish(args.style+"css", args.output) + publish(args.style+"images",args.output) + def generateSitemap(): sitemap = [] try: @@ -373,13 +543,20 @@ missing = dir_.set() - sitemap.set() removed = sitemap.set() - dir_.set() for page in removed: print removed+' pages missing!!' - for page in missing: print 'adding missing page '+page - sitemap.add_page(page) - + sitemap.add_link(page) +if len(missing & removed) != 0: + print 'writing new sitemap - please adjust if needed' + sitemap.write_map() sitemap.graph() +sitemap.process() + +t1 = time.time() +sitemap.publish() +t2 = time.time() +print "Publish [%5.2f s]" % (round(t2-t1,2)) sitemap = generateSitemap() tmptarget = tempfile.mkdtemp()+'/'