Adding method process and publish to mimic the old scripts stages to publish.
[treecutter.git] / src / tree-cutter.py
index 0be43854431e635270704f59891bf8629db3ca9a..37b893a0961529fcdb66b230f5bb9d68f0e83e31 100755 (executable)
@@ -26,6 +26,8 @@ style_xslt = args.style+"docbook.xsl"
 style_tmpl = args.style+"index.en.html.tmpl"
 outputdir = args.output
 
+tmptarget = tempfile.mkdtemp()+'/'
+
 valid_scripts = ['.py','.pl']
 MAXLEVEL = 10000
 
@@ -81,6 +83,84 @@ class Page():
         self._menu = None
         self._rendered_article = None
 
+    def language(self):
+        return self._lang
+
+    def menu(self):
+        return self._menu
+
+    def set_article(self,art):
+        self._rendered_article = art
+
+    def prepare(self):
+        self._doc = bindery.parse(self._file, prefixes=PREFIXES)
+        if self._doc.xml_select(u'/db:article/db:info/db:title'):
+            self._title = unicode(self._doc.article.info.title)
+        if self._doc.xml_select(u'/db:article/db:info/db:titleabbrev'):
+            self._menu = unicode(self._doc.article.info.titleabbrev)
+
+        dirname = os.path.dirname(self._file)
+        code  = self._doc.xml_select(u"//xi:include[@parse='text']")
+        if code:
+            for c in code:
+                (p, ext) = os.path.splitext(c.href)
+                if ext in valid_scripts:
+                    exe = os.path.join(os.path.abspath(dirname+c.href))
+                    xml = subprocess.Popen([exe],stdout=subprocess.PIPE)
+                    xstr = bindery.parse(str(xml.stdout.read()))
+                    idp = c.xml_index_on_parent
+                    for x in xstr.xml_children:
+                        c.xml_parent.xml_insert(idp,x)
+                        c.xml_parent.xml_remove(c)
+
+        for r in self._doc.xml_select(u"//db:link[@xl:href]"):
+            rf = os.path.join(dirname,r.href)
+            if os.path.isfile(rf):
+                self._resources.append(rf)
+        for i in self._doc.xml_select(u"//db:imagedata[@fileref]"):
+            im = os.path.join(dirname,i.fileref)
+            if os.path.isfile(im):
+                self._resources.append(im)
+
+    def render(self):
+        #  amara can not handle the docbook stylesheets
+        #  xmlarticle = transform(doc,style_xslt)
+        cwd = os.getcwd()
+        dirname = os.path.dirname(self._file)
+        os.chdir(dirname)
+        infile  = os.path.basename(tempfile.mktemp())
+        outfile = tempfile.mktemp()
+        tfi = open(infile,'w')
+        tfi.write(self._doc.xml_encode())
+        tfi.close()
+#  cmd = ["saxon-xslt-xinclude","-o",outfile,infile,style_xslt]
+        cmd = ["xsltproc","--xinclude","--output",outfile,style_xslt,infile]
+        retcode = subprocess.call(cmd)
+        if retcode:
+            print 'Error: '+' '.join(cmd)+' Returncode ['+str(retcode)+']'
+        tfo = open(outfile,'r')
+        self._rendered_article = tfo.read()
+        tfo.close()
+        os.remove(infile)
+        os.remove(outfile)
+        os.chdir(cwd)
+
+    def template(self,sitemap):
+        htmlmenu =  sitemap.gen_menu(self._lang,None,None)
+        levelmenu = sitemap.gen_menu(self._lang,self,"tree")
+        template = Template(file=style_tmpl,
+                            searchList=[{'title':self._title},
+                                        {'menu':htmlmenu},
+                                        {'article':self._rendered_article},
+                                        {'levelmenu':levelmenu},
+                                        {'levelname':'Menu'}])
+        outfile = tmptarget+'html'.join(self._file.rsplit('xml',1))
+        mkdir_p(os.path.dirname(outfile))
+        out = open(outfile, 'w')
+        out.write(str(template))
+        out.close()
+
+
 class Link():
     """Class representing a webpage on the site"""
     def __init__(self,link):
@@ -105,6 +185,29 @@ class Link():
     def link(self):
         return self._link
 
+    def prepare(self):
+        for page in self._pages:
+            page.prepare()
+
+    def languages(self):
+        p = []
+        for page in self._pages:
+            p.append(page.language())
+        return p
+
+    def render(self):
+        for page in self._pages:
+            page.render()
+
+    def template(self,sitemap):
+        for page in self._pages:
+            page.template(sitemap)
+
+    def page(self,lang):
+        for page in self._pages:
+            if page.language()==lang:
+                return page
+
 class Node():
     def __init__(self,token,value):
         self._token = token
@@ -124,6 +227,15 @@ class Trie():
     def __init__(self):
         self._root = []
 
+    def __iter__(self):
+        return self.inorder(self._root)
+
+    def inorder(self,t):
+        for l in t:
+            yield l.value()
+            for x in self.inorder(l.children()):
+                yield x
+
     def _add(self,trie, key, content):
         # is the key a leaf
         k = key.pop(0)
@@ -153,7 +265,25 @@ class Trie():
         self._graph(self._root, G)
 #        G.layout('dot')
 #        G.draw('g.png')
-        print G.string()
+#        print G.string()
+
+    def _menu(self, trie, lang, page, css):
+        html = "<ul%s>\n" % css
+        for l in trie:
+            sel = ''
+            if l.value().page(lang) == page:
+                sel = ' class="selected"'
+            html += '<li%s><a href="%s">%s</a>\n' \
+            % (sel,l.value().link(),l.value().page(lang).menu())
+            html += self._menu(l.children(), lang, page, "")
+        html += "</ul>\n"
+        return html
+
+    def menu(self,lang,page,cssclass):
+        css = ''
+        if cssclass:
+            css = ' class="'+cssclass+'"'
+        return self._menu(self._root, lang, page, css)
 
 class Sitemap():
     """Class keeping the internal site structure"""
@@ -165,6 +295,11 @@ class Sitemap():
         tokens = filter(None,re.split(r'(^/\w*/|\w*/)',link))
         self._tree.add(tokens,Link(link))
 
+    def write_map(self):
+        f = open(self._file,'w')
+        f.write('\n'.join(link.link() for link in self._tree))
+        f.close()
+
     def read_map(self):
         try:
             f = open(self._file)
@@ -178,9 +313,44 @@ class Sitemap():
     def set(self):
         return set(link.link() for link in self._tree)
 
+    def process(self):
+        t1 = time.time()
+        for link in self._tree:
+            link.prepare()
+        t2 = time.time()
+        print "Prepare  [%5.2f s]" % (round(t2-t1,2))
+        sitelang = set()
+        for link in self._tree:
+            sitelang = lang.union(set(link.languages()))
+        t3 = time.time()
+        print "Language [%5.2f s]" % (round(t3-t2,2))
+        for link in self._tree:
+            link.render()
+        t4 = time.time()
+        print "Render   [%5.2f s]" % (round(t4-t3,2))
+        for link in self._tree:
+            link.template(self)
+        t5 = time.time()
+        print "Template [%5.2f s]" % (round(t5-t4,2))
+        sm = {}
+        for l in sitelang:
+            sm[l] = Page((l,'/sitemap'))
+            sm[l].set_article(self.gen_menu(l,None,"tree sitemap"))
+            sm[l].template(self)
+        t6 = time.time()
+        print "Sitemap [%5.2f s]" % (round(t6-t5,2))
+
     def graph(self):
         self._tree.graph()
 
+    def gen_menu(self,lang,page,cssclass):
+        return self._tree.menu(lang,page,cssclass)
+
+    def publish(self):
+        publish(tmptarget, args.output)
+        publish(args.style+"css", args.output)
+        publish(args.style+"images",args.output)
+
 def generateSitemap():
     sitemap = []
     try:
@@ -373,13 +543,20 @@ missing = dir_.set() - sitemap.set()
 removed = sitemap.set() - dir_.set()
 for page in removed:
     print removed+' pages missing!!'
-
 for page in missing:
     print 'adding missing page '+page
-    sitemap.add_page(page)
-
+    sitemap.add_link(page)
+if len(missing & removed) != 0:
+    print 'writing new sitemap - please adjust if needed'
+    sitemap.write_map()
 sitemap.graph()
 
+sitemap.process()
+
+t1 = time.time()
+sitemap.publish()
+t2 = time.time()
+print "Publish  [%5.2f s]" % (round(t2-t1,2))
 
 sitemap = generateSitemap()
 tmptarget = tempfile.mkdtemp()+'/'