better way of generating multiple pages XHTML output

author Stefano Zacchiroli <zack@upsilon.cc>

Sun, 14 May 2006 17:41:30 +0000 (17:41 +0000)

committer Stefano Zacchiroli <zack@upsilon.cc>

Sun, 14 May 2006 17:41:30 +0000 (17:41 +0000)
author Stefano Zacchiroli <zack@upsilon.cc>
Sun, 14 May 2006 17:41:30 +0000 (17:41 +0000)
committer Stefano Zacchiroli <zack@upsilon.cc>
Sun, 14 May 2006 17:41:30 +0000 (17:41 +0000)
diff --git a/helm/software/matita/help/C/Makefile b/helm/software/matita/help/C/Makefile

index 95fe3e3c696c9b381948d6ffdfe5e46361a84d04..dccc62ed6f74cee2f9a6d7369bf78b074fdd6b3c 100644 (file)
--- a/helm/software/matita/help/C/Makefile
+++ b/helm/software/matita/help/C/Makefile
@@ -1,26 +1,34 @@
  XSLTPROC=xsltproc
-XHTML_XSL=http://docbook.sourceforge.net/release/xsl/current/xhtml/docbook.xsl
-FO_XSL=http://docbook.sourceforge.net/release/xsl/current/fo/docbook.xsl
+XHTML_XSL=matita-xhtml.xsl
+FO_XSL=matita-fo.xsl
+MAIN=matita.xml
  
  all: html txt
  
+# XHTMLs generation
+
  .PHONY: html
  html: html-stamp
-html-stamp: matita.html
-       ./split.ml $<
+html-stamp: $(MAIN)
+       xsltproc $(XHTML_XSL) $<
         touch $@
  
+# TXTs generation
+
  TXTS = $(patsubst %.html,%.txt,$(wildcard *.html))
  .PHONY: txt
  txt: txt-stamp
  txt-stamp: html-stamp
         $(MAKE) $(TXTS)
         touch $@
-
  %.txt: %.html
         w3m -dump $< > $@
-%.html: %.xml
-       xsltproc $(XHTML_XSL) $< | xmllint --format - > $@
+
+# PDF generation
+
+pdf: pdf-stamp
+pdf-stamp: $(patsubst %.xml,%.pdf,$(MAIN))
+       touch $@
  %.fo: %.xml
         xsltproc $(FO_XSL) $< | xmllint --format - > $@
  %.pdf: %.fo
diff --git a/helm/software/matita/help/C/matita-fo.xsl b/helm/software/matita/help/C/matita-fo.xsl

new file mode 100644 (file)

index 0000000..3e564b4
--- /dev/null
+++ b/helm/software/matita/help/C/matita-fo.xsl
@@ -0,0 +1,5 @@
+<?xml version="1.0" encoding="utf-8"?>
+<xsl:stylesheet xmlns:xsl="http://www.w3.org/1999/XSL/Transform" version="1.0">
+  <xsl:import href="http://docbook.sourceforge.net/release/xsl/current/fo/docbook.xsl"/>
+  <xsl:output method="xml" encoding="utf-8" indent="yes"/>
+</xsl:stylesheet>
diff --git a/helm/software/matita/help/C/matita-xhtml.xsl b/helm/software/matita/help/C/matita-xhtml.xsl

new file mode 100644 (file)

index 0000000..eb78163
--- /dev/null
+++ b/helm/software/matita/help/C/matita-xhtml.xsl
@@ -0,0 +1,6 @@
+<?xml version="1.0" encoding="utf-8"?>
+<xsl:stylesheet xmlns:xsl="http://www.w3.org/1999/XSL/Transform" version="1.0">
+  <xsl:import href="http://docbook.sourceforge.net/release/xsl/current/xhtml/chunk.xsl"/>
+  <xsl:output method="xml" encoding="utf-8" indent="yes"/>
+  <xsl:param name="use.id.as.filename">1</xsl:param>
+</xsl:stylesheet>
diff --git a/helm/software/matita/help/C/split.ml b/helm/software/matita/help/C/split.ml

deleted file mode 100755 (executable)

index bd9f727..0000000
--- a/helm/software/matita/help/C/split.ml
+++ /dev/null
@@ -1,209 +0,0 @@
-#!/usr/bin/ocamlrun /usr/bin/ocaml
-(* Copyright (C) 2006, HELM Team.
- * 
- * This file is part of HELM, an Hypertextual, Electronic
- * Library of Mathematics, developed at the Computer Science
- * Department, University of Bologna, Italy.
- * 
- * HELM is free software; you can redistribute it and/or
- * modify it under the terms of the GNU General Public License
- * as published by the Free Software Foundation; either version 2
- * of the License, or (at your option) any later version.
- * 
- * HELM is distributed in the hope that it will be useful,
- * but WITHOUT ANY WARRANTY; without even the implied warranty of
- * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
- * GNU General Public License for more details.
- *
- * You should have received a copy of the GNU General Public License
- * along with HELM; if not, write to the Free Software
- * Foundation, Inc., 59 Temple Place - Suite 330, Boston,
- * MA  02111-1307, USA.
- * 
- * For details, see the HELM World-Wide-Web page,
- * http://helm.cs.unibo.it/
- *)
-
-let fname =
-  try Sys.argv.(1)
-  with Invalid_argument _ ->
-    prerr_endline "Usage: split.ml <FILE.html>";
-    exit 1 ;;
-
-#use "topfind";;
-#require "unix";;
-#require "pxp-engine";;
-#require "pxp-lex-utf8";;
-
-open Printf
-
-let xhtml_header title =
-  sprintf
-"<?xml version=\"1.0\" encoding=\"UTF-8\"?>
-<!DOCTYPE html PUBLIC \"-//W3C//DTD XHTML 1.0 Transitional//EN\" \"http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd\">
-<html xmlns=\"http://www.w3.org/1999/xhtml\">
-  <head>
-    <title>%s</title>
-  </head>
-  <body>
-"
-  title
-
-let xhtml_trailer =
-"  </body>
-</html>
-"
-
-type 'a node =
-  ('a Pxp_document.node #Pxp_document.extension as 'a) Pxp_document.node
-
-let resolver =
-  Pxp_reader.lookup_public_id_as_file [
-    "-//W3C//DTD XHTML 1.0 Transitional//EN", "xhtml1-transitional.dtd";
-    "-//W3C//ENTITIES Latin 1 for XHTML//EN", "xhtml-lat1.ent";
-    "-//W3C//ENTITIES Symbols for XHTML//EN", "xhtml-symbol.ent";
-    "-//W3C//ENTITIES Special for XHTML//EN", "xhtml-special.ent"; ]
-
-let parse_xml fname =
-  Pxp_tree_parser.parse_wfdocument_entity
-    { Pxp_types.default_config with Pxp_types.encoding = `Enc_utf8 }
-    (Pxp_types.from_file ~alt:[ resolver ] fname)
-    Pxp_tree_parser.default_spec
-
-  (** pattern matching like predicate on pxp nodes *)
-let match_elt tag attr_name ?attr_value () node =
-  node#node_type = Pxp_document.T_element tag
-  && (match attr_value with
-     | Some attr_value ->
-         (try node#attribute attr_name = Pxp_types.Value attr_value
-          with Not_found -> false)
-     | None -> List.mem attr_name node#attribute_names)
-
-let slice doc =
-  let document =
-    try
-      Pxp_document.find ~deeply:true
-        (match_elt "div" "class" ~attr_value:"book" ()) doc#root
-     with Not_found -> failwith "Can't find book <div>" in
-  let titlepage =
-    Pxp_document.find ~deeply:false
-      (match_elt "div" "class" ~attr_value:"titlepage" ()) document in
-  let toc =
-    Pxp_document.find ~deeply:false
-      (match_elt "div" "class" ~attr_value:"toc" ()) document in
-  let parts =
-    Pxp_document.find_all ~deeply:false
-      (match_elt "div" "class" ~attr_value:"chapter" ()) document in
-  let title =
-    Pxp_document.find ~deeply:true
-      (fun node -> node#node_type = Pxp_document.T_element "title") doc#root in
-  title#data,
-  titlepage :: toc :: parts
-
-let localize_ids parts =
-  let id2part = Hashtbl.create 1023 in
-  let part_ids = ref [] in
-  List.iter
-    (fun part ->
-      match Pxp_document.find_all ~deeply:true (match_elt "a" "id" ()) part with
-      | part_id :: ids ->
-          let part_id = part_id#required_string_attribute "id" in
-          part_ids := part_id :: !part_ids;
-          List.iter
-            (fun id ->
-              let id = id#required_string_attribute "id" in
-              Hashtbl.add id2part id part_id)
-            ids
-      | _ -> failwith "can't find part id")
-    parts;
-  !part_ids, id2part
-
-let fname_of_part part_name = part_name ^ ".html"
-
-let get_part_id part =
-  let id =
-    try
-      Pxp_document.find ~deeply:true (match_elt "a" "id" ()) part
-    with Not_found -> failwith "can't find part id" in
-  id#required_string_attribute "id"
-
-let get_part_title part =
-  let h2 =
-    Pxp_document.find ~deeply:true
-      (match_elt "h2" "class" ~attr_value:"title" ()) part in
-  let text =
-    List.find (fun node -> node#node_type = Pxp_document.T_data) h2#sub_nodes in
-  text#data
-
-let iter_xrefs f node =
-  let a_s = Pxp_document.find_all ~deeply:true (match_elt "a" "href" ()) node in
-  List.iter
-    (fun (node: 'a node) ->
-      let href = node#required_string_attribute "href" in
-      assert (String.length href > 0);
-      if href.[0] = '#' then
-        let xref = String.sub href 1 (String.length href - 1) in
-        f node xref)
-    a_s
-
-let patch_toc part_ids id2part toc =
-  iter_xrefs
-    (fun node xref ->
-      if List.mem xref part_ids then
-        node#set_attribute "href" (Pxp_types.Value (fname_of_part xref))
-      else
-        try
-          let part = Hashtbl.find id2part xref in
-          node#set_attribute "href"
-            (Pxp_types.Value (fname_of_part part ^ "#" ^ xref))
-        with Not_found -> ())
-    toc
-
-let patch_part part_ids id2part part =
-  let part_name = get_part_id part in
-  iter_xrefs
-    (fun node xref ->
-      try
-        let xref_part = Hashtbl.find id2part xref in
-        if xref_part <> part_name then
-          node#set_attribute "href"
-            (Pxp_types.Value (fname_of_part xref_part ^ "#" ^ xref))
-      with Not_found -> ())
-    part
-
-let open_formatter fname =
-  Unix.open_process_out (sprintf "xmllint --format -o %s -" fname)
-
-let close_formatter oc = ignore (Unix.close_process_out oc)
-
-let output_index title (titlepage: 'a node) (toc: 'a node) fname =
-  let oc = open_formatter fname in
-  output_string oc (xhtml_header title);
-  titlepage#write (`Out_channel oc) `Enc_utf8;
-  toc#write (`Out_channel oc) `Enc_utf8;
-  output_string oc xhtml_trailer;
-  close_formatter oc
-
-let output_part title (part: 'a node) fname =
-  let oc = open_formatter fname in
-  output_string oc
-    (xhtml_header (sprintf "%s - %s" title (get_part_title part)));
-  part#write (`Out_channel oc) `Enc_utf8;
-  output_string oc xhtml_trailer;
-  close_formatter oc
-
-let main () =
-  let doc = parse_xml fname in
-  match slice doc with
-  | title, (titlepage :: toc :: parts) ->
-      let part_ids, id2part = localize_ids parts in
-      patch_toc part_ids id2part toc;
-      List.iter (patch_part part_ids id2part) parts;
-      output_index title titlepage toc "index.html";
-      List.iter
-        (fun part -> output_part title part (get_part_id part ^ ".html"))
-        parts
-  | _ -> failwith "Unrecognized document structure"
-
-let _ = main ()
-
author	Stefano Zacchiroli <zack@upsilon.cc>
	Sun, 14 May 2006 17:41:30 +0000 (17:41 +0000)
committer	Stefano Zacchiroli <zack@upsilon.cc>
	Sun, 14 May 2006 17:41:30 +0000 (17:41 +0000)
helm/software/matita/help/C/Makefile		patch \| blob \| history
helm/software/matita/help/C/matita-fo.xsl	[new file with mode: 0644]	patch \| blob
helm/software/matita/help/C/matita-xhtml.xsl	[new file with mode: 0644]	patch \| blob
helm/software/matita/help/C/split.ml	[deleted file]	patch \| blob \| history