(* Copyright (C) 2000, HELM Team. * * This file is part of HELM, an Hypertextual, Electronic * Library of Mathematics, developed at the Computer Science * Department, University of Bologna, Italy. * * HELM is free software; you can redistribute it and/or * modify it under the terms of the GNU General Public License * as published by the Free Software Foundation; either version 2 * of the License, or (at your option) any later version. * * HELM is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with HELM; if not, write to the Free Software * Foundation, Inc., 59 Temple Place - Suite 330, Boston, * MA 02111-1307, USA. * * For details, see the HELM World-Wide-Web page, * http://cs.unibo.it/helm/. *) (******************************************************************************) (* *) (* PROJECT HELM *) (* *) (* Claudio Sacerdoti Coen *) (* 24/01/2000 *) (* *) (* This is the main (top level) module of a parser for cic objects from xml *) (* files to the internal representation. It uses the modules cicParser2 *) (* (objects level) and cicParser3 (terms level) *) (* *) (******************************************************************************) exception Warnings;; class warner = object method warn w = print_endline ("WARNING: " ^ w) ; (raise Warnings : unit) end ;; exception EmptyUri of string;; (* given an uri u it returns the list of tokens of the base uri of u *) (* e.g.: token_of_uri "cic:/a/b/c/d.xml" returns ["a" ; "b" ; "c"] *) let tokens_of_uri uri = let uri' = UriManager.string_of_uri uri in let rec chop_list = function [] -> raise (EmptyUri uri') | [fn] -> [] | he::[fn] -> [he] | he::tl -> he::(chop_list tl) in let trimmed_uri = Str.replace_first (Str.regexp "cic:") "" uri' in let list_of_tokens = Str.split (Str.regexp "/") trimmed_uri in chop_list list_of_tokens ;; (* given the filename of an xml file of a cic object it returns its internal *) (* representation. *) let annobj_of_xml filename uri = let module Y = Pxp_yacc in try let d = (* sets the current base uri to resolve relative URIs *) CicParser3.current_sp := tokens_of_uri uri ; CicParser3.current_uri := uri ; let config = {Y.default_config with Y.warner = new warner} in Y.parse_document_entity config (*PXP (Y.ExtID (Pxp_types.System filename, new Pxp_reader.resolve_as_file ~url_of_id ())) *) (PxpUriResolver.from_file filename) CicParser3.domspec in CicParser2.get_term d#root with e -> print_endline ("Filename: " ^ filename ^ "\nException: ") ; print_endline (Pxp_types.string_of_exn e) ; raise e ;; let obj_of_xml filename uri = Deannotate.deannotate_obj (annobj_of_xml filename uri) ;;