]> matita.cs.unibo.it Git - helm.git/blobdiff - helm/metadata/create_V7_mowgli/METADATA/meta_lex.l
New version for the new DTD.
[helm.git] / helm / metadata / create_V7_mowgli / METADATA / meta_lex.l
diff --git a/helm/metadata/create_V7_mowgli/METADATA/meta_lex.l b/helm/metadata/create_V7_mowgli/METADATA/meta_lex.l
new file mode 100644 (file)
index 0000000..967fbc0
--- /dev/null
@@ -0,0 +1,265 @@
+ /******************************************************************/
+ /*  Copyright (C) 2000, HELM Team                                 */ 
+ /*                                                                */
+ /* This file is part of HELM, an Hypertextual, Electronic         */
+ /* Library of Mathematics, developed at the Computer Science      */
+ /* Department, University of Bologna, Italy.                      */
+ /*                                                                */
+ /* HELM is free software; you can redistribute it and/or          */
+ /* modify it under the terms of the GNU General Public License    */
+ /* as published by the Free Software Foundation; either version   */
+ /* 2 of the License, or (at your option) any later version.       */
+ /*                                                                */
+ /* HELM is distributed in the hope that it will be useful,        */
+ /* but WITHOUT ANY WARRANTY; without even the implied warranty of */
+ /* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the   */
+ /* GNU General Public License for more details.                   */
+ /*                                                                */
+ /* You should have received a copy of the GNU General Public      */
+ /* License along with HELM; if not, write to the Free Software    */
+ /* Foundation, Inc., 59 Temple Place - Suite 330, Boston,         */
+ /* MA  02111-1307, USA.                                           */
+ /*                                                                */
+ /* For details, see the HELM World-Wide-Web page,                 */
+ /* http://cs.unibo.it/helm/.                                      */
+ /******************************************************************/
+
+ /***************************************************************/
+ /*                       META_LEXAN                           */
+ /*                 Automatic Metadata Extractor                */
+ /*           First draft 11/12/2001, by Andrea Asperti         */
+ /*      more bugs added by domenico lordi on mon 12/17/2001    */
+ /***************************************************************/
+
+ /***************************************************************/
+ /* 1. Inclusion of header files.                              */
+ /***************************************************************/
+
+%{
+#include                <string.h>
+#include                <stdlib.h>
+#include                <sys/stat.h>
+#include                "sthandler.h"
+%}
+
+ /***************************************************************/
+ /* 2. Constants and Variables Definitions                      */
+ /***************************************************************/
+
+%{
+#define                 NOWHERE   0
+#define                 CONST     1
+#define                 MUTIND    2
+#define                 MUTCONSTRUCT  3
+
+#define                 INBODY    0
+#define                 MAINHYP   1
+#define                 INHYP     2
+#define                 INCONCL   3
+#define                 MAINCONCL 4
+#define                 INTYPE    5
+#define                 NOTFOUND  6
+
+#define                 HERE      0     
+#define                 AFTER     1
+
+
+int                    where = NOWHERE;
+int                     found = NOTFOUND;
+int                     position = INBODY;
+int                     first_child = HERE;
+int                    skip = 0;     // boolean to skip the insertion of a URI
+int                     no_open_source =0;
+int                     tmp_n;
+char                    sep = '"';
+char                    *xpointer = "#xpointer(1/";
+char                    *uri;
+char                    *tmp;
+%}
+
+ /***************************************************************/
+ /* 3. Regular definitions.                                    */
+ /***************************************************************/
+
+uri                     [^"]+
+digits                  [0-9]+                   
+
+ /***************************************************************/
+ /* 4. Rules.                                                  */
+ /***************************************************************/
+
+
+%%
+
+"<Variable"[^>]*">"(" "|\n)*"<body" {
+                    position = INBODY; // Variables have both a body and a type
+                   }
+
+"</body>"(" "|\n)*"<type" {
+                    position = INTYPE; // Variables have both a body and a type
+                   }
+
+"<decl"            |
+"<def"             {
+                    if ((position == INTYPE) ||
+                        (position == INHYP))
+                        { position = INHYP;
+                          no_open_source++;};
+                   }
+
+"</decl>"          |
+"</def"            {
+                    if (position == INHYP)
+                     {
+                      no_open_source--;
+                      if (no_open_source == 0) 
+                       { position = INTYPE;
+                         first_child = HERE; };
+                     };
+                   }
+
+
+.|\n               {
+                   }
+
+"<LAMBDA"          |
+"<REL"             |
+"<MUTCASE"         |
+"<FIX"             |
+"<COFIX"           { 
+                          first_child = AFTER;
+                   }
+
+"<VAR"             {
+                     skip = 1;
+                     first_child = AFTER;
+                   }
+
+"<CONST"           { 
+                     if (position == INTYPE) /* CONST on the spine */
+                        position = INCONCL;
+                     where = CONST;
+                   }
+
+"<MUTIND"          { 
+                     if (position == INTYPE) /* MUTIND on the spine */
+                        position = INCONCL;
+                     where = MUTIND;
+                   }
+
+"<MUTCONSTRUCT"    { 
+                     if (position == INTYPE) /* MUTCONSTRUCT on the spine */
+                        position = INCONCL;
+                     where = MUTCONSTRUCT;
+                   }
+
+"uri=\""{uri}      {     
+                         if (!skip) {
+                            uri=(char *)malloc((sizeof('a')*200)); 
+                            strcpy(uri,yytext);
+                            strsep(&uri,&sep);
+                            if (where == CONST)
+                                {
+                                   search(uri,first_child,position); 
+                                   where = NOWHERE;
+                                   first_child = AFTER;
+                                   free(uri); 
+                                 };
+                         } else skip = 0;
+                   } 
+
+"noType=\""{digits} {
+                         if ((where == MUTIND) || (where == MUTCONSTRUCT))
+                          { strsep(&yytext,&sep);
+                            tmp=(char *)malloc((sizeof(sep)*(strlen(yytext)+1)));
+                            strcpy(tmp,yytext);
+                            tmp_n = atoi(tmp)+1;
+                            sprintf(tmp,"%d",tmp_n);
+                            strcat(uri,"#xpointer(1/"); 
+                            strcat(uri,tmp); 
+                          };
+                         if (where == MUTIND) 
+                             { 
+                               strcat(uri,")");
+                               search(uri,first_child,position); 
+                               free(uri);
+                               free(tmp);
+                               where = NOWHERE; 
+                               first_child = AFTER;};
+                   } 
+
+"noConstr=\""{digits} {
+                         if (where == MUTCONSTRUCT)
+                          { strsep(&yytext,&sep);
+                            tmp=(char *)malloc((sizeof(sep)*(strlen(yytext)+1)));
+                            strcpy(tmp,yytext);
+                            strcat(uri,"/");
+                            strcat(uri,tmp);
+                            strcat(uri,")");
+                            search(uri,first_child,position);
+                            free(uri);
+                            free(tmp);
+                            where = NOWHERE; 
+                            first_child = AFTER;};
+                   } 
+
+
+
+%%
+
+ /***************************************************************/
+ /* 6. Auxiliary functions.                                    */
+ /***************************************************************/
+
+main(int argc, char *argv[])
+{                  
+                   struct stat buf;
+                   init_symbol_table();
+
+                   // We process the body
+                   if (!stat("tmp/body.xml",&buf)) {
+                      yyin = fopen("tmp/body.xml", "r");
+                      position = INBODY;
+                      yylex();
+                      fclose(yyin);
+                   }
+
+                   // We process the type
+                   yyin = fopen("tmp/type.xml", "r");
+                   position = INTYPE;
+                   first_child = HERE;
+                   yylex();
+
+                   printf("<?xml version=\"1.0\" encoding=\"ISO-8859-1\"?>\n\n");
+                   printf("<rdf:RDF xml:lang=\"en\" xmlns:rdf=\"http://www.w3.org/1999/02/22-rdf-syntax-ns#\" xmlns:h=\"file:mattone.rdf#\">\n");
+                   printf("\t<h:Object rdf:about=\"");
+                   printf("%s",argv[1]);
+                   printf("\">\n");
+                   print_all();
+                   printf("\t</h:Object>\n");
+                   printf("</rdf:RDF>\n");
+                   fclose(yyin);
+                   } 
+
+search(uri,first_child,position)
+char               *uri;
+int                first_child;
+int                position; 
+{                  
+                   if (first_child == HERE)
+                      {
+                       if (position == INHYP)
+                          found = search_bucket(uri,MAINHYP);
+                       else if (position == INCONCL)
+                          found = search_bucket(uri,MAINCONCL);
+                       /* if (found == NOTFOUND)
+                          printf( "pos = %d, uri = %s\n", MAINCONCL, uri); */
+                       }
+                    else found = search_bucket(uri,position);
+                    /* if (found == NOTFOUND)
+                          printf( "pos = %d, uri = %s\n", position, uri); */
+                    }
+
+int yywrap() {
+               return 1;
+             }