X-Git-Url: http://matita.cs.unibo.it/gitweb/?a=blobdiff_plain;f=helm%2FDEVEL%2Fpxp%2Fpxp%2Flexers%2Fpxp_lex_defs_drv_utf8.def;fp=helm%2FDEVEL%2Fpxp%2Fpxp%2Flexers%2Fpxp_lex_defs_drv_utf8.def;h=0000000000000000000000000000000000000000;hb=c7514aaa249a96c5fdd39b1123fbdb38d92f20b6;hp=dc108ef6d408a422a8929e72bfa9f19795a88cc6;hpb=1c7fb836e2af4f2f3d18afd0396701f2094265ff;p=helm.git diff --git a/helm/DEVEL/pxp/pxp/lexers/pxp_lex_defs_drv_utf8.def b/helm/DEVEL/pxp/pxp/lexers/pxp_lex_defs_drv_utf8.def deleted file mode 100644 index dc108ef6d..000000000 --- a/helm/DEVEL/pxp/pxp/lexers/pxp_lex_defs_drv_utf8.def +++ /dev/null @@ -1,160 +0,0 @@ -(* $Id$ - * ---------------------------------------------------------------------- - * - *) - -let ws = [ ' ' '\t' '\r' '\n' ] - -let ascii_digit = ['0'-'9'] - -let ascii_hexdigit = ['0'-'9' 'a'-'h' 'A'-'H'] - -let namechar = letter | digit | '.' | ':' | '-' | '_' | combiningChar | extender - -let name = ( letter | '_' | ':' ) namechar* - -let nmtoken = namechar+ - -(* Valid characters are: - * #9, #10, #13, #32-#xD7FF, #xE000-#xFFFD, #x10000-#x10FFFF - * - * #xD7FF as UTF-8 sequence: - * 1110xxxx 10xxxxxx 10xxxxxx - * 1110...D 10...7.. 10.F...F = ED 9F BF - * - * #xE000 as UTF-8 sequence: - * 1110xxxx 10xxxxxx 10xxxxxx - * 1110...E 10...0.. 10.0...0 = EE 80 80 - * - * UTF-8 sequence CF BE BF as character: - * 1110xxxx 10xxxxxx 10xxxxxx - * 1110...F 10111110 10111111 = #FFBF - * - * #xFFFD as UTF-8 sequence: - * 1110xxxx 10xxxxxx 10xxxxxx - * 1110...F 10...F.. 10.F...D = EF BF BD - * - * #x010000 as UTF-8 sequence: - * 11110xxx 10xxxxxx 10xxxxxx 10xxxxxx - * 111100.. 10.1...0 10...0.. 10.0...0 = F0 90 80 80 - * - * #x10FFFF as UTF-8 sequence: - * 11110xxx 10xxxxxx 10xxxxxx 10xxxxxx - * 111101.. 10.0...F 10...F.. 10.F...F = F4 8F BF BF - *) - - -let non_ascii_character = - ['\192'-'\223'] ['\128'-'\191'] (* #x80-#x7FF *) -| ['\224'-'\236'] ['\128'-'\191'] ['\128'-'\191'] (* #x800-#xCFFF *) -| '\237' ['\128'-'\159'] ['\128'-'\191'] (* #xD000-#xD7FF *) -| '\238' ['\128'-'\191'] ['\128'-'\191'] (* #xE000-#xEFFF *) -| '\239' ['\128'-'\190'] ['\128'-'\191'] (* #xF000-#xFFBF *) -| '\239' '\191' ['\128'-'\189'] (* #xFFC0-#xFFFD *) -| '\240' ['\144'-'\191'] ['\128'-'\191'] ['\128'-'\191'] - (* #x010000-#x03FFFF *) -| ['\241'-'\243'] ['\128'-'\191'] ['\128'-'\191'] ['\128'-'\191'] - (* #x040000-#x0FFFFF *) -| '\244' ['\128'-'\143'] ['\128'-'\191'] ['\128'-'\191'] - (* #x100000-#10FFFFF *) - -let character = - [ '\009' '\010' '\013' '\032'-'\127' ] -| non_ascii_character - - -let character_except_question_mark = (* '?' = '\063' *) - [ '\009' '\010' '\013' '\032'-'\062' '\064'-'\127' ] -| non_ascii_character - - -let character_except_right_angle_bracket = (* '>' = '\062' *) - [ '\009' '\010' '\013' '\032'-'\061' '\063'-'\127' ] -| non_ascii_character - - -let character_except_minus = (* '-' = '\045' *) - [ '\009' '\010' '\013' '\032'-'\044' '\046'-'\127' ] -| non_ascii_character - - -let character_except_quot = (* '"' = '\034' *) - [ '\009' '\010' '\013' '\032'-'\033' '\035'-'\255' ] -| non_ascii_character - - -let character_except_apos = (* '\'' = '\039' *) - [ '\009' '\010' '\013' '\032'-'\038' '\040'-'\255' ] -| non_ascii_character - - -let pi_string = character_except_question_mark* - ( '?' character_except_right_angle_bracket - character_except_question_mark* )* - '?'? - - -let comment_string = character_except_minus* - ('-' character_except_minus+ )* - - -let normal_character = - (* Character except '&' = '\038', '<' = '\060', ']' = '\093', and CR LF *) - [ '\009' '\032'-'\037' '\039'-'\059' '\061'-'\092' '\094'-'\127' ] -| non_ascii_character - - -let character_except_rbracket = (* ']' = '\093' *) - [ '\009' '\010' '\013' '\032'-'\092' '\094'-'\127' ] -| non_ascii_character - - -let character_except_rbracket_rangle = (* ']' = '\093', '>' = '\062' *) - [ '\009' '\010' '\013' '\032'-'\061' '\063'-'\092' '\094'-'\127' ] -| non_ascii_character - - -let cdata_string = - character_except_rbracket* - ( "]" character_except_rbracket+ | - "]]" ']'* character_except_rbracket_rangle character_except_rbracket* - )* - ']'* - - -let printable_character_except_amp_lt = - (* '&' = '\038', '<' = '\060' *) - [ '\032'-'\037' '\039'-'\059' '\061'-'\127'] -| non_ascii_character - - -let printable_character_except_amp_percent = - (* '%' = '\037', '&' = '\038' *) - [ '\032'-'\036' '\039'-'\127'] -| non_ascii_character - - -let character_except_special = - (* '<'=060, ']'=093, '"'=034, '\''=039 *) - [ '\009' '\010' '\013' '\032'-'\033' '\035'-'\038' '\040'-'\059' - '\061'-'\092' '\094'-'\127' ] -| non_ascii_character - - - -(* ====================================================================== - * History: - * - * $Log$ - * Revision 1.1 2000/11/17 09:57:32 lpadovan - * Initial revision - * - * Revision 1.2 2000/08/26 19:58:08 gerd - * Bugfix in character_except_apos. The bug caused that attribute - * values delimited by ' could not be scanned at all. - * - * Revision 1.1 2000/05/20 20:33:25 gerd - * Initial revision. - * - * - *)