1*cdf0e10cSrcweir#************************************************************************* 2*cdf0e10cSrcweir# 3*cdf0e10cSrcweir# DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. 4*cdf0e10cSrcweir# 5*cdf0e10cSrcweir# Copyright 2000, 2010 Oracle and/or its affiliates. 6*cdf0e10cSrcweir# 7*cdf0e10cSrcweir# OpenOffice.org - a multi-platform office productivity suite 8*cdf0e10cSrcweir# 9*cdf0e10cSrcweir# This file is part of OpenOffice.org. 10*cdf0e10cSrcweir# 11*cdf0e10cSrcweir# OpenOffice.org is free software: you can redistribute it and/or modify 12*cdf0e10cSrcweir# it under the terms of the GNU Lesser General Public License version 3 13*cdf0e10cSrcweir# only, as published by the Free Software Foundation. 14*cdf0e10cSrcweir# 15*cdf0e10cSrcweir# OpenOffice.org is distributed in the hope that it will be useful, 16*cdf0e10cSrcweir# but WITHOUT ANY WARRANTY; without even the implied warranty of 17*cdf0e10cSrcweir# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the 18*cdf0e10cSrcweir# GNU Lesser General Public License version 3 for more details 19*cdf0e10cSrcweir# (a copy is included in the LICENSE file that accompanied this code). 20*cdf0e10cSrcweir# 21*cdf0e10cSrcweir# You should have received a copy of the GNU Lesser General Public License 22*cdf0e10cSrcweir# version 3 along with OpenOffice.org. If not, see 23*cdf0e10cSrcweir# <http://www.openoffice.org/license.html> 24*cdf0e10cSrcweir# for a copy of the LGPLv3 License. 25*cdf0e10cSrcweir# 26*cdf0e10cSrcweir#************************************************************************* 27*cdf0e10cSrcweir 28*cdf0e10cSrcweir$ARGV0 = shift @ARGV; 29*cdf0e10cSrcweir$ARGV1 = shift @ARGV; 30*cdf0e10cSrcweir$ARGV2 = shift @ARGV; 31*cdf0e10cSrcweir$ARGV3 = shift @ARGV; 32*cdf0e10cSrcweir 33*cdf0e10cSrcweiropen( INFILE, $ARGV0 ) or die "Error: cannot open input file: $!"; 34*cdf0e10cSrcweirmy %tokens; 35*cdf0e10cSrcweirwhile ( <INFILE> ) 36*cdf0e10cSrcweir{ 37*cdf0e10cSrcweir # trim newline 38*cdf0e10cSrcweir chomp( $_ ); 39*cdf0e10cSrcweir # trim leading/trailing whitespace 40*cdf0e10cSrcweir $_ =~ s/^\s*//g; 41*cdf0e10cSrcweir $_ =~ s/\s*$//g; 42*cdf0e10cSrcweir # check for valid characters 43*cdf0e10cSrcweir $_ =~ /^[a-zA-Z0-9-_]+$/ or die "Error: invalid character in token '$_'"; 44*cdf0e10cSrcweir $id = "XML_$_"; 45*cdf0e10cSrcweir $id =~ s/-/_/g; 46*cdf0e10cSrcweir $tokens{$_} = $id; 47*cdf0e10cSrcweir} 48*cdf0e10cSrcweirclose ( INFILE ); 49*cdf0e10cSrcweir 50*cdf0e10cSrcweir# generate output files 51*cdf0e10cSrcweir 52*cdf0e10cSrcweiropen ( IDFILE, ">$ARGV1" ) or die "Error: cannot open output file: $!"; 53*cdf0e10cSrcweiropen ( NAMEFILE, ">$ARGV2" ) or die "Error: cannot open output file: $!"; 54*cdf0e10cSrcweiropen ( GPERFFILE, ">$ARGV3" ) or die "Error: cannot open output file: $!"; 55*cdf0e10cSrcweir 56*cdf0e10cSrcweirprint( GPERFFILE "%language=C++\n" ); 57*cdf0e10cSrcweirprint( GPERFFILE "%global-table\n" ); 58*cdf0e10cSrcweirprint( GPERFFILE "%null-strings\n" ); 59*cdf0e10cSrcweirprint( GPERFFILE "%struct-type\n" ); 60*cdf0e10cSrcweirprint( GPERFFILE "struct xmltoken {\n" ); 61*cdf0e10cSrcweirprint( GPERFFILE " const sal_Char *name;\n" ); 62*cdf0e10cSrcweirprint( GPERFFILE " sal_Int32 nToken;\n" ); 63*cdf0e10cSrcweirprint( GPERFFILE "};\n" ); 64*cdf0e10cSrcweirprint( GPERFFILE "%%\n" ); 65*cdf0e10cSrcweir 66*cdf0e10cSrcweir$i = 0; 67*cdf0e10cSrcweirforeach( sort( keys( %tokens ) ) ) 68*cdf0e10cSrcweir{ 69*cdf0e10cSrcweir print( IDFILE "const sal_Int32 $tokens{$_} = $i;\n" ); 70*cdf0e10cSrcweir print( NAMEFILE "\"$_\",\n" ); 71*cdf0e10cSrcweir print( GPERFFILE "$_,$tokens{$_}\n" ); 72*cdf0e10cSrcweir ++$i; 73*cdf0e10cSrcweir} 74*cdf0e10cSrcweir 75*cdf0e10cSrcweirprint( IDFILE "const sal_Int32 XML_TOKEN_COUNT = $i;\n" ); 76*cdf0e10cSrcweirprint( GPERFFILE "%%\n" ); 77*cdf0e10cSrcweir 78*cdf0e10cSrcweirclose( IDFILE ); 79*cdf0e10cSrcweirclose( NAMEFILE ); 80*cdf0e10cSrcweirclose( GPERFFILE ); 81