xref: /trunk/main/oox/source/token/tokens.pl (revision cdf0e10c4e3984b49a9502b011690b615761d4a3)
1*cdf0e10cSrcweir#*************************************************************************
2*cdf0e10cSrcweir#
3*cdf0e10cSrcweir# DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4*cdf0e10cSrcweir#
5*cdf0e10cSrcweir# Copyright 2000, 2010 Oracle and/or its affiliates.
6*cdf0e10cSrcweir#
7*cdf0e10cSrcweir# OpenOffice.org - a multi-platform office productivity suite
8*cdf0e10cSrcweir#
9*cdf0e10cSrcweir# This file is part of OpenOffice.org.
10*cdf0e10cSrcweir#
11*cdf0e10cSrcweir# OpenOffice.org is free software: you can redistribute it and/or modify
12*cdf0e10cSrcweir# it under the terms of the GNU Lesser General Public License version 3
13*cdf0e10cSrcweir# only, as published by the Free Software Foundation.
14*cdf0e10cSrcweir#
15*cdf0e10cSrcweir# OpenOffice.org is distributed in the hope that it will be useful,
16*cdf0e10cSrcweir# but WITHOUT ANY WARRANTY; without even the implied warranty of
17*cdf0e10cSrcweir# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
18*cdf0e10cSrcweir# GNU Lesser General Public License version 3 for more details
19*cdf0e10cSrcweir# (a copy is included in the LICENSE file that accompanied this code).
20*cdf0e10cSrcweir#
21*cdf0e10cSrcweir# You should have received a copy of the GNU Lesser General Public License
22*cdf0e10cSrcweir# version 3 along with OpenOffice.org.  If not, see
23*cdf0e10cSrcweir# <http://www.openoffice.org/license.html>
24*cdf0e10cSrcweir# for a copy of the LGPLv3 License.
25*cdf0e10cSrcweir#
26*cdf0e10cSrcweir#*************************************************************************
27*cdf0e10cSrcweir
28*cdf0e10cSrcweir$ARGV0 = shift @ARGV;
29*cdf0e10cSrcweir$ARGV1 = shift @ARGV;
30*cdf0e10cSrcweir$ARGV2 = shift @ARGV;
31*cdf0e10cSrcweir$ARGV3 = shift @ARGV;
32*cdf0e10cSrcweir
33*cdf0e10cSrcweiropen( INFILE, $ARGV0 ) or die "Error: cannot open input file: $!";
34*cdf0e10cSrcweirmy %tokens;
35*cdf0e10cSrcweirwhile ( <INFILE> )
36*cdf0e10cSrcweir{
37*cdf0e10cSrcweir    # trim newline
38*cdf0e10cSrcweir    chomp( $_ );
39*cdf0e10cSrcweir    # trim leading/trailing whitespace
40*cdf0e10cSrcweir    $_ =~ s/^\s*//g;
41*cdf0e10cSrcweir    $_ =~ s/\s*$//g;
42*cdf0e10cSrcweir    # check for valid characters
43*cdf0e10cSrcweir    $_ =~ /^[a-zA-Z0-9-_]+$/ or die "Error: invalid character in token '$_'";
44*cdf0e10cSrcweir    $id = "XML_$_";
45*cdf0e10cSrcweir    $id =~ s/-/_/g;
46*cdf0e10cSrcweir    $tokens{$_} = $id;
47*cdf0e10cSrcweir}
48*cdf0e10cSrcweirclose ( INFILE );
49*cdf0e10cSrcweir
50*cdf0e10cSrcweir# generate output files
51*cdf0e10cSrcweir
52*cdf0e10cSrcweiropen ( IDFILE, ">$ARGV1" ) or die "Error: cannot open output file: $!";
53*cdf0e10cSrcweiropen ( NAMEFILE, ">$ARGV2" ) or die "Error: cannot open output file: $!";
54*cdf0e10cSrcweiropen ( GPERFFILE, ">$ARGV3" ) or die "Error: cannot open output file: $!";
55*cdf0e10cSrcweir
56*cdf0e10cSrcweirprint( GPERFFILE "%language=C++\n" );
57*cdf0e10cSrcweirprint( GPERFFILE "%global-table\n" );
58*cdf0e10cSrcweirprint( GPERFFILE "%null-strings\n" );
59*cdf0e10cSrcweirprint( GPERFFILE "%struct-type\n" );
60*cdf0e10cSrcweirprint( GPERFFILE "struct xmltoken {\n" );
61*cdf0e10cSrcweirprint( GPERFFILE "    const sal_Char *name;\n" );
62*cdf0e10cSrcweirprint( GPERFFILE "    sal_Int32 nToken;\n" );
63*cdf0e10cSrcweirprint( GPERFFILE "};\n" );
64*cdf0e10cSrcweirprint( GPERFFILE "%%\n" );
65*cdf0e10cSrcweir
66*cdf0e10cSrcweir$i = 0;
67*cdf0e10cSrcweirforeach( sort( keys( %tokens ) ) )
68*cdf0e10cSrcweir{
69*cdf0e10cSrcweir    print( IDFILE "const sal_Int32 $tokens{$_} = $i;\n" );
70*cdf0e10cSrcweir    print( NAMEFILE "\"$_\",\n" );
71*cdf0e10cSrcweir    print( GPERFFILE "$_,$tokens{$_}\n" );
72*cdf0e10cSrcweir    ++$i;
73*cdf0e10cSrcweir}
74*cdf0e10cSrcweir
75*cdf0e10cSrcweirprint( IDFILE "const sal_Int32 XML_TOKEN_COUNT = $i;\n" );
76*cdf0e10cSrcweirprint( GPERFFILE "%%\n" );
77*cdf0e10cSrcweir
78*cdf0e10cSrcweirclose( IDFILE );
79*cdf0e10cSrcweirclose( NAMEFILE );
80*cdf0e10cSrcweirclose( GPERFFILE );
81