xref: /aoo41x/main/rsc/source/tools/rscchar.cxx (revision 477794c1)
1*477794c1SAndrew Rist /**************************************************************
2*477794c1SAndrew Rist  *
3*477794c1SAndrew Rist  * Licensed to the Apache Software Foundation (ASF) under one
4*477794c1SAndrew Rist  * or more contributor license agreements.  See the NOTICE file
5*477794c1SAndrew Rist  * distributed with this work for additional information
6*477794c1SAndrew Rist  * regarding copyright ownership.  The ASF licenses this file
7*477794c1SAndrew Rist  * to you under the Apache License, Version 2.0 (the
8*477794c1SAndrew Rist  * "License"); you may not use this file except in compliance
9*477794c1SAndrew Rist  * with the License.  You may obtain a copy of the License at
10*477794c1SAndrew Rist  *
11*477794c1SAndrew Rist  *   http://www.apache.org/licenses/LICENSE-2.0
12cdf0e10cSrcweir  *
13*477794c1SAndrew Rist  * Unless required by applicable law or agreed to in writing,
14*477794c1SAndrew Rist  * software distributed under the License is distributed on an
15*477794c1SAndrew Rist  * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
16*477794c1SAndrew Rist  * KIND, either express or implied.  See the License for the
17*477794c1SAndrew Rist  * specific language governing permissions and limitations
18*477794c1SAndrew Rist  * under the License.
19*477794c1SAndrew Rist  *
20*477794c1SAndrew Rist  *************************************************************/
21*477794c1SAndrew Rist 
22*477794c1SAndrew Rist 
23cdf0e10cSrcweir 
24cdf0e10cSrcweir // MARKER(update_precomp.py): autogen include statement, do not remove
25cdf0e10cSrcweir #include "precompiled_rsc.hxx"
26cdf0e10cSrcweir /****************** I N C L U D E S **************************************/
27cdf0e10cSrcweir #include <stdio.h>
28cdf0e10cSrcweir #include <string.h>
29cdf0e10cSrcweir #include <ctype.h>
30cdf0e10cSrcweir 
31cdf0e10cSrcweir #ifndef _TABLE_HXX //autogen
32cdf0e10cSrcweir #include <tools/table.hxx>
33cdf0e10cSrcweir #endif
34cdf0e10cSrcweir 
35cdf0e10cSrcweir // Solar Definitionen
36cdf0e10cSrcweir #include <tools/solar.h>
37cdf0e10cSrcweir #include <rsctools.hxx>
38cdf0e10cSrcweir 
39cdf0e10cSrcweir #include <rtl/textcvt.h>
40cdf0e10cSrcweir #include <rtl/textenc.h>
41cdf0e10cSrcweir #include <rtl/alloc.h>
42cdf0e10cSrcweir 
43cdf0e10cSrcweir /*************************************************************************
44cdf0e10cSrcweir |*
45cdf0e10cSrcweir |*    RscChar::MakeChar()
46cdf0e10cSrcweir |*
47cdf0e10cSrcweir |*    Beschreibung      Der String wird nach C-Konvention umgesetzt
48cdf0e10cSrcweir |*    Ersterstellung    MM 20.03.91
49cdf0e10cSrcweir |*    Letzte Aenderung  MM 20.03.91
50cdf0e10cSrcweir |*
51cdf0e10cSrcweir *************************************************************************/
MakeUTF8(char * pStr,sal_uInt16 nTextEncoding)52cdf0e10cSrcweir char * RscChar::MakeUTF8( char * pStr, sal_uInt16 nTextEncoding )
53cdf0e10cSrcweir {
54cdf0e10cSrcweir 	sal_Size nMaxUniCodeBuf = strlen( pStr ) + 1;
55cdf0e10cSrcweir 	if( nMaxUniCodeBuf * 6 > 0x0FFFFF )
56cdf0e10cSrcweir         RscExit( 10 );
57cdf0e10cSrcweir 
58cdf0e10cSrcweir 	char *			pOrgStr = new char[ nMaxUniCodeBuf ];
59cdf0e10cSrcweir 	sal_uInt32		nOrgLen = 0;
60cdf0e10cSrcweir 
61cdf0e10cSrcweir 	char cOld = '1';
62cdf0e10cSrcweir 	while( cOld != 0 )
63cdf0e10cSrcweir 	{
64cdf0e10cSrcweir 		char c;
65cdf0e10cSrcweir 
66cdf0e10cSrcweir 		if( *pStr == '\\' )
67cdf0e10cSrcweir 		{
68cdf0e10cSrcweir 			++pStr;
69cdf0e10cSrcweir 			switch( *pStr )
70cdf0e10cSrcweir 			{
71cdf0e10cSrcweir 				case 'a':
72cdf0e10cSrcweir 					c = '\a';
73cdf0e10cSrcweir 					break;
74cdf0e10cSrcweir 				case 'b':
75cdf0e10cSrcweir 					c = '\b';
76cdf0e10cSrcweir 					break;
77cdf0e10cSrcweir 				case 'f':
78cdf0e10cSrcweir 					c = '\f';
79cdf0e10cSrcweir 					break;
80cdf0e10cSrcweir 				case 'n':
81cdf0e10cSrcweir 					c = '\n';
82cdf0e10cSrcweir 					break;
83cdf0e10cSrcweir 				case 'r':
84cdf0e10cSrcweir 					c = '\r';
85cdf0e10cSrcweir 					break;
86cdf0e10cSrcweir 				case 't':
87cdf0e10cSrcweir 					c = '\t';
88cdf0e10cSrcweir 					break;
89cdf0e10cSrcweir 				case 'v':
90cdf0e10cSrcweir 					c = '\v';
91cdf0e10cSrcweir 					break;
92cdf0e10cSrcweir 				case '\\':
93cdf0e10cSrcweir 					c = '\\';
94cdf0e10cSrcweir 					break;
95cdf0e10cSrcweir 				case '?':
96cdf0e10cSrcweir 					c = '\?';
97cdf0e10cSrcweir 					break;
98cdf0e10cSrcweir 				case '\'':
99cdf0e10cSrcweir 					c = '\'';
100cdf0e10cSrcweir 					break;
101cdf0e10cSrcweir 				case '\"':
102cdf0e10cSrcweir 					c = '\"';
103cdf0e10cSrcweir 					break;
104cdf0e10cSrcweir 				default:
105cdf0e10cSrcweir 				{
106cdf0e10cSrcweir 					if( '0' <= *pStr && '7' >= *pStr )
107cdf0e10cSrcweir 					{
108cdf0e10cSrcweir 						sal_uInt16  nChar = 0;
109cdf0e10cSrcweir 						int  i = 0;
110cdf0e10cSrcweir 						while( '0' <= *pStr && '7' >= *pStr && i != 3 )
111cdf0e10cSrcweir 						{
112cdf0e10cSrcweir 							nChar = nChar * 8 + (sal_uInt8)*pStr - (sal_uInt8)'0';
113cdf0e10cSrcweir 							++pStr;
114cdf0e10cSrcweir 							i++;
115cdf0e10cSrcweir 						}
116cdf0e10cSrcweir 						if( nChar > 255 )
117cdf0e10cSrcweir 						{
118cdf0e10cSrcweir 							// Wert zu gross, oder kein 3 Ziffern
119cdf0e10cSrcweir 							delete [] pOrgStr;
120cdf0e10cSrcweir 							return( NULL );
121cdf0e10cSrcweir 						}
122cdf0e10cSrcweir 						c = (char)nChar;
123cdf0e10cSrcweir 						pStr--;
124cdf0e10cSrcweir 					}
125cdf0e10cSrcweir 					else if( 'x' == *pStr )
126cdf0e10cSrcweir 					{
127cdf0e10cSrcweir 						sal_uInt16  nChar = 0;
128cdf0e10cSrcweir 						int  i = 0;
129cdf0e10cSrcweir 						++pStr;
130cdf0e10cSrcweir 						while( isxdigit( *pStr ) && i != 2 )
131cdf0e10cSrcweir 						{
132cdf0e10cSrcweir 							if( isdigit( *pStr ) )
133cdf0e10cSrcweir 								nChar = nChar * 16 + (sal_uInt8)*pStr - (sal_uInt8)'0';
134cdf0e10cSrcweir 							else if( isupper( *pStr ) )
135cdf0e10cSrcweir 								nChar = nChar * 16 + (sal_uInt8)*pStr - (sal_uInt8)'A' +10;
136cdf0e10cSrcweir 							else
137cdf0e10cSrcweir 								nChar = nChar * 16 + (sal_uInt8)*pStr - (sal_uInt8)'a' +10;
138cdf0e10cSrcweir 							++pStr;
139cdf0e10cSrcweir 							i++;
140cdf0e10cSrcweir 						}
141cdf0e10cSrcweir 						c = (char)nChar;
142cdf0e10cSrcweir 						pStr--;
143cdf0e10cSrcweir 					}
144cdf0e10cSrcweir 					else
145cdf0e10cSrcweir 						c = *pStr;
146cdf0e10cSrcweir 				};
147cdf0e10cSrcweir 			}
148cdf0e10cSrcweir 		}
149cdf0e10cSrcweir 		else
150cdf0e10cSrcweir 			c = *pStr;
151cdf0e10cSrcweir 		pOrgStr[ nOrgLen++ ] = c;
152cdf0e10cSrcweir 		cOld = *pStr;
153cdf0e10cSrcweir 		pStr++;
154cdf0e10cSrcweir 	}
155cdf0e10cSrcweir 
156cdf0e10cSrcweir 	sal_Unicode *	pUniCode = new sal_Unicode[ nMaxUniCodeBuf ];
157cdf0e10cSrcweir 	rtl_TextToUnicodeConverter hConv = rtl_createTextToUnicodeConverter( nTextEncoding );
158cdf0e10cSrcweir 
159cdf0e10cSrcweir 	sal_uInt32 nInfo;
160cdf0e10cSrcweir 	sal_Size   nSrcCvtBytes;
161cdf0e10cSrcweir 	sal_Size nUniSize = rtl_convertTextToUnicode( hConv, 0,
162cdf0e10cSrcweir 												pOrgStr, nOrgLen,
163cdf0e10cSrcweir 												pUniCode, nMaxUniCodeBuf,
164cdf0e10cSrcweir 												RTL_TEXTTOUNICODE_FLAGS_UNDEFINED_DEFAULT
165cdf0e10cSrcweir 												| RTL_TEXTTOUNICODE_FLAGS_MBUNDEFINED_DEFAULT
166cdf0e10cSrcweir 												| RTL_TEXTTOUNICODE_FLAGS_INVALID_DEFAULT
167cdf0e10cSrcweir 												| RTL_TEXTTOUNICODE_FLAGS_FLUSH,
168cdf0e10cSrcweir 												&nInfo,
169cdf0e10cSrcweir 												&nSrcCvtBytes );
170cdf0e10cSrcweir 
171cdf0e10cSrcweir 	rtl_destroyTextToUnicodeConverter( hConv );
172cdf0e10cSrcweir 	delete[] pOrgStr, pOrgStr = 0;
173cdf0e10cSrcweir 
174cdf0e10cSrcweir 	hConv = rtl_createUnicodeToTextConverter( RTL_TEXTENCODING_UTF8 );
175cdf0e10cSrcweir 	// factor fo 6 is the maximum size of an UNICODE character as utf8
176cdf0e10cSrcweir     char * pUtf8 = (char *)rtl_allocateMemory( nUniSize * 6 );
177cdf0e10cSrcweir 	rtl_convertUnicodeToText( hConv, 0,
178cdf0e10cSrcweir 							pUniCode, nUniSize,
179cdf0e10cSrcweir 							pUtf8, nUniSize * 6,
180cdf0e10cSrcweir 							RTL_UNICODETOTEXT_FLAGS_UNDEFINED_DEFAULT
181cdf0e10cSrcweir 							| RTL_UNICODETOTEXT_FLAGS_INVALID_DEFAULT
182cdf0e10cSrcweir 							| RTL_UNICODETOTEXT_FLAGS_FLUSH,
183cdf0e10cSrcweir 							&nInfo,
184cdf0e10cSrcweir 							&nSrcCvtBytes );
185cdf0e10cSrcweir 
186cdf0e10cSrcweir 	rtl_destroyTextToUnicodeConverter( hConv );
187cdf0e10cSrcweir 	delete[] pUniCode, pUniCode = 0;
188cdf0e10cSrcweir 
189cdf0e10cSrcweir 	return pUtf8;
190cdf0e10cSrcweir };
191