xref: /AOO41X/main/sal/textenc/textcvt.c (revision cdf0e10c4e3984b49a9502b011690b615761d4a3)
1*cdf0e10cSrcweir /*************************************************************************
2*cdf0e10cSrcweir  *
3*cdf0e10cSrcweir  * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER.
4*cdf0e10cSrcweir  *
5*cdf0e10cSrcweir  * Copyright 2000, 2010 Oracle and/or its affiliates.
6*cdf0e10cSrcweir  *
7*cdf0e10cSrcweir  * OpenOffice.org - a multi-platform office productivity suite
8*cdf0e10cSrcweir  *
9*cdf0e10cSrcweir  * This file is part of OpenOffice.org.
10*cdf0e10cSrcweir  *
11*cdf0e10cSrcweir  * OpenOffice.org is free software: you can redistribute it and/or modify
12*cdf0e10cSrcweir  * it under the terms of the GNU Lesser General Public License version 3
13*cdf0e10cSrcweir  * only, as published by the Free Software Foundation.
14*cdf0e10cSrcweir  *
15*cdf0e10cSrcweir  * OpenOffice.org is distributed in the hope that it will be useful,
16*cdf0e10cSrcweir  * but WITHOUT ANY WARRANTY; without even the implied warranty of
17*cdf0e10cSrcweir  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
18*cdf0e10cSrcweir  * GNU Lesser General Public License version 3 for more details
19*cdf0e10cSrcweir  * (a copy is included in the LICENSE file that accompanied this code).
20*cdf0e10cSrcweir  *
21*cdf0e10cSrcweir  * You should have received a copy of the GNU Lesser General Public License
22*cdf0e10cSrcweir  * version 3 along with OpenOffice.org.  If not, see
23*cdf0e10cSrcweir  * <http://www.openoffice.org/license.html>
24*cdf0e10cSrcweir  * for a copy of the LGPLv3 License.
25*cdf0e10cSrcweir  *
26*cdf0e10cSrcweir  ************************************************************************/
27*cdf0e10cSrcweir 
28*cdf0e10cSrcweir #include "rtl/textcvt.h"
29*cdf0e10cSrcweir #include "gettextencodingdata.h"
30*cdf0e10cSrcweir #include "tenchelp.h"
31*cdf0e10cSrcweir 
32*cdf0e10cSrcweir /* ======================================================================= */
33*cdf0e10cSrcweir 
34*cdf0e10cSrcweir static sal_Size ImplDummyToUnicode( const sal_Char* pSrcBuf, sal_Size nSrcBytes,
35*cdf0e10cSrcweir                                     sal_Unicode* pDestBuf, sal_Size nDestChars,
36*cdf0e10cSrcweir                                     sal_uInt32 nFlags, sal_uInt32* pInfo,
37*cdf0e10cSrcweir                                     sal_Size* pSrcCvtBytes )
38*cdf0e10cSrcweir {
39*cdf0e10cSrcweir     sal_Unicode*        pEndDestBuf;
40*cdf0e10cSrcweir     const sal_Char*     pEndSrcBuf;
41*cdf0e10cSrcweir 
42*cdf0e10cSrcweir     if ( ((nFlags & RTL_TEXTTOUNICODE_FLAGS_UNDEFINED_MASK) == RTL_TEXTTOUNICODE_FLAGS_UNDEFINED_ERROR) ||
43*cdf0e10cSrcweir          ((nFlags & RTL_TEXTTOUNICODE_FLAGS_MBUNDEFINED_MASK) == RTL_TEXTTOUNICODE_FLAGS_MBUNDEFINED_ERROR) )
44*cdf0e10cSrcweir     {
45*cdf0e10cSrcweir         *pInfo |= RTL_TEXTTOUNICODE_INFO_ERROR |
46*cdf0e10cSrcweir                   RTL_TEXTTOUNICODE_INFO_UNDEFINED |
47*cdf0e10cSrcweir                   RTL_TEXTTOUNICODE_INFO_MBUNDEFINED;
48*cdf0e10cSrcweir         return 0;
49*cdf0e10cSrcweir     }
50*cdf0e10cSrcweir 
51*cdf0e10cSrcweir     *pInfo = 0;
52*cdf0e10cSrcweir     pEndDestBuf = pDestBuf+nDestChars;
53*cdf0e10cSrcweir     pEndSrcBuf  = pSrcBuf+nSrcBytes;
54*cdf0e10cSrcweir     while ( pSrcBuf < pEndSrcBuf )
55*cdf0e10cSrcweir     {
56*cdf0e10cSrcweir         if ( pDestBuf == pEndDestBuf )
57*cdf0e10cSrcweir         {
58*cdf0e10cSrcweir             *pInfo |= RTL_TEXTTOUNICODE_INFO_ERROR | RTL_TEXTTOUNICODE_INFO_DESTBUFFERTOSMALL;
59*cdf0e10cSrcweir             break;
60*cdf0e10cSrcweir         }
61*cdf0e10cSrcweir 
62*cdf0e10cSrcweir         *pDestBuf = (sal_Unicode)(sal_uChar)*pSrcBuf;
63*cdf0e10cSrcweir         pDestBuf++;
64*cdf0e10cSrcweir         pSrcBuf++;
65*cdf0e10cSrcweir     }
66*cdf0e10cSrcweir 
67*cdf0e10cSrcweir     *pSrcCvtBytes = nSrcBytes - (pEndSrcBuf-pSrcBuf);
68*cdf0e10cSrcweir     return (nDestChars - (pEndDestBuf-pDestBuf));
69*cdf0e10cSrcweir }
70*cdf0e10cSrcweir 
71*cdf0e10cSrcweir /* ----------------------------------------------------------------------- */
72*cdf0e10cSrcweir 
73*cdf0e10cSrcweir static sal_Size ImplUnicodeToDummy( const sal_Unicode* pSrcBuf, sal_Size nSrcChars,
74*cdf0e10cSrcweir                                     sal_Char* pDestBuf, sal_Size nDestBytes,
75*cdf0e10cSrcweir                                     sal_uInt32 nFlags, sal_uInt32* pInfo,
76*cdf0e10cSrcweir                                     sal_Size* pSrcCvtChars )
77*cdf0e10cSrcweir {
78*cdf0e10cSrcweir     sal_Char*               pEndDestBuf;
79*cdf0e10cSrcweir     const sal_Unicode*      pEndSrcBuf;
80*cdf0e10cSrcweir 
81*cdf0e10cSrcweir     if ( ((nFlags & RTL_UNICODETOTEXT_FLAGS_UNDEFINED_MASK) == RTL_UNICODETOTEXT_FLAGS_UNDEFINED_ERROR) )
82*cdf0e10cSrcweir     {
83*cdf0e10cSrcweir         *pInfo |= RTL_UNICODETOTEXT_INFO_ERROR |
84*cdf0e10cSrcweir                   RTL_UNICODETOTEXT_INFO_UNDEFINED;
85*cdf0e10cSrcweir         return 0;
86*cdf0e10cSrcweir     }
87*cdf0e10cSrcweir 
88*cdf0e10cSrcweir     *pInfo = 0;
89*cdf0e10cSrcweir     pEndDestBuf = pDestBuf+nDestBytes;
90*cdf0e10cSrcweir     pEndSrcBuf  = pSrcBuf+nSrcChars;
91*cdf0e10cSrcweir     while ( pSrcBuf < pEndSrcBuf )
92*cdf0e10cSrcweir     {
93*cdf0e10cSrcweir         if ( pDestBuf == pEndDestBuf )
94*cdf0e10cSrcweir         {
95*cdf0e10cSrcweir             *pInfo |= RTL_UNICODETOTEXT_INFO_ERROR | RTL_UNICODETOTEXT_INFO_DESTBUFFERTOSMALL;
96*cdf0e10cSrcweir             break;
97*cdf0e10cSrcweir         }
98*cdf0e10cSrcweir 
99*cdf0e10cSrcweir         *pDestBuf = (sal_Char)(sal_uChar)(*pSrcBuf & 0x00FF);
100*cdf0e10cSrcweir         pDestBuf++;
101*cdf0e10cSrcweir         pSrcBuf++;
102*cdf0e10cSrcweir     }
103*cdf0e10cSrcweir 
104*cdf0e10cSrcweir     *pSrcCvtChars = nSrcChars - (pEndSrcBuf-pSrcBuf);
105*cdf0e10cSrcweir     return (nDestBytes - (pEndDestBuf-pDestBuf));
106*cdf0e10cSrcweir }
107*cdf0e10cSrcweir 
108*cdf0e10cSrcweir /* ======================================================================= */
109*cdf0e10cSrcweir 
110*cdf0e10cSrcweir rtl_TextToUnicodeConverter SAL_CALL rtl_createTextToUnicodeConverter( rtl_TextEncoding eTextEncoding )
111*cdf0e10cSrcweir {
112*cdf0e10cSrcweir     const ImplTextEncodingData* pData = Impl_getTextEncodingData( eTextEncoding );
113*cdf0e10cSrcweir     if ( pData )
114*cdf0e10cSrcweir         return (rtl_TextToUnicodeConverter) &pData->maConverter;
115*cdf0e10cSrcweir     else
116*cdf0e10cSrcweir         return 0;
117*cdf0e10cSrcweir }
118*cdf0e10cSrcweir 
119*cdf0e10cSrcweir /* ----------------------------------------------------------------------- */
120*cdf0e10cSrcweir 
121*cdf0e10cSrcweir void SAL_CALL rtl_destroyTextToUnicodeConverter( rtl_TextToUnicodeConverter hContext )
122*cdf0e10cSrcweir {
123*cdf0e10cSrcweir     (void) hContext; /* unused */
124*cdf0e10cSrcweir }
125*cdf0e10cSrcweir 
126*cdf0e10cSrcweir /* ----------------------------------------------------------------------- */
127*cdf0e10cSrcweir 
128*cdf0e10cSrcweir rtl_TextToUnicodeContext SAL_CALL rtl_createTextToUnicodeContext( rtl_TextToUnicodeConverter hConverter )
129*cdf0e10cSrcweir {
130*cdf0e10cSrcweir     const ImplTextConverter* pConverter = (const ImplTextConverter*)hConverter;
131*cdf0e10cSrcweir     if ( !pConverter )
132*cdf0e10cSrcweir         return 0;
133*cdf0e10cSrcweir     else if ( pConverter->mpCreateTextToUnicodeContext )
134*cdf0e10cSrcweir         return (rtl_TextToUnicodeContext)pConverter->mpCreateTextToUnicodeContext();
135*cdf0e10cSrcweir     else
136*cdf0e10cSrcweir         return (rtl_TextToUnicodeContext)1;
137*cdf0e10cSrcweir }
138*cdf0e10cSrcweir 
139*cdf0e10cSrcweir /* ----------------------------------------------------------------------- */
140*cdf0e10cSrcweir 
141*cdf0e10cSrcweir void SAL_CALL rtl_destroyTextToUnicodeContext( rtl_TextToUnicodeConverter hConverter,
142*cdf0e10cSrcweir                                                rtl_TextToUnicodeContext hContext )
143*cdf0e10cSrcweir {
144*cdf0e10cSrcweir     const ImplTextConverter* pConverter = (const ImplTextConverter*)hConverter;
145*cdf0e10cSrcweir     if ( pConverter && hContext && pConverter->mpDestroyTextToUnicodeContext )
146*cdf0e10cSrcweir         pConverter->mpDestroyTextToUnicodeContext( (void*)hContext );
147*cdf0e10cSrcweir }
148*cdf0e10cSrcweir 
149*cdf0e10cSrcweir /* ----------------------------------------------------------------------- */
150*cdf0e10cSrcweir 
151*cdf0e10cSrcweir void SAL_CALL rtl_resetTextToUnicodeContext( rtl_TextToUnicodeConverter hConverter,
152*cdf0e10cSrcweir                                              rtl_TextToUnicodeContext hContext )
153*cdf0e10cSrcweir {
154*cdf0e10cSrcweir     const ImplTextConverter* pConverter = (const ImplTextConverter*)hConverter;
155*cdf0e10cSrcweir     if ( pConverter && hContext && pConverter->mpResetTextToUnicodeContext )
156*cdf0e10cSrcweir         pConverter->mpResetTextToUnicodeContext( (void*)hContext );
157*cdf0e10cSrcweir }
158*cdf0e10cSrcweir 
159*cdf0e10cSrcweir /* ----------------------------------------------------------------------- */
160*cdf0e10cSrcweir 
161*cdf0e10cSrcweir sal_Size SAL_CALL rtl_convertTextToUnicode( rtl_TextToUnicodeConverter hConverter,
162*cdf0e10cSrcweir                                             rtl_TextToUnicodeContext hContext,
163*cdf0e10cSrcweir                                             const sal_Char* pSrcBuf, sal_Size nSrcBytes,
164*cdf0e10cSrcweir                                             sal_Unicode* pDestBuf, sal_Size nDestChars,
165*cdf0e10cSrcweir                                             sal_uInt32 nFlags, sal_uInt32* pInfo,
166*cdf0e10cSrcweir                                             sal_Size* pSrcCvtBytes )
167*cdf0e10cSrcweir {
168*cdf0e10cSrcweir     const ImplTextConverter* pConverter = (const ImplTextConverter*)hConverter;
169*cdf0e10cSrcweir 
170*cdf0e10cSrcweir     /* Only temporaer, because we don't want die, if we don't have a
171*cdf0e10cSrcweir        converter, because not all converters are implemented yet */
172*cdf0e10cSrcweir     if ( !pConverter )
173*cdf0e10cSrcweir     {
174*cdf0e10cSrcweir         return ImplDummyToUnicode( pSrcBuf, nSrcBytes,
175*cdf0e10cSrcweir                                    pDestBuf, nDestChars,
176*cdf0e10cSrcweir                                    nFlags, pInfo, pSrcCvtBytes );
177*cdf0e10cSrcweir     }
178*cdf0e10cSrcweir 
179*cdf0e10cSrcweir     return pConverter->mpConvertTextToUnicodeProc( pConverter->mpConvertData,
180*cdf0e10cSrcweir                                                    (void*)hContext,
181*cdf0e10cSrcweir                                                    pSrcBuf, nSrcBytes,
182*cdf0e10cSrcweir                                                    pDestBuf, nDestChars,
183*cdf0e10cSrcweir                                                    nFlags, pInfo,
184*cdf0e10cSrcweir                                                    pSrcCvtBytes );
185*cdf0e10cSrcweir }
186*cdf0e10cSrcweir 
187*cdf0e10cSrcweir /* ======================================================================= */
188*cdf0e10cSrcweir 
189*cdf0e10cSrcweir rtl_UnicodeToTextConverter SAL_CALL rtl_createUnicodeToTextConverter( rtl_TextEncoding eTextEncoding )
190*cdf0e10cSrcweir {
191*cdf0e10cSrcweir     const ImplTextEncodingData* pData = Impl_getTextEncodingData( eTextEncoding );
192*cdf0e10cSrcweir     if ( pData )
193*cdf0e10cSrcweir         return (rtl_TextToUnicodeConverter) &pData->maConverter;
194*cdf0e10cSrcweir     else
195*cdf0e10cSrcweir         return 0;
196*cdf0e10cSrcweir }
197*cdf0e10cSrcweir 
198*cdf0e10cSrcweir /* ----------------------------------------------------------------------- */
199*cdf0e10cSrcweir 
200*cdf0e10cSrcweir void SAL_CALL rtl_destroyUnicodeToTextConverter( rtl_UnicodeToTextConverter hConverter )
201*cdf0e10cSrcweir {
202*cdf0e10cSrcweir     (void) hConverter; /* unused */
203*cdf0e10cSrcweir }
204*cdf0e10cSrcweir 
205*cdf0e10cSrcweir /* ----------------------------------------------------------------------- */
206*cdf0e10cSrcweir 
207*cdf0e10cSrcweir rtl_UnicodeToTextContext SAL_CALL rtl_createUnicodeToTextContext( rtl_UnicodeToTextConverter hConverter )
208*cdf0e10cSrcweir {
209*cdf0e10cSrcweir     const ImplTextConverter* pConverter = (const ImplTextConverter*)hConverter;
210*cdf0e10cSrcweir     if ( !pConverter )
211*cdf0e10cSrcweir         return 0;
212*cdf0e10cSrcweir     else if ( pConverter->mpCreateUnicodeToTextContext )
213*cdf0e10cSrcweir         return (rtl_UnicodeToTextContext)pConverter->mpCreateUnicodeToTextContext();
214*cdf0e10cSrcweir     else
215*cdf0e10cSrcweir         return (rtl_UnicodeToTextContext)1;
216*cdf0e10cSrcweir }
217*cdf0e10cSrcweir 
218*cdf0e10cSrcweir /* ----------------------------------------------------------------------- */
219*cdf0e10cSrcweir 
220*cdf0e10cSrcweir void SAL_CALL rtl_destroyUnicodeToTextContext( rtl_UnicodeToTextConverter hConverter,
221*cdf0e10cSrcweir                                                rtl_UnicodeToTextContext hContext )
222*cdf0e10cSrcweir {
223*cdf0e10cSrcweir     const ImplTextConverter* pConverter = (const ImplTextConverter*)hConverter;
224*cdf0e10cSrcweir     if ( pConverter && hContext && pConverter->mpDestroyUnicodeToTextContext )
225*cdf0e10cSrcweir         pConverter->mpDestroyUnicodeToTextContext( (void*)hContext );
226*cdf0e10cSrcweir }
227*cdf0e10cSrcweir 
228*cdf0e10cSrcweir /* ----------------------------------------------------------------------- */
229*cdf0e10cSrcweir 
230*cdf0e10cSrcweir void SAL_CALL rtl_resetUnicodeToTextContext( rtl_UnicodeToTextConverter hConverter,
231*cdf0e10cSrcweir                                              rtl_UnicodeToTextContext hContext )
232*cdf0e10cSrcweir {
233*cdf0e10cSrcweir     const ImplTextConverter* pConverter = (const ImplTextConverter*)hConverter;
234*cdf0e10cSrcweir     if ( pConverter && hContext && pConverter->mpResetUnicodeToTextContext )
235*cdf0e10cSrcweir         pConverter->mpResetUnicodeToTextContext( (void*)hContext );
236*cdf0e10cSrcweir }
237*cdf0e10cSrcweir 
238*cdf0e10cSrcweir /* ----------------------------------------------------------------------- */
239*cdf0e10cSrcweir 
240*cdf0e10cSrcweir sal_Size SAL_CALL rtl_convertUnicodeToText( rtl_UnicodeToTextConverter hConverter,
241*cdf0e10cSrcweir                                             rtl_UnicodeToTextContext hContext,
242*cdf0e10cSrcweir                                             const sal_Unicode* pSrcBuf, sal_Size nSrcChars,
243*cdf0e10cSrcweir                                             sal_Char* pDestBuf, sal_Size nDestBytes,
244*cdf0e10cSrcweir                                             sal_uInt32 nFlags, sal_uInt32* pInfo,
245*cdf0e10cSrcweir                                             sal_Size* pSrcCvtChars )
246*cdf0e10cSrcweir {
247*cdf0e10cSrcweir     const ImplTextConverter* pConverter = (const ImplTextConverter*)hConverter;
248*cdf0e10cSrcweir 
249*cdf0e10cSrcweir     /* Only temporaer, because we don't want die, if we don't have a
250*cdf0e10cSrcweir        converter, because not all converters are implemented yet */
251*cdf0e10cSrcweir     if ( !pConverter )
252*cdf0e10cSrcweir     {
253*cdf0e10cSrcweir         return ImplUnicodeToDummy( pSrcBuf, nSrcChars,
254*cdf0e10cSrcweir                                    pDestBuf, nDestBytes,
255*cdf0e10cSrcweir                                    nFlags, pInfo, pSrcCvtChars );
256*cdf0e10cSrcweir     }
257*cdf0e10cSrcweir 
258*cdf0e10cSrcweir     return pConverter->mpConvertUnicodeToTextProc( pConverter->mpConvertData,
259*cdf0e10cSrcweir                                                    (void*)hContext,
260*cdf0e10cSrcweir                                                    pSrcBuf, nSrcChars,
261*cdf0e10cSrcweir                                                    pDestBuf, nDestBytes,
262*cdf0e10cSrcweir                                                    nFlags, pInfo,
263*cdf0e10cSrcweir                                                    pSrcCvtChars );
264*cdf0e10cSrcweir }
265