LCOV - code coverage report
Current view: top level - i18nutil/source/utility - casefolding.cxx (source / functions) Hit Total Coverage
Test: commit 10e77ab3ff6f4314137acd6e2702a6e5c1ce1fae Lines: 38 62 61.3 %
Date: 2014-11-03 Functions: 3 4 75.0 %
Legend: Lines: hit not hit

          Line data    Source code
       1             : /* -*- Mode: C++; tab-width: 4; indent-tabs-mode: nil; c-basic-offset: 4 -*- */
       2             : /*
       3             :  * This file is part of the LibreOffice project.
       4             :  *
       5             :  * This Source Code Form is subject to the terms of the Mozilla Public
       6             :  * License, v. 2.0. If a copy of the MPL was not distributed with this
       7             :  * file, You can obtain one at http://mozilla.org/MPL/2.0/.
       8             :  *
       9             :  * This file incorporates work covered by the following license notice:
      10             :  *
      11             :  *   Licensed to the Apache Software Foundation (ASF) under one or more
      12             :  *   contributor license agreements. See the NOTICE file distributed
      13             :  *   with this work for additional information regarding copyright
      14             :  *   ownership. The ASF licenses this file to you under the Apache
      15             :  *   License, Version 2.0 (the "License"); you may not use this file
      16             :  *   except in compliance with the License. You may obtain a copy of
      17             :  *   the License at http://www.apache.org/licenses/LICENSE-2.0 .
      18             :  */
      19             : 
      20             : #include "i18nutil/casefolding.hxx"
      21             : #include "casefolding_data.h"
      22             : #include "i18nutil/widthfolding.hxx"
      23             : 
      24             : using namespace com::sun::star::lang;
      25             : using namespace com::sun::star::uno;
      26             : 
      27             : namespace com { namespace sun { namespace star { namespace i18n {
      28             : 
      29             : static Mapping mapping_03a3[] = {{0, 1, {0x03c2, 0, 0}},{0, 1, {0x03c3, 0, 0}}};
      30             : static Mapping mapping_0307[] = {{0, 0, {0, 0, 0}},{0, 1, {0x0307, 0, 0}}};
      31             : static Mapping mapping_004a[] = {{0, 2, {0x006a, 0x0307, 0}},{0, 1, {0x006a, 0, 0}}};
      32             : static Mapping mapping_012e[] = {{0, 2, {0x012f, 0x0307, 0}},{0, 1, {0x012f, 0, 0}}};
      33             : static Mapping mapping_00cc[] = {{0, 3, {0x0069, 0x0307, 0x0300}},{0, 1, {0x00ec, 0, 0}}};
      34             : static Mapping mapping_00cd[] = {{0, 3, {0x0069, 0x0307, 0x0301}},{0, 1, {0x00ed, 0, 0}}};
      35             : static Mapping mapping_0128[] = {{0, 3, {0x0069, 0x0307, 0x0303}},{0, 1, {0x0129, 0, 0}}};
      36             : static Mapping mapping_0049[] = {{0, 2, {0x0069, 0x0307, 0}},{0, 1, {0x0131, 0, 0}},{0, 1, {0x0069, 0, 0}}};
      37             : static Mapping mapping_0069[] = {{0, 1, {0x0130, 0, 0}},{0, 1, {0x0049, 0, 0}}};
      38             : static Mapping mapping_0130[] = {{0, 1, {0x0069, 0, 0}},{0, 1, {0x0130, 0, 0}}};
      39             : 
      40             : #define langIs(lang) (aLocale.Language == lang)
      41             : 
      42             : // only check simple case, there is more complicated case need to be checked.
      43             : #define type_i(ch) ((ch) == 0x0069 || (ch) == 0x006a)
      44             : 
      45             : #define cased_letter(ch) (CaseMappingIndex[(ch)>>8] >= 0 && (CaseMappingValue[(CaseMappingIndex[(ch)>>8] << 8) + ((ch)&0xff)].type & CasedLetter))
      46             : 
      47             : // for Lithuanian, condition to make explicit dot above when lowercasing capital I's and J's
      48             : // whenever there are more accents above.
      49             : #define accent_above(ch) (((ch) >= 0x0300 && (ch) <= 0x0314) || ((ch) >= 0x033D && (ch) <= 0x0344) || (ch) == 0x0346 || ((ch) >= 0x034A && (ch) <= 0x034C))
      50             : 
      51      499520 : Mapping& casefolding::getConditionalValue(const sal_Unicode* str, sal_Int32 pos, sal_Int32 len, Locale& aLocale, sal_uInt8 nMappingType) throw (RuntimeException)
      52             : {
      53      499520 :         switch(str[pos]) {
      54             :         case 0x03a3:
      55             :             // final_sigma (not followed by cased and preceded by cased character)
      56             :             // DOES NOT check ignorable sequence yet (more complicated implementation).
      57           0 :             return !(pos < len && cased_letter(str[pos+1])) && (pos > 0 && cased_letter(str[pos-1])) ?
      58           0 :                 mapping_03a3[0] : mapping_03a3[1];
      59             :         case 0x0307:
      60           0 :             return (((nMappingType == MappingTypeLowerToUpper && langIs("lt")) ||
      61           0 :                 (nMappingType == MappingTypeUpperToLower && (langIs("tr") || langIs("az")))) &&
      62           0 :                 (pos > 0 && type_i(str[pos-1]))) ?      // after_i
      63           0 :                     mapping_0307[0] : mapping_0307[1];
      64             :         case 0x0130:
      65           0 :             return (langIs("tr") || langIs("az")) ? mapping_0130[0] : mapping_0130[1];
      66             :         case 0x0069:
      67      492659 :             return (langIs("tr") || langIs("az")) ? mapping_0069[0] : mapping_0069[1];
      68        5213 :         case 0x0049: return langIs("lt") && pos > len && accent_above(str[pos+1]) ? mapping_0049[0] :
      69       10426 :                     (langIs("tr") || langIs("az")) ? mapping_0049[1] : mapping_0049[2];
      70        1648 :         case 0x004a: return langIs("lt") && pos > len && accent_above(str[pos+1]) ? mapping_004a[0] : mapping_004a[1];
      71           0 :         case 0x012e: return langIs("lt") && pos > len && accent_above(str[pos+1]) ? mapping_012e[0] : mapping_012e[1];
      72           0 :         case 0x00cc: return langIs("lt") ? mapping_00cc[0] : mapping_00cc[1];
      73           0 :         case 0x00cd: return langIs("lt") ? mapping_00cd[0] : mapping_00cd[1];
      74           0 :         case 0x0128: return langIs("lt") ? mapping_0128[0] : mapping_0128[1];
      75             :         }
      76             :         // Should not come here
      77           0 :         throw RuntimeException();
      78             : }
      79             : 
      80    27424284 : Mapping& casefolding::getValue(const sal_Unicode* str, sal_Int32 pos, sal_Int32 len, Locale& aLocale, sal_uInt8 nMappingType) throw (RuntimeException)
      81             : {
      82             :     static Mapping dummy = { 0, 1, { 0, 0, 0 } };
      83    27424284 :     sal_Int16 address = CaseMappingIndex[str[pos] >> 8];
      84             : 
      85    27424284 :     dummy.map[0] = str[pos];
      86             : 
      87    27424284 :     if (address >= 0) {
      88    27416162 :         address = (address << 8) + (str[pos] & 0xFF);
      89    27416162 :         if (CaseMappingValue[address].type & nMappingType) {
      90     4257560 :             sal_uInt8 type = CaseMappingValue[address].type;
      91     4257560 :             if (type & ValueTypeNotValue) {
      92      499870 :                 if (CaseMappingValue[address].value == 0)
      93      497872 :                     return getConditionalValue(str, pos, len, aLocale, nMappingType);
      94             :                 else {
      95        7296 :                     for (int map = CaseMappingValue[address].value;
      96        3648 :                             map < CaseMappingValue[address].value + MaxCaseMappingExtras; map++) {
      97        3648 :                         if (CaseMappingExtra[map].type & nMappingType) {
      98        1998 :                             if (CaseMappingExtra[map].type & ValueTypeNotValue)
      99        1648 :                                 return getConditionalValue(str, pos, len, aLocale, nMappingType);
     100             :                             else
     101         350 :                                 return CaseMappingExtra[map];
     102             :                         }
     103             :                     }
     104             :                     // Should not come here
     105           0 :                     throw RuntimeException();
     106             :                 }
     107             :             } else
     108     3757690 :                 dummy.map[0] = CaseMappingValue[address].value;
     109             :         }
     110             :     }
     111    26924414 :     return dummy;
     112             : }
     113             : 
     114             : inline bool SAL_CALL
     115           0 : is_ja_voice_sound_mark(sal_Unicode& current, sal_Unicode next)
     116             : {
     117           0 :         sal_Unicode c = 0;
     118             : 
     119           0 :         if ((next == 0x3099 || next == 0x309a) && ( (c = widthfolding::getCompositionChar(current, next)) != 0 ))
     120           0 :             current = c;
     121           0 :         return c != 0;
     122             : }
     123             : 
     124      177284 : sal_Unicode casefolding::getNextChar(const sal_Unicode *str, sal_Int32& idx, sal_Int32 len, MappingElement& e, Locale& aLocale, sal_uInt8 nMappingType, TransliterationModules moduleLoaded) throw (RuntimeException)
     125             : {
     126      177284 :         if( idx >= len )
     127             :         {
     128           0 :             e = MappingElement();
     129           0 :             return 0;
     130             :         }
     131             : 
     132             :         sal_Unicode c;
     133             : 
     134      177284 :         if (moduleLoaded & TransliterationModules_IGNORE_CASE) {
     135      177284 :             if( e.current >= e.element.nmap ) {
     136      177284 :                 e.element = getValue(str, idx++, len, aLocale, nMappingType);
     137      177284 :                 e.current = 0;
     138             :             }
     139      177284 :             c = e.element.map[e.current++];
     140             :         } else {
     141           0 :             c = *(str + idx++);
     142             :         }
     143             : 
     144      177284 :         if (moduleLoaded & TransliterationModules_IGNORE_KANA) {
     145       74336 :             if ((0x3040 <= c && c <= 0x3094) || (0x309d <= c && c <= 0x309f))
     146           0 :                 c += 0x60;
     147             :         }
     148             : 
     149             :         // composition: KA + voice-mark --> GA. see halfwidthToFullwidth.cxx for detail
     150      177284 :         if (moduleLoaded & TransliterationModules_IGNORE_WIDTH) {
     151      156388 :             static oneToOneMapping& half2fullTable = widthfolding::gethalf2fullTable();
     152      156388 :             c = half2fullTable[c];
     153      156388 :             if (0x3040 <= c && c <= 0x30ff && idx < len &&
     154           0 :                     is_ja_voice_sound_mark(c, half2fullTable[*(str + idx)]))
     155           0 :                 idx++;
     156             :         }
     157             : 
     158      177284 :         return c;
     159             : }
     160             : 
     161             : } } } }
     162             : 
     163             : /* vim:set shiftwidth=4 softtabstop=4 expandtab: */

Generated by: LCOV version 1.10