mirror of
https://github.com/mozilla/gecko-dev.git
synced 2024-11-24 05:11:16 +00:00
e96ab7f00d
Differential Revision: https://phabricator.services.mozilla.com/D49443 --HG-- rename : intl/icu/source/i18n/numparse_stringsegment.cpp => intl/icu/source/i18n/string_segment.cpp rename : intl/icu/source/data/buildtool/__init__.py => intl/icu/source/python/icutools/databuilder/__init__.py rename : intl/icu/source/data/buildtool/comment_stripper.py => intl/icu/source/python/icutools/databuilder/comment_stripper.py rename : intl/icu/source/data/buildtool/locale_dependencies.py => intl/icu/source/python/icutools/databuilder/locale_dependencies.py rename : intl/icu/source/data/buildtool/renderers/__init__.py => intl/icu/source/python/icutools/databuilder/renderers/__init__.py rename : intl/icu/source/data/buildtool/renderers/makefile.py => intl/icu/source/python/icutools/databuilder/renderers/makefile.py rename : intl/icu/source/data/buildtool/test/__init__.py => intl/icu/source/python/icutools/databuilder/test/__init__.py rename : intl/icu/source/data/buildtool/test/__main__.py => intl/icu/source/python/icutools/databuilder/test/__main__.py rename : intl/icu/source/data/buildtool/test/filtration_test.py => intl/icu/source/python/icutools/databuilder/test/filtration_test.py extra : moz-landing-system : lando
194 lines
5.0 KiB
C++
194 lines
5.0 KiB
C++
// © 2016 and later: Unicode, Inc. and others.
|
|
// License & terms of use: http://www.unicode.org/copyright.html
|
|
/*
|
|
*******************************************************************************
|
|
*
|
|
* Copyright (C) 2001-2011, International Business Machines
|
|
* Corporation and others. All Rights Reserved.
|
|
*
|
|
*******************************************************************************
|
|
* file name: casetrn.cpp
|
|
* encoding: UTF-8
|
|
* tab size: 8 (not used)
|
|
* indentation:4
|
|
*
|
|
* created on: 2004sep03
|
|
* created by: Markus W. Scherer
|
|
*
|
|
* Implementation class for lower-/upper-/title-casing transliterators.
|
|
*/
|
|
|
|
#include "unicode/utypes.h"
|
|
|
|
#if !UCONFIG_NO_TRANSLITERATION
|
|
|
|
#include "unicode/uchar.h"
|
|
#include "unicode/ustring.h"
|
|
#include "unicode/utf.h"
|
|
#include "unicode/utf16.h"
|
|
#include "tolowtrn.h"
|
|
#include "ucase.h"
|
|
#include "cpputils.h"
|
|
|
|
/* case context iterator using a Replaceable */
|
|
U_CFUNC UChar32 U_CALLCONV
|
|
utrans_rep_caseContextIterator(void *context, int8_t dir)
|
|
{
|
|
U_NAMESPACE_USE
|
|
|
|
UCaseContext *csc=(UCaseContext *)context;
|
|
Replaceable *rep=(Replaceable *)csc->p;
|
|
UChar32 c;
|
|
|
|
if(dir<0) {
|
|
/* reset for backward iteration */
|
|
csc->index=csc->cpStart;
|
|
csc->dir=dir;
|
|
} else if(dir>0) {
|
|
/* reset for forward iteration */
|
|
csc->index=csc->cpLimit;
|
|
csc->dir=dir;
|
|
} else {
|
|
/* continue current iteration direction */
|
|
dir=csc->dir;
|
|
}
|
|
|
|
// automatically adjust start and limit if the Replaceable disagrees
|
|
// with the original values
|
|
if(dir<0) {
|
|
if(csc->start<csc->index) {
|
|
c=rep->char32At(csc->index-1);
|
|
if(c<0) {
|
|
csc->start=csc->index;
|
|
} else {
|
|
csc->index-=U16_LENGTH(c);
|
|
return c;
|
|
}
|
|
}
|
|
} else {
|
|
// detect, and store in csc->b1, if we hit the limit
|
|
if(csc->index<csc->limit) {
|
|
c=rep->char32At(csc->index);
|
|
if(c<0) {
|
|
csc->limit=csc->index;
|
|
csc->b1=TRUE;
|
|
} else {
|
|
csc->index+=U16_LENGTH(c);
|
|
return c;
|
|
}
|
|
} else {
|
|
csc->b1=TRUE;
|
|
}
|
|
}
|
|
return U_SENTINEL;
|
|
}
|
|
|
|
U_NAMESPACE_BEGIN
|
|
|
|
UOBJECT_DEFINE_ABSTRACT_RTTI_IMPLEMENTATION(CaseMapTransliterator)
|
|
|
|
/**
|
|
* Constructs a transliterator.
|
|
*/
|
|
CaseMapTransliterator::CaseMapTransliterator(const UnicodeString &id, UCaseMapFull *map) :
|
|
Transliterator(id, 0),
|
|
fMap(map)
|
|
{
|
|
// TODO test incremental mode with context-sensitive text (e.g. greek sigma)
|
|
// TODO need to call setMaximumContextLength()?!
|
|
}
|
|
|
|
/**
|
|
* Destructor.
|
|
*/
|
|
CaseMapTransliterator::~CaseMapTransliterator() {
|
|
}
|
|
|
|
/**
|
|
* Copy constructor.
|
|
*/
|
|
CaseMapTransliterator::CaseMapTransliterator(const CaseMapTransliterator& o) :
|
|
Transliterator(o),
|
|
fMap(o.fMap)
|
|
{
|
|
}
|
|
|
|
/**
|
|
* Assignment operator.
|
|
*/
|
|
/*CaseMapTransliterator& CaseMapTransliterator::operator=(const CaseMapTransliterator& o) {
|
|
Transliterator::operator=(o);
|
|
fMap = o.fMap;
|
|
return *this;
|
|
}*/
|
|
|
|
/**
|
|
* Transliterator API.
|
|
*/
|
|
/*CaseMapTransliterator* CaseMapTransliterator::clone() const {
|
|
return new CaseMapTransliterator(*this);
|
|
}*/
|
|
|
|
/**
|
|
* Implements {@link Transliterator#handleTransliterate}.
|
|
*/
|
|
void CaseMapTransliterator::handleTransliterate(Replaceable& text,
|
|
UTransPosition& offsets,
|
|
UBool isIncremental) const
|
|
{
|
|
if (offsets.start >= offsets.limit) {
|
|
return;
|
|
}
|
|
|
|
UCaseContext csc;
|
|
uprv_memset(&csc, 0, sizeof(csc));
|
|
csc.p = &text;
|
|
csc.start = offsets.contextStart;
|
|
csc.limit = offsets.contextLimit;
|
|
|
|
UnicodeString tmp;
|
|
const UChar *s;
|
|
UChar32 c;
|
|
int32_t textPos, delta, result;
|
|
|
|
for(textPos=offsets.start; textPos<offsets.limit;) {
|
|
csc.cpStart=textPos;
|
|
c=text.char32At(textPos);
|
|
csc.cpLimit=textPos+=U16_LENGTH(c);
|
|
|
|
result=fMap(c, utrans_rep_caseContextIterator, &csc, &s, UCASE_LOC_ROOT);
|
|
|
|
if(csc.b1 && isIncremental) {
|
|
// fMap() tried to look beyond the context limit
|
|
// wait for more input
|
|
offsets.start=csc.cpStart;
|
|
return;
|
|
}
|
|
|
|
if(result>=0) {
|
|
// replace the current code point with its full case mapping result
|
|
// see UCASE_MAX_STRING_LENGTH
|
|
if(result<=UCASE_MAX_STRING_LENGTH) {
|
|
// string s[result]
|
|
tmp.setTo(FALSE, s, result);
|
|
delta=result-U16_LENGTH(c);
|
|
} else {
|
|
// single code point
|
|
tmp.setTo(result);
|
|
delta=tmp.length()-U16_LENGTH(c);
|
|
}
|
|
text.handleReplaceBetween(csc.cpStart, textPos, tmp);
|
|
if(delta!=0) {
|
|
textPos+=delta;
|
|
csc.limit=offsets.contextLimit+=delta;
|
|
offsets.limit+=delta;
|
|
}
|
|
}
|
|
}
|
|
offsets.start=textPos;
|
|
}
|
|
|
|
U_NAMESPACE_END
|
|
|
|
#endif /* #if !UCONFIG_NO_TRANSLITERATION */
|