// © 2016 and later: Unicode, Inc. and others. // License & terms of use: http://www.unicode.org/copyright.html /* ******************************************************************************* * Copyright (C) 1997-2009,2014 International Business Machines * Corporation and others. All Rights Reserved. ******************************************************************************* * Date Name Description * 06/21/00 aliu Creation. ******************************************************************************* */ #include "unicode/utypes.h" #if !UCONFIG_NO_TRANSLITERATION #include "unicode/utrans.h" #include "unicode/putil.h" #include "unicode/rep.h" #include "unicode/translit.h" #include "unicode/unifilt.h" #include "unicode/uniset.h" #include "unicode/ustring.h" #include "unicode/uenum.h" #include "unicode/uset.h" #include "uenumimp.h" #include "cpputils.h" #include "rbt.h" // Following macro is to be followed by ';' or just ';' #define utrans_ENTRY(s) if ((s)==nullptr || U_FAILURE(*(s))) return /******************************************************************** * Replaceable-UReplaceableCallbacks glue ********************************************************************/ /** * Make a UReplaceable + UReplaceableCallbacks into a Replaceable object. */ U_NAMESPACE_BEGIN class ReplaceableGlue : public Replaceable { UReplaceable *rep; const UReplaceableCallbacks *func; public: ReplaceableGlue(UReplaceable *replaceable, const UReplaceableCallbacks *funcCallback); virtual ~ReplaceableGlue(); virtual void handleReplaceBetween(int32_t start, int32_t limit, const UnicodeString& text) override; virtual void extractBetween(int32_t start, int32_t limit, UnicodeString& target) const override; virtual void copy(int32_t start, int32_t limit, int32_t dest) override; // virtual Replaceable *clone() const { return nullptr; } same as default /** * ICU "poor man's RTTI", returns a UClassID for the actual class. * * @draft ICU 2.2 */ virtual UClassID getDynamicClassID() const override; /** * ICU "poor man's RTTI", returns a UClassID for this class. * * @draft ICU 2.2 */ static UClassID U_EXPORT2 getStaticClassID(); protected: virtual int32_t getLength() const override; virtual char16_t getCharAt(int32_t offset) const override; virtual UChar32 getChar32At(int32_t offset) const override; }; UOBJECT_DEFINE_RTTI_IMPLEMENTATION(ReplaceableGlue) ReplaceableGlue::ReplaceableGlue(UReplaceable *replaceable, const UReplaceableCallbacks *funcCallback) : Replaceable() { this->rep = replaceable; this->func = funcCallback; } ReplaceableGlue::~ReplaceableGlue() {} int32_t ReplaceableGlue::getLength() const { return (*func->length)(rep); } char16_t ReplaceableGlue::getCharAt(int32_t offset) const { return (*func->charAt)(rep, offset); } UChar32 ReplaceableGlue::getChar32At(int32_t offset) const { return (*func->char32At)(rep, offset); } void ReplaceableGlue::handleReplaceBetween(int32_t start, int32_t limit, const UnicodeString& text) { (*func->replace)(rep, start, limit, text.getBuffer(), text.length()); } void ReplaceableGlue::extractBetween(int32_t start, int32_t limit, UnicodeString& target) const { (*func->extract)(rep, start, limit, target.getBuffer(limit-start)); target.releaseBuffer(limit-start); } void ReplaceableGlue::copy(int32_t start, int32_t limit, int32_t dest) { (*func->copy)(rep, start, limit, dest); } U_NAMESPACE_END /******************************************************************** * General API ********************************************************************/ U_NAMESPACE_USE U_CAPI UTransliterator* U_EXPORT2 utrans_openU(const char16_t *id, int32_t idLength, UTransDirection dir, const char16_t *rules, int32_t rulesLength, UParseError *parseError, UErrorCode *status) { if(status==nullptr || U_FAILURE(*status)) { return nullptr; } if (id == nullptr) { *status = U_ILLEGAL_ARGUMENT_ERROR; return nullptr; } UParseError temp; if(parseError == nullptr){ parseError = &temp; } UnicodeString ID(idLength<0, id, idLength); // r-o alias if(rules==nullptr){ Transliterator *trans = nullptr; trans = Transliterator::createInstance(ID, dir, *parseError, *status); if(U_FAILURE(*status)){ return nullptr; } return (UTransliterator*) trans; }else{ UnicodeString ruleStr(rulesLength < 0, rules, rulesLength); // r-o alias Transliterator *trans = nullptr; trans = Transliterator::createFromRules(ID, ruleStr, dir, *parseError, *status); if(U_FAILURE(*status)) { return nullptr; } return (UTransliterator*) trans; } } U_CAPI UTransliterator* U_EXPORT2 utrans_open(const char* id, UTransDirection dir, const char16_t* rules, /* may be Null */ int32_t rulesLength, /* -1 if null-terminated */ UParseError* parseError, /* may be Null */ UErrorCode* status) { UnicodeString ID(id, -1, US_INV); // use invariant converter return utrans_openU(ID.getBuffer(), ID.length(), dir, rules, rulesLength, parseError, status); } U_CAPI UTransliterator* U_EXPORT2 utrans_openInverse(const UTransliterator* trans, UErrorCode* status) { utrans_ENTRY(status) nullptr; UTransliterator* result = (UTransliterator*) ((Transliterator*) trans)->createInverse(*status); return result; } U_CAPI UTransliterator* U_EXPORT2 utrans_clone(const UTransliterator* trans, UErrorCode* status) { utrans_ENTRY(status) nullptr; if (trans == nullptr) { *status = U_ILLEGAL_ARGUMENT_ERROR; return nullptr; } Transliterator *t = ((Transliterator*) trans)->clone(); if (t == nullptr) { *status = U_MEMORY_ALLOCATION_ERROR; } return (UTransliterator*) t; } U_CAPI void U_EXPORT2 utrans_close(UTransliterator* trans) { delete (Transliterator*) trans; } U_CAPI const char16_t * U_EXPORT2 utrans_getUnicodeID(const UTransliterator *trans, int32_t *resultLength) { // Transliterator keeps its ID NUL-terminated const UnicodeString &ID=((Transliterator*) trans)->getID(); if(resultLength!=nullptr) { *resultLength=ID.length(); } return ID.getBuffer(); } U_CAPI int32_t U_EXPORT2 utrans_getID(const UTransliterator* trans, char* buf, int32_t bufCapacity) { return ((Transliterator*) trans)->getID().extract(0, 0x7fffffff, buf, bufCapacity, US_INV); } U_CAPI void U_EXPORT2 utrans_register(UTransliterator* adoptedTrans, UErrorCode* status) { utrans_ENTRY(status); // status currently ignored; may remove later Transliterator::registerInstance((Transliterator*) adoptedTrans); } U_CAPI void U_EXPORT2 utrans_unregisterID(const char16_t* id, int32_t idLength) { UnicodeString ID(idLength<0, id, idLength); // r-o alias Transliterator::unregister(ID); } U_CAPI void U_EXPORT2 utrans_unregister(const char* id) { UnicodeString ID(id, -1, US_INV); // use invariant converter Transliterator::unregister(ID); } U_CAPI void U_EXPORT2 utrans_setFilter(UTransliterator* trans, const char16_t* filterPattern, int32_t filterPatternLen, UErrorCode* status) { utrans_ENTRY(status); UnicodeFilter* filter = nullptr; if (filterPattern != nullptr && *filterPattern != 0) { // Create read only alias of filterPattern: UnicodeString pat(filterPatternLen < 0, filterPattern, filterPatternLen); filter = new UnicodeSet(pat, *status); /* test for nullptr */ if (filter == nullptr) { *status = U_MEMORY_ALLOCATION_ERROR; return; } if (U_FAILURE(*status)) { delete filter; filter = nullptr; } } ((Transliterator*) trans)->adoptFilter(filter); } U_CAPI int32_t U_EXPORT2 utrans_countAvailableIDs() { return Transliterator::countAvailableIDs(); } U_CAPI int32_t U_EXPORT2 utrans_getAvailableID(int32_t index, char* buf, // may be nullptr int32_t bufCapacity) { return Transliterator::getAvailableID(index).extract(0, 0x7fffffff, buf, bufCapacity, US_INV); } /* Transliterator UEnumeration ---------------------------------------------- */ typedef struct UTransEnumeration { UEnumeration uenum; int32_t index, count; } UTransEnumeration; U_CDECL_BEGIN static int32_t U_CALLCONV utrans_enum_count(UEnumeration *uenum, UErrorCode *pErrorCode) { if(pErrorCode==nullptr || U_FAILURE(*pErrorCode)) { return 0; } return ((UTransEnumeration *)uenum)->count; } static const char16_t* U_CALLCONV utrans_enum_unext(UEnumeration *uenum, int32_t* resultLength, UErrorCode *pErrorCode) { if(pErrorCode==nullptr || U_FAILURE(*pErrorCode)) { return nullptr; } UTransEnumeration *ute=(UTransEnumeration *)uenum; int32_t index=ute->index; if(indexcount) { const UnicodeString &ID=Transliterator::getAvailableID(index); ute->index=index+1; if(resultLength!=nullptr) { *resultLength=ID.length(); } // Transliterator keeps its ID NUL-terminated return ID.getBuffer(); } if(resultLength!=nullptr) { *resultLength=0; } return nullptr; } static void U_CALLCONV utrans_enum_reset(UEnumeration *uenum, UErrorCode *pErrorCode) { if(pErrorCode==nullptr || U_FAILURE(*pErrorCode)) { return; } UTransEnumeration *ute=(UTransEnumeration *)uenum; ute->index=0; ute->count=Transliterator::countAvailableIDs(); } static void U_CALLCONV utrans_enum_close(UEnumeration *uenum) { uprv_free(uenum); } U_CDECL_END static const UEnumeration utransEnumeration={ nullptr, nullptr, utrans_enum_close, utrans_enum_count, utrans_enum_unext, uenum_nextDefault, utrans_enum_reset }; U_CAPI UEnumeration * U_EXPORT2 utrans_openIDs(UErrorCode *pErrorCode) { UTransEnumeration *ute; if(pErrorCode==nullptr || U_FAILURE(*pErrorCode)) { return nullptr; } ute=(UTransEnumeration *)uprv_malloc(sizeof(UTransEnumeration)); if(ute==nullptr) { *pErrorCode=U_MEMORY_ALLOCATION_ERROR; return nullptr; } ute->uenum=utransEnumeration; ute->index=0; ute->count=Transliterator::countAvailableIDs(); return (UEnumeration *)ute; } /******************************************************************** * Transliteration API ********************************************************************/ U_CAPI void U_EXPORT2 utrans_trans(const UTransliterator* trans, UReplaceable* rep, const UReplaceableCallbacks* repFunc, int32_t start, int32_t* limit, UErrorCode* status) { utrans_ENTRY(status); if (trans == nullptr || rep == nullptr || repFunc == nullptr || limit == nullptr) { *status = U_ILLEGAL_ARGUMENT_ERROR; return; } ReplaceableGlue r(rep, repFunc); *limit = ((Transliterator*) trans)->transliterate(r, start, *limit); } U_CAPI void U_EXPORT2 utrans_transIncremental(const UTransliterator* trans, UReplaceable* rep, const UReplaceableCallbacks* repFunc, UTransPosition* pos, UErrorCode* status) { utrans_ENTRY(status); if (trans == nullptr || rep == nullptr || repFunc == nullptr || pos == nullptr) { *status = U_ILLEGAL_ARGUMENT_ERROR; return; } ReplaceableGlue r(rep, repFunc); ((Transliterator*) trans)->transliterate(r, *pos, *status); } U_CAPI void U_EXPORT2 utrans_transUChars(const UTransliterator* trans, char16_t* text, int32_t* textLength, int32_t textCapacity, int32_t start, int32_t* limit, UErrorCode* status) { utrans_ENTRY(status); if (trans == nullptr || text == nullptr || limit == nullptr) { *status = U_ILLEGAL_ARGUMENT_ERROR; return; } int32_t textLen = (textLength == nullptr || *textLength < 0) ? u_strlen(text) : *textLength; // writeable alias: for this ct, len CANNOT be -1 (why?) UnicodeString str(text, textLen, textCapacity); *limit = ((Transliterator*) trans)->transliterate(str, start, *limit); // Copy the string buffer back to text (only if necessary) // and fill in *neededCapacity (if neededCapacity != nullptr). textLen = str.extract(text, textCapacity, *status); if(textLength != nullptr) { *textLength = textLen; } } U_CAPI void U_EXPORT2 utrans_transIncrementalUChars(const UTransliterator* trans, char16_t* text, int32_t* textLength, int32_t textCapacity, UTransPosition* pos, UErrorCode* status) { utrans_ENTRY(status); if (trans == nullptr || text == nullptr || pos == nullptr) { *status = U_ILLEGAL_ARGUMENT_ERROR; return; } int32_t textLen = (textLength == nullptr || *textLength < 0) ? u_strlen(text) : *textLength; // writeable alias: for this ct, len CANNOT be -1 (why?) UnicodeString str(text, textLen, textCapacity); ((Transliterator*) trans)->transliterate(str, *pos, *status); // Copy the string buffer back to text (only if necessary) // and fill in *neededCapacity (if neededCapacity != nullptr). textLen = str.extract(text, textCapacity, *status); if(textLength != nullptr) { *textLength = textLen; } } U_CAPI int32_t U_EXPORT2 utrans_toRules( const UTransliterator* trans, UBool escapeUnprintable, char16_t* result, int32_t resultLength, UErrorCode* status) { utrans_ENTRY(status) 0; if ( (result==nullptr)? resultLength!=0: resultLength<0 ) { *status = U_ILLEGAL_ARGUMENT_ERROR; return 0; } UnicodeString res; res.setTo(result, 0, resultLength); ((Transliterator*) trans)->toRules(res, escapeUnprintable); return res.extract(result, resultLength, *status); } U_CAPI USet* U_EXPORT2 utrans_getSourceSet(const UTransliterator* trans, UBool ignoreFilter, USet* fillIn, UErrorCode* status) { utrans_ENTRY(status) fillIn; if (fillIn == nullptr) { fillIn = uset_openEmpty(); } if (ignoreFilter) { ((Transliterator*) trans)->handleGetSourceSet(*((UnicodeSet*)fillIn)); } else { ((Transliterator*) trans)->getSourceSet(*((UnicodeSet*)fillIn)); } return fillIn; } #endif /* #if !UCONFIG_NO_TRANSLITERATION */