summaryrefslogtreecommitdiffstats
path: root/intl/uconv/util/nsUnicodeDecodeHelper.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'intl/uconv/util/nsUnicodeDecodeHelper.cpp')
-rw-r--r--intl/uconv/util/nsUnicodeDecodeHelper.cpp234
1 files changed, 234 insertions, 0 deletions
diff --git a/intl/uconv/util/nsUnicodeDecodeHelper.cpp b/intl/uconv/util/nsUnicodeDecodeHelper.cpp
new file mode 100644
index 000000000..9d3491d86
--- /dev/null
+++ b/intl/uconv/util/nsUnicodeDecodeHelper.cpp
@@ -0,0 +1,234 @@
+/* -*- Mode: C++; tab-width: 2; indent-tabs-mode: nil; c-basic-offset: 2 -*- */
+/* This Source Code Form is subject to the terms of the Mozilla Public
+ * License, v. 2.0. If a copy of the MPL was not distributed with this
+ * file, You can obtain one at http://mozilla.org/MPL/2.0/. */
+
+#include "unicpriv.h"
+#include "nsUnicodeDecodeHelper.h"
+#include "mozilla/UniquePtr.h"
+
+//----------------------------------------------------------------------
+// Class nsUnicodeDecodeHelper [implementation]
+nsresult nsUnicodeDecodeHelper::ConvertByTable(
+ const char * aSrc,
+ int32_t * aSrcLength,
+ char16_t * aDest,
+ int32_t * aDestLength,
+ uScanClassID aScanClass,
+ uShiftInTable * aShiftInTable,
+ uMappingTable * aMappingTable,
+ bool aErrorSignal)
+{
+ const char * src = aSrc;
+ int32_t srcLen = *aSrcLength;
+ char16_t * dest = aDest;
+ char16_t * destEnd = aDest + *aDestLength;
+
+ char16_t med;
+ int32_t bcr; // byte count for read
+ nsresult res = NS_OK;
+
+ while ((srcLen > 0) && (dest < destEnd)) {
+ bool charFound;
+ if (aScanClass == uMultibytesCharset) {
+ NS_ASSERTION(aShiftInTable, "shift table missing");
+ charFound = uScanShift(aShiftInTable, nullptr, (uint8_t *)src,
+ reinterpret_cast<uint16_t*>(&med), srcLen,
+ (uint32_t *)&bcr);
+ } else {
+ charFound = uScan(aScanClass, nullptr, (uint8_t *)src,
+ reinterpret_cast<uint16_t*>(&med),
+ srcLen, (uint32_t *)&bcr);
+ }
+ if (!charFound) {
+ res = NS_OK_UDEC_MOREINPUT;
+ break;
+ }
+
+ if (!uMapCode((uTable*) aMappingTable, static_cast<uint16_t>(med), reinterpret_cast<uint16_t*>(dest))) {
+ if (med < 0x20) {
+ // somehow some table miss the 0x00 - 0x20 part
+ *dest = med;
+ } else {
+ if (aErrorSignal) {
+ res = NS_ERROR_ILLEGAL_INPUT;
+ break;
+ }
+ // Unicode replacement value for unmappable chars
+ *dest = 0xfffd;
+ }
+ }
+
+ src += bcr;
+ srcLen -= bcr;
+ dest++;
+ }
+
+ if ((srcLen > 0) && (res == NS_OK)) res = NS_OK_UDEC_MOREOUTPUT;
+
+ *aSrcLength = src - aSrc;
+ *aDestLength = dest - aDest;
+ return res;
+}
+
+nsresult nsUnicodeDecodeHelper::ConvertByMultiTable(
+ const char * aSrc,
+ int32_t * aSrcLength,
+ char16_t * aDest,
+ int32_t * aDestLength,
+ int32_t aTableCount,
+ const uRange * aRangeArray,
+ uScanClassID * aScanClassArray,
+ uMappingTable ** aMappingTable,
+ bool aErrorSignal)
+{
+ uint8_t * src = (uint8_t *)aSrc;
+ int32_t srcLen = *aSrcLength;
+ char16_t * dest = aDest;
+ char16_t * destEnd = aDest + *aDestLength;
+
+ char16_t med;
+ int32_t bcr; // byte count for read
+ nsresult res = NS_OK;
+ int32_t i;
+
+ while ((srcLen > 0) && (dest < destEnd))
+ {
+ bool done= false;
+ bool passRangeCheck = false;
+ bool passScan = false;
+ for (i=0; (!done) && (i<aTableCount); i++)
+ {
+ if ((aRangeArray[i].min <= *src) && (*src <= aRangeArray[i].max))
+ {
+ passRangeCheck = true;
+ if (uScan(aScanClassArray[i], nullptr, src,
+ reinterpret_cast<uint16_t*>(&med), srcLen,
+ (uint32_t *)&bcr))
+ {
+ passScan = true;
+ done = uMapCode((uTable*) aMappingTable[i],
+ static_cast<uint16_t>(med),
+ reinterpret_cast<uint16_t*>(dest));
+ } // if (uScan ... )
+ } // if Range
+ } // for loop
+
+ if(passRangeCheck && (! passScan))
+ {
+ if (res != NS_ERROR_ILLEGAL_INPUT)
+ res = NS_OK_UDEC_MOREINPUT;
+ break;
+ }
+ if(! done)
+ {
+ bcr = 1;
+ if ((uint8_t)*src < 0x20) {
+ // somehow some table miss the 0x00 - 0x20 part
+ *dest = *src;
+ } else if(*src == (uint8_t) 0xa0) {
+ // handle nbsp
+ *dest = 0x00a0;
+ } else {
+ // we need to decide how many byte we skip. We can use uScan to do this
+ for (i=0; i<aTableCount; i++)
+ {
+ if ((aRangeArray[i].min <= *src) && (*src <= aRangeArray[i].max))
+ {
+ if (uScan(aScanClassArray[i], nullptr, src,
+ reinterpret_cast<uint16_t*>(&med), srcLen,
+ (uint32_t*)&bcr))
+ {
+ // match the patten
+
+ int32_t k;
+ for(k = 1; k < bcr; k++)
+ {
+ if(0 == (src[k] & 0x80))
+ { // only skip if all bytes > 0x80
+ // if we hit bytes <= 0x80, skip only one byte
+ bcr = 1;
+ break;
+ }
+ }
+ break;
+ }
+ }
+ }
+ // treat it as NSBR if bcr == 1 and it is 0xa0
+ if ((1==bcr)&&(*src == (uint8_t)0xa0 )) {
+ *dest = 0x00a0;
+ } else {
+ if (aErrorSignal) {
+ res = NS_ERROR_ILLEGAL_INPUT;
+ break;
+ }
+ *dest = 0xfffd;
+ }
+ }
+ }
+
+ src += bcr;
+ srcLen -= bcr;
+ dest++;
+ } // while
+
+ if ((srcLen > 0) && (res == NS_OK)) res = NS_OK_UDEC_MOREOUTPUT;
+
+ *aSrcLength = src - (uint8_t *)aSrc;
+ *aDestLength = dest - aDest;
+ return res;
+}
+
+nsresult nsUnicodeDecodeHelper::ConvertByFastTable(
+ const char * aSrc,
+ int32_t * aSrcLength,
+ char16_t * aDest,
+ int32_t * aDestLength,
+ const char16_t * aFastTable,
+ int32_t aTableSize,
+ bool aErrorSignal)
+{
+ uint8_t * src = (uint8_t *)aSrc;
+ uint8_t * srcEnd = src;
+ char16_t * dest = aDest;
+
+ nsresult res;
+ if (*aSrcLength > *aDestLength) {
+ srcEnd += (*aDestLength);
+ res = NS_PARTIAL_MORE_OUTPUT;
+ } else {
+ srcEnd += (*aSrcLength);
+ res = NS_OK;
+ }
+
+ for (; src<srcEnd;) {
+ *dest = aFastTable[*src];
+ if (*dest == 0xfffd && aErrorSignal) {
+ res = NS_ERROR_ILLEGAL_INPUT;
+ break;
+ }
+ src++;
+ dest++;
+ }
+
+ *aSrcLength = src - (uint8_t *)aSrc;
+ *aDestLength = dest - aDest;
+ return res;
+}
+
+nsresult nsUnicodeDecodeHelper::CreateFastTable(
+ uMappingTable * aMappingTable,
+ char16_t * aFastTable,
+ int32_t aTableSize)
+{
+ int32_t tableSize = aTableSize;
+ int32_t buffSize = aTableSize;
+ auto buff = mozilla::MakeUnique<char[]>(buffSize);
+
+ char * p = buff.get();
+ for (int32_t i=0; i<aTableSize; i++) *(p++) = i;
+ return ConvertByTable(buff.get(), &buffSize, aFastTable, &tableSize,
+ u1ByteCharset, nullptr, aMappingTable);
+}
+