summaryrefslogtreecommitdiff
path: root/fxbarcode/pdf417/BC_PDF417HighLevelEncoder.cpp
diff options
context:
space:
mode:
Diffstat (limited to 'fxbarcode/pdf417/BC_PDF417HighLevelEncoder.cpp')
-rw-r--r--fxbarcode/pdf417/BC_PDF417HighLevelEncoder.cpp430
1 files changed, 430 insertions, 0 deletions
diff --git a/fxbarcode/pdf417/BC_PDF417HighLevelEncoder.cpp b/fxbarcode/pdf417/BC_PDF417HighLevelEncoder.cpp
new file mode 100644
index 0000000000..ac8b0186f6
--- /dev/null
+++ b/fxbarcode/pdf417/BC_PDF417HighLevelEncoder.cpp
@@ -0,0 +1,430 @@
+// Copyright 2014 PDFium Authors. All rights reserved.
+// Use of this source code is governed by a BSD-style license that can be
+// found in the LICENSE file.
+
+// Original code copyright 2014 Foxit Software Inc. http://www.foxitsoftware.com
+// Original code is licensed as follows:
+/*
+ * Copyright 2006 Jeremias Maerki in part, and ZXing Authors in part
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License");
+ * you may not use this file except in compliance with the License.
+ * You may obtain a copy of the License at
+ *
+ * http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * Unless required by applicable law or agreed to in writing, software
+ * distributed under the License is distributed on an "AS IS" BASIS,
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+ * See the License for the specific language governing permissions and
+ * limitations under the License.
+ */
+
+#include "fxbarcode/pdf417/BC_PDF417HighLevelEncoder.h"
+
+#include "fxbarcode/BC_UtilCodingConvert.h"
+#include "fxbarcode/pdf417/BC_PDF417Compaction.h"
+#include "fxbarcode/utils.h"
+#include "third_party/bigint/BigIntegerLibrary.hh"
+
+#define SUBMODE_ALPHA 0
+#define SUBMODE_LOWER 1
+#define SUBMODE_MIXED 2
+
+int32_t CBC_PDF417HighLevelEncoder::TEXT_COMPACTION = 0;
+int32_t CBC_PDF417HighLevelEncoder::BYTE_COMPACTION = 1;
+int32_t CBC_PDF417HighLevelEncoder::NUMERIC_COMPACTION = 2;
+int32_t CBC_PDF417HighLevelEncoder::SUBMODE_PUNCTUATION = 3;
+int32_t CBC_PDF417HighLevelEncoder::LATCH_TO_TEXT = 900;
+int32_t CBC_PDF417HighLevelEncoder::LATCH_TO_BYTE_PADDED = 901;
+int32_t CBC_PDF417HighLevelEncoder::LATCH_TO_NUMERIC = 902;
+int32_t CBC_PDF417HighLevelEncoder::SHIFT_TO_BYTE = 913;
+int32_t CBC_PDF417HighLevelEncoder::LATCH_TO_BYTE = 924;
+uint8_t CBC_PDF417HighLevelEncoder::TEXT_MIXED_RAW[] = {
+ 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 38, 13, 9, 44, 58,
+ 35, 45, 46, 36, 47, 43, 37, 42, 61, 94, 0, 32, 0, 0, 0};
+uint8_t CBC_PDF417HighLevelEncoder::TEXT_PUNCTUATION_RAW[] = {
+ 59, 60, 62, 64, 91, 92, 93, 95, 96, 126, 33, 13, 9, 44, 58,
+ 10, 45, 46, 36, 47, 34, 124, 42, 40, 41, 63, 123, 125, 39, 0};
+int32_t CBC_PDF417HighLevelEncoder::MIXED[128] = {0};
+int32_t CBC_PDF417HighLevelEncoder::PUNCTUATION[128] = {0};
+
+void CBC_PDF417HighLevelEncoder::Initialize() {
+ Inverse();
+}
+
+void CBC_PDF417HighLevelEncoder::Finalize() {}
+
+CFX_WideString CBC_PDF417HighLevelEncoder::encodeHighLevel(
+ CFX_WideString wideMsg,
+ Compaction compaction,
+ int32_t& e) {
+ CFX_ByteString bytes;
+ CBC_UtilCodingConvert::UnicodeToUTF8(wideMsg, bytes);
+ CFX_WideString msg;
+ int32_t len = bytes.GetLength();
+ for (int32_t i = 0; i < len; i++) {
+ wchar_t ch = (wchar_t)(bytes.GetAt(i) & 0xff);
+ if (ch == '?' && bytes.GetAt(i) != '?') {
+ e = BCExceptionCharactersOutsideISO88591Encoding;
+ return CFX_WideString();
+ }
+ msg += ch;
+ }
+ std::vector<uint8_t> byteArr;
+ for (int32_t k = 0; k < bytes.GetLength(); k++) {
+ byteArr.push_back(bytes.GetAt(k));
+ }
+ CFX_WideString sb;
+ len = msg.GetLength();
+ int32_t p = 0;
+ int32_t textSubMode = SUBMODE_ALPHA;
+ if (compaction == TEXT) {
+ encodeText(msg, p, len, sb, textSubMode);
+ } else if (compaction == BYTES) {
+ encodeBinary(&byteArr, p, byteArr.size(), BYTE_COMPACTION, sb);
+ } else if (compaction == NUMERIC) {
+ sb += (wchar_t)LATCH_TO_NUMERIC;
+ encodeNumeric(msg, p, len, sb);
+ } else {
+ int32_t encodingMode = LATCH_TO_TEXT;
+ while (p < len) {
+ int32_t n = determineConsecutiveDigitCount(msg, p);
+ if (n >= 13) {
+ sb += (wchar_t)LATCH_TO_NUMERIC;
+ encodingMode = NUMERIC_COMPACTION;
+ textSubMode = SUBMODE_ALPHA;
+ encodeNumeric(msg, p, n, sb);
+ p += n;
+ } else {
+ int32_t t = determineConsecutiveTextCount(msg, p);
+ if (t >= 5 || n == len) {
+ if (encodingMode != TEXT_COMPACTION) {
+ sb += (wchar_t)LATCH_TO_TEXT;
+ encodingMode = TEXT_COMPACTION;
+ textSubMode = SUBMODE_ALPHA;
+ }
+ textSubMode = encodeText(msg, p, t, sb, textSubMode);
+ p += t;
+ } else {
+ int32_t b = determineConsecutiveBinaryCount(msg, &byteArr, p, e);
+ if (e != BCExceptionNO)
+ return L" ";
+ if (b == 0) {
+ b = 1;
+ }
+ if (b == 1 && encodingMode == TEXT_COMPACTION) {
+ encodeBinary(&byteArr, p, 1, TEXT_COMPACTION, sb);
+ } else {
+ encodeBinary(&byteArr, p, b, encodingMode, sb);
+ encodingMode = BYTE_COMPACTION;
+ textSubMode = SUBMODE_ALPHA;
+ }
+ p += b;
+ }
+ }
+ }
+ }
+ return sb;
+}
+
+void CBC_PDF417HighLevelEncoder::Inverse() {
+ for (size_t l = 0; l < FX_ArraySize(MIXED); ++l)
+ MIXED[l] = -1;
+
+ for (uint8_t i = 0; i < FX_ArraySize(TEXT_MIXED_RAW); ++i) {
+ uint8_t b = TEXT_MIXED_RAW[i];
+ if (b != 0)
+ MIXED[b] = i;
+ }
+
+ for (size_t l = 0; l < FX_ArraySize(PUNCTUATION); ++l)
+ PUNCTUATION[l] = -1;
+
+ for (uint8_t i = 0; i < FX_ArraySize(TEXT_PUNCTUATION_RAW); ++i) {
+ uint8_t b = TEXT_PUNCTUATION_RAW[i];
+ if (b != 0)
+ PUNCTUATION[b] = i;
+ }
+}
+
+int32_t CBC_PDF417HighLevelEncoder::encodeText(CFX_WideString msg,
+ int32_t startpos,
+ int32_t count,
+ CFX_WideString& sb,
+ int32_t initialSubmode) {
+ CFX_WideString tmp;
+ int32_t submode = initialSubmode;
+ int32_t idx = 0;
+ while (true) {
+ wchar_t ch = msg.GetAt(startpos + idx);
+ switch (submode) {
+ case SUBMODE_ALPHA:
+ if (isAlphaUpper(ch)) {
+ if (ch == ' ') {
+ tmp += (wchar_t)26;
+ } else {
+ tmp += (wchar_t)(ch - 65);
+ }
+ } else {
+ if (isAlphaLower(ch)) {
+ submode = SUBMODE_LOWER;
+ tmp += (wchar_t)27;
+ continue;
+ } else if (isMixed(ch)) {
+ submode = SUBMODE_MIXED;
+ tmp += (wchar_t)28;
+ continue;
+ } else {
+ tmp += (wchar_t)29;
+ tmp += PUNCTUATION[ch];
+ break;
+ }
+ }
+ break;
+ case SUBMODE_LOWER:
+ if (isAlphaLower(ch)) {
+ if (ch == ' ') {
+ tmp += (wchar_t)26;
+ } else {
+ tmp += (wchar_t)(ch - 97);
+ }
+ } else {
+ if (isAlphaUpper(ch)) {
+ tmp += (wchar_t)27;
+ tmp += (wchar_t)(ch - 65);
+ break;
+ } else if (isMixed(ch)) {
+ submode = SUBMODE_MIXED;
+ tmp += (wchar_t)28;
+ continue;
+ } else {
+ tmp += (wchar_t)29;
+ tmp += PUNCTUATION[ch];
+ break;
+ }
+ }
+ break;
+ case SUBMODE_MIXED:
+ if (isMixed(ch)) {
+ tmp += MIXED[ch];
+ } else {
+ if (isAlphaUpper(ch)) {
+ submode = SUBMODE_ALPHA;
+ tmp += (wchar_t)28;
+ continue;
+ } else if (isAlphaLower(ch)) {
+ submode = SUBMODE_LOWER;
+ tmp += (wchar_t)27;
+ continue;
+ } else {
+ if (startpos + idx + 1 < count) {
+ wchar_t next = msg.GetAt(startpos + idx + 1);
+ if (isPunctuation(next)) {
+ submode = SUBMODE_PUNCTUATION;
+ tmp += (wchar_t)25;
+ continue;
+ }
+ }
+ tmp += (wchar_t)29;
+ tmp += PUNCTUATION[ch];
+ }
+ }
+ break;
+ default:
+ if (isPunctuation(ch)) {
+ tmp += PUNCTUATION[ch];
+ } else {
+ submode = SUBMODE_ALPHA;
+ tmp += (wchar_t)29;
+ continue;
+ }
+ }
+ idx++;
+ if (idx >= count) {
+ break;
+ }
+ }
+ wchar_t h = 0;
+ int32_t len = tmp.GetLength();
+ for (int32_t i = 0; i < len; i++) {
+ bool odd = (i % 2) != 0;
+ if (odd) {
+ h = (wchar_t)((h * 30) + tmp.GetAt(i));
+ sb += h;
+ } else {
+ h = tmp.GetAt(i);
+ }
+ }
+ if ((len % 2) != 0) {
+ sb += (wchar_t)((h * 30) + 29);
+ }
+ return submode;
+}
+void CBC_PDF417HighLevelEncoder::encodeBinary(std::vector<uint8_t>* bytes,
+ int32_t startpos,
+ int32_t count,
+ int32_t startmode,
+ CFX_WideString& sb) {
+ if (count == 1 && startmode == TEXT_COMPACTION) {
+ sb += (wchar_t)SHIFT_TO_BYTE;
+ }
+ int32_t idx = startpos;
+ int32_t i = 0;
+ if (count >= 6) {
+ sb += (wchar_t)LATCH_TO_BYTE;
+ wchar_t chars[5];
+ while ((startpos + count - idx) >= 6) {
+ int64_t t = 0;
+ for (i = 0; i < 6; i++) {
+ t <<= 8;
+ t += (*bytes)[idx + i] & 0xff;
+ }
+ for (i = 0; i < 5; i++) {
+ chars[i] = (wchar_t)(t % 900);
+ t /= 900;
+ }
+ for (i = 4; i >= 0; i--) {
+ sb += (chars[i]);
+ }
+ idx += 6;
+ }
+ }
+ if (idx < startpos + count) {
+ sb += (wchar_t)LATCH_TO_BYTE_PADDED;
+ }
+ for (i = idx; i < startpos + count; i++) {
+ int32_t ch = (*bytes)[i] & 0xff;
+ sb += (wchar_t)ch;
+ }
+}
+void CBC_PDF417HighLevelEncoder::encodeNumeric(CFX_WideString msg,
+ int32_t startpos,
+ int32_t count,
+ CFX_WideString& sb) {
+ int32_t idx = 0;
+ BigInteger num900 = 900;
+ while (idx < count) {
+ CFX_WideString tmp;
+ int32_t len = 44 < count - idx ? 44 : count - idx;
+ CFX_ByteString part =
+ ((wchar_t)'1' + msg.Mid(startpos + idx, len)).UTF8Encode();
+ BigInteger bigint = stringToBigInteger(part.c_str());
+ do {
+ int32_t c = (bigint % num900).toInt();
+ tmp += (wchar_t)(c);
+ bigint = bigint / num900;
+ } while (!bigint.isZero());
+ for (int32_t i = tmp.GetLength() - 1; i >= 0; i--) {
+ sb += tmp.GetAt(i);
+ }
+ idx += len;
+ }
+}
+bool CBC_PDF417HighLevelEncoder::isDigit(wchar_t ch) {
+ return ch >= '0' && ch <= '9';
+}
+bool CBC_PDF417HighLevelEncoder::isAlphaUpper(wchar_t ch) {
+ return ch == ' ' || (ch >= 'A' && ch <= 'Z');
+}
+bool CBC_PDF417HighLevelEncoder::isAlphaLower(wchar_t ch) {
+ return ch == ' ' || (ch >= 'a' && ch <= 'z');
+}
+bool CBC_PDF417HighLevelEncoder::isMixed(wchar_t ch) {
+ return MIXED[ch] != -1;
+}
+bool CBC_PDF417HighLevelEncoder::isPunctuation(wchar_t ch) {
+ return PUNCTUATION[ch] != -1;
+}
+bool CBC_PDF417HighLevelEncoder::isText(wchar_t ch) {
+ return ch == '\t' || ch == '\n' || ch == '\r' || (ch >= 32 && ch <= 126);
+}
+int32_t CBC_PDF417HighLevelEncoder::determineConsecutiveDigitCount(
+ CFX_WideString msg,
+ int32_t startpos) {
+ int32_t count = 0;
+ int32_t len = msg.GetLength();
+ int32_t idx = startpos;
+ if (idx < len) {
+ wchar_t ch = msg.GetAt(idx);
+ while (isDigit(ch) && idx < len) {
+ count++;
+ idx++;
+ if (idx < len) {
+ ch = msg.GetAt(idx);
+ }
+ }
+ }
+ return count;
+}
+int32_t CBC_PDF417HighLevelEncoder::determineConsecutiveTextCount(
+ CFX_WideString msg,
+ int32_t startpos) {
+ int32_t len = msg.GetLength();
+ int32_t idx = startpos;
+ while (idx < len) {
+ wchar_t ch = msg.GetAt(idx);
+ int32_t numericCount = 0;
+ while (numericCount < 13 && isDigit(ch) && idx < len) {
+ numericCount++;
+ idx++;
+ if (idx < len) {
+ ch = msg.GetAt(idx);
+ }
+ }
+ if (numericCount >= 13) {
+ return idx - startpos - numericCount;
+ }
+ if (numericCount > 0) {
+ continue;
+ }
+ ch = msg.GetAt(idx);
+ if (!isText(ch)) {
+ break;
+ }
+ idx++;
+ }
+ return idx - startpos;
+}
+int32_t CBC_PDF417HighLevelEncoder::determineConsecutiveBinaryCount(
+ CFX_WideString msg,
+ std::vector<uint8_t>* bytes,
+ int32_t startpos,
+ int32_t& e) {
+ int32_t len = msg.GetLength();
+ int32_t idx = startpos;
+ while (idx < len) {
+ wchar_t ch = msg.GetAt(idx);
+ int32_t numericCount = 0;
+ while (numericCount < 13 && isDigit(ch)) {
+ numericCount++;
+ int32_t i = idx + numericCount;
+ if (i >= len) {
+ break;
+ }
+ ch = msg.GetAt(i);
+ }
+ if (numericCount >= 13) {
+ return idx - startpos;
+ }
+ int32_t textCount = 0;
+ while (textCount < 5 && isText(ch)) {
+ textCount++;
+ int32_t i = idx + textCount;
+ if (i >= len) {
+ break;
+ }
+ ch = msg.GetAt(i);
+ }
+ if (textCount >= 5) {
+ return idx - startpos;
+ }
+ ch = msg.GetAt(idx);
+ if ((*bytes)[idx] == 63 && ch != '?') {
+ e = BCExceptionNonEncodableCharacterDetected;
+ return -1;
+ }
+ idx++;
+ }
+ return idx - startpos;
+}