UNPKG

@zxing/library

Version:

TypeScript port of ZXing multi-format 1D/2D barcode image processing library.

194 lines (193 loc) 8.63 kB
/* * Copyright 2013 ZXing authors * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ // import java.util.Collection; // import java.util.Collections; import Collections from '../../util/Collections'; // import java.util.Comparator; // import java.util.Iterator; // import java.util.LinkedList; import State from './State'; import * as C from './EncoderConstants'; import * as CharMap from './CharMap'; import * as ShiftTable from './ShiftTable'; import StringUtils from '../../common/StringUtils'; /** * This produces nearly optimal encodings of text into the first-level of * encoding used by Aztec code. * * It uses a dynamic algorithm. For each prefix of the string, it determines * a set of encodings that could lead to this prefix. We repeatedly add a * character and generate a new set of optimal encodings until we have read * through the entire input. * * @author Frank Yellin * @author Rustam Abdullaev */ export default /*public final*/ class HighLevelEncoder { constructor(text) { this.text = text; } /** * @return text represented by this encoder encoded as a {@link BitArray} */ encode() { const spaceCharCode = StringUtils.getCharCode(' '); const lineBreakCharCode = StringUtils.getCharCode('\n'); let states = Collections.singletonList(State.INITIAL_STATE); for (let index = 0; index < this.text.length; index++) { let pairCode; let nextChar = index + 1 < this.text.length ? this.text[index + 1] : 0; switch (this.text[index]) { case StringUtils.getCharCode('\r'): pairCode = nextChar === lineBreakCharCode ? 2 : 0; break; case StringUtils.getCharCode('.'): pairCode = nextChar === spaceCharCode ? 3 : 0; break; case StringUtils.getCharCode(','): pairCode = nextChar === spaceCharCode ? 4 : 0; break; case StringUtils.getCharCode(':'): pairCode = nextChar === spaceCharCode ? 5 : 0; break; default: pairCode = 0; } if (pairCode > 0) { // We have one of the four special PUNCT pairs. Treat them specially. // Get a new set of states for the two new characters. states = HighLevelEncoder.updateStateListForPair(states, index, pairCode); index++; } else { // Get a new set of states for the new character. states = this.updateStateListForChar(states, index); } } // We are left with a set of states. Find the shortest one. const minState = Collections.min(states, (a, b) => { return a.getBitCount() - b.getBitCount(); }); // Convert it to a bit array, and return. return minState.toBitArray(this.text); } // We update a set of states for a new character by updating each state // for the new character, merging the results, and then removing the // non-optimal states. updateStateListForChar(states, index) { const result = []; for (let state /*State*/ of states) { this.updateStateForChar(state, index, result); } return HighLevelEncoder.simplifyStates(result); } // Return a set of states that represent the possible ways of updating this // state for the next character. The resulting set of states are added to // the "result" list. updateStateForChar(state, index, result) { let ch = (this.text[index] & 0xff); let charInCurrentTable = CharMap.CHAR_MAP[state.getMode()][ch] > 0; let stateNoBinary = null; for (let mode /*int*/ = 0; mode <= C.MODE_PUNCT; mode++) { let charInMode = CharMap.CHAR_MAP[mode][ch]; if (charInMode > 0) { if (stateNoBinary == null) { // Only create stateNoBinary the first time it's required. stateNoBinary = state.endBinaryShift(index); } // Try generating the character by latching to its mode if (!charInCurrentTable || mode === state.getMode() || mode === C.MODE_DIGIT) { // If the character is in the current table, we don't want to latch to // any other mode except possibly digit (which uses only 4 bits). Any // other latch would be equally successful *after* this character, and // so wouldn't save any bits. const latchState = stateNoBinary.latchAndAppend(mode, charInMode); result.push(latchState); } // Try generating the character by switching to its mode. if (!charInCurrentTable && ShiftTable.SHIFT_TABLE[state.getMode()][mode] >= 0) { // It never makes sense to temporarily shift to another mode if the // character exists in the current mode. That can never save bits. const shiftState = stateNoBinary.shiftAndAppend(mode, charInMode); result.push(shiftState); } } } if (state.getBinaryShiftByteCount() > 0 || CharMap.CHAR_MAP[state.getMode()][ch] === 0) { // It's never worthwhile to go into binary shift mode if you're not already // in binary shift mode, and the character exists in your current mode. // That can never save bits over just outputting the char in the current mode. let binaryState = state.addBinaryShiftChar(index); result.push(binaryState); } } static updateStateListForPair(states, index, pairCode) { const result = []; for (let state /*State*/ of states) { this.updateStateForPair(state, index, pairCode, result); } return this.simplifyStates(result); } static updateStateForPair(state, index, pairCode, result) { let stateNoBinary = state.endBinaryShift(index); // Possibility 1. Latch to C.MODE_PUNCT, and then append this code result.push(stateNoBinary.latchAndAppend(C.MODE_PUNCT, pairCode)); if (state.getMode() !== C.MODE_PUNCT) { // Possibility 2. Shift to C.MODE_PUNCT, and then append this code. // Every state except C.MODE_PUNCT (handled above) can shift result.push(stateNoBinary.shiftAndAppend(C.MODE_PUNCT, pairCode)); } if (pairCode === 3 || pairCode === 4) { // both characters are in DIGITS. Sometimes better to just add two digits let digitState = stateNoBinary .latchAndAppend(C.MODE_DIGIT, 16 - pairCode) // period or comma in DIGIT .latchAndAppend(C.MODE_DIGIT, 1); // space in DIGIT result.push(digitState); } if (state.getBinaryShiftByteCount() > 0) { // It only makes sense to do the characters as binary if we're already // in binary mode. let binaryState = state .addBinaryShiftChar(index) .addBinaryShiftChar(index + 1); result.push(binaryState); } } static simplifyStates(states) { let result = []; for (const newState of states) { let add = true; for (const oldState of result) { if (oldState.isBetterThanOrEqualTo(newState)) { add = false; break; } if (newState.isBetterThanOrEqualTo(oldState)) { // iterator.remove(); result = result.filter(x => x !== oldState); // remove old state } } if (add) { result.push(newState); } } return result; } }