123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652 |
- <?php
- declare(strict_types = 1);
- namespace BaconQrCode\Encoder;
- use BaconQrCode\Common\BitArray;
- use BaconQrCode\Common\CharacterSetEci;
- use BaconQrCode\Common\ErrorCorrectionLevel;
- use BaconQrCode\Common\Mode;
- use BaconQrCode\Common\ReedSolomonCodec;
- use BaconQrCode\Common\Version;
- use BaconQrCode\Exception\WriterException;
- use SplFixedArray;
- /**
- * Encoder.
- */
- final class Encoder
- {
- /**
- * Default byte encoding.
- */
- public const DEFAULT_BYTE_MODE_ECODING = 'ISO-8859-1';
- /**
- * The original table is defined in the table 5 of JISX0510:2004 (p.19).
- */
- private const ALPHANUMERIC_TABLE = [
- -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, // 0x00-0x0f
- -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, // 0x10-0x1f
- 36, -1, -1, -1, 37, 38, -1, -1, -1, -1, 39, 40, -1, 41, 42, 43, // 0x20-0x2f
- 0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 44, -1, -1, -1, -1, -1, // 0x30-0x3f
- -1, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, // 0x40-0x4f
- 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, -1, -1, -1, -1, -1, // 0x50-0x5f
- ];
- /**
- * Codec cache.
- *
- * @var array
- */
- private static $codecs = [];
- /**
- * Encodes "content" with the error correction level "ecLevel".
- */
- public static function encode(
- string $content,
- ErrorCorrectionLevel $ecLevel,
- string $encoding = self::DEFAULT_BYTE_MODE_ECODING
- ) : QrCode {
- // Pick an encoding mode appropriate for the content. Note that this
- // will not attempt to use multiple modes / segments even if that were
- // more efficient. Would be nice.
- $mode = self::chooseMode($content, $encoding);
- // This will store the header information, like mode and length, as well
- // as "header" segments like an ECI segment.
- $headerBits = new BitArray();
- // Append ECI segment if applicable
- if (Mode::BYTE() === $mode && self::DEFAULT_BYTE_MODE_ECODING !== $encoding) {
- $eci = CharacterSetEci::getCharacterSetEciByName($encoding);
- if (null !== $eci) {
- self::appendEci($eci, $headerBits);
- }
- }
- // (With ECI in place,) Write the mode marker
- self::appendModeInfo($mode, $headerBits);
- // Collect data within the main segment, separately, to count its size
- // if needed. Don't add it to main payload yet.
- $dataBits = new BitArray();
- self::appendBytes($content, $mode, $dataBits, $encoding);
- // Hard part: need to know version to know how many bits length takes.
- // But need to know how many bits it takes to know version. First we
- // take a guess at version by assuming version will be the minimum, 1:
- $provisionalBitsNeeded = $headerBits->getSize()
- + $mode->getCharacterCountBits(Version::getVersionForNumber(1))
- + $dataBits->getSize();
- $provisionalVersion = self::chooseVersion($provisionalBitsNeeded, $ecLevel);
- // Use that guess to calculate the right version. I am still not sure
- // this works in 100% of cases.
- $bitsNeeded = $headerBits->getSize()
- + $mode->getCharacterCountBits($provisionalVersion)
- + $dataBits->getSize();
- $version = self::chooseVersion($bitsNeeded, $ecLevel);
- $headerAndDataBits = new BitArray();
- $headerAndDataBits->appendBitArray($headerBits);
- // Find "length" of main segment and write it.
- $numLetters = (Mode::BYTE() === $mode ? $dataBits->getSizeInBytes() : strlen($content));
- self::appendLengthInfo($numLetters, $version, $mode, $headerAndDataBits);
- // Put data together into the overall payload.
- $headerAndDataBits->appendBitArray($dataBits);
- $ecBlocks = $version->getEcBlocksForLevel($ecLevel);
- $numDataBytes = $version->getTotalCodewords() - $ecBlocks->getTotalEcCodewords();
- // Terminate the bits properly.
- self::terminateBits($numDataBytes, $headerAndDataBits);
- // Interleave data bits with error correction code.
- $finalBits = self::interleaveWithEcBytes(
- $headerAndDataBits,
- $version->getTotalCodewords(),
- $numDataBytes,
- $ecBlocks->getNumBlocks()
- );
- // Choose the mask pattern.
- $dimension = $version->getDimensionForVersion();
- $matrix = new ByteMatrix($dimension, $dimension);
- $maskPattern = self::chooseMaskPattern($finalBits, $ecLevel, $version, $matrix);
- // Build the matrix.
- MatrixUtil::buildMatrix($finalBits, $ecLevel, $version, $maskPattern, $matrix);
- return new QrCode($mode, $ecLevel, $version, $maskPattern, $matrix);
- }
- /**
- * Gets the alphanumeric code for a byte.
- */
- private static function getAlphanumericCode(int $code) : int
- {
- if (isset(self::ALPHANUMERIC_TABLE[$code])) {
- return self::ALPHANUMERIC_TABLE[$code];
- }
- return -1;
- }
- /**
- * Chooses the best mode for a given content.
- */
- private static function chooseMode(string $content, string $encoding = null) : Mode
- {
- if (null !== $encoding && 0 === strcasecmp($encoding, 'SHIFT-JIS')) {
- return self::isOnlyDoubleByteKanji($content) ? Mode::KANJI() : Mode::BYTE();
- }
- $hasNumeric = false;
- $hasAlphanumeric = false;
- $contentLength = strlen($content);
- for ($i = 0; $i < $contentLength; ++$i) {
- $char = $content[$i];
- if (ctype_digit($char)) {
- $hasNumeric = true;
- } elseif (-1 !== self::getAlphanumericCode(ord($char))) {
- $hasAlphanumeric = true;
- } else {
- return Mode::BYTE();
- }
- }
- if ($hasAlphanumeric) {
- return Mode::ALPHANUMERIC();
- } elseif ($hasNumeric) {
- return Mode::NUMERIC();
- }
- return Mode::BYTE();
- }
- /**
- * Calculates the mask penalty for a matrix.
- */
- private static function calculateMaskPenalty(ByteMatrix $matrix) : int
- {
- return (
- MaskUtil::applyMaskPenaltyRule1($matrix)
- + MaskUtil::applyMaskPenaltyRule2($matrix)
- + MaskUtil::applyMaskPenaltyRule3($matrix)
- + MaskUtil::applyMaskPenaltyRule4($matrix)
- );
- }
- /**
- * Checks if content only consists of double-byte kanji characters.
- */
- private static function isOnlyDoubleByteKanji(string $content) : bool
- {
- $bytes = @iconv('utf-8', 'SHIFT-JIS', $content);
- if (false === $bytes) {
- return false;
- }
- $length = strlen($bytes);
- if (0 !== $length % 2) {
- return false;
- }
- for ($i = 0; $i < $length; $i += 2) {
- $byte = $bytes[$i] & 0xff;
- if (($byte < 0x81 || $byte > 0x9f) && $byte < 0xe0 || $byte > 0xeb) {
- return false;
- }
- }
- return true;
- }
- /**
- * Chooses the best mask pattern for a matrix.
- */
- private static function chooseMaskPattern(
- BitArray $bits,
- ErrorCorrectionLevel $ecLevel,
- Version $version,
- ByteMatrix $matrix
- ) : int {
- $minPenalty = PHP_INT_MAX;
- $bestMaskPattern = -1;
- for ($maskPattern = 0; $maskPattern < QrCode::NUM_MASK_PATTERNS; ++$maskPattern) {
- MatrixUtil::buildMatrix($bits, $ecLevel, $version, $maskPattern, $matrix);
- $penalty = self::calculateMaskPenalty($matrix);
- if ($penalty < $minPenalty) {
- $minPenalty = $penalty;
- $bestMaskPattern = $maskPattern;
- }
- }
- return $bestMaskPattern;
- }
- /**
- * Chooses the best version for the input.
- *
- * @throws WriterException if data is too big
- */
- private static function chooseVersion(int $numInputBits, ErrorCorrectionLevel $ecLevel) : Version
- {
- for ($versionNum = 1; $versionNum <= 40; ++$versionNum) {
- $version = Version::getVersionForNumber($versionNum);
- $numBytes = $version->getTotalCodewords();
- $ecBlocks = $version->getEcBlocksForLevel($ecLevel);
- $numEcBytes = $ecBlocks->getTotalEcCodewords();
- $numDataBytes = $numBytes - $numEcBytes;
- $totalInputBytes = intdiv($numInputBits + 8, 8);
- if ($numDataBytes >= $totalInputBytes) {
- return $version;
- }
- }
- throw new WriterException('Data too big');
- }
- /**
- * Terminates the bits in a bit array.
- *
- * @throws WriterException if data bits cannot fit in the QR code
- * @throws WriterException if bits size does not equal the capacity
- */
- private static function terminateBits(int $numDataBytes, BitArray $bits) : void
- {
- $capacity = $numDataBytes << 3;
- if ($bits->getSize() > $capacity) {
- throw new WriterException('Data bits cannot fit in the QR code');
- }
- for ($i = 0; $i < 4 && $bits->getSize() < $capacity; ++$i) {
- $bits->appendBit(false);
- }
- $numBitsInLastByte = $bits->getSize() & 0x7;
- if ($numBitsInLastByte > 0) {
- for ($i = $numBitsInLastByte; $i < 8; ++$i) {
- $bits->appendBit(false);
- }
- }
- $numPaddingBytes = $numDataBytes - $bits->getSizeInBytes();
- for ($i = 0; $i < $numPaddingBytes; ++$i) {
- $bits->appendBits(0 === ($i & 0x1) ? 0xec : 0x11, 8);
- }
- if ($bits->getSize() !== $capacity) {
- throw new WriterException('Bits size does not equal capacity');
- }
- }
- /**
- * Gets number of data- and EC bytes for a block ID.
- *
- * @return int[]
- * @throws WriterException if block ID is too large
- * @throws WriterException if EC bytes mismatch
- * @throws WriterException if RS blocks mismatch
- * @throws WriterException if total bytes mismatch
- */
- private static function getNumDataBytesAndNumEcBytesForBlockId(
- int $numTotalBytes,
- int $numDataBytes,
- int $numRsBlocks,
- int $blockId
- ) : array {
- if ($blockId >= $numRsBlocks) {
- throw new WriterException('Block ID too large');
- }
- $numRsBlocksInGroup2 = $numTotalBytes % $numRsBlocks;
- $numRsBlocksInGroup1 = $numRsBlocks - $numRsBlocksInGroup2;
- $numTotalBytesInGroup1 = intdiv($numTotalBytes, $numRsBlocks);
- $numTotalBytesInGroup2 = $numTotalBytesInGroup1 + 1;
- $numDataBytesInGroup1 = intdiv($numDataBytes, $numRsBlocks);
- $numDataBytesInGroup2 = $numDataBytesInGroup1 + 1;
- $numEcBytesInGroup1 = $numTotalBytesInGroup1 - $numDataBytesInGroup1;
- $numEcBytesInGroup2 = $numTotalBytesInGroup2 - $numDataBytesInGroup2;
- if ($numEcBytesInGroup1 !== $numEcBytesInGroup2) {
- throw new WriterException('EC bytes mismatch');
- }
- if ($numRsBlocks !== $numRsBlocksInGroup1 + $numRsBlocksInGroup2) {
- throw new WriterException('RS blocks mismatch');
- }
- if ($numTotalBytes !==
- (($numDataBytesInGroup1 + $numEcBytesInGroup1) * $numRsBlocksInGroup1)
- + (($numDataBytesInGroup2 + $numEcBytesInGroup2) * $numRsBlocksInGroup2)
- ) {
- throw new WriterException('Total bytes mismatch');
- }
- if ($blockId < $numRsBlocksInGroup1) {
- return [$numDataBytesInGroup1, $numEcBytesInGroup1];
- } else {
- return [$numDataBytesInGroup2, $numEcBytesInGroup2];
- }
- }
- /**
- * Interleaves data with EC bytes.
- *
- * @throws WriterException if number of bits and data bytes does not match
- * @throws WriterException if data bytes does not match offset
- * @throws WriterException if an interleaving error occurs
- */
- private static function interleaveWithEcBytes(
- BitArray $bits,
- int $numTotalBytes,
- int $numDataBytes,
- int $numRsBlocks
- ) : BitArray {
- if ($bits->getSizeInBytes() !== $numDataBytes) {
- throw new WriterException('Number of bits and data bytes does not match');
- }
- $dataBytesOffset = 0;
- $maxNumDataBytes = 0;
- $maxNumEcBytes = 0;
- $blocks = new SplFixedArray($numRsBlocks);
- for ($i = 0; $i < $numRsBlocks; ++$i) {
- list($numDataBytesInBlock, $numEcBytesInBlock) = self::getNumDataBytesAndNumEcBytesForBlockId(
- $numTotalBytes,
- $numDataBytes,
- $numRsBlocks,
- $i
- );
- $size = $numDataBytesInBlock;
- $dataBytes = $bits->toBytes(8 * $dataBytesOffset, $size);
- $ecBytes = self::generateEcBytes($dataBytes, $numEcBytesInBlock);
- $blocks[$i] = new BlockPair($dataBytes, $ecBytes);
- $maxNumDataBytes = max($maxNumDataBytes, $size);
- $maxNumEcBytes = max($maxNumEcBytes, count($ecBytes));
- $dataBytesOffset += $numDataBytesInBlock;
- }
- if ($numDataBytes !== $dataBytesOffset) {
- throw new WriterException('Data bytes does not match offset');
- }
- $result = new BitArray();
- for ($i = 0; $i < $maxNumDataBytes; ++$i) {
- foreach ($blocks as $block) {
- $dataBytes = $block->getDataBytes();
- if ($i < count($dataBytes)) {
- $result->appendBits($dataBytes[$i], 8);
- }
- }
- }
- for ($i = 0; $i < $maxNumEcBytes; ++$i) {
- foreach ($blocks as $block) {
- $ecBytes = $block->getErrorCorrectionBytes();
- if ($i < count($ecBytes)) {
- $result->appendBits($ecBytes[$i], 8);
- }
- }
- }
- if ($numTotalBytes !== $result->getSizeInBytes()) {
- throw new WriterException(
- 'Interleaving error: ' . $numTotalBytes . ' and ' . $result->getSizeInBytes() . ' differ'
- );
- }
- return $result;
- }
- /**
- * Generates EC bytes for given data.
- *
- * @param SplFixedArray<int> $dataBytes
- * @return SplFixedArray<int>
- */
- private static function generateEcBytes(SplFixedArray $dataBytes, int $numEcBytesInBlock) : SplFixedArray
- {
- $numDataBytes = count($dataBytes);
- $toEncode = new SplFixedArray($numDataBytes + $numEcBytesInBlock);
- for ($i = 0; $i < $numDataBytes; $i++) {
- $toEncode[$i] = $dataBytes[$i] & 0xff;
- }
- $ecBytes = new SplFixedArray($numEcBytesInBlock);
- $codec = self::getCodec($numDataBytes, $numEcBytesInBlock);
- $codec->encode($toEncode, $ecBytes);
- return $ecBytes;
- }
- /**
- * Gets an RS codec and caches it.
- */
- private static function getCodec(int $numDataBytes, int $numEcBytesInBlock) : ReedSolomonCodec
- {
- $cacheId = $numDataBytes . '-' . $numEcBytesInBlock;
- if (isset(self::$codecs[$cacheId])) {
- return self::$codecs[$cacheId];
- }
- return self::$codecs[$cacheId] = new ReedSolomonCodec(
- 8,
- 0x11d,
- 0,
- 1,
- $numEcBytesInBlock,
- 255 - $numDataBytes - $numEcBytesInBlock
- );
- }
- /**
- * Appends mode information to a bit array.
- */
- private static function appendModeInfo(Mode $mode, BitArray $bits) : void
- {
- $bits->appendBits($mode->getBits(), 4);
- }
- /**
- * Appends length information to a bit array.
- *
- * @throws WriterException if num letters is bigger than expected
- */
- private static function appendLengthInfo(int $numLetters, Version $version, Mode $mode, BitArray $bits) : void
- {
- $numBits = $mode->getCharacterCountBits($version);
- if ($numLetters >= (1 << $numBits)) {
- throw new WriterException($numLetters . ' is bigger than ' . ((1 << $numBits) - 1));
- }
- $bits->appendBits($numLetters, $numBits);
- }
- /**
- * Appends bytes to a bit array in a specific mode.
- *
- * @throws WriterException if an invalid mode was supplied
- */
- private static function appendBytes(string $content, Mode $mode, BitArray $bits, string $encoding) : void
- {
- switch ($mode) {
- case Mode::NUMERIC():
- self::appendNumericBytes($content, $bits);
- break;
- case Mode::ALPHANUMERIC():
- self::appendAlphanumericBytes($content, $bits);
- break;
- case Mode::BYTE():
- self::append8BitBytes($content, $bits, $encoding);
- break;
- case Mode::KANJI():
- self::appendKanjiBytes($content, $bits);
- break;
- default:
- throw new WriterException('Invalid mode: ' . $mode);
- }
- }
- /**
- * Appends numeric bytes to a bit array.
- */
- private static function appendNumericBytes(string $content, BitArray $bits) : void
- {
- $length = strlen($content);
- $i = 0;
- while ($i < $length) {
- $num1 = (int) $content[$i];
- if ($i + 2 < $length) {
- // Encode three numeric letters in ten bits.
- $num2 = (int) $content[$i + 1];
- $num3 = (int) $content[$i + 2];
- $bits->appendBits($num1 * 100 + $num2 * 10 + $num3, 10);
- $i += 3;
- } elseif ($i + 1 < $length) {
- // Encode two numeric letters in seven bits.
- $num2 = (int) $content[$i + 1];
- $bits->appendBits($num1 * 10 + $num2, 7);
- $i += 2;
- } else {
- // Encode one numeric letter in four bits.
- $bits->appendBits($num1, 4);
- ++$i;
- }
- }
- }
- /**
- * Appends alpha-numeric bytes to a bit array.
- *
- * @throws WriterException if an invalid alphanumeric code was found
- */
- private static function appendAlphanumericBytes(string $content, BitArray $bits) : void
- {
- $length = strlen($content);
- $i = 0;
- while ($i < $length) {
- $code1 = self::getAlphanumericCode(ord($content[$i]));
- if (-1 === $code1) {
- throw new WriterException('Invalid alphanumeric code');
- }
- if ($i + 1 < $length) {
- $code2 = self::getAlphanumericCode(ord($content[$i + 1]));
- if (-1 === $code2) {
- throw new WriterException('Invalid alphanumeric code');
- }
- // Encode two alphanumeric letters in 11 bits.
- $bits->appendBits($code1 * 45 + $code2, 11);
- $i += 2;
- } else {
- // Encode one alphanumeric letter in six bits.
- $bits->appendBits($code1, 6);
- ++$i;
- }
- }
- }
- /**
- * Appends regular 8-bit bytes to a bit array.
- *
- * @throws WriterException if content cannot be encoded to target encoding
- */
- private static function append8BitBytes(string $content, BitArray $bits, string $encoding) : void
- {
- $bytes = @iconv('utf-8', $encoding, $content);
- if (false === $bytes) {
- throw new WriterException('Could not encode content to ' . $encoding);
- }
- $length = strlen($bytes);
- for ($i = 0; $i < $length; $i++) {
- $bits->appendBits(ord($bytes[$i]), 8);
- }
- }
- /**
- * Appends KANJI bytes to a bit array.
- *
- * @throws WriterException if content does not seem to be encoded in SHIFT-JIS
- * @throws WriterException if an invalid byte sequence occurs
- */
- private static function appendKanjiBytes(string $content, BitArray $bits) : void
- {
- if (strlen($content) % 2 > 0) {
- // We just do a simple length check here. The for loop will check
- // individual characters.
- throw new WriterException('Content does not seem to be encoded in SHIFT-JIS');
- }
- $length = strlen($content);
- for ($i = 0; $i < $length; $i += 2) {
- $byte1 = ord($content[$i]) & 0xff;
- $byte2 = ord($content[$i + 1]) & 0xff;
- $code = ($byte1 << 8) | $byte2;
- if ($code >= 0x8140 && $code <= 0x9ffc) {
- $subtracted = $code - 0x8140;
- } elseif ($code >= 0xe040 && $code <= 0xebbf) {
- $subtracted = $code - 0xc140;
- } else {
- throw new WriterException('Invalid byte sequence');
- }
- $encoded = (($subtracted >> 8) * 0xc0) + ($subtracted & 0xff);
- $bits->appendBits($encoded, 13);
- }
- }
- /**
- * Appends ECI information to a bit array.
- */
- private static function appendEci(CharacterSetEci $eci, BitArray $bits) : void
- {
- $mode = Mode::ECI();
- $bits->appendBits($mode->getBits(), 4);
- $bits->appendBits($eci->getValue(), 8);
- }
- }
|