| 123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652 | <?phpdeclare(strict_types = 1);namespace BaconQrCode\Encoder;use BaconQrCode\Common\BitArray;use BaconQrCode\Common\CharacterSetEci;use BaconQrCode\Common\ErrorCorrectionLevel;use BaconQrCode\Common\Mode;use BaconQrCode\Common\ReedSolomonCodec;use BaconQrCode\Common\Version;use BaconQrCode\Exception\WriterException;use SplFixedArray;/** * Encoder. */final class Encoder{    /**     * Default byte encoding.     */    public const DEFAULT_BYTE_MODE_ECODING = 'ISO-8859-1';    /**     * The original table is defined in the table 5 of JISX0510:2004 (p.19).     */    private const ALPHANUMERIC_TABLE = [        -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,  // 0x00-0x0f        -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1,  // 0x10-0x1f        36, -1, -1, -1, 37, 38, -1, -1, -1, -1, 39, 40, -1, 41, 42, 43,  // 0x20-0x2f        0,   1,  2,  3,  4,  5,  6,  7,  8,  9, 44, -1, -1, -1, -1, -1,  // 0x30-0x3f        -1, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24,  // 0x40-0x4f        25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, -1, -1, -1, -1, -1,  // 0x50-0x5f    ];    /**     * Codec cache.     *     * @var array     */    private static $codecs = [];    /**     * Encodes "content" with the error correction level "ecLevel".     */    public static function encode(        string $content,        ErrorCorrectionLevel $ecLevel,        string $encoding = self::DEFAULT_BYTE_MODE_ECODING    ) : QrCode {        // Pick an encoding mode appropriate for the content. Note that this        // will not attempt to use multiple modes / segments even if that were        // more efficient. Would be nice.        $mode = self::chooseMode($content, $encoding);        // This will store the header information, like mode and length, as well        // as "header" segments like an ECI segment.        $headerBits = new BitArray();        // Append ECI segment if applicable        if (Mode::BYTE() === $mode && self::DEFAULT_BYTE_MODE_ECODING !== $encoding) {            $eci = CharacterSetEci::getCharacterSetEciByName($encoding);            if (null !== $eci) {                self::appendEci($eci, $headerBits);            }        }        // (With ECI in place,) Write the mode marker        self::appendModeInfo($mode, $headerBits);        // Collect data within the main segment, separately, to count its size        // if needed. Don't add it to main payload yet.        $dataBits = new BitArray();        self::appendBytes($content, $mode, $dataBits, $encoding);        // Hard part: need to know version to know how many bits length takes.        // But need to know how many bits it takes to know version. First we        // take a guess at version by assuming version will be the minimum, 1:        $provisionalBitsNeeded = $headerBits->getSize()            + $mode->getCharacterCountBits(Version::getVersionForNumber(1))            + $dataBits->getSize();        $provisionalVersion = self::chooseVersion($provisionalBitsNeeded, $ecLevel);        // Use that guess to calculate the right version. I am still not sure        // this works in 100% of cases.        $bitsNeeded = $headerBits->getSize()            + $mode->getCharacterCountBits($provisionalVersion)            + $dataBits->getSize();        $version = self::chooseVersion($bitsNeeded, $ecLevel);        $headerAndDataBits = new BitArray();        $headerAndDataBits->appendBitArray($headerBits);        // Find "length" of main segment and write it.        $numLetters = (Mode::BYTE() === $mode ? $dataBits->getSizeInBytes() : strlen($content));        self::appendLengthInfo($numLetters, $version, $mode, $headerAndDataBits);        // Put data together into the overall payload.        $headerAndDataBits->appendBitArray($dataBits);        $ecBlocks = $version->getEcBlocksForLevel($ecLevel);        $numDataBytes = $version->getTotalCodewords() - $ecBlocks->getTotalEcCodewords();        // Terminate the bits properly.        self::terminateBits($numDataBytes, $headerAndDataBits);        // Interleave data bits with error correction code.        $finalBits = self::interleaveWithEcBytes(            $headerAndDataBits,            $version->getTotalCodewords(),            $numDataBytes,            $ecBlocks->getNumBlocks()        );        // Choose the mask pattern.        $dimension = $version->getDimensionForVersion();        $matrix = new ByteMatrix($dimension, $dimension);        $maskPattern = self::chooseMaskPattern($finalBits, $ecLevel, $version, $matrix);        // Build the matrix.        MatrixUtil::buildMatrix($finalBits, $ecLevel, $version, $maskPattern, $matrix);        return new QrCode($mode, $ecLevel, $version, $maskPattern, $matrix);    }    /**     * Gets the alphanumeric code for a byte.     */    private static function getAlphanumericCode(int $code) : int    {        if (isset(self::ALPHANUMERIC_TABLE[$code])) {            return self::ALPHANUMERIC_TABLE[$code];        }        return -1;    }    /**     * Chooses the best mode for a given content.     */    private static function chooseMode(string $content, string $encoding = null) : Mode    {        if (null !== $encoding && 0 === strcasecmp($encoding, 'SHIFT-JIS')) {            return self::isOnlyDoubleByteKanji($content) ? Mode::KANJI() : Mode::BYTE();        }        $hasNumeric = false;        $hasAlphanumeric = false;        $contentLength = strlen($content);        for ($i = 0; $i < $contentLength; ++$i) {            $char = $content[$i];            if (ctype_digit($char)) {                $hasNumeric = true;            } elseif (-1 !== self::getAlphanumericCode(ord($char))) {                $hasAlphanumeric = true;            } else {                return Mode::BYTE();            }        }        if ($hasAlphanumeric) {            return Mode::ALPHANUMERIC();        } elseif ($hasNumeric) {            return Mode::NUMERIC();        }        return Mode::BYTE();    }    /**     * Calculates the mask penalty for a matrix.     */    private static function calculateMaskPenalty(ByteMatrix $matrix) : int    {        return (            MaskUtil::applyMaskPenaltyRule1($matrix)            + MaskUtil::applyMaskPenaltyRule2($matrix)            + MaskUtil::applyMaskPenaltyRule3($matrix)            + MaskUtil::applyMaskPenaltyRule4($matrix)        );    }    /**     * Checks if content only consists of double-byte kanji characters.     */    private static function isOnlyDoubleByteKanji(string $content) : bool    {        $bytes = @iconv('utf-8', 'SHIFT-JIS', $content);        if (false === $bytes) {            return false;        }        $length = strlen($bytes);        if (0 !== $length % 2) {            return false;        }        for ($i = 0; $i < $length; $i += 2) {            $byte = $bytes[$i] & 0xff;            if (($byte < 0x81 || $byte > 0x9f) && $byte < 0xe0 || $byte > 0xeb) {                return false;            }        }        return true;    }    /**     * Chooses the best mask pattern for a matrix.     */    private static function chooseMaskPattern(        BitArray $bits,        ErrorCorrectionLevel $ecLevel,        Version $version,        ByteMatrix $matrix    ) : int {        $minPenalty = PHP_INT_MAX;        $bestMaskPattern = -1;        for ($maskPattern = 0; $maskPattern < QrCode::NUM_MASK_PATTERNS; ++$maskPattern) {            MatrixUtil::buildMatrix($bits, $ecLevel, $version, $maskPattern, $matrix);            $penalty = self::calculateMaskPenalty($matrix);            if ($penalty < $minPenalty) {                $minPenalty = $penalty;                $bestMaskPattern = $maskPattern;            }        }        return $bestMaskPattern;    }    /**     * Chooses the best version for the input.     *     * @throws WriterException if data is too big     */    private static function chooseVersion(int $numInputBits, ErrorCorrectionLevel $ecLevel) : Version    {        for ($versionNum = 1; $versionNum <= 40; ++$versionNum) {            $version = Version::getVersionForNumber($versionNum);            $numBytes = $version->getTotalCodewords();            $ecBlocks = $version->getEcBlocksForLevel($ecLevel);            $numEcBytes = $ecBlocks->getTotalEcCodewords();            $numDataBytes = $numBytes - $numEcBytes;            $totalInputBytes = intdiv($numInputBits + 8, 8);            if ($numDataBytes >= $totalInputBytes) {                return $version;            }        }        throw new WriterException('Data too big');    }    /**     * Terminates the bits in a bit array.     *     * @throws WriterException if data bits cannot fit in the QR code     * @throws WriterException if bits size does not equal the capacity     */    private static function terminateBits(int $numDataBytes, BitArray $bits) : void    {        $capacity = $numDataBytes << 3;        if ($bits->getSize() > $capacity) {            throw new WriterException('Data bits cannot fit in the QR code');        }        for ($i = 0; $i < 4 && $bits->getSize() < $capacity; ++$i) {            $bits->appendBit(false);        }        $numBitsInLastByte = $bits->getSize() & 0x7;        if ($numBitsInLastByte > 0) {            for ($i = $numBitsInLastByte; $i < 8; ++$i) {                $bits->appendBit(false);            }        }        $numPaddingBytes = $numDataBytes - $bits->getSizeInBytes();        for ($i = 0; $i < $numPaddingBytes; ++$i) {            $bits->appendBits(0 === ($i & 0x1) ? 0xec : 0x11, 8);        }        if ($bits->getSize() !== $capacity) {            throw new WriterException('Bits size does not equal capacity');        }    }    /**     * Gets number of data- and EC bytes for a block ID.     *     * @return int[]     * @throws WriterException if block ID is too large     * @throws WriterException if EC bytes mismatch     * @throws WriterException if RS blocks mismatch     * @throws WriterException if total bytes mismatch     */    private static function getNumDataBytesAndNumEcBytesForBlockId(        int $numTotalBytes,        int $numDataBytes,        int $numRsBlocks,        int $blockId    ) : array {        if ($blockId >= $numRsBlocks) {            throw new WriterException('Block ID too large');        }        $numRsBlocksInGroup2 = $numTotalBytes % $numRsBlocks;        $numRsBlocksInGroup1 = $numRsBlocks - $numRsBlocksInGroup2;        $numTotalBytesInGroup1 = intdiv($numTotalBytes, $numRsBlocks);        $numTotalBytesInGroup2 = $numTotalBytesInGroup1 + 1;        $numDataBytesInGroup1 = intdiv($numDataBytes, $numRsBlocks);        $numDataBytesInGroup2 = $numDataBytesInGroup1 + 1;        $numEcBytesInGroup1 = $numTotalBytesInGroup1 - $numDataBytesInGroup1;        $numEcBytesInGroup2 = $numTotalBytesInGroup2 - $numDataBytesInGroup2;        if ($numEcBytesInGroup1 !== $numEcBytesInGroup2) {            throw new WriterException('EC bytes mismatch');        }        if ($numRsBlocks !== $numRsBlocksInGroup1 + $numRsBlocksInGroup2) {            throw new WriterException('RS blocks mismatch');        }        if ($numTotalBytes !==            (($numDataBytesInGroup1 + $numEcBytesInGroup1) * $numRsBlocksInGroup1)            + (($numDataBytesInGroup2 + $numEcBytesInGroup2) * $numRsBlocksInGroup2)        ) {            throw new WriterException('Total bytes mismatch');        }        if ($blockId < $numRsBlocksInGroup1) {            return [$numDataBytesInGroup1, $numEcBytesInGroup1];        } else {            return [$numDataBytesInGroup2, $numEcBytesInGroup2];        }    }    /**     * Interleaves data with EC bytes.     *     * @throws WriterException if number of bits and data bytes does not match     * @throws WriterException if data bytes does not match offset     * @throws WriterException if an interleaving error occurs     */    private static function interleaveWithEcBytes(        BitArray $bits,        int $numTotalBytes,        int $numDataBytes,        int $numRsBlocks    ) : BitArray {        if ($bits->getSizeInBytes() !== $numDataBytes) {            throw new WriterException('Number of bits and data bytes does not match');        }        $dataBytesOffset = 0;        $maxNumDataBytes = 0;        $maxNumEcBytes   = 0;        $blocks = new SplFixedArray($numRsBlocks);        for ($i = 0; $i < $numRsBlocks; ++$i) {            list($numDataBytesInBlock, $numEcBytesInBlock) = self::getNumDataBytesAndNumEcBytesForBlockId(                $numTotalBytes,                $numDataBytes,                $numRsBlocks,                $i            );            $size = $numDataBytesInBlock;            $dataBytes = $bits->toBytes(8 * $dataBytesOffset, $size);            $ecBytes = self::generateEcBytes($dataBytes, $numEcBytesInBlock);            $blocks[$i] = new BlockPair($dataBytes, $ecBytes);            $maxNumDataBytes = max($maxNumDataBytes, $size);            $maxNumEcBytes = max($maxNumEcBytes, count($ecBytes));            $dataBytesOffset += $numDataBytesInBlock;        }        if ($numDataBytes !== $dataBytesOffset) {            throw new WriterException('Data bytes does not match offset');        }        $result = new BitArray();        for ($i = 0; $i < $maxNumDataBytes; ++$i) {            foreach ($blocks as $block) {                $dataBytes = $block->getDataBytes();                if ($i < count($dataBytes)) {                    $result->appendBits($dataBytes[$i], 8);                }            }        }        for ($i = 0; $i < $maxNumEcBytes; ++$i) {            foreach ($blocks as $block) {                $ecBytes = $block->getErrorCorrectionBytes();                if ($i < count($ecBytes)) {                    $result->appendBits($ecBytes[$i], 8);                }            }        }        if ($numTotalBytes !== $result->getSizeInBytes()) {            throw new WriterException(                'Interleaving error: ' . $numTotalBytes . ' and ' . $result->getSizeInBytes() . ' differ'            );        }        return $result;    }    /**     * Generates EC bytes for given data.     *     * @param  SplFixedArray<int> $dataBytes     * @return SplFixedArray<int>     */    private static function generateEcBytes(SplFixedArray $dataBytes, int $numEcBytesInBlock) : SplFixedArray    {        $numDataBytes = count($dataBytes);        $toEncode = new SplFixedArray($numDataBytes + $numEcBytesInBlock);        for ($i = 0; $i < $numDataBytes; $i++) {            $toEncode[$i] = $dataBytes[$i] & 0xff;        }        $ecBytes = new SplFixedArray($numEcBytesInBlock);        $codec = self::getCodec($numDataBytes, $numEcBytesInBlock);        $codec->encode($toEncode, $ecBytes);        return $ecBytes;    }    /**     * Gets an RS codec and caches it.     */    private static function getCodec(int $numDataBytes, int $numEcBytesInBlock) : ReedSolomonCodec    {        $cacheId = $numDataBytes . '-' . $numEcBytesInBlock;        if (isset(self::$codecs[$cacheId])) {            return self::$codecs[$cacheId];        }        return self::$codecs[$cacheId] = new ReedSolomonCodec(            8,            0x11d,            0,            1,            $numEcBytesInBlock,            255 - $numDataBytes - $numEcBytesInBlock        );    }    /**     * Appends mode information to a bit array.     */    private static function appendModeInfo(Mode $mode, BitArray $bits) : void    {        $bits->appendBits($mode->getBits(), 4);    }    /**     * Appends length information to a bit array.     *     * @throws WriterException if num letters is bigger than expected     */    private static function appendLengthInfo(int $numLetters, Version $version, Mode $mode, BitArray $bits) : void    {        $numBits = $mode->getCharacterCountBits($version);        if ($numLetters >= (1 << $numBits)) {            throw new WriterException($numLetters . ' is bigger than ' . ((1 << $numBits) - 1));        }        $bits->appendBits($numLetters, $numBits);    }    /**     * Appends bytes to a bit array in a specific mode.     *     * @throws WriterException if an invalid mode was supplied     */    private static function appendBytes(string $content, Mode $mode, BitArray $bits, string $encoding) : void    {        switch ($mode) {            case Mode::NUMERIC():                self::appendNumericBytes($content, $bits);                break;            case Mode::ALPHANUMERIC():                self::appendAlphanumericBytes($content, $bits);                break;            case Mode::BYTE():                self::append8BitBytes($content, $bits, $encoding);                break;            case Mode::KANJI():                self::appendKanjiBytes($content, $bits);                break;            default:                throw new WriterException('Invalid mode: ' . $mode);        }    }    /**     * Appends numeric bytes to a bit array.     */    private static function appendNumericBytes(string $content, BitArray $bits) : void    {        $length = strlen($content);        $i = 0;        while ($i < $length) {            $num1 = (int) $content[$i];            if ($i + 2 < $length) {                // Encode three numeric letters in ten bits.                $num2 = (int) $content[$i + 1];                $num3 = (int) $content[$i + 2];                $bits->appendBits($num1 * 100 + $num2 * 10 + $num3, 10);                $i += 3;            } elseif ($i + 1 < $length) {                // Encode two numeric letters in seven bits.                $num2 = (int) $content[$i + 1];                $bits->appendBits($num1 * 10 + $num2, 7);                $i += 2;            } else {                // Encode one numeric letter in four bits.                $bits->appendBits($num1, 4);                ++$i;            }        }    }    /**     * Appends alpha-numeric bytes to a bit array.     *     * @throws WriterException if an invalid alphanumeric code was found     */    private static function appendAlphanumericBytes(string $content, BitArray $bits) : void    {        $length = strlen($content);        $i = 0;        while ($i < $length) {            $code1 = self::getAlphanumericCode(ord($content[$i]));            if (-1 === $code1) {                throw new WriterException('Invalid alphanumeric code');            }            if ($i + 1 < $length) {                $code2 = self::getAlphanumericCode(ord($content[$i + 1]));                if (-1 === $code2) {                    throw new WriterException('Invalid alphanumeric code');                }                // Encode two alphanumeric letters in 11 bits.                $bits->appendBits($code1 * 45 + $code2, 11);                $i += 2;            } else {                // Encode one alphanumeric letter in six bits.                $bits->appendBits($code1, 6);                ++$i;            }        }    }    /**     * Appends regular 8-bit bytes to a bit array.     *     * @throws WriterException if content cannot be encoded to target encoding     */    private static function append8BitBytes(string $content, BitArray $bits, string $encoding) : void    {        $bytes = @iconv('utf-8', $encoding, $content);        if (false === $bytes) {            throw new WriterException('Could not encode content to ' . $encoding);        }        $length = strlen($bytes);        for ($i = 0; $i < $length; $i++) {            $bits->appendBits(ord($bytes[$i]), 8);        }    }    /**     * Appends KANJI bytes to a bit array.     *     * @throws WriterException if content does not seem to be encoded in SHIFT-JIS     * @throws WriterException if an invalid byte sequence occurs     */    private static function appendKanjiBytes(string $content, BitArray $bits) : void    {        if (strlen($content) % 2 > 0) {            // We just do a simple length check here. The for loop will check            // individual characters.            throw new WriterException('Content does not seem to be encoded in SHIFT-JIS');        }        $length = strlen($content);        for ($i = 0; $i < $length; $i += 2) {            $byte1 = ord($content[$i]) & 0xff;            $byte2 = ord($content[$i + 1]) & 0xff;            $code = ($byte1 << 8) | $byte2;            if ($code >= 0x8140 && $code <= 0x9ffc) {                $subtracted = $code - 0x8140;            } elseif ($code >= 0xe040 && $code <= 0xebbf) {                $subtracted = $code - 0xc140;            } else {                throw new WriterException('Invalid byte sequence');            }            $encoded = (($subtracted >> 8) * 0xc0) + ($subtracted & 0xff);            $bits->appendBits($encoded, 13);        }    }    /**     * Appends ECI information to a bit array.     */    private static function appendEci(CharacterSetEci $eci, BitArray $bits) : void    {        $mode = Mode::ECI();        $bits->appendBits($mode->getBits(), 4);        $bits->appendBits($eci->getValue(), 8);    }}
 |