diff options
author | Evgenii Kliuchnikov <eustas@google.com> | 2023-07-04 13:01:14 +0000 |
---|---|---|
committer | Evgenii Kliuchnikov <eustas.ru@gmail.com> | 2023-07-05 19:15:11 +0000 |
commit | bc32ae12d575520fcf7b0a82f0e660b7e2705043 (patch) | |
tree | fd566426f185c84c82ee5dcad24087ab234baafc | |
parent | 6ee96e291db87ccea9b8451a23de0aa0d93d194d (diff) | |
download | brotli-bc32ae12d575520fcf7b0a82f0e660b7e2705043.zip brotli-bc32ae12d575520fcf7b0a82f0e660b7e2705043.tar.gz brotli-bc32ae12d575520fcf7b0a82f0e660b7e2705043.tar.bz2 |
add tests with UTF8/UTF16 non-ASCII text
PiperOrigin-RevId: 545424981
-rw-r--r-- | .github/workflows/codeql.yml | 5 | ||||
-rw-r--r-- | python/tests/_test_utils.py | 2 | ||||
-rw-r--r-- | tests/testdata/cp1251-utf16le | bin | 0 -> 1554 bytes | |||
-rw-r--r-- | tests/testdata/cp1251-utf16le.compressed | bin | 0 -> 632 bytes | |||
-rw-r--r-- | tests/testdata/cp852-utf8 | 12 | ||||
-rw-r--r-- | tests/testdata/cp852-utf8.compressed | bin | 0 -> 362 bytes |
6 files changed, 18 insertions, 1 deletions
diff --git a/.github/workflows/codeql.yml b/.github/workflows/codeql.yml index bd043c9..1df6419 100644 --- a/.github/workflows/codeql.yml +++ b/.github/workflows/codeql.yml @@ -34,9 +34,12 @@ jobs: uses: github/codeql-action/init@v2 with: languages: ${{ matrix.language }} + # CodeQL is currently crashing on files with large lists: + # https://github.com/github/codeql/issues/13656 config: | - paths-ignore: + paths-ignore: - research + - js/test_data.* - if: matrix.language == 'cpp' name: Build CPP diff --git a/python/tests/_test_utils.py b/python/tests/_test_utils.py index 059cb43..38afec3 100644 --- a/python/tests/_test_utils.py +++ b/python/tests/_test_utils.py @@ -45,6 +45,8 @@ TESTDATA_FILES = [ 'random_org_10k.bin', # Small data 'mapsdatazrh', # Large data 'ukkonooa', # Poem + 'cp1251-utf16le', # Codepage 1251 table saved in UTF16-LE encoding + 'cp852-utf8', # Codepage 852 table saved in UTF8 encoding ] # Some files might be missing in a lightweight sources pack. diff --git a/tests/testdata/cp1251-utf16le b/tests/testdata/cp1251-utf16le Binary files differnew file mode 100644 index 0000000..d1cb042 --- /dev/null +++ b/tests/testdata/cp1251-utf16le diff --git a/tests/testdata/cp1251-utf16le.compressed b/tests/testdata/cp1251-utf16le.compressed Binary files differnew file mode 100644 index 0000000..2706963 --- /dev/null +++ b/tests/testdata/cp1251-utf16le.compressed diff --git a/tests/testdata/cp852-utf8 b/tests/testdata/cp852-utf8 new file mode 100644 index 0000000..fa14705 --- /dev/null +++ b/tests/testdata/cp852-utf8 @@ -0,0 +1,12 @@ +The following table shows code page 852. Each character is shown with its equivalent Unicode code point. Only the second half of the table (128–255) is shown, the first half (0–127) being the same as code page 437. + +Code page 852 +0 1 2 3 4 5 6 7 8 9 A B C D E F +8x Ç ü é â ä ů ć ç ł ë Ő ő î Ź Ä Ć +9x É Ĺ ĺ ô ö Ľ ľ Ś ś Ö Ü Ť ť Ł × č +Ax á í ó ú Ą ą Ž ž Ę ę ¬ ź Č ş « » +Bx ░ ▒ ▓ │ ┤ Á Â Ě Ş ╣ ║ ╗ ╝ Ż ż ┐ +Cx └ ┴ ┬ ├ ─ ┼ Ă ă ╚ ╔ ╩ ╦ ╠ ═ ╬ ¤ +Dx đ Đ Ď Ë ď Ň Í Î ě ┘ ┌ █ ▄ Ţ Ů ▀ +Ex Ó ß Ô Ń ń ň Š š Ŕ Ú ŕ Ű ý Ý ţ ´ +Fx SHY ˝ ˛ ˇ ˘ § ÷ ¸ ° ¨ ˙ ű Ř ř ■ NBSP diff --git a/tests/testdata/cp852-utf8.compressed b/tests/testdata/cp852-utf8.compressed Binary files differnew file mode 100644 index 0000000..12ba6c2 --- /dev/null +++ b/tests/testdata/cp852-utf8.compressed |