aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorEvgenii Kliuchnikov <eustas@google.com>2023-07-04 13:01:14 +0000
committerEvgenii Kliuchnikov <eustas.ru@gmail.com>2023-07-05 19:15:11 +0000
commitbc32ae12d575520fcf7b0a82f0e660b7e2705043 (patch)
treefd566426f185c84c82ee5dcad24087ab234baafc
parent6ee96e291db87ccea9b8451a23de0aa0d93d194d (diff)
downloadbrotli-bc32ae12d575520fcf7b0a82f0e660b7e2705043.zip
brotli-bc32ae12d575520fcf7b0a82f0e660b7e2705043.tar.gz
brotli-bc32ae12d575520fcf7b0a82f0e660b7e2705043.tar.bz2
add tests with UTF8/UTF16 non-ASCII text
PiperOrigin-RevId: 545424981
-rw-r--r--.github/workflows/codeql.yml5
-rw-r--r--python/tests/_test_utils.py2
-rw-r--r--tests/testdata/cp1251-utf16lebin0 -> 1554 bytes
-rw-r--r--tests/testdata/cp1251-utf16le.compressedbin0 -> 632 bytes
-rw-r--r--tests/testdata/cp852-utf812
-rw-r--r--tests/testdata/cp852-utf8.compressedbin0 -> 362 bytes
6 files changed, 18 insertions, 1 deletions
diff --git a/.github/workflows/codeql.yml b/.github/workflows/codeql.yml
index bd043c9..1df6419 100644
--- a/.github/workflows/codeql.yml
+++ b/.github/workflows/codeql.yml
@@ -34,9 +34,12 @@ jobs:
uses: github/codeql-action/init@v2
with:
languages: ${{ matrix.language }}
+ # CodeQL is currently crashing on files with large lists:
+ # https://github.com/github/codeql/issues/13656
config: |
- paths-ignore:
+ paths-ignore:
- research
+ - js/test_data.*
- if: matrix.language == 'cpp'
name: Build CPP
diff --git a/python/tests/_test_utils.py b/python/tests/_test_utils.py
index 059cb43..38afec3 100644
--- a/python/tests/_test_utils.py
+++ b/python/tests/_test_utils.py
@@ -45,6 +45,8 @@ TESTDATA_FILES = [
'random_org_10k.bin', # Small data
'mapsdatazrh', # Large data
'ukkonooa', # Poem
+ 'cp1251-utf16le', # Codepage 1251 table saved in UTF16-LE encoding
+ 'cp852-utf8', # Codepage 852 table saved in UTF8 encoding
]
# Some files might be missing in a lightweight sources pack.
diff --git a/tests/testdata/cp1251-utf16le b/tests/testdata/cp1251-utf16le
new file mode 100644
index 0000000..d1cb042
--- /dev/null
+++ b/tests/testdata/cp1251-utf16le
Binary files differ
diff --git a/tests/testdata/cp1251-utf16le.compressed b/tests/testdata/cp1251-utf16le.compressed
new file mode 100644
index 0000000..2706963
--- /dev/null
+++ b/tests/testdata/cp1251-utf16le.compressed
Binary files differ
diff --git a/tests/testdata/cp852-utf8 b/tests/testdata/cp852-utf8
new file mode 100644
index 0000000..fa14705
--- /dev/null
+++ b/tests/testdata/cp852-utf8
@@ -0,0 +1,12 @@
+The following table shows code page 852. Each character is shown with its equivalent Unicode code point. Only the second half of the table (128–255) is shown, the first half (0–127) being the same as code page 437.
+
+Code page 852
+0 1 2 3 4 5 6 7 8 9 A B C D E F
+8x Ç ü é â ä ů ć ç ł ë Ő ő î Ź Ä Ć
+9x É Ĺ ĺ ô ö Ľ ľ Ś ś Ö Ü Ť ť Ł × č
+Ax á í ó ú Ą ą Ž ž Ę ę ¬ ź Č ş « »
+Bx ░ ▒ ▓ │ ┤ Á Â Ě Ş ╣ ║ ╗ ╝ Ż ż ┐
+Cx └ ┴ ┬ ├ ─ ┼ Ă ă ╚ ╔ ╩ ╦ ╠ ═ ╬ ¤
+Dx đ Đ Ď Ë ď Ň Í Î ě ┘ ┌ █ ▄ Ţ Ů ▀
+Ex Ó ß Ô Ń ń ň Š š Ŕ Ú ŕ Ű ý Ý ţ ´
+Fx SHY ˝ ˛ ˇ ˘ § ÷ ¸ ° ¨ ˙ ű Ř ř ■ NBSP
diff --git a/tests/testdata/cp852-utf8.compressed b/tests/testdata/cp852-utf8.compressed
new file mode 100644
index 0000000..12ba6c2
--- /dev/null
+++ b/tests/testdata/cp852-utf8.compressed
Binary files differ