diff options
author | c8ef <c8ef@outlook.com> | 2024-12-31 09:28:34 +0800 |
---|---|---|
committer | GitHub <noreply@github.com> | 2024-12-31 09:28:34 +0800 |
commit | f385542f62fa1f57001c95c476165e1618cb54ba (patch) | |
tree | 2143a7f87787f9bba5655ff02157dc5dc3b37230 /clang/tools/include-mapping/cppreference_parser.py | |
parent | 9abcca5e25296aea49288ad63901f9e0a332dad4 (diff) | |
download | llvm-f385542f62fa1f57001c95c476165e1618cb54ba.zip llvm-f385542f62fa1f57001c95c476165e1618cb54ba.tar.gz llvm-f385542f62fa1f57001c95c476165e1618cb54ba.tar.bz2 |
[Tooling/Inclusion] Modify the Python script to open the C++ reference with UTF-8 encoding. (#121341)
This will prevent the error on systems with a default encoding other
than utf-8.
```
UnicodeDecodeError: 'gbk' codec can't decode byte 0xb6 in position 12958: illegal multibyte sequence
```
Diffstat (limited to 'clang/tools/include-mapping/cppreference_parser.py')
-rw-r--r-- | clang/tools/include-mapping/cppreference_parser.py | 4 |
1 files changed, 2 insertions, 2 deletions
diff --git a/clang/tools/include-mapping/cppreference_parser.py b/clang/tools/include-mapping/cppreference_parser.py index 9101f3d..f7da2ba 100644 --- a/clang/tools/include-mapping/cppreference_parser.py +++ b/clang/tools/include-mapping/cppreference_parser.py @@ -139,7 +139,7 @@ def _ParseIndexPage(index_page_html): def _ReadSymbolPage(path, name, qual_name): - with open(path) as f: + with open(path, encoding="utf-8") as f: return _ParseSymbolPage(f.read(), name, qual_name) @@ -156,7 +156,7 @@ def _GetSymbols(pool, root_dir, index_page_name, namespace, variants_to_accept): # contains the defined header. # 2. Parse the symbol page to get the defined header. index_page_path = os.path.join(root_dir, index_page_name) - with open(index_page_path, "r") as f: + with open(index_page_path, "r", encoding="utf-8") as f: # Read each symbol page in parallel. results = [] # (symbol_name, promise of [header...]) for symbol_name, symbol_page_path, variant in _ParseIndexPage(f.read()): |