aboutsummaryrefslogtreecommitdiff
path: root/clang/tools/include-mapping/cppreference_parser.py
diff options
context:
space:
mode:
authorc8ef <c8ef@outlook.com>2024-12-31 09:28:34 +0800
committerGitHub <noreply@github.com>2024-12-31 09:28:34 +0800
commitf385542f62fa1f57001c95c476165e1618cb54ba (patch)
tree2143a7f87787f9bba5655ff02157dc5dc3b37230 /clang/tools/include-mapping/cppreference_parser.py
parent9abcca5e25296aea49288ad63901f9e0a332dad4 (diff)
downloadllvm-f385542f62fa1f57001c95c476165e1618cb54ba.zip
llvm-f385542f62fa1f57001c95c476165e1618cb54ba.tar.gz
llvm-f385542f62fa1f57001c95c476165e1618cb54ba.tar.bz2
[Tooling/Inclusion] Modify the Python script to open the C++ reference with UTF-8 encoding. (#121341)
This will prevent the error on systems with a default encoding other than utf-8. ``` UnicodeDecodeError: 'gbk' codec can't decode byte 0xb6 in position 12958: illegal multibyte sequence ```
Diffstat (limited to 'clang/tools/include-mapping/cppreference_parser.py')
-rw-r--r--clang/tools/include-mapping/cppreference_parser.py4
1 files changed, 2 insertions, 2 deletions
diff --git a/clang/tools/include-mapping/cppreference_parser.py b/clang/tools/include-mapping/cppreference_parser.py
index 9101f3d..f7da2ba 100644
--- a/clang/tools/include-mapping/cppreference_parser.py
+++ b/clang/tools/include-mapping/cppreference_parser.py
@@ -139,7 +139,7 @@ def _ParseIndexPage(index_page_html):
def _ReadSymbolPage(path, name, qual_name):
- with open(path) as f:
+ with open(path, encoding="utf-8") as f:
return _ParseSymbolPage(f.read(), name, qual_name)
@@ -156,7 +156,7 @@ def _GetSymbols(pool, root_dir, index_page_name, namespace, variants_to_accept):
# contains the defined header.
# 2. Parse the symbol page to get the defined header.
index_page_path = os.path.join(root_dir, index_page_name)
- with open(index_page_path, "r") as f:
+ with open(index_page_path, "r", encoding="utf-8") as f:
# Read each symbol page in parallel.
results = [] # (symbol_name, promise of [header...])
for symbol_name, symbol_page_path, variant in _ParseIndexPage(f.read()):