From 16856529d75ffe9b84614df8986142517022ddbe Mon Sep 17 00:00:00 2001 From: VincyZhang Date: Thu, 14 Dec 2023 11:18:23 +0800 Subject: [PATCH] adapt to windows (#916) Signed-off-by: Wenxin Zhang --- .../pipeline/plugins/retrieval/indexing/context_utils.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/intel_extension_for_transformers/neural_chat/pipeline/plugins/retrieval/indexing/context_utils.py b/intel_extension_for_transformers/neural_chat/pipeline/plugins/retrieval/indexing/context_utils.py index cc8436cc8e6..0263bb0cb42 100644 --- a/intel_extension_for_transformers/neural_chat/pipeline/plugins/retrieval/indexing/context_utils.py +++ b/intel_extension_for_transformers/neural_chat/pipeline/plugins/retrieval/indexing/context_utils.py @@ -48,7 +48,7 @@ def read_pdf(pdf_path): def read_html(html_path): """Read the html file.""" - with open(html_path, 'r') as file: + with open(html_path, 'r', encoding="utf-8") as file: html = file.read() soup = BeautifulSoup(html, 'html.parser') text = soup.get_text(strip=True)