From 947ebd2895408c5ebd00b9a3da1b220937553c4a Mon Sep 17 00:00:00 2001 From: Marco Vinciguerra Date: Tue, 10 Sep 2024 08:41:08 +0200 Subject: [PATCH] fix: parse node --- scrapegraphai/nodes/parse_node.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/scrapegraphai/nodes/parse_node.py b/scrapegraphai/nodes/parse_node.py index 3e8ed5ac..a28b2e86 100644 --- a/scrapegraphai/nodes/parse_node.py +++ b/scrapegraphai/nodes/parse_node.py @@ -65,7 +65,7 @@ class ParseNode(BaseNode): docs_transformed = input_data[0] if self.parse_html: - docs_transformed = Html2TextTransformer().transform_documents(input_data[0]) + docs_transformed = Html2TextTransformer(ignore_links=False).transform_documents(input_data[0]) docs_transformed = docs_transformed[0] chunks = chunk(text=docs_transformed.page_content,