diff --git a/scrapegraphai/nodes/fetch_node.py b/scrapegraphai/nodes/fetch_node.py index ec202f3f..2637a70a 100644 --- a/scrapegraphai/nodes/fetch_node.py +++ b/scrapegraphai/nodes/fetch_node.py @@ -356,7 +356,7 @@ def handle_web_source(self, state, source): compressed_document = [ Document(page_content=parsed_content, metadata={"source": "html file"}) ] - state["original_html"] = document + state["doc"] = document state.update( { self.output[0]: compressed_document, diff --git a/scrapegraphai/nodes/parse_node.py b/scrapegraphai/nodes/parse_node.py index 1c409da2..44cd5896 100644 --- a/scrapegraphai/nodes/parse_node.py +++ b/scrapegraphai/nodes/parse_node.py @@ -121,7 +121,6 @@ def execute(self, state: dict) -> dict: state.update({self.output[0]: chunks}) state.update({"parsed_doc": chunks}) - state.update({"content": chunks}) if self.parse_urls: state.update({self.output[1]: link_urls})