Skip to content

Commit fd0a902

Browse files
authored
Merge pull request #619 from tm-robinson/543-ScriptCreatorGraph-only-use-first-chunk
543 script creator graph only use first chunk
2 parents ba5c7ad + e741602 commit fd0a902

14 files changed

+73
-22
lines changed

CHANGELOG.md

Lines changed: 6 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,5 @@
1-
## [1.16.0-beta.4](https://github.com/ScrapeGraphAI/Scrapegraph-ai/compare/v1.16.0-beta.3...v1.16.0-beta.4) (2024-09-02)
1+
## [1.16.0](https://github.com/ScrapeGraphAI/Scrapegraph-ai/compare/v1.15.2...v1.16.0) (2024-09-01)
2+
23

34

45
### Features
@@ -11,6 +12,9 @@
1112
* deepcopy fail for coping model_instance config ([cd07418](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/cd07418474112cecd53ab47866262f2f31294223))
1213
* fix pydantic object copy ([553527a](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/553527a269cdd70c0c174ad5c78cbf35c00b22c1))
1314

15+
## [1.15.2](https://github.com/ScrapeGraphAI/Scrapegraph-ai/compare/v1.15.1...v1.15.2) (2024-09-01)
16+
17+
1418
## [1.16.0-beta.3](https://github.com/ScrapeGraphAI/Scrapegraph-ai/compare/v1.16.0-beta.2...v1.16.0-beta.3) (2024-09-01)
1519

1620

@@ -27,6 +31,7 @@
2731

2832

2933

34+
3035
### Bug Fixes
3136

3237
* pyproject.toml ([360ce1c](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/360ce1c0e468c959e63555120ac7cecf55563846))

pyproject.toml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,6 @@
11
[project]
22
name = "scrapegraphai"
3+
34
version = "1.16.0b4"
45

56
description = "A web scraping library based on LangChain which uses LLM and direct graph logic to create scraping pipelines."

scrapegraphai/graphs/abstract_graph.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -141,7 +141,7 @@ def _create_llm(self, llm_config: dict) -> object:
141141
try:
142142
self.model_token = models_tokens[llm_params["model_provider"]][llm_params["model"]]
143143
except KeyError:
144-
print("Model not found, using default token size (8192)")
144+
print(f"Model {llm_params['model_provider']}/{llm_params['model']} not found, using default token size (8192)")
145145
self.model_token = 8192
146146

147147
try:

scrapegraphai/graphs/deep_scraper_graph.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -75,7 +75,8 @@ def _create_repeated_graph(self) -> BaseGraph:
7575
input="doc",
7676
output=["parsed_doc"],
7777
node_config={
78-
"chunk_size": self.model_token
78+
"chunk_size": self.model_token,
79+
"llm_model": self.llm_model
7980
}
8081
)
8182

scrapegraphai/graphs/markdown_scraper_graph.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -60,7 +60,8 @@ def _create_graph(self) -> BaseGraph:
6060
output=["parsed_doc"],
6161
node_config={
6262
"parse_html": False,
63-
"chunk_size": self.model_token
63+
"chunk_size": self.model_token,
64+
"llm_model": self.llm_model
6465
}
6566
)
6667
generate_answer_node = GenerateAnswerNode(

scrapegraphai/graphs/omni_scraper_graph.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -74,7 +74,8 @@ def _create_graph(self) -> BaseGraph:
7474
input="doc",
7575
output=["parsed_doc"],
7676
node_config={
77-
"chunk_size": self.model_token
77+
"chunk_size": self.model_token,
78+
"llm_model": self.llm_model
7879
}
7980
)
8081
image_to_text_node = ImageToTextNode(

scrapegraphai/graphs/pdf_scraper_graph.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -68,7 +68,8 @@ def _create_graph(self) -> BaseGraph:
6868
output=["parsed_doc"],
6969
node_config={
7070
"parse_html": False,
71-
"chunk_size": self.model_token
71+
"chunk_size": self.model_token,
72+
"llm_model": self.llm_model
7273
}
7374
)
7475

scrapegraphai/graphs/script_creator_graph.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -73,11 +73,12 @@ def _create_graph(self) -> BaseGraph:
7373
input="doc",
7474
output=["parsed_doc"],
7575
node_config={"chunk_size": self.model_token,
76-
"parse_html": False
76+
"parse_html": False,
77+
"llm_model": self.llm_model
7778
}
7879
)
7980
generate_scraper_node = GenerateScraperNode(
80-
input="user_prompt & (doc)",
81+
input="user_prompt & (parsed_doc)",
8182
output=["answer"],
8283
node_config={
8384
"llm_model": self.llm_model,

scrapegraphai/graphs/search_link_graph.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -64,7 +64,8 @@ def _create_graph(self) -> BaseGraph:
6464
input="doc",
6565
output=["parsed_doc"],
6666
node_config={
67-
"chunk_size": self.model_token
67+
"chunk_size": self.model_token,
68+
"llm_model": self.llm_model
6869
}
6970
)
7071
search_link_node = SearchLinkNode(

scrapegraphai/graphs/speech_graph.py

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -68,7 +68,8 @@ def _create_graph(self) -> BaseGraph:
6868
input="doc",
6969
output=["parsed_doc"],
7070
node_config={
71-
"chunk_size": self.model_token
71+
"chunk_size": self.model_token,
72+
"llm_model": self.llm_model
7273
}
7374
)
7475
generate_answer_node = GenerateAnswerNode(

0 commit comments

Comments
 (0)