Skip to content

Commit 9a5948e

Browse files
authored
Merge branch 'main' into temp
2 parents 1756e85 + 879a554 commit 9a5948e

File tree

7 files changed

+43
-6
lines changed

7 files changed

+43
-6
lines changed

CHANGELOG.md

Lines changed: 20 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,17 +18,37 @@
1818
### Features
1919

2020
* add new toml ([fcb3220](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/fcb3220868e7ef1127a7a47f40d0379be282e6eb))
21+
* add gpt4o omni ([431edb7](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/431edb7bb2504f4c1335c3ae3ce2f91867fa7222))
22+
* add searchngx integration ([5c92186](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/5c9218608140bf694fbfd96aa90276bc438bb475))
23+
* refactoring_to_md function ([602dd00](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/602dd00209ee1d72a1223fc4793759450921fcf9))
24+
25+
2126

2227

2328
### chore
2429

2530
* **pyproject:** upgrade dependencies ([0425124](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/0425124c570f765b98fcf67ba6649f4f9fe76b15))
2631

2732

33+
2834
### Docs
2935

3036
* **gpt-4o-mini:** added new gpt, fixed chromium lazy loading, ([99dc849](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/99dc8497d85289759286a973e4aecc3f924d3ada))
3137

38+
39+
40+
### CI
41+
42+
* **release:** 1.10.0-beta.1 [skip ci] ([8f619de](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/8f619de23540216934b53bcf3426702e56c48f31))
43+
* **release:** 1.10.0-beta.2 [skip ci] ([aa7d4f0](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/aa7d4f0ebfc2623a51ce1e4887ff26c9906b0a95))
44+
* **release:** 1.10.0-beta.3 [skip ci] ([bf0a2f3](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/bf0a2f386f38cbe81d1e5ea3e05357f8ecabcab2))
45+
* **release:** 1.10.0-beta.4 [skip ci] ([a91807a](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/a91807a20cc07b15feb1ddd5cf7a1c323ff32b46))
46+
* **release:** 1.10.0-beta.5 [skip ci] ([0d5f925](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/0d5f9259d8fb148de7c95cf6f67f9562c5d2c880))
47+
* **release:** 1.9.0-beta.3 [skip ci] ([d3e63d9](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/d3e63d91be79f74e8a3fdb00e692d546c24cead5))
48+
* **release:** 1.9.0-beta.4 [skip ci] ([2fa04b5](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/2fa04b58159abf7af890ebc0768fe23d51bf177f))
49+
* **release:** 1.9.0-beta.5 [skip ci] ([bb62439](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/bb624399cfc3924825892dd48697fc298ad3b002))
50+
* **release:** 1.9.0-beta.6 [skip ci] ([54a69de](https://github.com/ScrapeGraphAI/Scrapegraph-ai/commit/54a69de69e8077e02fd5584783ca62cc2e0ec5bb))
51+
3252
## [1.10.0-beta.5](https://github.com/ScrapeGraphAI/Scrapegraph-ai/compare/v1.10.0-beta.4...v1.10.0-beta.5) (2024-07-20)
3353

3454

examples/local_models/smart_scraper_ollama.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -28,8 +28,8 @@
2828
# ************************************************
2929

3030
smart_scraper_graph = SmartScraperGraph(
31-
prompt="List me all the titles",
32-
source="https://perinim.github.io/projects",
31+
prompt="List me all the titles of the website",
32+
source="https://sport.sky.it/nba?gr=www",
3333
config=graph_config
3434
)
3535

requirements-dev.lock

Lines changed: 7 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -51,6 +51,7 @@ blinker==1.8.2
5151
boto3==1.34.146
5252
# via langchain-aws
5353
botocore==1.34.146
54+
5455
# via boto3
5556
# via s3transfer
5657
burr==0.22.1
@@ -179,6 +180,7 @@ greenlet==3.0.3
179180
# via playwright
180181
# via sqlalchemy
181182
groq==0.9.0
183+
182184
# via langchain-groq
183185
grpc-google-iam-v1==0.13.1
184186
# via google-cloud-resource-manager
@@ -253,6 +255,7 @@ langchain==0.2.10
253255
langchain-anthropic==0.1.20
254256
# via scrapegraphai
255257
langchain-aws==0.1.12
258+
256259
# via scrapegraphai
257260
langchain-core==0.2.22
258261
# via langchain
@@ -268,15 +271,17 @@ langchain-core==0.2.22
268271
langchain-fireworks==0.1.5
269272
# via scrapegraphai
270273
langchain-google-genai==1.0.8
274+
271275
# via scrapegraphai
272276
langchain-google-vertexai==1.0.7
273277
# via scrapegraphai
274278
langchain-groq==0.1.6
275279
# via scrapegraphai
276-
langchain-nvidia-ai-endpoints==0.1.6
280+
plangchain-nvidia-ai-endpoints==0.1.6
277281
# via scrapegraphai
278282
langchain-openai==0.1.17
279283
# via scrapegraphai
284+
280285
langchain-text-splitters==0.2.2
281286
# via langchain
282287
langsmith==0.1.93
@@ -291,6 +296,7 @@ markdown-it-py==3.0.0
291296
markupsafe==2.1.5
292297
# via jinja2
293298
matplotlib==3.9.1
299+
294300
# via burr
295301
mccabe==0.7.0
296302
# via pylint

requirements.lock

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -127,6 +127,7 @@ greenlet==3.0.3
127127
# via playwright
128128
# via sqlalchemy
129129
groq==0.9.0
130+
130131
# via langchain-groq
131132
grpc-google-iam-v1==0.13.1
132133
# via google-cloud-resource-manager
@@ -174,6 +175,7 @@ langchain==0.2.10
174175
langchain-anthropic==0.1.20
175176
# via scrapegraphai
176177
langchain-aws==0.1.12
178+
177179
# via scrapegraphai
178180
langchain-core==0.2.22
179181
# via langchain
@@ -189,6 +191,7 @@ langchain-core==0.2.22
189191
langchain-fireworks==0.1.5
190192
# via scrapegraphai
191193
langchain-google-genai==1.0.8
194+
192195
# via scrapegraphai
193196
langchain-google-vertexai==1.0.7
194197
# via scrapegraphai
@@ -198,6 +201,7 @@ langchain-nvidia-ai-endpoints==0.1.6
198201
# via scrapegraphai
199202
langchain-openai==0.1.17
200203
# via scrapegraphai
204+
201205
langchain-text-splitters==0.2.2
202206
# via langchain
203207
langsmith==0.1.93
@@ -214,6 +218,7 @@ multidict==6.0.5
214218
# via yarl
215219
multiprocess==0.70.16
216220
# via mpire
221+
217222
numpy==1.26.4
218223
# via faiss-cpu
219224
# via langchain
@@ -322,6 +327,7 @@ soupsieve==2.5
322327
sqlalchemy==2.0.31
323328
# via langchain
324329
tenacity==8.5.0
330+
325331
# via langchain
326332
# via langchain-core
327333
tiktoken==0.7.0

scrapegraphai/graphs/abstract_graph.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -150,6 +150,10 @@ def _create_llm(self, llm_config: dict, chat=False) -> object:
150150

151151
# If model instance is passed directly instead of the model details
152152
if "model_instance" in llm_params:
153+
try:
154+
self.model_token = llm_params["model_tokens"]
155+
except KeyError as exc:
156+
raise KeyError("model_tokens not specified") from exc
153157
return llm_params["model_instance"]
154158

155159
# Instantiate the language model based on the model name

scrapegraphai/nodes/parse_node.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -94,4 +94,4 @@ def execute(self, state: dict) -> dict:
9494

9595
state.update({self.output[0]: chunks})
9696

97-
return state
97+
return state

scrapegraphai/telemetry/telemetry.py

Lines changed: 3 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -91,7 +91,7 @@ def _check_config_and_environ_for_telemetry_flag(
9191
"python_version": f"{platform.python_version()}/{platform.python_implementation()}",
9292
"distinct_id": g_anonymous_id,
9393
"scrapegraphai_version": VERSION,
94-
"telemetry_version": "0.0.1",
94+
"telemetry_version": "0.0.3",
9595
}
9696

9797

@@ -156,7 +156,7 @@ def log_event(event: str, properties: Dict[str, any]):
156156
send_event_json(event_json)
157157

158158

159-
def log_graph_execution(graph_name: str, source: str, prompt:str, schema:dict, llm_model: str, embedder_model: str, source_type: str, execution_time: float, response: dict = None, error_node: str = None, exception: str = None, total_tokens: int = None):
159+
def log_graph_execution(graph_name: str, source: str, prompt:str, schema:dict, llm_model: str, embedder_model: str, source_type: str, execution_time: float, response: dict = None, error_node: str = None, exception: str = None, total_tokens: int = None, is_library=True):
160160
properties = {
161161
"graph_name": graph_name,
162162
"source": source,
@@ -170,6 +170,7 @@ def log_graph_execution(graph_name: str, source: str, prompt:str, schema:dict, l
170170
"error_node": error_node,
171171
"exception": exception,
172172
"total_tokens": total_tokens,
173+
"is_library": is_library
173174
}
174175
log_event("graph_execution", properties)
175176

0 commit comments

Comments
 (0)