@@ -4,9 +4,7 @@ name = "scrapegraphai"
4
4
5
5
version = " 1.14.1"
6
6
7
-
8
7
description = " A web scraping library based on LangChain which uses LLM and direct graph logic to create scraping pipelines."
9
-
10
8
authors = [
11
9
{ name = " Marco Vinciguerra" , email = " mvincig11@gmail.com" },
12
10
{ name = " Marco Perini" , email = " perinim.98@gmail.com" },
@@ -15,32 +13,24 @@ authors = [
15
13
16
14
dependencies = [
17
15
" langchain>=0.2.14" ,
18
- " langchain-fireworks>=0.1.3" ,
19
- " langchain_community>=0.2.9" ,
20
16
" langchain-google-genai>=1.0.7" ,
21
- " langchain-google-vertexai>=1.0.7" ,
22
17
" langchain-openai>=0.1.22" ,
23
- " langchain-groq>=0.1.3" ,
24
- " langchain-aws>=0.1.3" ,
25
- " langchain-anthropic>=0.1.11" ,
26
18
" langchain-mistralai>=0.1.12" ,
27
- " langchain-huggingface >=0.0.3 " ,
28
- " langchain-nvidia-ai-endpoints >=0.1.6 " ,
19
+ " langchain_community >=0.2.9 " ,
20
+ " langchain-aws >=0.1.3 " ,
29
21
" html2text>=2024.2.26" ,
30
22
" faiss-cpu>=1.8.0" ,
31
23
" beautifulsoup4>=4.12.3" ,
32
24
" pandas>=2.2.2" ,
33
25
" python-dotenv>=1.0.1" ,
34
26
" tiktoken>=0.7" ,
35
27
" tqdm>=4.66.4" ,
36
- " graphviz>=0.20.3" ,
37
28
" minify-html>=0.15.0" ,
38
29
" free-proxy>=1.1.1" ,
39
30
" playwright>=1.43.0" ,
40
- " google>=3.0.0" ,
41
31
" undetected-playwright>=0.3.0" ,
32
+ " google>=3.0.0" ,
42
33
" semchunk>=1.0.1" ,
43
- " browserbase>=0.3.0" ,
44
34
]
45
35
46
36
license = " MIT"
@@ -79,6 +69,25 @@ requires-python = ">=3.9,<4.0"
79
69
burr = [" burr[start]==0.22.1" ]
80
70
docs = [" sphinx==6.0" , " furo==2024.5.6" ]
81
71
72
+ # Group 1: Other Language Models
73
+ other-language-models = [
74
+ " langchain-fireworks>=0.1.3" ,
75
+ " langchain-groq>=0.1.3" ,
76
+ " langchain-anthropic>=0.1.11" ,
77
+ " langchain-huggingface>=0.0.3" ,
78
+ " langchain-nvidia-ai-endpoints>=0.1.6" ,
79
+ ]
80
+
81
+ # Group 2: More Semantic Options
82
+ more-semantic-options = [
83
+ " graphviz>=0.20.3" ,
84
+ ]
85
+
86
+ # Group 3: More Browser Options
87
+ more-browser-options = [
88
+ " browserbase>=0.3.0" ,
89
+ ]
90
+
82
91
[build-system ]
83
92
requires = [" hatchling" ]
84
93
build-backend = " hatchling.build"
0 commit comments