-
-
Notifications
You must be signed in to change notification settings - Fork 1.4k
/
Copy pathpyproject.toml
121 lines (108 loc) · 2.82 KB
/
pyproject.toml
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
[project]
name = "scrapegraphai"
version = "1.36.0"
description = "A web scraping library based on LangChain which uses LLM and direct graph logic to create scraping pipelines."
authors = [
{ name = "Marco Vinciguerra", email = "[email protected]" },
{ name = "Marco Perini", email = "[email protected]" },
{ name = "Lorenzo Padoan", email = "[email protected]" }
]
dependencies = [
"langchain>=0.3.0",
"langchain-openai>=0.1.22",
"langchain-mistralai>=0.1.12",
"langchain_community>=0.2.9",
"langchain-aws>=0.1.3",
"langchain-ollama>=0.1.3",
"html2text>=2024.2.26",
"beautifulsoup4>=4.12.3",
"python-dotenv>=1.0.1",
"tiktoken>=0.7",
"tqdm>=4.66.4",
"minify-html>=0.15.0",
"free-proxy>=1.1.1",
"playwright>=1.43.0",
"undetected-playwright>=0.3.0",
"semchunk>=2.2.0",
"googlesearch-python>=1.2.5",
"async-timeout>=4.0.3",
"simpleeval>=1.0.0",
"jsonschema>=4.23.0"
]
readme = "README.md"
homepage = "https://scrapegraphai.com/"
repository = "https://github.com/ScrapeGraphAI/Scrapegraph-ai"
documentation = "https://scrapegraph-ai.readthedocs.io/en/latest/"
keywords = [
"scrapegraph",
"scrapegraphai",
"langchain",
"ai",
"artificial intelligence",
"gpt",
"machine learning",
"rag",
"nlp",
"natural language processing",
"openai",
"scraping",
"web scraping",
"web scraping library",
"web scraping tool",
"webscraping",
"graph",
"llm"
]
classifiers = [
"Intended Audience :: Developers",
"Topic :: Software Development :: Libraries :: Python Modules",
"Programming Language :: Python :: 3",
"Operating System :: OS Independent",
]
requires-python = ">=3.10,<4.0"
[project.optional-dependencies]
burr = ["burr[start]==0.22.1"]
docs = ["sphinx==6.0", "furo==2024.5.6"]
ocr = [
"surya-ocr>=0.5.0",
"matplotlib>=3.7.2",
"ipywidgets>=8.1.0",
"pillow>=10.4.0",
]
[build-system]
requires = ["hatchling==1.26.3"]
build-backend = "hatchling.build"
[tool.uv]
dev-dependencies = [
"pytest>=8.0.0",
"pytest-mock>=3.14.0",
"pytest-asyncio>=0.25.0",
"pytest-sugar>=1.0.0",
"pytest-cov>=4.1.0",
"pylint>=3.2.5",
"poethepoet>=0.32.0",
"black>=24.2.0",
"ruff>=0.2.0",
"isort>=5.13.2",
"pre-commit>=3.6.0",
"mypy>=1.8.0",
"types-setuptools>=75.1.0"
]
[tool.black]
line-length = 88
target-version = ["py310"]
[tool.isort]
profile = "black"
[tool.ruff]
line-length = 88
[tool.ruff.lint]
select = ["F", "E", "W", "C"]
ignore = ["E203", "E501", "C901"] # Ignore conflicts with Black
[tool.mypy]
python_version = "3.10"
strict = true
disallow_untyped_calls = true
ignore_missing_imports = true
[tool.poe.tasks]
pylint-local = "pylint scraperaphai/**/*.py"
pylint-ci = "pylint --disable=C0114,C0115,C0116 --exit-zero scrapegraphai/**/*.py"