-
Notifications
You must be signed in to change notification settings - Fork 7
Expand file tree
/
Copy pathpyproject.toml
More file actions
116 lines (107 loc) · 2.54 KB
/
pyproject.toml
File metadata and controls
116 lines (107 loc) · 2.54 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
[build-system]
requires = ["setuptools>=61.0", "wheel"]
build-backend = "setuptools.build_meta"
[project]
name = "web2json-agent"
version = "1.1.6"
description = "Web Structured Data Extraction Agent"
readme = "README.md"
requires-python = ">=3.10"
license = "Apache-2.0"
authors = [
{name = "YangGuoqiang", email = "1041206149@qq.com"}
]
keywords = [
"web scraping",
"html parser",
"ai agent",
"code generation",
"langchain",
"web automation",
"data pipeline",
"structured data"
]
classifiers = [
"Development Status :: 4 - Beta",
"Intended Audience :: Developers",
"Programming Language :: Python :: 3",
"Programming Language :: Python :: 3.10",
"Programming Language :: Python :: 3.11",
"Programming Language :: Python :: 3.12",
"Programming Language :: Python :: 3.13",
"Topic :: Software Development :: Code Generators",
"Topic :: Internet :: WWW/HTTP :: Indexing/Search",
"Topic :: Text Processing :: Markup :: HTML",
]
dependencies = [
"langchain==1.0.1",
"langchain-core==1.0.5",
"langchain-openai==1.0.3",
"langchain-anthropic==1.1.0",
"openai==2.8.1",
"pydantic==2.10.3",
"pydantic-settings==2.6.1",
"python-dotenv==1.1.0",
"loguru==0.7.3",
"DrissionPage==4.1.1.2",
"beautifulsoup4==4.12.3",
"lxml==5.3.0",
"requests==2.32.3",
"numpy>=1.24.0",
"scikit-learn>=1.3.0",
# Apify SDK for Actor platform integration
"apify==1.7.2",
# Web API dependencies
"fastapi==0.109.0",
"uvicorn[standard]==0.27.0",
"python-multipart==0.0.6",
"aiofiles==23.2.1",
]
[project.optional-dependencies]
dev = [
"pytest>=7.0.0",
"pytest-cov>=4.0.0",
"black>=23.0.0",
"flake8>=6.0.0",
"mypy>=1.0.0",
]
[project.urls]
Homepage = "https://github.com/ccprocessor/web2json-agent"
Repository = "https://github.com/ccprocessor/web2json-agent.git"
"Bug Tracker" = "https://github.com/ccprocessor/web2json-agent/issues"
[project.scripts]
web2json = "web2json.cli:main"
[tool.setuptools.packages.find]
where = ["."]
include = [
"web2json*",
"web2json_api*",
]
exclude = [
"tests*",
"docs*",
"examples*",
"output*",
"logs*",
"input_html*",
"input_url*",
"evaluation*",
"evaluationSet*",
"swde_*",
"web2json_ui*",
]
[tool.setuptools.package-data]
"*" = [
"*.txt",
"*.json",
"*.yaml",
"*.md",
]
[tool.black]
line-length = 100
target-version = ['py310']
[tool.mypy]
python_version = "3.10"
warn_return_any = true
warn_unused_configs = true
disallow_untyped_defs = false