forked from CocoRoF/Contextifier
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathpyproject.toml
More file actions
106 lines (102 loc) · 2.66 KB
/
pyproject.toml
File metadata and controls
106 lines (102 loc) · 2.66 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
[build-system]
requires = ["hatchling"]
build-backend = "hatchling.build"
[project]
name = "contextifier"
version = "0.2.2"
description = "Convert raw documents into AI-understandable context with intelligent text extraction, table detection, and semantic chunking"
readme = "README.md"
requires-python = ">=3.12"
license = {text = "Apache-2.0"}
authors = [
{name = "CocoRoF", email = "gkfua00@gmail.com"},
]
maintainers = [
{name = "CocoRoF", email = "gkfua00@gmail.com"},
]
keywords = [
"document-processing",
"pdf",
"ocr",
"text-extraction",
"chunking",
"ai",
"llm",
"langchain",
"hwp",
"docx",
"xlsx",
]
classifiers = [
"Development Status :: 4 - Beta",
"Intended Audience :: Developers",
"License :: OSI Approved :: Apache Software License",
"Programming Language :: Python :: 3",
"Programming Language :: Python :: 3.12",
"Programming Language :: Python :: 3.13",
"Programming Language :: Python :: 3.14",
"Topic :: Software Development :: Libraries :: Python Modules",
"Topic :: Text Processing",
"Topic :: Scientific/Engineering :: Artificial Intelligence",
]
dependencies = [
"pydantic==2.12.5",
"pydantic-core==2.41.5",
"pydantic-settings==2.12.0",
"python-dotenv==1.2.1",
"python-multipart==0.0.20",
"orjson==3.11.5",
"psutil==7.0.0",
"pandas==2.3.3",
"langchain==1.2.3",
"langchain-aws==1.2.0",
"langchain-community==0.4.1",
"langchain-core==1.2.6",
"langchain-openai==1.1.7",
"langchain-anthropic==1.3.1",
"langchain-google-genai==4.1.3",
"langchain-text-splitters==1.1.0",
"langgraph==1.0.5",
"langsmith==0.6.2",
"beautifulsoup4==4.14.3",
"docx2pdf==0.1.8",
"python-docx==1.2.0",
"python-pptx==1.0.2",
"pymupdf==1.26.5",
"pdfplumber==0.11.5",
"openpyxl==3.1.5",
"xlrd==2.0.2",
"olefile==0.47",
"pyhwp==0.1b15",
"chardet==5.2.0",
"pi-heif==1.1.1",
"pdfminer-six==20231228",
"pdf2image==1.17.0",
"pytesseract==0.3.13",
"striprtf==0.0.29",
"cachetools==6.2.4",
]
[project.urls]
Homepage = "https://github.com/CocoRoF/Contextifier"
Documentation = "https://github.com/CocoRoF/Contextifier#readme"
Repository = "https://github.com/CocoRoF/Contextifier.git"
Issues = "https://github.com/CocoRoF/Contextifier/issues"
Changelog = "https://github.com/CocoRoF/Contextifier/releases"
[tool.hatch.build.targets.wheel]
packages = ["contextifier"]
[tool.hatch.build.targets.sdist]
include = [
"contextifier/",
"README.md",
"LICENSE",
"pyproject.toml",
]
exclude = [
"/.git",
"/.venv",
"/__pycache__",
"*.pyc",
"test/",
"temp/",
"libs/",
]