|
23 | 23 | }, |
24 | 24 | { |
25 | 25 | "cell_type": "code", |
26 | | - "execution_count": 1, |
| 26 | + "execution_count": null, |
27 | 27 | "metadata": {}, |
28 | | - "outputs": [ |
29 | | - { |
30 | | - "name": "stdout", |
31 | | - "output_type": "stream", |
32 | | - "text": [ |
33 | | - "Collecting datafog==3.2.0b20\n", |
34 | | - " Downloading datafog-3.2.0b20.tar.gz (15 kB)\n", |
35 | | - " Installing build dependencies ... \u001b[?25ldone\n", |
36 | | - "\u001b[?25h Getting requirements to build wheel ... \u001b[?25ldone\n", |
37 | | - "\u001b[?25h Preparing metadata (pyproject.toml) ... \u001b[?25ldone\n", |
38 | | - "\u001b[?25hRequirement already satisfied: pandas in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (2.0.3)\n", |
39 | | - "Requirement already satisfied: Requests==2.31.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (2.31.0)\n", |
40 | | - "Requirement already satisfied: spacy==3.4.4 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (3.4.4)\n", |
41 | | - "Requirement already satisfied: en-spacy-pii-fast==0.0.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (0.0.0)\n", |
42 | | - "Requirement already satisfied: pyspark==3.4.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (3.4.1)\n", |
43 | | - "Requirement already satisfied: pydantic==1.10.8 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (1.10.8)\n", |
44 | | - "Requirement already satisfied: Pillow in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (8.4.0)\n", |
45 | | - "Requirement already satisfied: sentencepiece in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (0.2.0)\n", |
46 | | - "Requirement already satisfied: protobuf in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (4.25.3)\n", |
47 | | - "Requirement already satisfied: pytesseract in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (0.3.10)\n", |
48 | | - "Requirement already satisfied: aiohttp in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (3.9.5)\n", |
49 | | - "Requirement already satisfied: pytest-asyncio in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (0.23.6)\n", |
50 | | - "Requirement already satisfied: typing-extensions>=4.2.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pydantic==1.10.8->datafog==3.2.0b20) (4.11.0)\n", |
51 | | - "Requirement already satisfied: py4j==0.10.9.7 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pyspark==3.4.1->datafog==3.2.0b20) (0.10.9.7)\n", |
52 | | - "Requirement already satisfied: charset-normalizer<4,>=2 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from Requests==2.31.0->datafog==3.2.0b20) (2.0.12)\n", |
53 | | - "Requirement already satisfied: idna<4,>=2.5 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from Requests==2.31.0->datafog==3.2.0b20) (3.3)\n", |
54 | | - "Requirement already satisfied: urllib3<3,>=1.21.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from Requests==2.31.0->datafog==3.2.0b20) (1.26.7)\n", |
55 | | - "Requirement already satisfied: certifi>=2017.4.17 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from Requests==2.31.0->datafog==3.2.0b20) (2021.10.8)\n", |
56 | | - "Requirement already satisfied: spacy-legacy<3.1.0,>=3.0.10 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (3.0.12)\n", |
57 | | - "Requirement already satisfied: spacy-loggers<2.0.0,>=1.0.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (1.0.5)\n", |
58 | | - "Requirement already satisfied: murmurhash<1.1.0,>=0.28.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (1.0.10)\n", |
59 | | - "Requirement already satisfied: cymem<2.1.0,>=2.0.2 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (2.0.8)\n", |
60 | | - "Requirement already satisfied: preshed<3.1.0,>=3.0.2 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (3.0.9)\n", |
61 | | - "Requirement already satisfied: thinc<8.2.0,>=8.1.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (8.1.12)\n", |
62 | | - "Requirement already satisfied: wasabi<1.1.0,>=0.9.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (0.10.1)\n", |
63 | | - "Requirement already satisfied: srsly<3.0.0,>=2.4.3 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (2.4.8)\n", |
64 | | - "Requirement already satisfied: catalogue<2.1.0,>=2.0.6 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (2.0.10)\n", |
65 | | - "Requirement already satisfied: typer<0.8.0,>=0.3.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (0.7.0)\n", |
66 | | - "Requirement already satisfied: pathy>=0.3.5 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (0.11.0)\n", |
67 | | - "Requirement already satisfied: smart-open<7.0.0,>=5.2.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (5.2.1)\n", |
68 | | - "Requirement already satisfied: tqdm<5.0.0,>=4.38.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (4.66.4)\n", |
69 | | - "Requirement already satisfied: numpy>=1.15.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (1.25.2)\n", |
70 | | - "Requirement already satisfied: jinja2 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (3.1.3)\n", |
71 | | - "Requirement already satisfied: setuptools in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (69.1.1)\n", |
72 | | - "Requirement already satisfied: packaging>=20.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (23.2)\n", |
73 | | - "Requirement already satisfied: langcodes<4.0.0,>=3.2.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (3.3.0)\n", |
74 | | - "Requirement already satisfied: aiosignal>=1.1.2 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from aiohttp->datafog==3.2.0b20) (1.3.1)\n", |
75 | | - "Requirement already satisfied: attrs>=17.3.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from aiohttp->datafog==3.2.0b20) (22.2.0)\n", |
76 | | - "Requirement already satisfied: frozenlist>=1.1.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from aiohttp->datafog==3.2.0b20) (1.3.3)\n", |
77 | | - "Requirement already satisfied: multidict<7.0,>=4.5 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from aiohttp->datafog==3.2.0b20) (6.0.4)\n", |
78 | | - "Requirement already satisfied: yarl<2.0,>=1.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from aiohttp->datafog==3.2.0b20) (1.8.2)\n", |
79 | | - "Requirement already satisfied: python-dateutil>=2.8.2 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pandas->datafog==3.2.0b20) (2.8.2)\n", |
80 | | - "Requirement already satisfied: pytz>=2020.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pandas->datafog==3.2.0b20) (2021.3)\n", |
81 | | - "Requirement already satisfied: tzdata>=2022.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pandas->datafog==3.2.0b20) (2024.1)\n", |
82 | | - "Requirement already satisfied: pytest<9,>=7.0.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pytest-asyncio->datafog==3.2.0b20) (7.4.4)\n", |
83 | | - "Requirement already satisfied: pathlib-abc==0.1.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pathy>=0.3.5->spacy==3.4.4->datafog==3.2.0b20) (0.1.1)\n", |
84 | | - "Requirement already satisfied: iniconfig in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pytest<9,>=7.0.0->pytest-asyncio->datafog==3.2.0b20) (2.0.0)\n", |
85 | | - "Requirement already satisfied: pluggy<2.0,>=0.12 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pytest<9,>=7.0.0->pytest-asyncio->datafog==3.2.0b20) (1.4.0)\n", |
86 | | - "Requirement already satisfied: six>=1.5 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from python-dateutil>=2.8.2->pandas->datafog==3.2.0b20) (1.16.0)\n", |
87 | | - "Requirement already satisfied: blis<0.8.0,>=0.7.8 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from thinc<8.2.0,>=8.1.0->spacy==3.4.4->datafog==3.2.0b20) (0.7.11)\n", |
88 | | - "Requirement already satisfied: confection<1.0.0,>=0.0.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from thinc<8.2.0,>=8.1.0->spacy==3.4.4->datafog==3.2.0b20) (0.1.4)\n", |
89 | | - "Requirement already satisfied: click<9.0.0,>=7.1.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from typer<0.8.0,>=0.3.0->spacy==3.4.4->datafog==3.2.0b20) (8.1.7)\n", |
90 | | - "Requirement already satisfied: MarkupSafe>=2.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from jinja2->spacy==3.4.4->datafog==3.2.0b20) (2.1.5)\n", |
91 | | - "Building wheels for collected packages: datafog\n", |
92 | | - " Building wheel for datafog (pyproject.toml) ... \u001b[?25ldone\n", |
93 | | - "\u001b[?25h Created wheel for datafog: filename=datafog-3.2.0b20-py3-none-any.whl size=16437 sha256=85772be41af732abed8ff3306701762a3d9df24129bf2a6392ea7accf0f99467\n", |
94 | | - " Stored in directory: /Users/sidmohan/Library/Caches/pip/wheels/e3/1d/bb/ac5c7ef27ba420864a19f0c53491bd68324cbb71082b15b3e4\n", |
95 | | - "Successfully built datafog\n", |
96 | | - "Installing collected packages: datafog\n", |
97 | | - " Attempting uninstall: datafog\n", |
98 | | - " Found existing installation: datafog 3.2.0b12\n", |
99 | | - " Uninstalling datafog-3.2.0b12:\n", |
100 | | - " Successfully uninstalled datafog-3.2.0b12\n", |
101 | | - "Successfully installed datafog-3.2.0b20\n", |
102 | | - "\n", |
103 | | - "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m23.2.1\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m24.0\u001b[0m\n", |
104 | | - "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpip install --upgrade pip\u001b[0m\n" |
105 | | - ] |
106 | | - } |
107 | | - ], |
| 28 | + "outputs": [], |
108 | 29 | "source": [ |
109 | 30 | "!pip install \"datafog==3.2.0\"" |
110 | 31 | ] |
|
118 | 39 | }, |
119 | 40 | { |
120 | 41 | "cell_type": "code", |
121 | | - "execution_count": 2, |
| 42 | + "execution_count": null, |
122 | 43 | "metadata": {}, |
123 | | - "outputs": [ |
124 | | - { |
125 | | - "name": "stdout", |
126 | | - "output_type": "stream", |
127 | | - "text": [ |
128 | | - "The operation couldn’t be completed. Unable to locate a Java Runtime that supports apt.\n", |
129 | | - "Please visit http://www.java.com for information on installing Java.\n", |
130 | | - "\n", |
131 | | - "The operation couldn’t be completed. Unable to locate a Java Runtime that supports apt.\n", |
132 | | - "Please visit http://www.java.com for information on installing Java.\n", |
133 | | - "\n" |
134 | | - ] |
135 | | - } |
136 | | - ], |
| 44 | + "outputs": [], |
137 | 45 | "source": [ |
138 | 46 | "! apt install tesseract-ocr\n", |
139 | 47 | "! apt install libtesseract-dev" |
140 | 48 | ] |
141 | 49 | }, |
142 | 50 | { |
143 | 51 | "cell_type": "code", |
144 | | - "execution_count": 3, |
| 52 | + "execution_count": null, |
145 | 53 | "metadata": {}, |
146 | | - "outputs": [ |
147 | | - { |
148 | | - "name": "stdout", |
149 | | - "output_type": "stream", |
150 | | - "text": [ |
151 | | - "Requirement already satisfied: nest_asyncio in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (1.6.0)\n", |
152 | | - "\n", |
153 | | - "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m23.2.1\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m24.0\u001b[0m\n", |
154 | | - "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpip install --upgrade pip\u001b[0m\n" |
155 | | - ] |
156 | | - } |
157 | | - ], |
| 54 | + "outputs": [], |
158 | 55 | "source": [ |
159 | 56 | "!pip install nest_asyncio" |
160 | 57 | ] |
|
0 commit comments