|
23 | 23 | },
|
24 | 24 | {
|
25 | 25 | "cell_type": "code",
|
26 |
| - "execution_count": 1, |
| 26 | + "execution_count": null, |
27 | 27 | "metadata": {},
|
28 |
| - "outputs": [ |
29 |
| - { |
30 |
| - "name": "stdout", |
31 |
| - "output_type": "stream", |
32 |
| - "text": [ |
33 |
| - "Collecting datafog==3.2.0b20\n", |
34 |
| - " Downloading datafog-3.2.0b20.tar.gz (15 kB)\n", |
35 |
| - " Installing build dependencies ... \u001b[?25ldone\n", |
36 |
| - "\u001b[?25h Getting requirements to build wheel ... \u001b[?25ldone\n", |
37 |
| - "\u001b[?25h Preparing metadata (pyproject.toml) ... \u001b[?25ldone\n", |
38 |
| - "\u001b[?25hRequirement already satisfied: pandas in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (2.0.3)\n", |
39 |
| - "Requirement already satisfied: Requests==2.31.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (2.31.0)\n", |
40 |
| - "Requirement already satisfied: spacy==3.4.4 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (3.4.4)\n", |
41 |
| - "Requirement already satisfied: en-spacy-pii-fast==0.0.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (0.0.0)\n", |
42 |
| - "Requirement already satisfied: pyspark==3.4.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (3.4.1)\n", |
43 |
| - "Requirement already satisfied: pydantic==1.10.8 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (1.10.8)\n", |
44 |
| - "Requirement already satisfied: Pillow in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (8.4.0)\n", |
45 |
| - "Requirement already satisfied: sentencepiece in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (0.2.0)\n", |
46 |
| - "Requirement already satisfied: protobuf in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (4.25.3)\n", |
47 |
| - "Requirement already satisfied: pytesseract in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (0.3.10)\n", |
48 |
| - "Requirement already satisfied: aiohttp in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (3.9.5)\n", |
49 |
| - "Requirement already satisfied: pytest-asyncio in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from datafog==3.2.0b20) (0.23.6)\n", |
50 |
| - "Requirement already satisfied: typing-extensions>=4.2.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pydantic==1.10.8->datafog==3.2.0b20) (4.11.0)\n", |
51 |
| - "Requirement already satisfied: py4j==0.10.9.7 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pyspark==3.4.1->datafog==3.2.0b20) (0.10.9.7)\n", |
52 |
| - "Requirement already satisfied: charset-normalizer<4,>=2 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from Requests==2.31.0->datafog==3.2.0b20) (2.0.12)\n", |
53 |
| - "Requirement already satisfied: idna<4,>=2.5 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from Requests==2.31.0->datafog==3.2.0b20) (3.3)\n", |
54 |
| - "Requirement already satisfied: urllib3<3,>=1.21.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from Requests==2.31.0->datafog==3.2.0b20) (1.26.7)\n", |
55 |
| - "Requirement already satisfied: certifi>=2017.4.17 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from Requests==2.31.0->datafog==3.2.0b20) (2021.10.8)\n", |
56 |
| - "Requirement already satisfied: spacy-legacy<3.1.0,>=3.0.10 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (3.0.12)\n", |
57 |
| - "Requirement already satisfied: spacy-loggers<2.0.0,>=1.0.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (1.0.5)\n", |
58 |
| - "Requirement already satisfied: murmurhash<1.1.0,>=0.28.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (1.0.10)\n", |
59 |
| - "Requirement already satisfied: cymem<2.1.0,>=2.0.2 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (2.0.8)\n", |
60 |
| - "Requirement already satisfied: preshed<3.1.0,>=3.0.2 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (3.0.9)\n", |
61 |
| - "Requirement already satisfied: thinc<8.2.0,>=8.1.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (8.1.12)\n", |
62 |
| - "Requirement already satisfied: wasabi<1.1.0,>=0.9.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (0.10.1)\n", |
63 |
| - "Requirement already satisfied: srsly<3.0.0,>=2.4.3 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (2.4.8)\n", |
64 |
| - "Requirement already satisfied: catalogue<2.1.0,>=2.0.6 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (2.0.10)\n", |
65 |
| - "Requirement already satisfied: typer<0.8.0,>=0.3.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (0.7.0)\n", |
66 |
| - "Requirement already satisfied: pathy>=0.3.5 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (0.11.0)\n", |
67 |
| - "Requirement already satisfied: smart-open<7.0.0,>=5.2.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (5.2.1)\n", |
68 |
| - "Requirement already satisfied: tqdm<5.0.0,>=4.38.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (4.66.4)\n", |
69 |
| - "Requirement already satisfied: numpy>=1.15.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (1.25.2)\n", |
70 |
| - "Requirement already satisfied: jinja2 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (3.1.3)\n", |
71 |
| - "Requirement already satisfied: setuptools in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (69.1.1)\n", |
72 |
| - "Requirement already satisfied: packaging>=20.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (23.2)\n", |
73 |
| - "Requirement already satisfied: langcodes<4.0.0,>=3.2.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from spacy==3.4.4->datafog==3.2.0b20) (3.3.0)\n", |
74 |
| - "Requirement already satisfied: aiosignal>=1.1.2 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from aiohttp->datafog==3.2.0b20) (1.3.1)\n", |
75 |
| - "Requirement already satisfied: attrs>=17.3.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from aiohttp->datafog==3.2.0b20) (22.2.0)\n", |
76 |
| - "Requirement already satisfied: frozenlist>=1.1.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from aiohttp->datafog==3.2.0b20) (1.3.3)\n", |
77 |
| - "Requirement already satisfied: multidict<7.0,>=4.5 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from aiohttp->datafog==3.2.0b20) (6.0.4)\n", |
78 |
| - "Requirement already satisfied: yarl<2.0,>=1.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from aiohttp->datafog==3.2.0b20) (1.8.2)\n", |
79 |
| - "Requirement already satisfied: python-dateutil>=2.8.2 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pandas->datafog==3.2.0b20) (2.8.2)\n", |
80 |
| - "Requirement already satisfied: pytz>=2020.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pandas->datafog==3.2.0b20) (2021.3)\n", |
81 |
| - "Requirement already satisfied: tzdata>=2022.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pandas->datafog==3.2.0b20) (2024.1)\n", |
82 |
| - "Requirement already satisfied: pytest<9,>=7.0.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pytest-asyncio->datafog==3.2.0b20) (7.4.4)\n", |
83 |
| - "Requirement already satisfied: pathlib-abc==0.1.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pathy>=0.3.5->spacy==3.4.4->datafog==3.2.0b20) (0.1.1)\n", |
84 |
| - "Requirement already satisfied: iniconfig in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pytest<9,>=7.0.0->pytest-asyncio->datafog==3.2.0b20) (2.0.0)\n", |
85 |
| - "Requirement already satisfied: pluggy<2.0,>=0.12 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from pytest<9,>=7.0.0->pytest-asyncio->datafog==3.2.0b20) (1.4.0)\n", |
86 |
| - "Requirement already satisfied: six>=1.5 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from python-dateutil>=2.8.2->pandas->datafog==3.2.0b20) (1.16.0)\n", |
87 |
| - "Requirement already satisfied: blis<0.8.0,>=0.7.8 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from thinc<8.2.0,>=8.1.0->spacy==3.4.4->datafog==3.2.0b20) (0.7.11)\n", |
88 |
| - "Requirement already satisfied: confection<1.0.0,>=0.0.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from thinc<8.2.0,>=8.1.0->spacy==3.4.4->datafog==3.2.0b20) (0.1.4)\n", |
89 |
| - "Requirement already satisfied: click<9.0.0,>=7.1.1 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from typer<0.8.0,>=0.3.0->spacy==3.4.4->datafog==3.2.0b20) (8.1.7)\n", |
90 |
| - "Requirement already satisfied: MarkupSafe>=2.0 in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (from jinja2->spacy==3.4.4->datafog==3.2.0b20) (2.1.5)\n", |
91 |
| - "Building wheels for collected packages: datafog\n", |
92 |
| - " Building wheel for datafog (pyproject.toml) ... \u001b[?25ldone\n", |
93 |
| - "\u001b[?25h Created wheel for datafog: filename=datafog-3.2.0b20-py3-none-any.whl size=16437 sha256=85772be41af732abed8ff3306701762a3d9df24129bf2a6392ea7accf0f99467\n", |
94 |
| - " Stored in directory: /Users/sidmohan/Library/Caches/pip/wheels/e3/1d/bb/ac5c7ef27ba420864a19f0c53491bd68324cbb71082b15b3e4\n", |
95 |
| - "Successfully built datafog\n", |
96 |
| - "Installing collected packages: datafog\n", |
97 |
| - " Attempting uninstall: datafog\n", |
98 |
| - " Found existing installation: datafog 3.2.0b12\n", |
99 |
| - " Uninstalling datafog-3.2.0b12:\n", |
100 |
| - " Successfully uninstalled datafog-3.2.0b12\n", |
101 |
| - "Successfully installed datafog-3.2.0b20\n", |
102 |
| - "\n", |
103 |
| - "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m23.2.1\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m24.0\u001b[0m\n", |
104 |
| - "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpip install --upgrade pip\u001b[0m\n" |
105 |
| - ] |
106 |
| - } |
107 |
| - ], |
| 28 | + "outputs": [], |
108 | 29 | "source": [
|
109 | 30 | "!pip install \"datafog==3.2.0\""
|
110 | 31 | ]
|
|
118 | 39 | },
|
119 | 40 | {
|
120 | 41 | "cell_type": "code",
|
121 |
| - "execution_count": 2, |
| 42 | + "execution_count": null, |
122 | 43 | "metadata": {},
|
123 |
| - "outputs": [ |
124 |
| - { |
125 |
| - "name": "stdout", |
126 |
| - "output_type": "stream", |
127 |
| - "text": [ |
128 |
| - "The operation couldn’t be completed. Unable to locate a Java Runtime that supports apt.\n", |
129 |
| - "Please visit http://www.java.com for information on installing Java.\n", |
130 |
| - "\n", |
131 |
| - "The operation couldn’t be completed. Unable to locate a Java Runtime that supports apt.\n", |
132 |
| - "Please visit http://www.java.com for information on installing Java.\n", |
133 |
| - "\n" |
134 |
| - ] |
135 |
| - } |
136 |
| - ], |
| 44 | + "outputs": [], |
137 | 45 | "source": [
|
138 | 46 | "! apt install tesseract-ocr\n",
|
139 | 47 | "! apt install libtesseract-dev"
|
140 | 48 | ]
|
141 | 49 | },
|
142 | 50 | {
|
143 | 51 | "cell_type": "code",
|
144 |
| - "execution_count": 3, |
| 52 | + "execution_count": null, |
145 | 53 | "metadata": {},
|
146 |
| - "outputs": [ |
147 |
| - { |
148 |
| - "name": "stdout", |
149 |
| - "output_type": "stream", |
150 |
| - "text": [ |
151 |
| - "Requirement already satisfied: nest_asyncio in /Users/sidmohan/.pyenv/versions/3.11.7/envs/2.2.0b1/lib/python3.11/site-packages (1.6.0)\n", |
152 |
| - "\n", |
153 |
| - "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m A new release of pip is available: \u001b[0m\u001b[31;49m23.2.1\u001b[0m\u001b[39;49m -> \u001b[0m\u001b[32;49m24.0\u001b[0m\n", |
154 |
| - "\u001b[1m[\u001b[0m\u001b[34;49mnotice\u001b[0m\u001b[1;39;49m]\u001b[0m\u001b[39;49m To update, run: \u001b[0m\u001b[32;49mpip install --upgrade pip\u001b[0m\n" |
155 |
| - ] |
156 |
| - } |
157 |
| - ], |
| 54 | + "outputs": [], |
158 | 55 | "source": [
|
159 | 56 | "!pip install nest_asyncio"
|
160 | 57 | ]
|
|
0 commit comments