Skip to content

Commit 2065783

Browse files
committed
chore: refactor data storage folder structure
1 parent 25784b8 commit 2065783

File tree

2 files changed

+7
-8
lines changed

2 files changed

+7
-8
lines changed

.gitignore

Lines changed: 1 addition & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,4 @@
1-
jupyter/house_prices
2-
jupyter/support_tickets
1+
jupyter/data/
32

43

54
# application data

jupyter/k-means-it-support-tickets.ipynb

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -87,7 +87,7 @@
8787
},
8888
{
8989
"cell_type": "code",
90-
"execution_count": 37,
90+
"execution_count": 40,
9191
"metadata": {},
9292
"outputs": [
9393
{
@@ -102,10 +102,10 @@
102102
"source": [
103103
"# Download the IT Support Tickets dataset from Kaggle (only if not already downloaded)\n",
104104
"# Check if the support_tickets directory already exists\n",
105-
"if not os.path.exists('support_tickets'):\n",
105+
"if not os.path.exists('data/support_tickets'):\n",
106106
" print(\"\\nDownloading dataset...\")\n",
107107
" !kaggle datasets download -d tobiasbueck/multilingual-customer-support-tickets\n",
108-
" !unzip -q multilingual-customer-support-tickets.zip -d support_tickets\n",
108+
" !unzip -q multilingual-customer-support-tickets.zip -d data/support_tickets\n",
109109
" print(\"Dataset downloaded and extracted successfully!\")\n",
110110
"else:\n",
111111
" print(\"\\nDataset already exists in 'support_tickets' directory. Skipping download.\")"
@@ -138,7 +138,7 @@
138138
},
139139
{
140140
"cell_type": "code",
141-
"execution_count": null,
141+
"execution_count": 41,
142142
"metadata": {},
143143
"outputs": [
144144
{
@@ -325,14 +325,14 @@
325325
"4 Feedback Tech Support NaN NaN NaN NaN "
326326
]
327327
},
328-
"execution_count": 27,
328+
"execution_count": 41,
329329
"metadata": {},
330330
"output_type": "execute_result"
331331
}
332332
],
333333
"source": [
334334
"# Load the IT Support Tickets dataset from local file\n",
335-
"df = pd.read_csv('support_tickets/aa_dataset-tickets-multi-lang-5-2-50-version.csv')\n",
335+
"df = pd.read_csv('data/support_tickets/aa_dataset-tickets-multi-lang-5-2-50-version.csv')\n",
336336
"print(f\"Dataset shape: {df.shape}\")\n",
337337
"print(f\"Columns: {df.columns.tolist()}\")\n",
338338
"df.head()"

0 commit comments

Comments
 (0)