- Added venv instruction + requirements.txt

- Added data folder structure with .gitkeep
- Added .gitignore
- Added load.py to load IMDB dataset and preview with D-Tale
This commit is contained in:
prabhaavp
2026-02-03 22:21:41 -05:00
parent c18b412867
commit 2d2ee64c0e
7 changed files with 279 additions and 1 deletions

12
scripts/load.py Normal file
View File

@@ -0,0 +1,12 @@
import pandas as pd
import dtale
file_path = '../data/raw/imdb_datasets/title.basics.tsv'
pd.set_option('display.max_columns', None) # show all columns
pd.set_option('display.width', 1000) # prevent columns from wrapping
df = pd.read_csv(file_path, sep='\t', nrows=1)
print(df)
d = dtale.show(df, subprocess=False)
d.open_browser()