{ "cells": [ { "cell_type": "markdown", "id": "8f2bf560", "metadata": {}, "source": [ "# Data Exploration\n", "Load the U.S. Accidents dataset, inspect the Description field, and validate the text filtering logic." ] }, { "cell_type": "code", "execution_count": null, "id": "811a068e", "metadata": {}, "outputs": [], "source": [ "import pandas as pd\n", "from pathlib import Path\n", "path = Path('../data/raw/US_Accidents_March23.csv')\n", "if path.exists():\n", " df = pd.read_csv(path, low_memory=False)\n", " print(df[['Description']].head())\n", " print(df['Description'].str.len().describe())\n", "else:\n", " print('Place the Kaggle CSV under data/raw/ before running this notebook.')" ] } ], "metadata": {}, "nbformat": 4, "nbformat_minor": 5 }