Spaces:
Running
Running
Update DSIP/preprocess.py
Browse files- DSIP/preprocess.py +3 -0
DSIP/preprocess.py
CHANGED
|
@@ -11,6 +11,9 @@ def parse(csv_path):
|
|
| 11 |
# Step 1: Load the dataset
|
| 12 |
# file_path = "dataset.csv" # Path to the original dataset
|
| 13 |
data = pd.read_csv(csv_path)
|
|
|
|
|
|
|
|
|
|
| 14 |
|
| 15 |
# Step 2: Define the feature columns (X) and target column (y)
|
| 16 |
X = data[["name", "attendance percentage", "average sleep time", "average screen time"]] # Feature columns
|
|
|
|
| 11 |
# Step 1: Load the dataset
|
| 12 |
# file_path = "dataset.csv" # Path to the original dataset
|
| 13 |
data = pd.read_csv(csv_path)
|
| 14 |
+
|
| 15 |
+
# Drop dupes
|
| 16 |
+
data = data.drop_duplicates()
|
| 17 |
|
| 18 |
# Step 2: Define the feature columns (X) and target column (y)
|
| 19 |
X = data[["name", "attendance percentage", "average sleep time", "average screen time"]] # Feature columns
|