Spaces:
Running
Running
Update DSIP/preprocess.py
Browse files- DSIP/preprocess.py +3 -0
DSIP/preprocess.py
CHANGED
@@ -11,6 +11,9 @@ def parse(csv_path):
|
|
11 |
# Step 1: Load the dataset
|
12 |
# file_path = "dataset.csv" # Path to the original dataset
|
13 |
data = pd.read_csv(csv_path)
|
|
|
|
|
|
|
14 |
|
15 |
# Step 2: Define the feature columns (X) and target column (y)
|
16 |
X = data[["name", "attendance percentage", "average sleep time", "average screen time"]] # Feature columns
|
|
|
11 |
# Step 1: Load the dataset
|
12 |
# file_path = "dataset.csv" # Path to the original dataset
|
13 |
data = pd.read_csv(csv_path)
|
14 |
+
|
15 |
+
# Drop dupes
|
16 |
+
data = data.drop_duplicates()
|
17 |
|
18 |
# Step 2: Define the feature columns (X) and target column (y)
|
19 |
X = data[["name", "attendance percentage", "average sleep time", "average screen time"]] # Feature columns
|