KaiquanMah commited on
Commit
540d32a
·
verified ·
1 Parent(s): d8bbbd8

Update DSIP/preprocess.py

Browse files
Files changed (1) hide show
  1. DSIP/preprocess.py +3 -0
DSIP/preprocess.py CHANGED
@@ -11,6 +11,9 @@ def parse(csv_path):
11
  # Step 1: Load the dataset
12
  # file_path = "dataset.csv" # Path to the original dataset
13
  data = pd.read_csv(csv_path)
 
 
 
14
 
15
  # Step 2: Define the feature columns (X) and target column (y)
16
  X = data[["name", "attendance percentage", "average sleep time", "average screen time"]] # Feature columns
 
11
  # Step 1: Load the dataset
12
  # file_path = "dataset.csv" # Path to the original dataset
13
  data = pd.read_csv(csv_path)
14
+
15
+ # Drop dupes
16
+ data = data.drop_duplicates()
17
 
18
  # Step 2: Define the feature columns (X) and target column (y)
19
  X = data[["name", "attendance percentage", "average sleep time", "average screen time"]] # Feature columns