Updated the commits for sanity checks.

This commit is contained in:
Batuhan Berk Başoğlu 2025-09-17 21:06:20 -04:00
parent 2a7c9cd28b
commit 5702c3c1b8
Signed by: batuhan-basoglu
SSH key fingerprint: SHA256:kEsnuHX+qbwhxSAXPUQ4ox535wFHu/hIRaa53FzxRpo
4 changed files with 157 additions and 13 deletions

View file

@ -43,7 +43,7 @@ if __name__ == "__main__":
for col in num_cols:
df = df[df[col] >= 0]
# sanity checks for data validity
# sanity checks for data validity - max tumor sizes possible
df = df[(df['radius_mean'] > 0) & (df['radius_mean'] <= 30)]
df = df[(df['radius_worst'] > 0) & (df['radius_worst'] <= 30)]
df = df[(df['texture_mean'] >= 0) & (df['texture_mean'] <= 100)]