1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26
| import numpy as np import pandas as pd from sklearn.impute import SimpleImputer, KNNImputer
df = pd.DataFrame({ 'age': [25, 30, np.nan, 35, 28, np.nan, 40], 'income': [5000, 8000, 6000, np.nan, 5500, 7000, np.nan], 'score': [85, 90, 78, 92, np.nan, 88, 95] })
imputer_mean = SimpleImputer(strategy='mean') df_mean = pd.DataFrame(imputer_mean.fit_transform(df), columns=df.columns)
imputer_median = SimpleImputer(strategy='median') df_median = pd.DataFrame(imputer_median.fit_transform(df), columns=df.columns)
imputer_mode = SimpleImputer(strategy='most_frequent') df_mode = pd.DataFrame(imputer_mode.fit_transform(df), columns=df.columns)
imputer_knn = KNNImputer(n_neighbors=3) df_knn = pd.DataFrame(imputer_knn.fit_transform(df), columns=df.columns)
|