Mean, Median and Most Frequent Values Finding
# -*- coding: utf-8 -*-
"""
Created on Sun Oct 22 19:30:20 2023
@author: Syed Kamran Bukhari
"""
import numpy as np
import pandas as pd
import matplotlib.pyplot as plt
#read CSV file
dataset = pd.read_csv('Assi_1_data.csv')
#impute mean values in replace of na
dataset=dataset[dataset>0]
dna= pd.DataFrame(dataset)
dna= dna.dropna()
dna=np.array(dna)
data = np.array(dataset)
data1 = np.array(dataset)
data2 = np.array(dataset)
from sklearn.impute import SimpleImputer
Imputer = SimpleImputer(missing_values=np.nan, strategy='most_frequent')
Imputer.fit(data[:, 0:3])
data[:,0:3]= Imputer.transform(data[:,0:3])
data = pd.DataFrame(data)
Imputer = SimpleImputer(missing_values=np.nan, strategy='median')
Imputer.fit(data1[:, 0:3])
data1[:,0:3]= Imputer.transform(data1[:,0:3])
data = pd.DataFrame(data1)
Imputer = SimpleImputer(missing_values=np.nan, strategy='mean')
Imputer.fit(data2[:, 0:3])
data2[:,0:3]= Imputer.transform(data2[:,0:3])
data2 = pd.DataFrame(data2)
Comments
Post a Comment