PYTHON PROGRAM RELATED TO INFORMATION RETRIEVAL AND WEB SEARCH

profileNANI1012
DataPreprocessing.py

# importing libraries import pandas import scipy import numpy from sklearn.preprocessing import MinMaxScaler # data set link url = "https://archive.ics.uci.edu/ml/machine-learning-databases/pima-indians-diabetes/pima-indians-diabetes.data" # data parameters names = ['preg', 'plas', 'pres', 'skin', 'test', 'mass', 'pedi', 'age', 'class'] # preparating of dataframe using the data at given link and defined columns list dataframe = pandas.read_csv(url, names = names) array = dataframe.values # separate array into input and output components X = array[:,0:8] Y = array[:,8] # initialising the MinMaxScaler scaler = MinMaxScaler(feature_range=(0, 1)) # learning the statistical parameters for each of the data and transforming rescaledX = scaler.fit_transform(X) # summarize transformed data numpy.set_printoptions(precision=3) print(rescaledX[0:5,:])