0% found this document useful (0 votes)

37 views7 pages

Normialization Dataset

NormializationDataset in Deep Learning

Uploaded by

mohitdubey42551

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

37 views7 pages

Normialization Dataset

NormializationDataset in Deep Learning

Uploaded by

mohitdubey42551

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as PDF, TXT or read online on Scribd

You are on page 1/ 7

from sklearn import preprocessing

import numpy as np

x_array = np.array([1000,50,71,5006,80])
normalized_arr = preprocessing.normalize([x_array])
print(normalized_arr)

[[0.19583773 0.00979189 0.01390448 0.98036366 0.01566702]]

import numpy as np
import pandas as pd
from sklearn import preprocessing

# create the DataFrame

california_housing = pd.read_csv("housing.csv")

# print the dataset description

#print(california_housing.DESCR)
california_housing.head()

longitude latitude housing_median_age total_rooms

total_bedrooms \
0 -122.23 37.88 41.0 880.0
129.0
1 -122.22 37.86 21.0 7099.0
1106.0
2 -122.24 37.85 52.0 1467.0
190.0
3 -122.25 37.85 52.0 1274.0
235.0
4 -122.25 37.85 52.0 1627.0
280.0

population households median_income median_house_value

ocean_proximity
0 322.0 126.0 8.3252 452600.0
NEAR BAY
1 2401.0 1138.0 8.3014 358500.0
NEAR BAY
2 496.0 177.0 7.2574 352100.0
NEAR BAY
3 558.0 219.0 5.6431 341300.0
NEAR BAY
4 565.0 259.0 3.8462 342200.0
NEAR BAY

x_array = np.array(california_housing['housing_median_age'])
print("HouseAge array: ",x_array)

HouseAge array: [41. 21. 52. ... 17. 18. 16.]

normalized_arr = preprocessing.normalize([x_array])
print("Normalized HouseAge array: ",normalized_arr)

Normalized HouseAge array: [[0.00912272 0.00467261 0.01157028 ...

0.00378259 0.0040051 0.00356009]]

d = preprocessing.normalize(california_housing)
scaled_df = pd.DataFrame(d, columns=california_housing.columns)
print(scaled_df)

----------------------------------------------------------------------
-----
ValueError Traceback (most recent call
last)
Cell In[8], line 1
----> 1 d = preprocessing.normalize(california_housing)
2 scaled_df = pd.DataFrame(d,
columns=california_housing.columns)
3 print(scaled_df)

File ~\AppData\Local\Programs\Python\Python310\lib\site-packages\
sklearn\preprocessing\_data.py:1817, in normalize(X, norm, axis, copy,
return_norm)
1814 else:
1815 raise ValueError("'%d' is not a supported axis" % axis)
-> 1817 X = check_array(
1818 X,
1819 accept_sparse=sparse_format,
1820 copy=copy,
1821 estimator="the normalize function",
1822 dtype=FLOAT_DTYPES,
1823 )
1824 if axis == 0:
1825 X = X.T

File ~\AppData\Local\Programs\Python\Python310\lib\site-packages\
sklearn\utils\validation.py:877, in check_array(array, accept_sparse,
accept_large_sparse, dtype, order, copy, force_all_finite, ensure_2d,
allow_nd, ensure_min_samples, ensure_min_features, estimator,
input_name)
875 array = xp.astype(array, dtype, copy=False)
876 else:
--> 877 array = _asarray_with_order(array, order=order,
dtype=dtype, xp=xp)
878 except ComplexWarning as complex_warning:
879 raise ValueError(
880 "Complex data not supported\n{}\n".format(array)
881 ) from complex_warning

File ~\AppData\Local\Programs\Python\Python310\lib\site-packages\
sklearn\utils\_array_api.py:185, in _asarray_with_order(array, dtype,
order, copy, xp)
182 xp, _ = get_namespace(array)
183 if xp.__name__ in {"numpy", "numpy.array_api"}:
184 # Use NumPy API to support order
--> 185 array = numpy.asarray(array, order=order, dtype=dtype)
186 return xp.asarray(array, copy=copy)
187 else:

File ~\AppData\Local\Programs\Python\Python310\lib\site-packages\
pandas\core\generic.py:2070, in NDFrame.__array__(self, dtype)
2069 def __array__(self, dtype: npt.DTypeLike | None = None) ->
np.ndarray:
-> 2070 return np.asarray(self._values, dtype=dtype)

ValueError: could not convert string to float: 'NEAR BAY'

from sklearn import preprocessing

import pandas as pd

data = california_housing.iloc[:,:-1]

data.head()

longitude latitude housing_median_age total_rooms

total_bedrooms \
0 -122.23 37.88 41.0 880.0
129.0
1 -122.22 37.86 21.0 7099.0
1106.0
2 -122.24 37.85 52.0 1467.0
190.0
3 -122.25 37.85 52.0 1274.0
235.0
4 -122.25 37.85 52.0 1627.0
280.0

population households median_income median_house_value

0 322.0 126.0 8.3252 452600.0
1 2401.0 1138.0 8.3014 358500.0
2 496.0 177.0 7.2574 352100.0
3 558.0 219.0 5.6431 341300.0
4 565.0 259.0 3.8462 342200.0

scaler = preprocessing.MinMaxScaler()
d = scaler.fit_transform(data)
scaled_df = pd.DataFrame(d, columns=data.columns)
print(scaled_df)
longitude latitude housing_median_age total_rooms
total_bedrooms \
0 0.211155 0.567481 0.784314 0.022331
0.019863
1 0.212151 0.565356 0.392157 0.180503
0.171477
2 0.210159 0.564293 1.000000 0.037260
0.029330
3 0.209163 0.564293 1.000000 0.032352
0.036313
4 0.209163 0.564293 1.000000 0.041330
0.043296
... ... ... ... ...
...
20635 0.324701 0.737513 0.470588 0.042296
0.057883
20636 0.312749 0.738576 0.333333 0.017676
0.023122
20637 0.311753 0.732200 0.313725 0.057277
0.075109
20638 0.301793 0.732200 0.333333 0.047256
0.063315
20639 0.309761 0.725824 0.294118 0.070782
0.095438

population households median_income median_house_value

0 0.008941 0.020556 0.539668 0.902266
1 0.067210 0.186976 0.538027 0.708247
2 0.013818 0.028943 0.466028 0.695051
3 0.015555 0.035849 0.354699 0.672783
4 0.015752 0.042427 0.230776 0.674638
... ... ... ... ...
20635 0.023599 0.054103 0.073130 0.130105
20636 0.009894 0.018582 0.141853 0.128043
20637 0.028140 0.071041 0.082764 0.159383
20638 0.020684 0.057227 0.094295 0.143713
20639 0.038790 0.086992 0.130253 0.153403

[20640 rows x 9 columns]

data.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 20640 entries, 0 to 20639
Data columns (total 9 columns):
# Column Non-Null Count Dtype
--- ------ -------------- -----
0 longitude 20640 non-null float64
1 latitude 20640 non-null float64
2 housing_median_age 20640 non-null float64
3 total_rooms 20640 non-null float64
4 total_bedrooms 20433 non-null float64
5 population 20640 non-null float64
6 households 20640 non-null float64
7 median_income 20640 non-null float64
8 median_house_value 20640 non-null float64
dtypes: float64(9)
memory usage: 1.4 MB

california_housing.info()

<class 'pandas.core.frame.DataFrame'>
RangeIndex: 20640 entries, 0 to 20639
Data columns (total 10 columns):
# Column Non-Null Count Dtype
--- ------ -------------- -----
0 longitude 20640 non-null float64
1 latitude 20640 non-null float64
2 housing_median_age 20640 non-null float64
3 total_rooms 20640 non-null float64
4 total_bedrooms 20433 non-null float64
5 population 20640 non-null float64
6 households 20640 non-null float64
7 median_income 20640 non-null float64
8 median_house_value 20640 non-null float64
9 ocean_proximity 20640 non-null object
dtypes: float64(9), object(1)
memory usage: 1.6+ MB

california_housing.describe()

longitude latitude housing_median_age total_rooms \

count 20640.000000 20640.000000 20640.000000 20640.000000
mean -119.569704 35.631861 28.639486 2635.763081
std 2.003532 2.135952 12.585558 2181.615252
min -124.350000 32.540000 1.000000 2.000000
25% -121.800000 33.930000 18.000000 1447.750000
50% -118.490000 34.260000 29.000000 2127.000000
75% -118.010000 37.710000 37.000000 3148.000000
max -114.310000 41.950000 52.000000 39320.000000

total_bedrooms population households median_income \

count 20433.000000 20640.000000 20640.000000 20640.000000
mean 537.870553 1425.476744 499.539680 3.870671
std 421.385070 1132.462122 382.329753 1.899822
min 1.000000 3.000000 1.000000 0.499900
25% 296.000000 787.000000 280.000000 2.563400
50% 435.000000 1166.000000 409.000000 3.534800
75% 647.000000 1725.000000 605.000000 4.743250
max 6445.000000 35682.000000 6082.000000 15.000100

median_house_value
count 20640.000000
mean 206855.816909
std 115395.615874
min 14999.000000
25% 119600.000000
50% 179700.000000
75% 264725.000000
max 500001.000000

california_housing.isna().sum1

longitude latitude housing_median_age total_rooms

total_bedrooms \
0 False False False False
False
1 False False False False
False
2 False False False False
False
3 False False False False
False
4 False False False False
False
... ... ... ... ...
...
20635 False False False False
False
20636 False False False False
False
20637 False False False False
False
20638 False False False False
False
20639 False False False False
False

population households median_income median_house_value \

0 False False False False
1 False False False False
2 False False False False
3 False False False False
4 False False False False
... ... ... ... ...
20635 False False False False
20636 False False False False
20637 False False False False
20638 False False False False
20639 False False False False

ocean_proximity
0 False
1 False
2 False
3 False
4 False
... ...
20635 False
20636 False
20637 False
20638 False
20639 False

[20640 rows x 10 columns]

Yh-305d Power Supply Schematic: Read/Download
18% (17)
Yh-305d Power Supply Schematic: Read/Download
2 pages
Java - Co - Po - Mapping
No ratings yet
Java - Co - Po - Mapping
4 pages
CSS NC II Institutional Assessment
100% (1)
CSS NC II Institutional Assessment
3 pages
Asus F8v (A) L80v N80 N81 Schematic Diagrams
No ratings yet
Asus F8v (A) L80v N80 N81 Schematic Diagrams
94 pages
Unit 3 Notes Computer Fundamentals
No ratings yet
Unit 3 Notes Computer Fundamentals
18 pages
Nt35310draft Spec v0.02
No ratings yet
Nt35310draft Spec v0.02
385 pages
The Data Science Process
100% (1)
The Data Science Process
53 pages
Eda Project
No ratings yet
Eda Project
28 pages
House Price Prediction: # Importing Necessary Libraries
No ratings yet
House Price Prediction: # Importing Necessary Libraries
18 pages
Unit 1: Shobana T S Assistant Professor Dept. of ISE, BMSCE
No ratings yet
Unit 1: Shobana T S Assistant Professor Dept. of ISE, BMSCE
127 pages
Untitled6.Ipynb - Colab
No ratings yet
Untitled6.Ipynb - Colab
6 pages
Housing Prices Notebook
No ratings yet
Housing Prices Notebook
14 pages
Shivajees MCQ On Microprocessor (Instruction Set) - GATE
No ratings yet
Shivajees MCQ On Microprocessor (Instruction Set) - GATE
13 pages
Data Center: Technology Solutions
100% (1)
Data Center: Technology Solutions
28 pages
One Hot Encoding
No ratings yet
One Hot Encoding
12 pages
Billing System Using Python
100% (1)
Billing System Using Python
2 pages
House Price Prediction
No ratings yet
House Price Prediction
14 pages
ML Lab - BCSL606
No ratings yet
ML Lab - BCSL606
67 pages
Example Project California Data Anaylsis Jupyter Notebook
No ratings yet
Example Project California Data Anaylsis Jupyter Notebook
28 pages
Teach Pendant Scripting Interface Manual (V4.5.4)
No ratings yet
Teach Pendant Scripting Interface Manual (V4.5.4)
59 pages
Regression Analysis - Lasso and Ridge Regularization
No ratings yet
Regression Analysis - Lasso and Ridge Regularization
17 pages
Exp - 2-EDA - CaliforniaData Set - HeatMap - PairPlot-checkpoint - Jupyter Notebook
No ratings yet
Exp - 2-EDA - CaliforniaData Set - HeatMap - PairPlot-checkpoint - Jupyter Notebook
12 pages
Sumit Singh Resume
No ratings yet
Sumit Singh Resume
1 page
Printer Setting Tools Instructions - V3.2
No ratings yet
Printer Setting Tools Instructions - V3.2
3 pages
Linear Regression With Python - Part 1
No ratings yet
Linear Regression With Python - Part 1
167 pages
Cp4252 Machine Learning Lab Manual
No ratings yet
Cp4252 Machine Learning Lab Manual
27 pages
Asr04 HMM Intro
No ratings yet
Asr04 HMM Intro
38 pages
Bigdata - Ipynb - Colab
No ratings yet
Bigdata - Ipynb - Colab
28 pages
ML Lab34
No ratings yet
ML Lab34
29 pages
18Cs53: Database Management Systems: Introduction To Transaction Processing Concepts and Theory
No ratings yet
18Cs53: Database Management Systems: Introduction To Transaction Processing Concepts and Theory
37 pages
Real Estate Price Prediction Model
No ratings yet
Real Estate Price Prediction Model
33 pages
HW 3
No ratings yet
HW 3
20 pages
ML Observation
No ratings yet
ML Observation
29 pages
SY-5005005 HMI EngineersManual
No ratings yet
SY-5005005 HMI EngineersManual
136 pages
Machine Learning Laboratory
No ratings yet
Machine Learning Laboratory
23 pages
Linear Regression Analysis - Polynomial Regression
No ratings yet
Linear Regression Analysis - Polynomial Regression
25 pages
Faseeh Chap 2 Report
No ratings yet
Faseeh Chap 2 Report
30 pages
ML Merged
No ratings yet
ML Merged
28 pages
Multi-Tenant User Collaboration Patterns in Azure Active Directory
No ratings yet
Multi-Tenant User Collaboration Patterns in Azure Active Directory
25 pages
Document From Jahnavi
No ratings yet
Document From Jahnavi
20 pages
SOE Getting Started Guide
No ratings yet
SOE Getting Started Guide
22 pages
Machine Learning Lab
No ratings yet
Machine Learning Lab
20 pages
Two Marks Questions With Answers Embedded System
100% (1)
Two Marks Questions With Answers Embedded System
4 pages
MiniProject BI
No ratings yet
MiniProject BI
16 pages
Merged
No ratings yet
Merged
35 pages
Machinelearning
No ratings yet
Machinelearning
26 pages
02 End To End Machine Learning Project
No ratings yet
02 End To End Machine Learning Project
26 pages
Housing Main
No ratings yet
Housing Main
23 pages
DL 1
No ratings yet
DL 1
11 pages
P04 The Regression Pipeline - Preprocessing Ans
No ratings yet
P04 The Regression Pipeline - Preprocessing Ans
19 pages
Regression Algorithm
No ratings yet
Regression Algorithm
9 pages
Exercise3 Solution
No ratings yet
Exercise3 Solution
19 pages
DALab Part-B BCU&BU
No ratings yet
DALab Part-B BCU&BU
12 pages
Setup: Chapter 2 - End-To-End Machine Learning Project
No ratings yet
Setup: Chapter 2 - End-To-End Machine Learning Project
31 pages
Real Estate Valuation Data Set: Section Order
No ratings yet
Real Estate Valuation Data Set: Section Order
17 pages
House Price Prediction Models
No ratings yet
House Price Prediction Models
16 pages
Compte Rendu Data Visualisation
No ratings yet
Compte Rendu Data Visualisation
5 pages
Predicting Home Prices in Bangalore
No ratings yet
Predicting Home Prices in Bangalore
18 pages
Medium Com Omarelgabrys Blog Microservices With Spring Boot Authentication With JWT Part 3 Fafc9d7187e8
No ratings yet
Medium Com Omarelgabrys Blog Microservices With Spring Boot Authentication With JWT Part 3 Fafc9d7187e8
19 pages
DL - LR - 1.ipynb - Colab
No ratings yet
DL - LR - 1.ipynb - Colab
5 pages
Resume Vimal Patel
No ratings yet
Resume Vimal Patel
5 pages
Project 4 - House Price Prediction - Ipynb - Colab
No ratings yet
Project 4 - House Price Prediction - Ipynb - Colab
5 pages
Emllab
No ratings yet
Emllab
6 pages
Assignment 1
No ratings yet
Assignment 1
3 pages
California Housing Project
No ratings yet
California Housing Project
5 pages
4819 Tha Eng Squadnet Brochure 4pp - Mar 2017 v2 Web
No ratings yet
4819 Tha Eng Squadnet Brochure 4pp - Mar 2017 v2 Web
4 pages
Boston Housing Solutions
No ratings yet
Boston Housing Solutions
3 pages
Kaggle Machine Learning
No ratings yet
Kaggle Machine Learning
6 pages
Tarea - Prediccion de Casas en California
No ratings yet
Tarea - Prediccion de Casas en California
5 pages
Adobe Research - MDSRTeamFlyerV3
No ratings yet
Adobe Research - MDSRTeamFlyerV3
3 pages
Q 1
No ratings yet
Q 1
2 pages
Assignement 4
No ratings yet
Assignement 4
6 pages
G8 - CSS Microproject (SR NO-19,20,21)
No ratings yet
G8 - CSS Microproject (SR NO-19,20,21)
18 pages
DSA7s Catalog
No ratings yet
DSA7s Catalog
2 pages
Oop 9
No ratings yet
Oop 9
6 pages
Python Assignment 1.ipynb - Colaboratory
No ratings yet
Python Assignment 1.ipynb - Colaboratory
3 pages
Eccouncil Ecihv2 8 1 1 Cloud Computing Concepts
No ratings yet
Eccouncil Ecihv2 8 1 1 Cloud Computing Concepts
2 pages
Python Skill Test
No ratings yet
Python Skill Test
6 pages
Project Linear Regression
No ratings yet
Project Linear Regression
7 pages
BTVN1 - Colaboratory
No ratings yet
BTVN1 - Colaboratory
4 pages
Ahd-Dpu 9 Dat en V9 20221025
No ratings yet
Ahd-Dpu 9 Dat en V9 20221025
2 pages
Prac - 8 (1) - Jupyter Notebook
No ratings yet
Prac - 8 (1) - Jupyter Notebook
6 pages
Online Banking
No ratings yet
Online Banking
2 pages
Introduction To Machine Learning (ML) With Sklearn
No ratings yet
Introduction To Machine Learning (ML) With Sklearn
10 pages
Import As Import As From Import: "Mean Squared Errors: "
No ratings yet
Import As Import As From Import: "Mean Squared Errors: "
1 page
House Price Prediction
No ratings yet
House Price Prediction
1 page
Datagate New User Setup PDF
No ratings yet
Datagate New User Setup PDF
5 pages
California Housing Price Prediction .
No ratings yet
California Housing Price Prediction .
1 page
Project PDF
No ratings yet
Project PDF
13 pages

Normialization Dataset

Uploaded by

Normialization Dataset

Uploaded by

from sklearn import preprocessing

[[0.19583773 0.00979189 0.01390448 0.98036366 0.01566702]]

# create the DataFrame

# print the dataset description

longitude latitude housing_median_age total_rooms

population households median_income median_house_value

HouseAge array: [41. 21. 52. ... 17. 18. 16.]

Normalized HouseAge array: [[0.00912272 0.00467261 0.01157028 ...

ValueError: could not convert string to float: 'NEAR BAY'

from sklearn import preprocessing

longitude latitude housing_median_age total_rooms

population households median_income median_house_value

population households median_income median_house_value

[20640 rows x 9 columns]

longitude latitude housing_median_age total_rooms \

total_bedrooms population households median_income \

longitude latitude housing_median_age total_rooms

population households median_income median_house_value \

[20640 rows x 10 columns]

You might also like