normalize or not to normalize#
how to normalize#
# random 10 point in 2d:
import random
import numpy as np
import matplotlib.pyplot as plt
import math
data = np.random.rand(10, 1)*2
print(data)
[[0.65619743]
[0.14339821]
[1.26453043]
[0.51684767]
[1.5084185 ]
[0.60104288]
[1.8014257 ]
[0.67697867]
[0.01956461]
[1.2869027 ]]
normalize_data = (data - data.min(axis=0)) / (data.max(axis=0) - data.min(axis=0))
print(normalize_data)
[[0.35728533]
[0.06949678]
[0.69868849]
[0.27908071]
[0.83556114]
[0.32633199]
[1. ]
[0.36894799]
[0. ]
[0.71124405]]
# plot each point in data how it moved to normalize_data
plt.scatter(np.ones(10)*1 ,data ,color='r')
plt.scatter(np.ones(10)*2 ,normalize_data, color='b')
plt.legend(['data', 'normalize_data'])
plt.show()
meaning of normalization#
