normalize_utils
1import pandas as pd 2import numpy as np 3import sys 4import matplotlib.pyplot as plt 5import os 6 7"""File containing code used as utility to normalize files, vector, etc""" 8 9def getFileName(argument): 10 """Given a full path name, returns only the name of the file""" 11 index = argument.rfind('/') 12 return argument[index:] 13 14def normalizeFile(filename, des_path, source_path): 15 """Normalize an entire file""" 16 dataframe = pd.read_csv(source_path + filename, index_col=0) 17 dataframe.plot(title=f"{filename}") 18 19 data_array = [] 20 21 max_value = 0 22 min_value = 999999999 23 24 for index,row in dataframe.iterrows(): 25 data_array.append(row[0]) 26 if row[0] > max_value: 27 max_value = row[0] 28 if row[0] < min_value: 29 min_value = row[0] 30 31 normalized_data_array = [] 32 33 for value in data_array: 34 normalized_value = (value - min_value) / (max_value - min_value) 35 normalized_data_array.append(normalized_value) 36 37 normalized_data_dict = {"Precio": normalized_data_array} 38 39 normalized_dataframe = pd.DataFrame(normalized_data_dict) 40 normalized_dataframe.plot() 41 42 normalized_dataframe.to_csv(des_path + filename) 43 44def normalizeVector(vector): 45 """Normalize a given vector with max min normalization""" 46 max_number = 0 47 min_number = 99999999 48 for number in vector: 49 number = float(number) 50 if number > max_number: 51 max_number = number 52 if number < min_number: 53 min_number = number 54 55 normalized_vector = [] 56 57 for number in vector: 58 number = float(number) 59 normalized_number = (number - min_number) / (max_number - min_number) 60 normalized_vector.append(round(normalized_number, 3)) 61 62 return normalized_vector 63 64# file_list = os.listdir(sys.argv[1]) 65# for file in file_list: 66# normalizeFile(file, sys.argv[2], sys.argv[1]) 67# plt.show()
def
getFileName(argument)
10def getFileName(argument): 11 """Given a full path name, returns only the name of the file""" 12 index = argument.rfind('/') 13 return argument[index:]
Given a full path name, returns only the name of the file
def
normalizeFile(filename, des_path, source_path)
15def normalizeFile(filename, des_path, source_path): 16 """Normalize an entire file""" 17 dataframe = pd.read_csv(source_path + filename, index_col=0) 18 dataframe.plot(title=f"{filename}") 19 20 data_array = [] 21 22 max_value = 0 23 min_value = 999999999 24 25 for index,row in dataframe.iterrows(): 26 data_array.append(row[0]) 27 if row[0] > max_value: 28 max_value = row[0] 29 if row[0] < min_value: 30 min_value = row[0] 31 32 normalized_data_array = [] 33 34 for value in data_array: 35 normalized_value = (value - min_value) / (max_value - min_value) 36 normalized_data_array.append(normalized_value) 37 38 normalized_data_dict = {"Precio": normalized_data_array} 39 40 normalized_dataframe = pd.DataFrame(normalized_data_dict) 41 normalized_dataframe.plot() 42 43 normalized_dataframe.to_csv(des_path + filename)
Normalize an entire file
def
normalizeVector(vector)
45def normalizeVector(vector): 46 """Normalize a given vector with max min normalization""" 47 max_number = 0 48 min_number = 99999999 49 for number in vector: 50 number = float(number) 51 if number > max_number: 52 max_number = number 53 if number < min_number: 54 min_number = number 55 56 normalized_vector = [] 57 58 for number in vector: 59 number = float(number) 60 normalized_number = (number - min_number) / (max_number - min_number) 61 normalized_vector.append(round(normalized_number, 3)) 62 63 return normalized_vector
Normalize a given vector with max min normalization