Is it over?

This commit is contained in:
2023-03-30 19:32:42 +02:00
parent 86107d5bb6
commit 4c36817a85
3 changed files with 20 additions and 12 deletions

View File

@@ -108,7 +108,7 @@ gammas['Critic_Score_Norm'] = scout.scaling_zscore(gammas, 'Critic_Score')
print(gammas['Critic_Score_Norm'].head(10))
# Saving all into a file
gammas.to_csv("output.csv", index=False)
gammas.to_csv("datasets/videogames/games_cleanish.csv", index=False)
# Need similarity and dissimialrity, scipy time
# Selecting 5 random rows
@@ -116,4 +116,4 @@ chosen_idx = np.random.choice(len(gammas), replace = False, size = 5)
sample_rows = gammas.iloc[chosen_idx]
print(sample_rows.head())
# scout.dissimilarity(sample_rows.select_dtypes(include = np.number))
scout.dissimilarity(sample_rows)

View File

@@ -49,11 +49,15 @@ def scaling_zscore(dataframe, col):
return stats.zscore(dataframe[col],axis = 0, nan_policy= "omit")
def dissimilarity(row_arr):
for i in len(row_arr):
print("| ")
for j in len(row_arr):
row_arr = row_arr.select_dtypes(include = np.number)
row_arr = row_arr.drop('Rank', axis = 1)
print(" | Entry 1 | Entry 2 | Entry 3 | Entry 4 | Entry 5 |")
for i in range(len(row_arr)):
print("Entry " , i + 1, " | ", end = "")
for j in range(len(row_arr)):
eucDist = distance.euclidean(row_arr.iloc[i], row_arr.iloc[j])
print(f"Dissim {i}{j}: {eucDist} |")
print(" {:#.6g} |".format(eucDist), end = "")
print("\n")
def scaling_range(datashitter, col):