Refactoring killed muh bebe

2023-03-28 14:07:50 +02:00
parent a7abb05567
commit fea7af62f6
2 changed files with 22 additions and 42 deletions
--- a/py_scripts/gunner.py
+++ b/py_scripts/gunner.py
@@ -3,34 +3,7 @@

 import pandas as pd
 import numpy as np
-import mining_hq

-# Sharing the dataset variables
-# Games' data
-
-# Loading Datasets
-games_merged = mining_hq.games_merged_dat
-
-victim1 = pd.read_excel("datasets/crime/clean_crime_canada_dataset.xlsx")
-victim2 = pd.read_csv("datasets/crime/report.csv")
-
-# Printing information regarding datasets
-print("Game Datasets' Info:\n")
-games_merged.info()
-
-print("Crime Datasets' Info:\n")
-victim2.info()
-victim1.info()
-
-
-# Regarding the Games.xls dataset:
-# Coercing the non-numeric values will result in NaN
-# thus allowing easier removal through `.notnull()`
-
-
-# Regarding the vgsales-12-4-2019 dataset
-# Considering we will be using a US (probs CA too) crime datasets
-# It wouldn't be that useful to have other columns regarding other regions
 def drop_kick(col_list, dataframe):
    return dataframe.drop(columns=col_list, axis=1)

@@ -38,8 +11,8 @@ def drop_kick(col_list, dataframe):
 # Getting the range of years which both datasets share
 def year_interval(victim1, victim2, col1, col2):
    return (
-        min(victim2[col2].max(), victim1[col1].max()),
        max(victim2[col2].min(), victim1[col1].min()),
+        min(victim2[col2].max(), victim1[col1].max()),
    )