feat: tests now test different algorithms

2026-07-04 19:03:01 +02:00 · 2023-06-11 20:08:50 +02:00 · 2023-06-11 20:08:50 +02:00 · cc803f1d66
commit cc803f1d66
parent 5816866342
1 changed files with 12 additions and 5 deletions
--- a/final/code/main.py
+++ b/final/code/main.py
@ -222,8 +222,11 @@ def create_model(pivot_table, rows_number, metric="cosine", algorithm="brute", n
    """
    neighbors_number = calculate_neighbors(pivot_table.shape[0], neighbors)
    pivot_table_matrix = csr_matrix(pivot_table.values)
-    model = NearestNeighbors(n_neighbors=neighbors_number,
-                             metric=metric, algorithm=algorithm)
+    if algorithm == "brute":
+        model = NearestNeighbors(n_neighbors=neighbors_number,
+                                metric=metric, algorithm=algorithm)
+    else:
+        model = NearestNeighbors(n_neighbors=neighbors_number, algorithm=algorithm)                         
    try:
        model.fit(pivot_table_matrix)
    except:
@ -290,7 +293,7 @@ def handle_arguments():

 def auto_mode(data_limit = -1, seed = 42, anime="RANDOM"):
    print("Started auto mode")
-    algorithm_spread = ['ball_tree', 'kd_tree', 'brute']
+    algorithm_spread = ['auto', 'ball_tree', 'kd_tree', 'brute']
    neighbor_spread = [5, "sqrt", "half", "log", "n-1"]
    # No reason to access and waste computational power every time we run the simulation
    starting_rating_data, starting_anime_contact_data, starting_rows_number = get_data(limit_data=data_limit)
@ -299,8 +302,12 @@ def auto_mode(data_limit = -1, seed = 42, anime="RANDOM"):
    if os.path.exists('test_results'):
        shutil.rmtree('test_results')
    for algorithm in algorithm_spread:
-        print("testing for algorithm: ", algorithm)
-        possibleMetrics = sorted(VALID_METRICS_SPARSE[algorithm])
+        possibleMetrics = []
+        if algorithm != 'auto':
+            possibleMetrics = sorted(VALID_METRICS_SPARSE[algorithm])
+        print("testing for algorithm: ", algorithm, possibleMetrics)
+        if possibleMetrics == []:
+            possibleMetrics = [""]
        for metric in possibleMetrics:
            print("testing for algorithm, metric: ", algorithm, metric)
            for neighbor_amount in neighbor_spread: