experiments_ssl_data_term.py

import sys
sys.path.insert(0, '..')
import os
os.environ['KMP_DUPLICATE_LIB_OK']='True'
import warnings
warnings.filterwarnings("ignore")

import numpy as np
import networkx as nx
import torch
from problem.spectral_subgraph_localization import edgelist_to_adjmatrix
from optimization.prox.prox import ProxSphere, ProxL21ForSymmetricCenteredMatrix
from problem.spectral_subgraph_localization import SubgraphIsomorphismSolver, VotingSubgraphIsomorpishmSolver, VotingSubgraphIsomorpishmSolver, Solution_algo, lap_from_adj
import pickle
import sys
from copy import deepcopy
from pathlib import Path
import math

from sklearn.metrics import balanced_accuracy_score, recall_score, precision_score, f1_score, precision_recall_fscore_support

def balanced_acc(y_true, y_pred):
    return balanced_accuracy_score(y_true, y_pred)

def recall(y_true, y_pred):
    return recall_score(y_true, y_pred, pos_label=0)

def precision(y_true, y_pred):
    return precision_score(y_true, y_pred, pos_label=0)

def f1(y_true, y_pred):
    return f1_score(y_true, y_pred, pos_label=0)

def prec_recall_fscore(y_true, y_pred):
    prec, recall, fscore, _ = precision_recall_fscore_support(y_true, y_pred)
    return prec, recall, fscore

def graph_edit_distance(y_true, y_pred):
    return nx.graph_edit_distance(y_true, y_pred, timeout=30)

def use_graph_edit_distance_generator(generator_object, description=None):
    num_iterations = 0
    if description is None:
        description = ""

    distance = None
    for distance in generator_object:
        num_iterations += 1
        print(distance, description)
        if num_iterations == 3:
            break
    
    return distance

def solution_graph(G, solution_vector):
    _G = G.copy()
    solution_indices = [i for i, res in enumerate(solution_vector) if res == 0]
    S = _G.subgraph(solution_indices)
    return S

def spectrum_from_graph(G):
    A = torch.tensor(nx.to_numpy_array(G))
    D = torch.diag(A.sum(dim=1))
    L = D - A
    return torch.linalg.eigvalsh(L)

# Calculates the sum of the absolute entry-wise difference between two torch tensors.
# If |X| < |Y|, the last eigenvalue of G2 is copied, untill the length of both lists are of same length.
def spectrum_abs_diff(X, Y):
    if len(X) > len(Y):
        return 999999

    eigenvalues_to_compare = min(len(X), len(Y)) # If 
    Y = Y[:eigenvalues_to_compare]
    X = X[:eigenvalues_to_compare]
    return torch.sum(torch.abs(torch.sub(X, Y))).item()

def spectrum_square_diff(X, Y):
    if len(X) > len(Y):
        n = len(X)-len(Y)

        listofzeros = [0] * n
        listofzeros = torch.tensor(listofzeros)
        Y = torch.cat((listofzeros, Y))

        #print(len(X), len(Y))

    eigenvalues_to_compare = min(len(X), len(Y)) # If 
    Y = Y[:eigenvalues_to_compare]
    X = X[:eigenvalues_to_compare]

    return torch.sum(torch.square(torch.sub(X, Y))).item()

def greedy_remove_node_by_spectrum(G, solution_vector, ref_spectrum):
    solution_indices = [i for i, res in enumerate(solution_vector) if res == 0]
    return greedy_remove_node_by_spectrum_aux(G, solution_indices, ref_spectrum)

def greedy_remove_node_by_spectrum_aux(G, solution_indices, ref_spectrum):
    if len(solution_indices) == len(ref_spectrum):
        return solution_indices

    smallest_spectrum_diff = math.inf
    best_idx_to_remove = None
    for idx in solution_indices:
        new_solution_indices = solution_indices.copy()
        new_solution_indices.remove(idx)
        new_solution = G.subgraph(new_solution_indices)
        new_spectrum = spectrum_from_graph(new_solution)
        new_spectrum_diff = spectrum_square_diff(ref_spectrum, new_spectrum)
        if new_spectrum_diff < smallest_spectrum_diff:
            smallest_spectrum_diff = new_spectrum_diff
            best_idx_to_remove = idx

    solution_indices.remove(best_idx_to_remove)
    return greedy_remove_node_by_spectrum_aux(G, solution_indices, ref_spectrum)

def greedy_add_node_by_spectrum_v2(G, solution_vector, ref_spectrum):
    solution_indices = [i for i, res in enumerate(solution_vector) if res == 0]
    remaining_indices = [i for i, res in enumerate(solution_vector) if res == 1]
    return greedy_add_node_by_spectrum_v2_aux(G, solution_indices, remaining_indices, ref_spectrum)

def greedy_add_node_by_spectrum_v2_aux(G, solution_indices, remaining_indices, ref_spectrum):
    if len(solution_indices) == len(ref_spectrum):
        return solution_indices

    smallest_spectrum_diff = math.inf
    best_idx_to_add = None
    for idx in remaining_indices:
        new_solution_indices = solution_indices.copy()
        new_solution_indices.append(idx)
        new_solution = G.subgraph(new_solution_indices)
        new_spectrum = spectrum_from_graph(new_solution)
        new_spectrum_diff = spectrum_square_diff(ref_spectrum, new_spectrum)
        if new_spectrum_diff < smallest_spectrum_diff:
            smallest_spectrum_diff = new_spectrum_diff
            best_idx_to_add = idx

    solution_indices.append(best_idx_to_add)
    remaining_indices.remove(best_idx_to_add)
    return greedy_add_node_by_spectrum_v2_aux(G, solution_indices, remaining_indices, ref_spectrum)

# TODO clean up kode, så vi ikke har aux metoder, men at de pågældende metoder bare bliver kaldt herfra
# TODO overvej at restricte greedy add nodes, så den kun overvejer nodes, der faktisk er blevet stemt på
# TODO ændr hvordan vi sammenligner spektrum når |S| < |Q|, ifht hvad end Petros har skrevet
def enforce_cardinality_constraint_by_spectrum(G, solution_vector, ref_spectrum):
    solution_indices = [i for i, res in enumerate(solution_vector) if res == 0]

    nodes_solution = len(solution_indices)
    nodes_query = len(ref_spectrum)

    final_solution_indices = None
    if nodes_solution == nodes_query:
        final_solution_indices = solution_indices
    elif nodes_solution < nodes_query:
        remaining_indices = [i for i, res in enumerate(solution_vector) if res == 1]
        final_solution_indices = greedy_add_node_by_spectrum_v2_aux(G, solution_indices, remaining_indices, ref_spectrum)
    else:
        final_solution_indices = greedy_remove_node_by_spectrum_aux(G, solution_indices, ref_spectrum)

    final_solution_vector = [1] * len(solution_vector)
    for idx in final_solution_indices:
        final_solution_vector[idx] = 0
    return final_solution_vector

def test_greedy_remove(G, A, part_nodes, ref_spectrum):
    n, _ = A.shape

    part_nodes_altered = [node for node in part_nodes]

    nodes_to_add = [42, 69, 80, 100]
    # print("Nodes added to query:", nodes_to_add)
    part_nodes_altered.extend(nodes_to_add)
    part_nodes_altered = np.array(part_nodes_altered)

    n2 = len(part_nodes_altered)

    A_sub = A[0:n2, 0:n2]
    A_sub = A[:,part_nodes_altered]
    A_sub = A_sub[part_nodes_altered,:]

    Q_altered_solution_vector = [0 if idx in part_nodes_altered else 1 for idx in range(n)]

    enforce_cardinality_constraint_by_spectrum(G, Q_altered_solution_vector, ref_spectrum)

def test_greedy_add(G, A, part_nodes, ref_spectrum):
    n, _ = A.shape

    part_nodes_altered = [node for node in part_nodes[:-4]]

    n2 = len(part_nodes_altered)

    A_sub = A[0:n2, 0:n2]
    A_sub = A[:,part_nodes_altered]
    A_sub = A_sub[part_nodes_altered,:]
    Q_altered_solution_vector = [0 if idx in part_nodes_altered else 1 for idx in range(n)]

    enforce_cardinality_constraint_by_spectrum(G, Q_altered_solution_vector, ref_spectrum)


def accur(y_true, y_pred):
    counter = 0
    correct = 0
    for i in range(len(y_true)):
        if y_true[i] == 0:
            counter += 1
            if y_true[i] == y_pred[i]:
                correct += 1
    return 1.0*correct/counter

def prune_graph(G, part_nodes):
    lowest_degree = np.inf
    sub_G = nx.subgraph(G, part_nodes)
    for degree_view in nx.degree(sub_G):
        lowest_degree = min(lowest_degree,degree_view[1])
    # print("removing edges:", list(n for n in G.nodes if nx.degree(G,n)<lowest_degree))
    G.remove_nodes_from(list(n for n in G.nodes if nx.degree(G,n)<lowest_degree))

def run_opt(edgefile,part_nodes, mu=1, standard_voting_thresholds=[], neighborhood_thresholds=[], edge_removal=0.3):
    # TODO fix test?
    # test_spectrum_abs_diff()

    # print(f'Reading from {edgefile}')
    A1=edgelist_to_adjmatrix(edgefile)
    G=nx.from_numpy_array(A1)
    A = torch.tensor(nx.to_numpy_array(G))

    n1 = len(part_nodes)
    n = len(G.nodes)
    # print(f"|Vq| = {n1}")
    # print(f"|V| = {n}")
    # print(f"|Vq|/|V| = {n1/n}")
    
    condac = nx.conductance(G, part_nodes)
    # print(f"Conductance equals to {condac}")

    # prune_graph(G, part_nodes) # TODO gør noget med G, lav A ud fra G? Vær opmærksom på om originale indices stadig passer...

    color_map=[]
    for node in G:
        if node in part_nodes:
            color_map.append('blue')
        else: 
            color_map.append('green') 
    
    D = torch.diag(A.sum(dim=1))
    L = D - A

    A_sub = A[0:n1, 0:n1]
    A_sub = A[:,part_nodes]
    A_sub=A_sub[part_nodes,:]

    Q = nx.from_numpy_array(A_sub.clone().detach().numpy())

    D_sub = torch.diag(A_sub.sum(dim=1))
    L_sub = D_sub - A_sub
    ref_spectrum = torch.linalg.eigvalsh(L_sub)

    v_val = float(np.max(ref_spectrum.numpy()))
    c = np.sqrt(n-len(part_nodes)) * v_val
    v_gt = v_val * np.ones(n)

    for i in range(n):
        if(i in part_nodes):
            v_gt[i] = 0.0

    problem_params = {'mu_spectral': 1,
                      'mu_l21': 0,
                      'mu_MS': 0,# / (c ** 2), #The μ regularizer eq. 11 TODO NO REGULARIZER!
                      'mu_split': 0,
                      'mu_trace': 0.0,
                      'trace_val': 0,
                      'weighted_flag': False
                      }

    solver_params = {'lr': 0.02, #learning rate
                 'a_tol': -1, # not used because its negative
                 'r_tol': -1e-5/c**2, # not used because its negative
                 'v_prox': ProxSphere(radius=c), #projection on a sphere
                 #'v_prox': ProxId(),
                 'E_prox': ProxL21ForSymmetricCenteredMatrix(solver="cvx"), #not used
                 # 'E_prox': ProxL1ForSymmCentdMatrixAndInequality(solver="cvx", L=L,
                 #                                                 trace_upper_bound=
                 #                                                 1.1 * torch.trace(L)),}
                 'train_v': True, #TODO....
                 'train_E': False, #TODO...
                 'threshold_algo': '1dkmeans', # 'spectral', '1dkmeans', 'smallest'
                 }

    # test_greedy_remove(G, A, part_nodes, ref_spectrum)
    # test_greedy_add(G, A, part_nodes, ref_spectrum)

    subgraph_isomorphism_solver = SubgraphIsomorphismSolver(A, ref_spectrum, problem_params, solver_params)
    v, E = \
        subgraph_isomorphism_solver.solve(max_outer_iters=3,max_inner_iters=500, show_iter=10000, verbose=False)

    Hamiltonian = L + E + torch.diag(v)
    og_spectrum = torch.linalg.eigvalsh(Hamiltonian)

    v_binary, E_binary = subgraph_isomorphism_solver.threshold(v_np=v.detach().numpy())
    
    gt_inidicator = v_gt
    gt_inidicator[gt_inidicator>0]=1 

    idx_smallest=np.argsort(v.detach().numpy())[:n1]
    v_smallest=np.ones((n,1))
    for i in range(n):
        if i in idx_smallest:
            v_smallest[i]=0

    original_accuracy = accur(v_gt, v_binary.clone().detach().numpy())
    original_balanced = balanced_acc(v_gt, v_binary.clone().detach().numpy())
    og_precision, og_recall, og_fscore = prec_recall_fscore(v_gt, v_binary.clone().detach().numpy())

    S = solution_graph(G, v_binary)


    og_spectrum_diff = spectrum_square_diff(ref_spectrum, og_spectrum)

    nodes_in_solution = count_nodes(v_binary)
    # print("Nodes in solution:", nodes_in_solution)

    experiments_to_make = 0

    random_solver = VotingSubgraphIsomorpishmSolver(A, ref_spectrum, problem_params, solver_params, v_gt, A_sub, experiments_to_make=experiments_to_make, edge_removal=edge_removal) # Faked original balanced accuracy, can probably delete anyway
    # v_randomized, _ = random_solver.solve(max_outer_iters=3,max_inner_iters=500, show_iter=10000, verbose=False)
    votes = random_solver.solve(max_outer_iters=3,max_inner_iters=500, show_iter=10000, verbose=False)

    standard_voting_results = []
    standard_voting_results_with_cardinality_constraint = []

    neighborhood_results = []
    neighborhood_results_with_cardinality_constraint = []

    og_results = {
                "acc": original_accuracy,
                "balanced_acc": original_balanced,
                "precision": og_precision[0],
                "recall": og_recall[0],
                "f1": og_fscore[0],
                "graph_edit_distance": og_ged,
                "spectrum": og_spectrum.tolist(),
                "spectrum_diff": og_spectrum_diff
            }

    # Returning original accuracy
    return standard_voting_results, neighborhood_results, condac, og_results, ref_spectrum.tolist(), standard_voting_results_with_cardinality_constraint, neighborhood_results_with_cardinality_constraint, votes, v_gt

def count_nodes(v_binary):
    return len(v_binary) - np.count_nonzero(v_binary)

def find_best_mu(edgefile,part_nodes):
    # print(f'Reading from {edgefile}')
    A1=edgelist_to_adjmatrix(edgefile)
    G=nx.from_numpy_array(A1)
    A = torch.tensor(nx.to_numpy_array(G))

    n1 = len(part_nodes)
    n = len(G.nodes)
    # print(f"|Vq| = {n1}")
    # print(f"|V| = {n}")
    # print(f"|Vq|/|V| = {n1/n}")
    
    condac = nx.conductance(G, part_nodes)
    # print(f"Conductance equals to {condac}")
    # print(f'query nodes {part_nodes}')
    color_map=[]
    for node in G:
        if node in part_nodes:
            color_map.append('blue')
        else: 
            color_map.append('green') 
    
    D = torch.diag(A.sum(dim=1))
    L = D - A

    A_sub = A[0:n1, 0:n1]
    A_sub = A[:,part_nodes]
    A_sub=A_sub[part_nodes,:]
    #print(A_sub)

    D_sub = torch.diag(A_sub.sum(dim=1))
    L_sub = D_sub - A_sub
    ref_spectrum = torch.linalg.eigvalsh(L_sub)

    v_val = float(np.max(ref_spectrum.numpy()))
    c = np.sqrt(n-len(part_nodes)) * v_val
    v_gt = v_val * np.ones(n)

    for i in range(n):
        if(i in part_nodes):
            v_gt[i] = 0.0

    problem_params = {'mu_spectral': 1,
                      'mu_l21': 0,
                      'mu_MS': 0,
                      'mu_split': 0,
                      'mu_trace': 0.0,
                      'trace_val': 0,
                      'weighted_flag': False
                      }

    solver_params = {'lr': 0.02, #learning rate
                 'a_tol': -1, # not used because its negative
                 'r_tol': -1e-5/c**2, # not used because its negative
                 'v_prox': ProxSphere(radius=c), #projection on a sphere
                 #'v_prox': ProxId(),
                 'E_prox': ProxL21ForSymmetricCenteredMatrix(solver="cvx"), #not used
                 # 'E_prox': ProxL1ForSymmCentdMatrixAndInequality(solver="cvx", L=L,
                 #                                                 trace_upper_bound=
                 #                                                 1.1 * torch.trace(L)),}
                 'train_v': True, #TODO....
                 'train_E': False, #TODO...
                 'threshold_algo': '1dkmeans', # 'spectral', '1dkmeans', 'smallest'
                 }


    subgraph_isomorphism_solver = SubgraphIsomorphismSolver(A, ref_spectrum, problem_params, solver_params)
    pp = [i/10.0 for i in range(11)]
    
    best_mu = 0
    best_ba = 0
    for  mu_MS in pp:
        print(f"iter = {iter}, mu_MS = {mu_MS}")
        problem_params = {'mu_spectral': 1,
                          'mu_l21': 0,
                          'mu_MS': mu_MS,# / (c ** 2), #The μ regularizer eq. 11
                          'mu_split': 0,
                          'mu_trace': 0.0,
                          'trace_val': 0,
                          'weighted_flag': False
                          }
        subgraph_isomorphism_solver.set_problem_params(problem_params)
        v, E = \
            subgraph_isomorphism_solver.solve(max_outer_iters=3,max_inner_iters=50, show_iter=10000, verbose=False)
        v_binary, E_binary = subgraph_isomorphism_solver.threshold(v_np=v.detach().numpy())
        for i in range(len(v_gt)):
            if v_gt[i] > 0: v_gt[i] = 1
            else: v_gt[i] = 0
        ba_current = balanced_acc(v_gt, v_binary.clone().detach())
        
        
        if ba_current>best_ba:
            best_ba = ba_current
            best_mu = mu_MS
            counter = 0
        else:
            counter += 1
        # print("Searching for the best balance accuracy...")
        # print(f"Current Balanced Accuracy for {mu_MS} is {ba_current}")
        # print(f"Best Balanced Accuracy is for {best_mu}, equal to {best_ba}")
        if((counter>10) or (best_ba==1.0)): break
    return best_mu

if __name__ == '__main__':

    #graph_names = ['ant', 'football', 'highschool', 'malaria', 'powerlaw_200_50_50', 'renyi_200_50', 'barabasi_200_50']
    dataset = sys.argv[1]
    percentage_lower_bound = int(sys.argv[2])
    percentage_upper_bound = int(sys.argv[3])
    per = float(sys.argv[4])
    edge_removal = float(sys.argv[5])
    folder_number = int(sys.argv[6])
    graph_names = [dataset]


    standard_voting_thresholds = [0.1, 0.2, 0.3, 0.4, 0.5, 0.6]
    neighborhood_thresholds = [0.1, 0.2, 0.3, 0.4, 0.5, 0.6]

    initial_dict_standard = {threshold: [] for threshold in standard_voting_thresholds}
    initial_dict_neighborhood = {threshold: [] for threshold in neighborhood_thresholds}

    graphs = []
    use_global_mu = True
    for graph_name in graph_names:
        
        res_dict={}
        res_dict[graph_name] = {}
        best_mu = {}
        best_m_par = 0
        counter_m_par = 0
        folder_amount = folder_number
        for folder_no in range(folder_amount , folder_amount + 1):
            if use_global_mu and folder_no==0: continue
            # perc = [0.1, 0.2, 0.3]
            clcr = [i/10.0 for i in range(percentage_lower_bound, percentage_upper_bound)]
            if folder_no == 0: 
                best_mu[per] = {}
            res_dict[graph_name][int(per*100)] = {}
            for lr in clcr:   
                
                # Create dictionaries for standard voting
                standard_voting_balanced_accuracies = deepcopy(initial_dict_standard)
                standard_voting_accuracies = deepcopy(initial_dict_standard)
                standard_voting_recalls = deepcopy(initial_dict_standard)
                standard_voting_precisions = deepcopy(initial_dict_standard)
                standard_voting_f1s = deepcopy(initial_dict_standard)
                standard_voting_ged = deepcopy(initial_dict_standard)
                standard_voting_spectrum = deepcopy(initial_dict_standard)
                standard_voting_spectrum_diff = deepcopy(initial_dict_standard)

                # Create dictionaries for standard voting
                cc_standard_voting_balanced_accuracies = deepcopy(initial_dict_standard)
                cc_standard_voting_accuracies = deepcopy(initial_dict_standard)
                cc_standard_voting_recalls = deepcopy(initial_dict_standard)
                cc_standard_voting_precisions = deepcopy(initial_dict_standard)
                cc_standard_voting_f1s = deepcopy(initial_dict_standard)
                cc_standard_voting_ged = deepcopy(initial_dict_standard)
                cc_standard_voting_spectrum = deepcopy(initial_dict_standard)
                cc_standard_voting_spectrum_diff = deepcopy(initial_dict_standard)

                # Create dictionaries for neighborhood
                neighborhood_balanced_accuracies = deepcopy(initial_dict_neighborhood)
                neighborhood_accuracies = deepcopy(initial_dict_neighborhood)
                neighborhood_recalls = deepcopy(initial_dict_neighborhood)   
                neighborhood_precisions = deepcopy(initial_dict_neighborhood)
                neighborhood_f1s = deepcopy(initial_dict_neighborhood)
                neighborhood_ged = deepcopy(initial_dict_neighborhood)
                neighborhood_spectrum = deepcopy(initial_dict_neighborhood)
                neighborhood_spectrum_diff = deepcopy(initial_dict_neighborhood)

                # Create dictionaries for neighborhood
                cc_neighborhood_balanced_accuracies = deepcopy(initial_dict_neighborhood)
                cc_neighborhood_accuracies = deepcopy(initial_dict_neighborhood)
                cc_neighborhood_recalls = deepcopy(initial_dict_neighborhood)   
                cc_neighborhood_precisions = deepcopy(initial_dict_neighborhood)
                cc_neighborhood_f1s = deepcopy(initial_dict_neighborhood)
                cc_neighborhood_ged = deepcopy(initial_dict_neighborhood)
                cc_neighborhood_spectrum = deepcopy(initial_dict_neighborhood)
                cc_neighborhood_spectrum_diff = deepcopy(initial_dict_neighborhood)

                # Lists for original results
                og_balanced_accuracies = []
                og_accuracies = []
                og_recalls = []
                og_precisions = []
                og_f1s = []
                og_ged = []
                og_spectrum = []
                og_spectrum_diff = []

                conductances = []
                edge_removals = []
                all_votes = []
                ground_truth = []

                script_dir = os.path.dirname(__file__)
                rel_path = f'experiments_final{folder_number}/{graph_name}/{per}/{lr*100}'
                Path(rel_path).mkdir(parents=True, exist_ok=True)
                abs_file_path = os.path.join(script_dir, rel_path)
                if folder_no == 0: 
                    best_mu[per][lr] = 0
                ext = str(int(per*100))
                part_file = './data/'+graph_name+'/'+str(int(per*100))+'/'+str(folder_no)+'/'+graph_name+'_'+ext+'_nodes.txt'
                # print(f'Reading subgraph from {part_file}')
                query_nodes=np.loadtxt(part_file)
                # print(query_nodes)
                #print(part_nodes)
                ext = str(int(per*100))+"_"+str(int(lr*100))
                edgefile = './data/'+graph_name+'/'+str(int(per*100))+'/'+str(folder_no)+'/'+graph_name+'_'+ext+'.txt'
                if folder_no == 0:
                    # print('**** Looking for the best m ****')
                    best_mu[per][lr] = find_best_mu(edgefile, query_nodes)
                    best_m_par += best_mu[per][lr]
                    counter_m_par += 1
                else:
                    if use_global_mu:
                        standard_voting_results, neighborhood_results, condac, og_results, ref_spectrum, standard_voting_results_with_cardinality_constraint, neighborhood_results_with_cardinality_constraint, votes, v_gt = run_opt(edgefile,query_nodes, 0.2, standard_voting_thresholds, neighborhood_thresholds, edge_removal)
                        conductances.append(condac)
                        edge_removals.append(edge_removal)
                        all_votes.append(votes)
                        ground_truth.append(v_gt)
                        # res_dict[graph_name][(int(per*100))][condac] = [acc, bal_acc, 0.2]
                        for result in standard_voting_results:
                            threshold = result["threshold"]
                            standard_voting_balanced_accuracies[threshold].append(result["balanced_acc"])   
                            standard_voting_accuracies[threshold].append(result["acc"])
                            standard_voting_recalls[threshold].append(result["recall"])
                            standard_voting_precisions[threshold].append(result["precision"])
                            standard_voting_f1s[threshold].append(result["f1"])
                            # standard_voting_ged[threshold].append(result["graph_edit_distance"])
                            standard_voting_spectrum[threshold].append(result["spectrum"])
                            standard_voting_spectrum_diff[threshold].append(result["spectrum_diff"])
                        for result in standard_voting_results_with_cardinality_constraint:
                            threshold = result["threshold"]
                            cc_standard_voting_balanced_accuracies[threshold].append(result["balanced_acc"])   
                            cc_standard_voting_accuracies[threshold].append(result["acc"])
                            cc_standard_voting_recalls[threshold].append(result["recall"])
                            cc_standard_voting_precisions[threshold].append(result["precision"])
                            cc_standard_voting_f1s[threshold].append(result["f1"])
                            # cc_standard_voting_ged[threshold].append(result["graph_edit_distance"])
                            cc_standard_voting_spectrum[threshold].append(result["spectrum"])
                            cc_standard_voting_spectrum_diff[threshold].append(result["spectrum_diff"])
                        for result in neighborhood_results:
                            threshold = result["threshold"]
                            neighborhood_balanced_accuracies[threshold].append(result["balanced_acc"])   
                            neighborhood_accuracies[threshold].append(result["acc"])
                            neighborhood_recalls[threshold].append(result["recall"])
                            neighborhood_precisions[threshold].append(result["precision"])
                            neighborhood_f1s[threshold].append(result["f1"])
                            # neighborhood_ged[threshold].append(result["graph_edit_distance"])
                            neighborhood_spectrum[threshold].append(result["spectrum"])
                            neighborhood_spectrum_diff[threshold].append(result["spectrum_diff"])
                        for result in neighborhood_results_with_cardinality_constraint:
                            threshold = result["threshold"]
                            cc_neighborhood_balanced_accuracies[threshold].append(result["balanced_acc"])   
                            cc_neighborhood_accuracies[threshold].append(result["acc"])
                            cc_neighborhood_recalls[threshold].append(result["recall"])
                            cc_neighborhood_precisions[threshold].append(result["precision"])
                            cc_neighborhood_f1s[threshold].append(result["f1"])
                            # cc_neighborhood_ged[threshold].append(result["graph_edit_distance"])
                            cc_neighborhood_spectrum[threshold].append(result["spectrum"])
                            cc_neighborhood_spectrum_diff[threshold].append(result["spectrum_diff"])
                        og_balanced_accuracies.append(og_results["balanced_acc"])
                        og_accuracies.append(og_results["acc"])
                        og_precisions.append(og_results["precision"])
                        og_recalls.append(og_results["recall"])
                        og_f1s.append(og_results["f1"])
                        # og_ged.append(og_results["graph_edit_distance"])
                        og_spectrum.append(og_results["spectrum"])
                        og_spectrum_diff.append(og_results["spectrum_diff"])

                    else:
                        standard_voting_results, neighborhood_results, condac, og_results, ref_spectrum, standard_voting_results_with_cardinality_constraint, neighborhood_results_with_cardinality_constraint, votes, v_gt = run_opt(edgefile,query_nodes, best_mu[per][lr], standard_voting_thresholds, neighborhood_thresholds, edge_removal)
                        conductances.append(condac)
                        edge_removals.append(edge_removal)
                        all_votes.append(votes)
                        ground_truth.append(v_gt)
                        # res_dict[graph_name][(int(per*100))][condac] = [acc, bal_acc, 0.2]
                        for result in standard_voting_results:
                            threshold = result["threshold"]
                            standard_voting_balanced_accuracies[threshold].append(result["balanced_acc"])   
                            standard_voting_accuracies[threshold].append(result["acc"])
                            standard_voting_recalls[threshold].append(result["recall"])
                            standard_voting_precisions[threshold].append(result["precision"])
                            standard_voting_f1s[threshold].append(result["f1"])
                            # standard_voting_ged[threshold].append(result["graph_edit_distance"])
                        for result in neighborhood_results:
                            threshold = result["threshold"]
                            neighborhood_balanced_accuracies[threshold].append(result["balanced_acc"])   
                            neighborhood_accuracies[threshold].append(result["acc"])
                            neighborhood_recalls[threshold].append(result["recall"])
                            neighborhood_precisions[threshold].append(result["precision"])
                            neighborhood_f1s[threshold].append(result["f1"])
                            # neighborhood_ged[threshold].append(result["graph_edit_distance"])
                        og_balanced_accuracies.append(og_results["balanced_acc"])
                        og_accuracies.append(og_results["acc"])
                        og_precisions.append(og_results["precision"])
                        og_recalls.append(og_results["recall"])
                        og_f1s.append(og_results["f1"])
                        # og_ged.append(og_results["graph_edit_distance"])

                       # Write results for standard voting 
                rel_path = f'experiments_final{folder_number}/{graph_name}/{per}/{lr*100}'
                Path(rel_path).mkdir(parents=True, exist_ok=True)
                script_dir = os.path.dirname(__file__)
                abs_file_path = os.path.join(script_dir, rel_path)
                
                # Write for original results
                f = open(f'{abs_file_path}/og_spectrum_diff_no_threshold_abs.txt', 'a+')
                f.write(str(og_spectrum_diff))

                f = open(f'{abs_file_path}/og_balanced_accuracy_no_threshold_abs.txt', 'a+')
                f.write(str(og_balanced_accuracies))