import pandas as pd
import numpy as np

def read_connection_matrix(filename):
    """
    Reads the connection matrix from a CSV file and returns it as a DataFrame.
    """
    return pd.read_csv(filename, index_col=0)

def get_edges_from_path(traversal_path):
    """Extracts the directed edges from a given traversal path."""
    return [(traversal_path[i], traversal_path[i + 1]) for i in range(len(traversal_path) - 1)]

def check_if_path_covers_all_edges_exactly_once(matrix, traversal_path):
    """Checks if the given traversal path covers all directed edges in the connection matrix exactly once."""
    # Extract all edges from the traversal path
    path_edges = get_edges_from_path(traversal_path)

    # Extract all edges from the connection matrix
    graph_edges = set()
    for i in matrix.index:
        for j in matrix.columns:
            if matrix.loc[i, j] == 1:
                graph_edges.add((i, j))

    # Check if all graph edges are covered by path edges exactly once
    if len(path_edges) != len(graph_edges):
        return False

    path_edges_count = {edge: path_edges.count(edge) for edge in path_edges}
    if any(count > 1 for count in path_edges_count.values()):
        return False

    return set(path_edges) == graph_edges
  
def dfs_traversal(matrix, start_node='VSS'):
    """
    Performs a DFS traversal on the connection matrix starting from the specified node 
    and returns the traversal path as an array of nodes.
    """
    visited_edges = set()
    traversal_path = []

    def dfs(node):
        traversal_path.append(node)
        for neighbor in matrix.columns:
            if matrix.at[node, neighbor] == 1 and (node, neighbor) not in visited_edges:
                visited_edges.add((node, neighbor))
                visited_edges.add((neighbor, node))  # Since the graph is undirected
                dfs(neighbor)
                traversal_path.append(node)  # Record the path back
    
    # Start DFS from the specified start node
    if start_node in matrix.index:
        dfs(start_node)
    
    # Generate a set of all edges in the graph
    all_edges = set()
    for node in matrix.index:
        for neighbor in matrix.columns:
            if matrix.at[node, neighbor] == 1:
                all_edges.add((node, neighbor))
                all_edges.add((neighbor, node))  # Since the graph is undirected
    
    return traversal_path, check_if_path_covers_all_edges_exactly_once(matrix, traversal_path)

def dfs_traversal_after(matrix, start_node='VSS', visited_edges = {}, traversal_path = []):
    """
    Performs a DFS traversal on the connection matrix starting from the specified node 
    and returns the traversal path as an array of nodes.
    """
    def dfs(node):
        traversal_path.append(node)
        for neighbor in matrix.columns:
            if matrix.at[node, neighbor] == 1 and (node, neighbor) not in visited_edges:
                visited_edges.add((node, neighbor))
                visited_edges.add((neighbor, node))  # Since the graph is undirected
                dfs(neighbor)
                traversal_path.append(node)  # Record the path back
    
    # Start DFS from the specified start node
    if start_node in matrix.index:
        dfs(start_node)

    return traversal_path

def dfs_all_continue(matrix, all_paths, unique_paths, max_solutions=2000):

    if len(all_paths)>max_solutions-1:
        stop = True
    else:
        stop = False
    for path_first in (all_paths):
        if stop == True:
            break
        visited_edges = set()
        for i in range(len(path_first)-1):
            if stop == True:
                break
            visited_edges.add((path_first[i], path_first[i+1]))
            visited_edges.add((path_first[i+1], path_first[i]))
            for neighbor in matrix.columns:
                if matrix.at[path_first[i], neighbor] == 1 and (path_first[i], neighbor) not in visited_edges:
                    visited_edges.add((path_first[i], neighbor))
                    visited_edges.add((neighbor, path_first[i]))
                    new_visited_edges = set()
                    if i!=0:
                        for z in range (i):
                            new_visited_edges.add((path_first[z], path_first[z+1]))
                            new_visited_edges.add((path_first[z+1], path_first[z]))
                    new_visited_edges.add((path_first[i], neighbor))
                    new_visited_edges.add((neighbor, path_first[i]))

                    newpath = []
                    for z in range (i+1):
                        newpath.append(path_first[z])
                    newnewpath = newpath.copy()
                    path = dfs_traversal_after(matrix,neighbor,new_visited_edges,newpath)
                    path.extend(newnewpath[::-1])
                    path_tuple = tuple(path)
                    if check_if_path_covers_all_edges_exactly_once(matrix, path):
                        if path_tuple not in unique_paths:
                            unique_paths.add(path_tuple)
                            all_paths.append(path.copy())
                if len(all_paths)>max_solutions-1:
                    stop = True
                    break
    return all_paths, unique_paths

def dfs_all_paths(matrix, start_node='VSS', max_solutions=2000, run_num = 4):
    """
    Performs a DFS traversal on the connection matrix starting from the specified node 
    and returns up to max_solutions complete traversal paths as a list of arrays of nodes.
    """

    all_paths = []
    unique_paths = set()

    path_first, result = dfs_traversal(matrix, start_node)

    if result == False:
        print('error')
        return None
    path_tuple = tuple(path_first)
    if path_tuple not in unique_paths:
        unique_paths.add(path_tuple)
        all_paths.append(path_first.copy())

    for run in range (run_num):
        all_paths, unique_paths = dfs_all_continue(matrix,all_paths,unique_paths,max_solutions)


    # stop = False
    # visited_edges = set()
    # for i in range(len(path_first)-1):
    #     if stop == True:
    #         break
    #     visited_edges.add((path_first[i], path_first[i+1]))
    #     visited_edges.add((path_first[i+1], path_first[i]))
    #     for neighbor in matrix.columns:
    #         if matrix.at[path_first[i], neighbor] == 1 and (path_first[i], neighbor) not in visited_edges:
    #             visited_edges.add((path_first[i], neighbor))
    #             visited_edges.add((neighbor, path_first[i]))
    #             new_visited_edges = set()
    #             if i!=0:
    #                 for z in range (i):
    #                     new_visited_edges.add((path_first[z], path_first[z+1]))
    #                     new_visited_edges.add((path_first[z+1], path_first[z]))
    #             new_visited_edges.add((path_first[i], neighbor))
    #             new_visited_edges.add((neighbor, path_first[i]))

    #             newpath = []
    #             for z in range (i+1):
    #                 newpath.append(path_first[z])
    #             newnewpath = newpath.copy()
    #             path = dfs_traversal_after(matrix,neighbor,new_visited_edges,newpath)
    #             path.extend(newnewpath[::-1])
    #             path_tuple = tuple(path)
    #             if check_if_path_covers_all_edges_exactly_once(matrix, path):
    #                 if path_tuple not in unique_paths:
    #                     unique_paths.add(path_tuple)
    #                     all_paths.append(path.copy())
    #         if len(all_paths)>max_solutions-1:
    #             stop = True
    #             break

    # if len(all_paths)>max_solutions-1:
    #     stop = True
    # else:
    #     stop = False
    # for path_first in (all_paths):
    #     if stop == True:
    #         break
    #     visited_edges = set()
    #     for i in range(len(path_first)-1):
    #         if stop == True:
    #             break
    #         visited_edges.add((path_first[i], path_first[i+1]))
    #         visited_edges.add((path_first[i+1], path_first[i]))
    #         for neighbor in matrix.columns:
    #             if matrix.at[path_first[i], neighbor] == 1 and (path_first[i], neighbor) not in visited_edges:
    #                 visited_edges.add((path_first[i], neighbor))
    #                 visited_edges.add((neighbor, path_first[i]))
    #                 new_visited_edges = set()
    #                 if i!=0:
    #                     for z in range (i):
    #                         new_visited_edges.add((path_first[z], path_first[z+1]))
    #                         new_visited_edges.add((path_first[z+1], path_first[z]))
    #                 new_visited_edges.add((path_first[i], neighbor))
    #                 new_visited_edges.add((neighbor, path_first[i]))

    #                 newpath = []
    #                 for z in range (i+1):
    #                     newpath.append(path_first[z])
    #                 newnewpath = newpath.copy()
    #                 path = dfs_traversal_after(matrix,neighbor,new_visited_edges,newpath)
    #                 path.extend(newnewpath[::-1])
    #                 path_tuple = tuple(path)
    #                 if check_if_path_covers_all_edges_exactly_once(matrix, path):
    #                     if path_tuple not in unique_paths:
    #                         unique_paths.add(path_tuple)
    #                         all_paths.append(path.copy())
    #             if len(all_paths)>max_solutions-1:
    #                 stop = True
    #                 break
    
    return all_paths


start = 556
end = 567

for i in range (start, end):
    # print('DATA:', i)
    number = str(i)
    # Define the file name of the connection matrix
    connect_dir = number + '/Graph' + number + '.csv'

    # Read the connection matrix
    connection_matrix = read_connection_matrix(connect_dir)

    # Perform DFS traversal starting from VDD, finding up to 20 unique solutions
    all_traversal_paths = dfs_all_paths(connection_matrix, start_node='VSS', max_solutions =100)

    # Check if all paths cover all edges exactly once
    if all(check_if_path_covers_all_edges_exactly_once(connection_matrix, path) for path in all_traversal_paths) == False:
        print('DATA', i, "'s paths do not cover edges exactly once")
        break
    # all_cover_edges_exactly_once = all(check_if_path_covers_all_edges_exactly_once(connection_matrix, path) for path in all_traversal_paths)
    # print("Do all paths cover edges exactly once?", all_cover_edges_exactly_once)

    padded_paths = [path + ['TRUNCATE'] * (1025 - len(path)) for path in all_traversal_paths if len(path) <= 1025]

    # Output the number of complete paths
    print('DATA:', i, "Number of complete paths:", len(padded_paths))

    # Check if all paths are unique
    if len(padded_paths) != len(set(tuple(path) for path in padded_paths)):
        print('DATA', i, "'s paths are not unique")
        break
    # are_all_paths_unique = len(padded_paths) == len(set(tuple(path) for path in padded_paths))
    # print("Are all paths unique?", are_all_paths_unique)

    # Output all traversal paths
    # for i, path in enumerate(all_traversal_paths):
    #     print(len(path))
    #     print(f"Traversal Path {i+1}:")
    #     print(path)
    
    save_dir = number + '/Sequence_total' + number + '.npy'
    # Save the NumPy array to a file
    np.save(save_dir, padded_paths)

    # # Load the array from the file to verify
    # loaded_traversal_result = np.load(save_dir)
    # print("Loaded Traversal Path:")
    # print(loaded_traversal_result)