#include <vector>

#ifdef TIME
    #include <time.hxx>
#endif


namespace preordering 
{

template<class ARC_COSTS, class ADJACENCY>
typename ARC_COSTS::VALUE_TYPE greedy_moving(
    const ARC_COSTS& arc_costs, ADJACENCY& adjacency
){
    typedef typename ARC_COSTS::VALUE_TYPE COST_TYPE;
    size_t n = arc_costs.size();

    assert (adjacency.size() == n);

    enum class MoveType
    {
        UP,
        DOWN,
        NONE,
        OTHER_CLUSTER,
        INSERT_ARC,
        REMOVE_ARC
    };

    struct BestMove
    {
        size_t i;  // node to move
        COST_TYPE cost; // cost of the move
        MoveType move_type;  // type of the move
        size_t target = 0;  // a representative node of the cluster where i is moved (if move_type == OTHER_CLUSTER)
    };

    COST_TYPE objective = 0;
    for (size_t i = 0; i < n; ++i)
    for (size_t j = 0; j < n; ++j)
    {
        if (adjacency(i, j))
            objective += arc_costs(i, j);
    }

    #ifdef TIME
        double t_update = 0;
        double t_move = 0;
        double t_insert = 0;
        double t_remove = 0;
        Clock clock;
    #endif

    while (true)
    {
        #ifdef TIME
            clock.reset();
        #endif
        BestMove best_move = {0, 0, MoveType::NONE};
        std::vector<COST_TYPE> isolate(n, 0);  // cost of isolating a node from a preorder (i.e. remove all incoming and outgoing arcs)
        for (size_t i = 0; i < n; ++i)
        {
            // move i above or below its own cluster
            COST_TYPE move_up_cost = 0;
            COST_TYPE move_down_cost = 0;
            bool is_singleton = true;
            for (size_t j = 0; j < n; ++j)
            {
                if (i == j) continue;
                if (adjacency(i, j) == 1)
                    isolate[i] += arc_costs(i, j);
                if (adjacency(j, i) == 1)
                    isolate[i] += arc_costs(j, i);
                if ((adjacency(i, j) == 1) && ( adjacency(j, i) == 1))
                {
                    is_singleton = false;
                    move_up_cost -= arc_costs(i, j);
                    move_down_cost -= arc_costs(j, i);
                }
            }
            if (is_singleton)
                continue;
            if (move_up_cost > best_move.cost)
                best_move = {i, move_up_cost, MoveType::UP};
            if (move_down_cost > best_move.cost)
                best_move = {i, move_down_cost, MoveType::DOWN};
        }

        ARC_COSTS move(n, 0);  // move(i, j) is the cost for moving i into the cluster of j
        for (size_t j = 0; j < n; ++j)
        {
            for (size_t k = 0; k < n; ++k)
            {
                if (adjacency(j, k))
                {
                    for (size_t i = 0; i < n; ++i)
                        if (i != k)
                            move(i, j) += arc_costs(i, k);
                }
                if (adjacency(k, j))
                {
                    for (size_t i = 0; i < n; ++i)
                        if (i != k)
                            move(i, j) += arc_costs(k, i);
                }
            }
        }
        for (size_t i = 0; i < n; ++i)
        for (size_t j = 0; j < n; ++j)
        {
            COST_TYPE move_ij = move(i, j) - isolate[i];
            if (adjacency(i, j) && adjacency(j, i))
                continue;
            if (move_ij > best_move.cost)
            {
                best_move = {i, move_ij, MoveType::OTHER_CLUSTER, j};
            }
        }
        #ifdef TIME
            t_move += clock.elapsed();
            clock.reset();
        #endif

        // compute clustering
        std::vector<std::vector<size_t>> clusters(n);
        std::vector<bool> visited(n, false);
        for (size_t i = 0; i < n; ++i)
        {
            if (visited[i])
                continue;
            for (size_t j = i; j < n; ++j)
            {
                if (adjacency(i, j) && adjacency(j, i))
                {
                    clusters[i].push_back(j);
                    visited[j] = true;
                }
            }
        }

        // remove arc from i to j
        for (size_t i = 0; i < n; ++i)
        {
            if (clusters[i].empty())
                continue;
            for (size_t j = 0; j < n; ++j)
            {
                if (clusters[j].empty())
                    continue;
                if (!adjacency(i, j) || adjacency(j, i))
                    continue;
                // test if i->j is in transitive reduction
                bool is_implied = false;
                for (size_t k = 0; k < n; ++k)
                {
                    if (clusters[k].empty())
                        continue;
                    if (k == i || k == j)
                        continue;
                    if ((adjacency(i, k) == 1) && (adjacency(k, j) == 1) && !adjacency(k, i) && !adjacency(j, k))
                    {
                        is_implied = true;
                        break;
                    }
                }
                if (is_implied)
                    continue;
                COST_TYPE remove_cost = 0;
                for (size_t cluster_i : clusters[i])
                {
                    for (size_t cluster_j : clusters[j])
                    {
                        remove_cost -= arc_costs(cluster_i, cluster_j);
                    }   
                }
                if (remove_cost > best_move.cost)
                {                    
                    best_move = {i, remove_cost, MoveType::REMOVE_ARC, j};
                }
            }
        }

        #ifdef TIME
            t_remove += clock.elapsed();
            clock.reset();
        #endif
        
        ARC_COSTS outgoing(n, 0);  // outgoing(i, j) is the sum of the costs of all arcs from i to successors of j
        for (size_t j = 0; j < n; ++j)
        {
            for (size_t k = 0; k < n; ++k)
            {
                if (!adjacency(j, k))
                    continue;
                for (size_t i = 0; i < n; ++i)
                {
                    if (adjacency(i, k))
                        continue;
                    outgoing(i, j) += arc_costs(i, k);
                }
            }
        }

        // with this, the change in objective value for setting i->j to 1 is computed as
        // the sum of all outgoing(k, j) for all predecessors k of i
        ARC_COSTS insert_gain(n, 0);
        for (size_t k = 0; k < n; ++k)
        {
            for (size_t i = 0; i < n; ++i)
            {
                if (!adjacency(k, i))
                    continue;
                for (size_t j = 0; j < n; ++j)
                {
                    insert_gain(i, j) += outgoing(k, j);
                }
            }
        }

        for (size_t j = 0; j < n; ++j)
        for (size_t i = 0; i < n; ++i)
        {
            if (insert_gain(i, j) >= best_move.cost && !adjacency(i, j))  // explicitly allow arc insertions with gain 0
                best_move = {i, insert_gain(i, j), MoveType::INSERT_ARC, j};
        }

        #ifdef TIME
            t_insert += clock.elapsed();
            clock.reset();
        #endif
                
        
        if (best_move.move_type == MoveType::NONE)
            break;

        size_t i = best_move.i;
        objective += best_move.cost;

        if (best_move.move_type == MoveType::UP)  // move i above its current cluster
        {
            #ifdef VERBOSE
                std::cout << "Moving node " << i << " above its current cluster with cost " << best_move.cost << "\n";
            #endif
            for (size_t k = 0; k < n; ++k)
            {
                if (k == i)
                    continue;
                if ((adjacency(i, k) == 1) && (adjacency(k, i) == 1))
                {
                    adjacency(i, k) = 0;
                }
            }
        }
        else if (best_move.move_type == MoveType::DOWN)  // move i below its current cluster
        {
            #ifdef VERBOSE
                std::cout << "Moving node " << i << " below its current cluster with cost " << best_move.cost << "\n";
            #endif
            for (size_t k = 0; k < n; ++k)
            {
                if (k == i)
                    continue;
                if ((adjacency(i, k) == 1) && (adjacency(k, i) == 1))
                {
                    adjacency(k, i) = 0;
                }
            }
        }
        else if (best_move.move_type == MoveType::INSERT_ARC)  // insert arc from i to j
        {
            #ifdef VERBOSE
                std::cout << "Inserting arc from node " << i << " to node " << best_move.target << " with cost " << best_move.cost << "\n";
            #endif
            size_t j = best_move.target;
            for (size_t pred_i = 0; pred_i < n; ++pred_i)
            {
                if (adjacency(pred_i, i) == 0)
                    continue;
                for (size_t succ_j = 0; succ_j < n; ++succ_j)
                {
                    if (adjacency(j, succ_j) == 0)
                        continue;
                    adjacency(pred_i, succ_j) = 1;
                }
            }
        }
        else if (best_move.move_type == MoveType::REMOVE_ARC)  // remove arc from i to j
        {
            #ifdef VERBOSE
                std::cout << "Removing arc from node " << i << " to node " << best_move.target << " with cost " << best_move.cost << "\n";
            #endif
            size_t j = best_move.target;
            for (size_t cluster_i = 0; cluster_i < n; ++cluster_i)
            {
                if ((adjacency(cluster_i, i) == 0) || (adjacency(i, cluster_i) == 0))
                    continue;
                for (size_t cluster_j = 0; cluster_j < n; ++cluster_j)
                {
                    if ((adjacency(cluster_j, j) == 0) || (adjacency(j, cluster_j) == 0))
                        continue;
                    adjacency(cluster_i, cluster_j) = 0;
                }
            }
        }
        else if (best_move.move_type == MoveType::OTHER_CLUSTER)  // move i to the cluster of j
        {
            #ifdef VERBOSE
                std::cout << "Moving node " << i << " to cluster of node " << best_move.target << " with cost " << best_move.cost << "\n";
            #endif
            size_t j = best_move.target;
            // move i to the cluster of j
            for (size_t k = 0; k < n; ++k)
            {
                if (k == i)
                    continue;
                adjacency(i, k) = adjacency(j, k);
                adjacency(k, i) = adjacency(k, j);
            }
        }

        #ifdef TIME
            t_update += clock.elapsed();
            clock.reset();
        #endif
    }

    #ifdef TIME
        std::cout << "t_move = " << t_move << "\n";
        std::cout << "t_remove = " << t_remove << "\n";
        std::cout << "t_insert = " << t_insert << "\n";
        std::cout << "t_update = " << t_update << "\n";
    #endif


    return objective;
}

} // namespace preordering