# Author: Botao Yu
'''
[anonymous]: 

Compare to enc_remigen_utils, this version
- Support tempo
- Support newer version of miditoolkit

- [2024.2.7] miditoolkit.containers -> miditoolkit
'''
import miditoolkit

from . import const
from . import enc_basic_utils
from .inst_sorting import get_inst_sorting_method
from .note_sorting import get_note_sorting_method


def convert_remigen_token_to_token_str(token):
    return enc_basic_utils.convert_basic_token_to_token_str(token)


def convert_remigen_token_list_to_token_str_list(token_list):
    return enc_basic_utils.convert_basic_token_list_to_token_str_list(token_list)


def convert_remigen_token_lists_to_token_str_lists(token_lists):
    return enc_basic_utils.convert_token_lists_to_token_str_lists(token_lists)


def convert_remigen_token_str_to_token(token_str):
    return enc_basic_utils.convert_basic_token_str_to_token(token_str)


def convert_token_str_list_to_token_list(token_str_list):
    return enc_basic_utils.convert_basic_token_str_list_to_token_list(token_str_list)


def convert_pos_info_to_token_lists(
    pos_info_id,
    remove_empty_bars=False,
    ignore_inst=False,
    ignore_ts=False,
    ignore_tempo=False,
    ignore_velocity=False,
    sort_insts=None,
    sort_notes=None,
):
    # bar, ts, pos, pitch, duration

    encoding = []

    sort_notes = get_note_sorting_method(sort_notes)
    if not ignore_inst:
        sort_insts = get_inst_sorting_method(sort_insts)

    max_pos = len(pos_info_id)
    cur_bar = None
    cur_ts = None
    cur_tempo = None
    for pos in range(max_pos):
        now_bar, now_ts, now_local_pos, now_tempo, now_insts_notes = pos_info_id[pos]
        # bar: every pos
        # ts: only at pos where it changes, otherwise None
        # local_pos: every pos
        # tempo: only at pos where it changes, otherwise None
        # insts_notes: only at pos where the note starts, otherwise None

        cur_local_pos = now_local_pos

        if now_tempo is not None and cur_tempo != now_tempo:
            cur_tempo = now_tempo

        if now_ts is not None and cur_ts != now_ts:
            cur_ts = now_ts

        # When entering a new bar, add a bar line token, 'b-1'
        if cur_bar != now_bar:
            if cur_bar is not None:
                encoding.append((const.BAR_ABBR, 1))  # bar
            cur_bar = now_bar

            # The first token of each bar is time signature.
            if not ignore_ts:
                encoding.append((const.TS_ABBR, cur_ts))  # ts

            # Second token is tempo
            if not ignore_tempo:
                encoding.append((const.TEMPO_ABBR, cur_tempo))  # tempo

        add_pos = False
        if now_insts_notes is not None:
            add_pos = True

        if add_pos:
            encoding.append((const.POS_ABBR, cur_local_pos))  # local pos

        if now_insts_notes is not None:
            cur_insts_notes = now_insts_notes
            insts_ids = list(cur_insts_notes.keys())

            if ignore_inst:
                inst_notes = []
                for inst_id in insts_ids:
                    inst_notes.extend(cur_insts_notes[inst_id])
                inst_notes = sort_notes(inst_notes)
                for pitch, duration, velocity in inst_notes:
                    encoding.append((const.PITCH_ABBR, pitch))  # pitch
                    encoding.append((const.DURATION_ABBR, duration))  # duration
                    if not ignore_velocity:
                        encoding.append((const.VELOCITY_ABBR, velocity))  # velocity
            else:
                insts_ids = sort_insts(insts_ids)
                for inst_id in insts_ids:
                    encoding.append((const.INST_ABBR, inst_id))  # inst
                    inst_notes = sort_notes(cur_insts_notes[inst_id])
                    for pitch, duration, velocity in inst_notes:
                        encoding.append((const.PITCH_ABBR, pitch))  # pitch
                        encoding.append((const.DURATION_ABBR, duration))  # duration
                        if not ignore_velocity:
                            encoding.append((const.VELOCITY_ABBR, velocity))  # velocity

    # Append a bar line token in the end
    encoding.append((const.BAR_ABBR, 1))  # bar

    if remove_empty_bars:
        encoding = do_remove_empty_bars(encoding, ignore_ts=ignore_ts)

    token_lists = [encoding]

    return token_lists


def do_remove_empty_bars(encoding, ignore_ts=False):
    '''
    [anonymous]: this function is untested. Might be buggy.
    '''
    len_encoding = len(encoding)
    valid_start = None
    valid_end = len_encoding
    for idx in range(len_encoding):
        tag_abbr = encoding[idx][0]
        if tag_abbr == (const.TEMPO_ABBR if ignore_ts else const.TS_ABBR):
            valid_start = idx
        elif tag_abbr in (const.INST_ABBR,
                          const.PITCH_ABBR, const.DURATION_ABBR, const.VELOCITY_ABBR):
            break
    for idx in range(len_encoding - 1, -1, -1):
        tag_abbr = encoding[idx][0]
        if tag_abbr in (const.VELOCITY_ABBR, const.DURATION_ABBR, const.PITCH_ABBR,
                        const.INST_ABBR):
            break
        elif tag_abbr == const.BAR_ABBR:
            valid_end = idx + 1

    assert valid_start is not None
    assert valid_start < valid_end

    encoding = encoding[valid_start: valid_end]

    return encoding


def fix_token_list(token_list):
    token_list = token_list[:]
    return token_list


def generate_midi_obj_from_remigen_token_list(
    token_list,
    vocab_manager,
    ignore_velocity=True,
    ticks_per_beat=const.DEFAULT_TICKS_PER_BEAT,
    ts=const.DEFAULT_TS,
    tempo=const.DEFAULT_TEMPO,
    inst_id=const.DEFAULT_INST_ID,
    velocity=const.DEFAULT_VELOCITY,
):  # Todo: 增加TS
    # Bar, Pos, Pitch, Duration

    beat_note_factor = vocab_manager.beat_note_factor
    pos_resolution = vocab_manager.pos_resolution

    cur_bar_id = 0
    cur_ts_id = None
    cur_local_pos = None
    cur_ts_pos_per_bar = beat_note_factor * pos_resolution * ts[0] // ts[1]
    cur_global_bar_pos = 0
    cur_global_pos = 0

    cur_pitch = None
    cur_duration = None
    cur_velocity = velocity
    cur_tempo_id = None

    max_tick = 0

    midi_obj = miditoolkit.midi.parser.MidiFile(ticks_per_beat=ticks_per_beat)
    midi_obj.instruments = [
        # miditoolkit.containers.Instrument(program=(0 if i == 128 else i), is_drum=(i == 128), name=str(i))
        miditoolkit.Instrument(program=(0 if i == 128 else i), is_drum=(i == 128), name=str(i))
        for i in range(128 + 1)
    ]

    cur_inst = midi_obj.instruments[inst_id]

    last_item_type = None
    for item in token_list:  # Todo: 对错误的结果顺序做处理
        try:
            item_type, item_value = item
        except ValueError:
            print(item)
            raise
        if item_type == const.BAR_ABBR:
            cur_bar_id += 1
            cur_local_pos = None
            cur_global_bar_pos += cur_ts_pos_per_bar
            cur_global_pos = cur_global_bar_pos
        elif item_type == const.TS_ABBR:
            if cur_ts_id != item_value:
                cur_ts_id = item_value
                cur_ts = vocab_manager.convert_id_to_ts(cur_ts_id)
                cur_ts_pos_per_bar = beat_note_factor * pos_resolution * cur_ts[0] // cur_ts[1]
                midi_obj.time_signature_changes.append(
                    miditoolkit.TimeSignature(numerator=cur_ts[0], denominator=cur_ts[1],
                                                         time=vocab_manager.pos_to_time(cur_global_bar_pos,
                                                                                        ticks_per_beat,
                                                                                        pos_resolution=pos_resolution))
                )
        elif item_type == const.POS_ABBR:
            if cur_local_pos != item_value:
                cur_local_pos = item_value
                cur_global_pos = cur_global_bar_pos + cur_local_pos
        elif item_type == const.TEMPO_ABBR:
            if cur_tempo_id != item_value:
                cur_tempo_id = item_value
                cur_tempo = vocab_manager.convert_id_to_tempo(cur_tempo_id)
                midi_obj.tempo_changes.append(
                    miditoolkit.TempoChange(cur_tempo,
                                                       time=vocab_manager.pos_to_time(cur_global_pos,
                                                                                      ticks_per_beat,
                                                                                      pos_resolution=pos_resolution))
                )
        elif item_type == const.INST_ABBR:
            cur_inst = midi_obj.instruments[item_value]
        elif item_type == const.PITCH_ABBR:
            cur_pitch = vocab_manager.convert_id_to_pitch(item_value)
        elif item_type == const.DURATION_ABBR:
            if last_item_type != const.PITCH_ABBR:
                print('Warning: duration token without pitch token')
            # assert last_item_type == const.PITCH_ABBR, 'last item should be {} but is {}'.format(const.PITCH_ABBR, last_item_type)
            cur_duration = vocab_manager.convert_id_to_dur(item_value)

            if ignore_velocity:
                start_pos = cur_global_pos
                end_pos = start_pos + cur_duration
                start_time = vocab_manager.pos_to_time(start_pos, ticks_per_beat, pos_resolution=pos_resolution)
                end_time = vocab_manager.pos_to_time(end_pos, ticks_per_beat, pos_resolution=pos_resolution)
                max_tick = max(end_time, max_tick)
                cur_inst.notes.append(
                    miditoolkit.Note(start=start_time, end=end_time, pitch=cur_pitch, velocity=cur_velocity)
                )
        elif item_type == const.VELOCITY_ABBR:
            if ignore_velocity:
                print('There are velocity token but setting ignor_velocity=True')
                # raise ValueError(
                #     "Invalid token for velocity (%s) while setting ignore_velocity=True" % ('%s-%s' % item)
                # )

            assert last_item_type == const.DURATION_ABBR
            cur_velocity = vocab_manager.convert_id_to_vel(item_value)

            start_pos = cur_global_pos
            end_pos = start_pos + cur_duration
            start_time = vocab_manager.pos_to_time(start_pos, ticks_per_beat, pos_resolution=pos_resolution)
            end_time = vocab_manager.pos_to_time(end_pos, ticks_per_beat, pos_resolution=pos_resolution)
            max_tick = max(end_time, max_tick)
            cur_inst.notes.append(
                miditoolkit.Note(start=start_time, end=end_time, pitch=cur_pitch, velocity=cur_velocity)
            )
        else:
            raise ValueError("Unknown encoding type: %s" % item_type)
        last_item_type = item_type

    if len(midi_obj.tempo_changes) == 0:
        midi_obj.tempo_changes.append(
            miditoolkit.TempoChange(
                tempo,
                time=0
            )
        )

    # If there is no time signature change, add the default one
    if len(midi_obj.time_signature_changes) == 0:
        midi_obj.time_signature_changes.append(
            miditoolkit.TimeSignature(
                ts[0], ts[1], time=0
            )
        )

    midi_obj.max_tick = max_tick

    midi_obj.instruments = [i for i in midi_obj.instruments if len(i.notes) > 0]

    return midi_obj
