midi2pianoroll.py

"""Utility functions for conversion between midi and pianoroll"""

import numpy as np
import pretty_midi
import chord_extraction_test_with_bass
# import music21

key_dict = {'Cmajor': 0, 'C#major': 1, 'D-major': 1, 'Dmajor': 2, 'D#major': 3,
            'E-major': 3, 'Emajor': 4, 'Fmajor': 5, 'F#major': 6,
            'G-major': 6, 'Gmajor': 7, 'G#major': 8,
            'A-major': 8, 'Amajor': 9, 'A#major': 10, 'B-major': 10, 'Bmajor': 11
            }

def merge_dicts(*dict_args):
    """Given any number of dicts, shallow copy and merge into a new dict,
    precedence goes to key value pairs in latter dicts."""
    result = {}
    for dictionary in dict_args:
        result.update(dictionary)
    return result

def get_key_info(pm):
    if len(pm.key_signature_changes) > 0:
        print(pm.key_signature_changes)
        key = pm.key_signature_changes[0].key_number  # ignore key changes
        if key > 11:
            print('Minor key')
        return key

    else:
        print('does not have any key_signature_change')
        return -1

def get_time_signature_info_and_arrays(pm):
    """Given a pretty_midi.PrettyMIDI class instance, return its time signature
    info dictionary and time signature array dictionary."""
    # sort time signature changes by time
    pm.time_signature_changes.sort(key=lambda x: x.time)
    # create a list of time signature changes content and another for the event times
    time_signature_times = [tsc.time for tsc in pm.time_signature_changes]
    time_signature_numerators = [tsc.numerator for tsc in pm.time_signature_changes]
    time_signature_denominators = [tsc.denominator for tsc in pm.time_signature_changes]
    # set time signature if only one time signature change event found
    if len(time_signature_times) == 1:
        time_signature = str(time_signature_numerators[0]) + '/' + str(time_signature_denominators[0])
    else:
        time_signature = None
    # collect variables into dictionaries to return
    time_signature_info = {'num_time_signature_changes': len(time_signature_times),
                           'time_signature': time_signature}
    time_signature_arrays = {'time_signature_numerators': np.array(time_signature_numerators),
                             'time_signature_denominators': np.array(time_signature_denominators),
                             'time_signature_times': np.array(time_signature_times)}
    return time_signature_info, time_signature_arrays

def get_beat_info_and_arrays(pm, beat_resolution=4, sort_tsc=True):
    """Given a pretty_midi.PrettyMIDI class instance, return its beat info
    dictionary and beat array dictionary. If sort_tsc is True(by default), the
    time_signatrue_changes list of the pretty_midi object will first be sorted.
    """
    # sort time signature changes by time
    if sort_tsc:
        pm.time_signature_changes.sort(key=lambda x: x.time)
    # use built-in method in pretty_midi to get beat_start_time, beats and downbeats
    beat_start_time = pm.time_signature_changes[0].time if pm.time_signature_changes else 0.0
    beat_times = pm.get_beats(beat_start_time)
    downbeat_times = pm.get_downbeats(beat_start_time)
    # calculate beats information
    num_beats = len(beat_times)
    incomplete_at_start = bool(downbeat_times[0] > beat_times[0])
    num_bars = len(downbeat_times) + int(incomplete_at_start)
    # create an empty beat array and an empty downbeat array
    beat_array = np.zeros(shape=(beat_resolution*num_beats, 1), dtype=bool)
    downbeat_array = np.zeros(shape=(beat_resolution*num_beats, 1), dtype=bool)
    # fill in the beats array and the downbeats array
    beat_array[0:-1:beat_resolution] = True
    for _, downbeat_time in enumerate(downbeat_times):
        idx_to_fill = np.searchsorted(beat_times, downbeat_time, side='right')
        downbeat_array[idx_to_fill] = True
    # collect variables into dictionaries to return
    beat_info = {'beat_start_time': beat_start_time,
                 'num_beats': num_beats,
                 'num_bars': num_bars,
                 'incomplete_at_start': incomplete_at_start}
    beat_arrays = {'beat_times': beat_times,
                   'downbeat_times': downbeat_times,
                   'beat_array': beat_array,
                   'downbeat_array': downbeat_array}
    return beat_info, beat_arrays

def get_tempo_info_and_arrays(pm, beat_resolution=4, beat_times=None):
    """Given a pretty_midi.PrettyMIDI class instance, return its tempo info
    dictionary and tempo info array dictionary. If no beat_times is given,
    pm.get_beats(beat_start_time) will be first computed to get beat_times."""
    # compute beat_times when it is not given
    if beat_times is None:
        beat_start_time = pm.time_signature_changes[0].time if pm.time_signature_changes else 0.0
        beat_times = pm.get_beats(beat_start_time)
    # create an empty tempo_array
    tempo_array = np.zeros(shape=(beat_resolution*len(beat_times), 1), dtype=float)
    # use built-in method in pretty_midi to get tempo change events
    tempo_change_times, tempi = pm.get_tempo_changes()
    # print 'tempo:', tempo_change_times, tempi, tempo_array.size
    if not tempo_change_times.size:
        # set to default tempo value when no tempo change events
        return None, None
    else:
        # deal with the first tempo change event
        tempo_end_beat = (np.searchsorted(beat_times, tempo_change_times[0], side='right')) * beat_resolution
        tempo_array[0:tempo_end_beat] = tempi[0]
        tempo_start_beat = tempo_end_beat
        # deal with the rest tempo change event
        tempo_id = 0
        while tempo_id+1 < len(tempo_change_times):
            tempo_end_beat = (np.searchsorted(beat_times, tempo_change_times[tempo_id+1], side='right')) * beat_resolution
            tempo_array[tempo_start_beat:tempo_end_beat] = tempi[tempo_id]
            tempo_start_beat = tempo_end_beat
            tempo_id += 1
        # deal with the rest beatscd
        tempo_array[tempo_start_beat:] = tempi[tempo_id]
    # collect variables into dictionaries to return
    tempo_info = {'tempo': tempi[0] if len(tempo_change_times) == 1 else None}
    tempo_arrays = {'tempo_change_times': tempo_change_times,
                    'tempi': tempi,
                    'tempo_array': tempo_array}
    # for i, tempo in enumerate(tempo_array):
    #     print i, tempo
    # print 'tempo size:', tempo_array.size
    return tempo_info, tempo_arrays

def get_midi_info_and_arrays(pm, beat_resolution=4):
    """Given a pretty_midi.PrettyMIDI class instance, return its midi_info_dict
    and midi_array_dict."""
    # get time sigature changes info
    time_signature_info, time_signature_arrays = get_time_signature_info_and_arrays(pm)
    # get beat info dictionary and beats array dictionary
    beat_info, beat_arrays = get_beat_info_and_arrays(pm, beat_resolution=beat_resolution, sort_tsc=False)
    # get tempo info dictionary and tempo array dictionary
    tempo_info, tempo_arrays = get_tempo_info_and_arrays(pm, beat_resolution=beat_resolution,
                                                         beat_times=beat_arrays['beat_times'])
    if tempo_info is None:
        return None, None
    # collect the results into dictionaries to return
    midi_info = merge_dicts(beat_info, time_signature_info, tempo_info)
    midi_arrays = merge_dicts(beat_arrays, time_signature_arrays, tempo_arrays)

    return midi_info, midi_arrays

def get_piano_roll(instrument, beat_resolution=4, beat_times=None, tempo_array=None, pm=None):
    # print '-------------------------------'
    # print 'instrument name:', instrument.name
    """Given a pretty_midi.Instrument class instance, return the pianoroll of
    the instrument. When one of the beat_times and the tempo_array is not given,
    the pretty_midi object should be given."""
    if beat_times is None:
        beat_start_time = pm.time_signature_changes[0].time if pm.time_signature_changes else 0.0
        beat_times = pm.get_beats(beat_start_time)
    if tempo_array is None:
        _, tempo_array = get_tempo_info_and_arrays(pm, beat_times)
    num_beats = len(beat_times)
    # create the piano roll and the onset roll
    piano_roll = np.zeros(shape=(beat_resolution*num_beats, 128), dtype=int)
    onset_roll = np.zeros(shape=(beat_resolution*num_beats, 128), dtype=bool)
    # print beat_times
    # print tempo_array
    # calculate pixel per beat
    ppbeat = beat_resolution
    hppbeat = beat_resolution/2
    # iterate through notes
    for note in instrument.notes:
        if note.end < beat_times[0]:
            continue
        else:
            # print '----------------------------'
            # print 'note start:', note.start, note.pitch
            # find the corresponding index of the note on event
            if note.start >= beat_times[0]:
                start_beat = np.searchsorted(beat_times, note.start, side='right') - 1
                start_loc = (note.start - beat_times[start_beat])
                # print 'start loc1', start_loc
                # print 'tempo array', tempo_array[int(start_beat*ppbeat)]
                start_loc = (tempo_array[int(start_beat*ppbeat)] / 60.0) * start_loc
            else:
                start_beat = 0
                start_loc = [0.0]
            # print 'start beat:', start_beat
            # print 'start loc:', start_loc, start_loc * ppbeat
            # if np.isclose(start_loc, [1], rtol=1e-03):
            #     start_loc = [1]
            start_idx = int(start_beat*ppbeat) + int(round(start_loc*ppbeat))
            # print 'start idx:', start_idx
            # find the corresponding index of the note off event
            if instrument.is_drum:
                # set note length to minimal (32th notes) for drums
                end_idx = start_idx + 1
            else:
                end_beat = np.searchsorted(beat_times, note.end, side='right') - 1
                end_loc = (note.end - beat_times[end_beat])
                end_loc = end_loc * tempo_array[int(end_beat*ppbeat)] / 60.0
                # print 'end loc:', end_loc
                end_idx = int(end_beat*ppbeat) + int(round(end_loc*ppbeat))
                # make sure the note length is larger than minimum note length
                if end_idx - start_idx < 1:
                    end_idx = start_idx + 1

            # print 'end idx:', end_idx
            # set values to the piano-roll and the onset-roll matrix
            piano_roll[start_idx:(end_idx), note.pitch] = note.velocity
            if start_idx < onset_roll.shape[0]:
                onset_roll[start_idx, note.pitch] = True
    return piano_roll, onset_roll

def get_instrument_info(instrument):
    """Given a pretty_midi.Instrument class instance, return the infomation
    dictionary of the instrument."""
    return {'program_num': instrument.program,
            'program_name': pretty_midi.program_to_instrument_name(instrument.program),
            'name': instrument.name.strip(),
            'is_drum': instrument.is_drum,
            'family_num': int(instrument.program)//8,
            'family_name': pretty_midi.program_to_instrument_class(instrument.program)}

def get_piano_rolls_with_estimated_key(pm, beat_resolution=4):
    """
    Convert a midi file to piano-rolls of multiple tracks.

    Parameters
    ----------
    midi_path : str
        The path to the midi file.

    Returns
    -------
    piano_rolls : np.ndarray of int
        The extracted piano-rolls. The value represents the velocity. The first
        dimension is the id of the instrument. The size is (num_instrument,
        num_time_step, num_pitches).
    onset_rolls : np.ndarray of bool
        The extracted onset-rolls. The value indicates the occurence of onset
        events. The first dimension is the id of the instrument. The size is
        (num_instrument, num_time_step, num_pitches).
    info_dict : dict
        A dictionary containing extracted useful information lost during the
        conversion of the midi file.
            midi_arrays : dict
                A dictionary containing informative arrays.
                    beat_times : np.ndarray
                        The time (in sec) of each beat
                    downbeat_times : np.ndarray
                        The time (in sec) of each downbeat
                    tempo_array : np.ndarray
                        The tempo at each time step
                    beat_array : np.ndarray
                        The location (time step) of beats
                    downbeat_array : np.ndarray
                        The location (time step) of downbeats
            midi_info : dict
                Contains information of the midi file, including time_signature,
                beat and tempo info.
            instrument_info: dict
                Contains information of each track
    """

    # create an empty instrument dictionary to store information of each instrument
    instrument_info = {}
    piano_rolls = []
    onset_rolls = []
    # get the midi information and the beat/tempo arrays
    midi_info, midi_arrays = get_midi_info_and_arrays(pm, beat_resolution)
    numerators = midi_arrays['time_signature_numerators']
    denominators = midi_arrays['time_signature_denominators']
    for numerator, denominator in zip(numerators, denominators):
        if numerator != 4 or denominator != 4:
            print("numerator:", numerator)
            print("denominator:", denominator)
            print("not 4/4!!")
            # return None

    # sort instruments by their program numbers
    pm.instruments.sort(key=lambda x: x.program)
    print('instruments:', pm.instruments)

    bass_piano_roll = np.array([])
    # iterate thorugh all instruments
    i = 0
    for idx, instrument in enumerate(pm.instruments):
        # get the piano-roll and the onset-roll of a specific instrument
        piano_roll, onset_roll = get_piano_roll(instrument, beat_resolution=beat_resolution,
                                                beat_times=midi_arrays['beat_times'],
                                                tempo_array=midi_arrays['tempo_array'])
        if np.sum(piano_roll[:, 12:]) == 0:
            continue

        if instrument.is_drum:
            piano_rolls.append(np.zeros(shape = piano_roll.shape, dtype = int))
            onset_rolls.append(np.zeros(shape = onset_roll.shape, dtype = int))

        else:
            piano_rolls.append(piano_roll)
            onset_rolls.append(onset_roll)

        # append information of current instrument to instrument dictionary
        instrument_info[str(i)] = get_instrument_info(instrument)
        if instrument_info[str(i)]['program_num'] > 31 and instrument_info[str(i)]['program_num'] < 40:
            # print('program number: ', instrument_info[str(idx)]['program_num'], instrument_info[str(idx)]['program_name'])
            bass_piano_roll = piano_roll

        i += 1

    total_rolls = np.zeros_like(piano_rolls[0])
    for piano_roll in piano_rolls:
        total_rolls = np.add(total_rolls, piano_roll)


    histo_oct = np.zeros(12)
    histo = np.sum(total_rolls, axis = 0)

    for pitch in range(len(histo)):
        histo_oct[pitch % 12] += histo[pitch]

    print(histo_oct)

    max_n = histo_oct.argsort(axis=0)[-7:]
    max_n.sort()

    print(max_n)

    # get all scales for every root note
    major = np.array([0, 2, 4, 5, 7, 9, 11], dtype=int)
    major_scales = []
    for i in range(0, 12):
        major_scales.append(np.sort((np.array(major) + i) % 12))


    minor = np.array([0, 2, 3, 5, 7, 8, 10], dtype=int)
    minor_scales = []
    for i in range(0, 12):
        minor_scales.append(np.sort((np.array(minor) + i) % 12))

    key = -1
    for i, scale in enumerate(major_scales):
        if np.array_equal(max_n, scale):
            key = i

    for i, scale in enumerate(minor_scales):
        if np.array_equal(max_n, scale):
            if histo_oct[key] < histo_oct[i]:
                key = i + 12


    print('key:', key)
    if key == -1:
        new_key = get_key_info(pm)
        if new_key == -1:
            return None
        else:
            key_pitch = new_key % 12
    else:
        key_pitch = key % 12

    print('key_pitch:', key_pitch)

    # key_pitch = 0


    # new_piano_rolls = []
    # for piano_roll in piano_rolls:
    #     new_piano_roll = np.zeros(shape = piano_roll.shape, dtype = int)
    #     for time_slice in range(piano_roll.shape[0]):
    #         for pitch in range(piano_roll.shape[1]):
    #             if pitch >= key_pitch:
    #                 new_piano_roll[time_slice][pitch-key_pitch] = 1 if piano_roll[time_slice][pitch] != 0 else 0
    #
    #     new_piano_rolls.append(new_piano_roll)

    # new_onset_rolls = []
    # for onset_roll in onset_rolls:
    #     new_onset_roll = np.zeros(shape = onset_roll.shape, dtype = int)
    #     for time_slice in range(onset_roll.shape[0]):
    #         for pitch in range(onset_roll.shape[1]):
    #             if pitch >= key_pitch:
    #                 new_onset_roll[time_slice][pitch - key_pitch] = onset_roll[time_slice][pitch]
    #     new_onset_rolls.append(new_onset_roll)


    # new_total_rolls = np.zeros(shape = total_rolls.shape, dtype = int)
    # for time_slice in range(total_rolls.shape[0]):
    #     for pitch in range(total_rolls.shape[1]):
    #         if pitch >= key_pitch:
    #             new_total_rolls[time_slice][pitch - key_pitch] = 1 if total_rolls[time_slice][pitch] != 0 else 0
    #
    # new_bass_piano_roll = np.zeros(shape=bass_piano_roll.shape, dtype=int)
    # if new_bass_piano_roll.size != 0:
    #     for time_slice in range(total_rolls.shape[0]):
    #         for pitch in range(total_rolls.shape[1]):
    #             if pitch >= key_pitch:
    #                 new_bass_piano_roll[time_slice][pitch - key_pitch] = 1 if bass_piano_roll[time_slice][pitch] != 0 else 0

    # bass_notes_for_chords = []
    #
    # for i in range(0, bass_piano_roll.shape[0], 8):
    #     mini_roll = np.sum(bass_piano_roll[i:(i + 8), :], axis = 0)
    #
    #     if all(mini_roll == 0):
    #         note = -1
    #     else:
    #         note = np.argmax(mini_roll)
    #
    #     bass_notes_for_chords.append(note)

    # print('bass notes:', bass_notes_for_chords)
    # print('len:', len(bass_notes_for_chords))
    key_from_signature = get_key_info(pm)
    print('musegan key:', key_from_signature)

    # chords = []
    # chords = chord_extraction_test_with_bass.find_chord_from_bass_note(0, bass_notes_for_chords)
    chords = chord_extraction_test_with_bass.find_triad_chord_include_nondiatonic(key, total_rolls, bass_piano_roll)

    # print('chords:', chords, type(chords))

    info_dict = {'midi_arrays': midi_arrays,
                 'midi_info': midi_info,
                 'instrument_info': instrument_info}

    return piano_rolls, onset_rolls, info_dict, chords, key, key_from_signature

def get_piano_rolls_with_Krumhansl_key(pm, key, beat_resolution=4):
    """
    Convert a midi file to piano-rolls of multiple tracks.

    Parameters
    ----------
    midi_path : str
        The path to the midi file.

    Returns
    -------
    piano_rolls : np.ndarray of int
        The extracted piano-rolls. The value represents the velocity. The first
        dimension is the id of the instrument. The size is (num_instrument,
        num_time_step, num_pitches).
    onset_rolls : np.ndarray of bool
        The extracted onset-rolls. The value indicates the occurence of onset
        events. The first dimension is the id of the instrument. The size is
        (num_instrument, num_time_step, num_pitches).
    info_dict : dict
        A dictionary containing extracted useful information lost during the
        conversion of the midi file.
            midi_arrays : dict
                A dictionary containing informative arrays.
                    beat_times : np.ndarray
                        The time (in sec) of each beat
                    downbeat_times : np.ndarray
                        The time (in sec) of each downbeat
                    tempo_array : np.ndarray
                        The tempo at each time step
                    beat_array : np.ndarray
                        The location (time step) of beats
                    downbeat_array : np.ndarray
                        The location (time step) of downbeats
            midi_info : dict
                Contains information of the midi file, including time_signature,
                beat and tempo info.
            instrument_info: dict
                Contains information of each track
    """

    if key in key_dict:
        key_pitch = key_dict[key]

    else:
        print('Minor key', key)
        return None


    # create an empty instrument dictionary to store information of each instrument
    instrument_info = {}
    piano_rolls = []
    onset_rolls = []
    # get the midi information and the beat/tempo arrays
    midi_info, midi_arrays = get_midi_info_and_arrays(pm, beat_resolution)
    numerators = midi_arrays['time_signature_numerators']
    denominators = midi_arrays['time_signature_denominators']
    for numerator, denominator in zip(numerators, denominators):
        if numerator != 4 or denominator != 4:
            print("not 4/4")
            # return None

    # sort instruments by their program numbers
    pm.instruments.sort(key=lambda x: x.program)
    print('instruments:', pm.instruments)

    bass_piano_roll = np.array([])
    # iterate thorugh all instruments
    i = 0
    for idx, instrument in enumerate(pm.instruments):
        # get the piano-roll and the onset-roll of a specific instrument
        piano_roll, onset_roll = get_piano_roll(instrument, beat_resolution=beat_resolution,
                                                beat_times=midi_arrays['beat_times'],
                                                tempo_array=midi_arrays['tempo_array'])
        if np.sum(piano_roll[:, 12:]) == 0:
            continue

        if instrument.is_drum:
            piano_rolls.append(np.zeros(shape = piano_roll.shape, dtype = int))
            onset_rolls.append(np.zeros(shape = onset_roll.shape, dtype = int))

        else:
            piano_rolls.append(piano_roll)
            onset_rolls.append(onset_roll)

        # append information of current instrument to instrument dictionary
        instrument_info[str(i)] = get_instrument_info(instrument)
        if instrument_info[str(i)]['program_num'] > 31 and instrument_info[str(i)]['program_num'] < 40:
            # print('program number: ', instrument_info[str(idx)]['program_num'], instrument_info[str(idx)]['program_name'])
            bass_piano_roll = piano_roll

        i += 1

    total_rolls = np.zeros_like(piano_rolls[0])
    for piano_roll in piano_rolls:
        total_rolls = np.add(total_rolls, piano_roll)


    new_piano_rolls = []
    for piano_roll in piano_rolls:
        new_piano_roll = np.zeros(shape = piano_roll.shape, dtype = int)
        for time_slice in range(piano_roll.shape[0]):
            for pitch in range(piano_roll.shape[1]):
                if pitch >= key_pitch:
                    new_piano_roll[time_slice][pitch - key_pitch] = 1 if piano_roll[time_slice][pitch] != 0 else 0

        new_piano_rolls.append(new_piano_roll)

    new_onset_rolls = []
    for onset_roll in onset_rolls:
        new_onset_roll = np.zeros(shape = onset_roll.shape, dtype = int)
        for time_slice in range(onset_roll.shape[0]):
            for pitch in range(onset_roll.shape[1]):
                if pitch >= key_pitch:
                    new_onset_roll[time_slice][pitch - key_pitch] = onset_roll[time_slice][pitch]
        new_onset_rolls.append(new_onset_roll)


    new_total_rolls = np.zeros(shape = total_rolls.shape, dtype = int)
    for time_slice in range(total_rolls.shape[0]):
        for pitch in range(total_rolls.shape[1]):
            if pitch >= key_pitch:
                new_total_rolls[time_slice][pitch - key_pitch] = total_rolls[time_slice][pitch]

    new_bass_piano_roll = np.zeros(shape=bass_piano_roll.shape, dtype=int)
    if new_bass_piano_roll.size != 0:
        for time_slice in range(total_rolls.shape[0]):
            for pitch in range(total_rolls.shape[1]):
                if pitch >= key_pitch:
                    new_bass_piano_roll[time_slice][pitch - key_pitch] = bass_piano_roll[time_slice][pitch]

    # bass_notes_for_chords = []
    #
    # for i in range(0, bass_piano_roll.shape[0], 8):
    #     mini_roll = np.sum(bass_piano_roll[i:(i + 8), :], axis = 0)
    #
    #     if all(mini_roll == 0):
    #         note = -1
    #     else:
    #         note = np.argmax(mini_roll)
    #
    #     bass_notes_for_chords.append(note)

    # print('bass notes:', bass_notes_for_chords)
    # print('len:', len(bass_notes_for_chords))
    key_from_signature = get_key_info(pm)
    print('musegan key:', key_from_signature)

    # chords = []
    # chords = chord_extraction_test_with_bass.find_chord_from_bass_note(0, bass_notes_for_chords)
    chords = chord_extraction_test_with_bass.find_chord_from_bass_note_and_pianorolls(0, new_total_rolls, new_bass_piano_roll)

    # print('chords:', chords, type(chords))

    info_dict = {'midi_arrays': midi_arrays,
                 'midi_info': midi_info,
                 'instrument_info': instrument_info}

    return new_piano_rolls, new_onset_rolls, info_dict, chords, key, key_from_signature


def get_piano_rolls(pm, beat_resolution=4):
    """
    Convert a midi file to piano-rolls of multiple tracks.

    Parameters
    ----------
    midi_path : str
        The path to the midi file.

    Returns
    -------
    piano_rolls : np.ndarray of int
        The extracted piano-rolls. The value represents the velocity. The first
        dimension is the id of the instrument. The size is (num_instrument,
        num_time_step, num_pitches).
    onset_rolls : np.ndarray of bool
        The extracted onset-rolls. The value indicates the occurence of onset
        events. The first dimension is the id of the instrument. The size is
        (num_instrument, num_time_step, num_pitches).
    info_dict : dict
        A dictionary containing extracted useful information lost during the
        conversion of the midi file.
            midi_arrays : dict
                A dictionary containing informative arrays.
                    beat_times : np.ndarray
                        The time (in sec) of each beat
                    downbeat_times : np.ndarray
                        The time (in sec) of each downbeat
                    tempo_array : np.ndarray
                        The tempo at each time step
                    beat_array : np.ndarray
                        The location (time step) of beats
                    downbeat_array : np.ndarray
                        The location (time step) of downbeats
            midi_info : dict
                Contains information of the midi file, including time_signature,
                beat and tempo info.
            instrument_info: dict
                Contains information of each track
    """

    # Get key from key_signature_changes
    # key = get_key_info(pm)
    #
    # if key == -1 or key > 11:
    #     return None

    # create an empty instrument dictionary to store information of each instrument
    instrument_info = {}
    piano_rolls = []
    onset_rolls = []
    # get the midi information and the beat/tempo arrays
    midi_info, midi_arrays = get_midi_info_and_arrays(pm, beat_resolution)
    if midi_info is None:
        return None

    print(midi_arrays['tempi'])
    numerators = midi_arrays['time_signature_numerators']
    denominators = midi_arrays['time_signature_denominators']
    for numerator, denominator in zip(numerators, denominators):
        if numerator != 4 or denominator != 4:
            print("numerator:", numerator, "denominator:", denominator)
            print("not 4/4")
            return None

    # sort instruments by their program numbers
    pm.instruments.sort(key=lambda x: x.program)
    # print('instruments:', pm.instruments)

    key_pitch = 0
    # key_pitch = 5
    # print('original key:', key_pitch)
    bass_piano_roll = []
    # iterate thorugh all instruments
    for idx, instrument in enumerate(pm.instruments):

        # get the piano-roll and the onset-roll of a specific instrument
        piano_roll, onset_roll = get_piano_roll(instrument, beat_resolution=beat_resolution,
                                                beat_times=midi_arrays['beat_times'],
                                                tempo_array=midi_arrays['tempo_array'])

        if not instrument.is_drum:
            # print(instrument)
            # shift piano roll to ckey
            # new_piano_roll = np.zeros(shape = piano_roll.shape, dtype = int)
            # for time_slice in range(piano_roll.shape[0]):
            #     for pitch in range(piano_roll.shape[1]):
            #         if pitch >= key_pitch:
            #             new_piano_roll[time_slice][pitch - key_pitch] = 1 if piano_roll[time_slice][pitch] != 0 else 0
            #
            #
            # new_onset_roll = np.zeros(shape=onset_roll.shape, dtype=int)
            # for time_slice in range(onset_roll.shape[0]):
            #     for pitch in range(onset_roll.shape[1]):
            #         if pitch >= key_pitch:
            #             new_onset_roll[time_slice][pitch - key_pitch] = onset_roll[time_slice][pitch]

            # append the piano-roll to the piano-roll list and the onset-roll list
            piano_rolls.append(piano_roll)
            onset_rolls.append(onset_roll)
        else:
            piano_rolls.append(np.zeros(shape = piano_roll.shape, dtype = int))
            onset_rolls.append(np.zeros(shape = onset_roll.shape, dtype = int))

        # else:
        #     piano_rolls.append(piano_roll)
        #     onset_rolls.append(onset_roll)

        # append information of current instrument to instrument dictionary
        instrument_info[str(idx)] = get_instrument_info(instrument)
        if 'melod' in instrument_info[str(idx)]['name'].lower() and np.count_nonzero(piano_roll) < 15:
            instrument_info[str(idx)]['name'] = ''

        # if instrument_info[str(idx)]['program_num'] > 31 and instrument_info[str(idx)]['program_num'] < 40:
        #     # print('program number: ', instrument_info[str(idx)]['program_num'], instrument_info[str(idx)]['program_name'])
        #     bass_piano_roll = new_piano_roll


    # total_rolls = np.zeros_like(piano_rolls[0])
    # for piano_roll in piano_rolls:
    #     total_rolls = np.add(total_rolls, piano_roll)
    #     #print(total_rolls[100])

    #print('total_rolls[100]:', total_rolls[100])


    # print(total_rolls.shape)
    # for i in range(total_rolls.shape[0]):
    #     print(i, np.nonzero(total_rolls[i]))

    # for i in range(bass_piano_roll.shape[0]):
    #     print(i, np.nonzero(bass_piano_roll[i]))

    # key_pitch = key % 12
    #
    # new_piano_rolls = []
    # for piano_roll in piano_rolls:
    #     new_piano_roll = np.zeros(shape = piano_roll.shape, dtype = int)
    #     for time_slice in range(piano_roll.shape[0]):
    #         for pitch in range(piano_roll.shape[1]):
    #             if pitch >= key_pitch:
    #                 new_piano_roll[time_slice][pitch - key_pitch] = piano_roll[time_slice][pitch]
    #     new_piano_rolls.append(new_piano_roll)
    #
    # new_onset_rolls = []
    # for onset_roll in onset_rolls:
    #     new_onset_roll = np.zeros(shape = onset_roll.shape, dtype = int)
    #     for time_slice in range(onset_roll.shape[0]):
    #         for pitch in range(onset_roll.shape[1]):
    #             if pitch >= key_pitch:
    #                 new_onset_roll[time_slice][pitch - key_pitch] = onset_roll[time_slice][pitch]
    #     new_onset_rolls.append(new_onset_roll)


    # new_bass_piano_roll = np.zeros(shape = bass_piano_roll.shape, dtype = int)
    # for time_slice in range(bass_piano_roll.shape[0]):
    #     for pitch in range(bass_piano_roll.shape[1]):
    #         if pitch >= key_pitch:
    #             new_bass_piano_roll[time_slice][pitch - key_pitch] = bass_piano_roll[time_slice][pitch]

    # print('bass piano roll: ', bass_piano_rolls.shape)


    # bass_notes_for_chords = []
    #
    # for i in range(0, bass_piano_roll.shape[0], 8):
    #     mini_roll = np.sum(bass_piano_roll[i:(i + 8), :], axis = 0)
    #
    #     if all(mini_roll == 0):
    #         note = -1
    #     else:
    #         note = np.argmax(mini_roll)
    #
    #     bass_notes_for_chords.append(note)

    # print('bass notes:', bass_notes_for_chords)
    # print('len:', len(bass_notes_for_chords))
    # print('key:', key)

    # chords = []
    # chords = chord_extraction_test_with_bass.find_chord_from_bass_note(0, bass_notes_for_chords)
    # chords = chord_extraction_test_with_bass.find_chord_from_bass_note_and_pianorolls(0, total_rolls, bass_piano_roll)

    # print('chords:', chords, type(chords))

    info_dict = {'midi_arrays': midi_arrays,
                 'midi_info': midi_info,
                 'instrument_info': instrument_info}

    return piano_rolls, onset_rolls, info_dict, None, 0, 0

def midi_to_pianorolls(midi_path, beat_resolution=4):
    """
    Convert a midi file to piano-rolls of multiple tracks.

    Parameters
    ----------
    midi_path : str
        The path to the midi file.

    Returns
    -------
    piano_rolls : np.ndarray of int
        The extracted piano-rolls. The value represents the velocity. The first
        dimension is the id of the instrument. The size is (num_instrument,
        num_time_step, num_pitches).
    onset_rolls : np.ndarray of bool
        The extracted onset-rolls. The value indicates the occurence of onset
        events. The first dimension is the id of the instrument. The size is
        (num_instrument, num_time_step, num_pitches).
    info_dict : dict
        A dictionary containing extracted useful information lost during the
        conversion of the midi file.
            midi_arrays : dict
                A dictionary containing informative arrays.
                    beatThe time (in sec) of each beat
                    downbeat_times : np.ndarray
                        The time (in sec) of each downbeat
                    tempo_array : np.ndarray
                        _times : np.ndarray
                        The tempo at each time step
                    beat_array : np.ndarray
                        The location (time step) of beats
                    downbeat_array : np.ndarray
                        The location (time step) of downbeats
            midi_info : dict
                Contains information of the midi file, including time_signature,
                beat and tempo info.
            instrument_info: dict
                Contains information of each track
    """
    # load the MIDI file as a pretty_midi
    print('-------------------------------------------------------------------------')
    print(midi_path)
    try:
        # score = music21.converter.parse(midi_path)
        # key = score.analyze('Krumhansl')
        # key_name = key.tonic.name + key.type
        # print('Krumhansl key:', key_name)
        # del score

        pm = pretty_midi.PrettyMIDI(midi_path)
        # result = get_piano_rolls_with_Krumhansl_key(pm, key_name, beat_resolution)
        # result = get_piano_rolls_with_estimated_key(pm, beat_resolution)
        result = get_piano_rolls(pm, beat_resolution)
        # del key

    except Exception as error:
        print("error at ", midi_path)
        print(error)
        result = None
    return result