from src.music.pipeline.url2audio import url2audio
from src.music.pipeline.audio2midi import audio2midi
from src.music.pipeline.midi2processed import midi2processed
from src.music.pipeline.processed2encoded import processed2encoded
from src.music.pipeline.encoded2rep import encoded2rep
from src.music.config import RANDOM_CROP, NB_AUG, FROM_URL_PATH
# from src.music.pipeline.synth2audio import AudioRecorder
# from src.music.pipeline.processed2handcodedrep import processed2handcodedrep
import time
import hashlib

VERBOSE = True
AUGMENTATION, NOISE_INJECTED = False, False
CROP = 10# crop 30s before transcription

# AUDIO_RECORDER = AudioRecorder(place='home')

def encode_music(url=None,
                 audio_path=None,
                 midi_path=None,
                 processed_path=None,
                 record=False,
                 crop=CROP,
                 random_crop=RANDOM_CROP,
                 augmentation=AUGMENTATION,
                 noise_injection=NOISE_INJECTED,
                 apply_filtering=True,
                 nb_aug=NB_AUG,
                 level=0,
                 verbose=VERBOSE):
    if not record:  assert url is not None or audio_path is not None or midi_path is not None or processed_path is not None
    init_time = time.time()
    error = ''
    try:
        if record:
            assert audio_path is None and midi_path is None
            if verbose: print(' ' * level + 'Processing music, recorded from mic.')
            audio_path = AUDIO_RECORDER.record_one()
            error = ''
        if processed_path is None:
            if midi_path is None:
                if audio_path is None:
                    if verbose and not record: print(' ' * level + 'Processing music, from audio source.')
                    init_t = time.time()
                    audio_path, _, error = url2audio(playlist_path=FROM_URL_PATH, video_url=url, verbose=verbose, level=level+2)
                    if verbose: print(' ' * (level + 4) + f'Audio downloaded in {int(time.time() - init_t)} seconds.')
                else:
                    if verbose and not record: print(' ' * level + 'Processing music, from midi source.')
                init_t = time.time()
                midi_path, error = audio2midi(audio_path, crop=crop, random_crop=random_crop, verbose=verbose, level=level+2)
                if verbose: print(' ' * (level + 4) + f'Audio transcribed to midi in {int(time.time() - init_t)} seconds.')
            init_t = time.time()
            processed_path, error = midi2processed(midi_path, apply_filtering=apply_filtering, verbose=verbose, level=level+2)
            if verbose: print(' ' * (level + 4) + f'Midi preprocessed in {int(time.time() - init_t)} seconds.')
        init_t = time.time()
        encoded_path, error = processed2encoded(processed_path, augmentation=augmentation, nb_aug=nb_aug, noise_injection=noise_injection, verbose=verbose, level=level+2)
        if verbose: print(' ' * (level + 4) + f'Midi encoded in {int(time.time() - init_t)} seconds.')
        init_t = time.time()
        representation_path, representation, error = encoded2rep(encoded_path, return_rep=True, level=level+2, verbose=verbose)
        if verbose: print(' ' * (level + 4) + f'Music representation computed in {int(time.time() - init_t)} seconds.')
        init_t = time.time()
        handcoded_rep_path, handcoded_rep, error = None, None, ''
        # handcoded_rep_path, handcoded_rep, error = processed2handcodedrep(processed_path, return_rep=True, level=level+2, verbose=verbose)
        if verbose: print(' ' * (level + 4) + f'Music handcoded representation computed in {int(time.time() - init_t)} seconds.')
        # assert handcoded_rep_path is not None and representation_path is not None
        all_paths = dict(url=url, audio_path=audio_path, midi_path=midi_path, processed_path=processed_path, encoded_path=encoded_path,
                         representation_path=representation_path, handcoded_rep_path=handcoded_rep_path)
        print('audio hash: ', hashlib.md5(open(audio_path, 'rb').read()).hexdigest())
        print('midi hash: ', hashlib.md5(open(midi_path, 'rb').read()).hexdigest())
        print('processed hash: ', hashlib.md5(open(processed_path, 'rb').read()).hexdigest())
        print('encoded hash: ', hashlib.md5(open(encoded_path, 'rb').read()).hexdigest())
        print('rep hash: ', hashlib.md5(open(representation_path, 'rb').read()).hexdigest())
        print("rep:", representation[:10])
        if verbose: print(' ' * (level + 2) + f'Music processed in {int(time.time() - init_time)} seconds.')
    except Exception as err:
        print(err, error)
        if verbose: print(' ' * (level + 2) + f'Music FAILED to process in {int(time.time() - init_time)} seconds.')
        representation = None
        handcoded_rep = None
        all_paths = dict()

    return representation, handcoded_rep, all_paths, error

if __name__ == '__main__':
    representation = encode_music(url="https://www.youtube.com/watch?v=a2LFVWBmoiw")[0]
    # representation = encode_music(record=True)[0]