import logging
import os
import re
import time
from typing import Tuple

import numpy as np
import requests
import torch
from torch.utils.data import Dataset, DataLoader
from tqdm import tqdm

from config import *
from training.downloader import Downloader, download_fn


base_dataset_api = "http://kaistore.dcs.fmph.uniba.sk/api"

base_dataset_path = "http://kaistore.dcs.fmph.uniba.sk/beatsaber-map-generator/"

logging.basicConfig(
    level=logging.ERROR,
    format="%(levelname)s - %(asctime)s - %(message)s",
    filename="data_tester.log",
)


def non_collate(batch):
    return batch


class BaseLoader(Dataset):
    def __init__(
        self,
        difficulty: DifficultyName = DifficultyName.ALL,
        object_type: ObjectType = ObjectType.COLOR_NOTES,
        enable_condition: bool = True,
        with_beats: bool = True,
        seq_length: int = 16000,
        skip_step: int = 2000,
        split: Split = Split.TRAIN,
        split_seed: str = "42",
        batch_size: int = 2,
        num_workers: int = 0,
        model_type: str = "onsets",
    ):
        self.difficulty = difficulty
        self.object_type = object_type
        self.enable_condition = enable_condition
        self.with_beats = with_beats
        self.seq_length = seq_length
        self.skip_step = skip_step
        self.split = split
        self.split_seed = split_seed
        self.batch_size = batch_size
        self.num_workers = num_workers
        self.model_type = model_type

        self.downloader = Downloader(
            download_fn, position_start=4 if split == Split.TRAIN else 5
        )
        self.files = []
        self.no_songs = 0

        self._load()

        if self.split == Split.VALIDATION and self.files:
            for f in self.files:
                self.downloader.enqueue(f, f)

    def _load(self):
        response = requests.post(
            f"{base_dataset_api}/get-list-of-batches",
            json={
                "difficulty": self.difficulty.value.lower(),
                "split_seed": self.split_seed,
                "split": self.split.value,
                "model_type": self.model_type,
            },
        ).json()

        self.files = response.get("files", [])
        self.no_songs = response.get("no_songs", 0)

    def process(self, song):

        song["data"] = song

        # Delegate to onset or note processing
        if self.model_type == "onsets":
            yield from self.process_onsets(song)
        elif self.model_type == "notes":
            raise NotImplementedError(
                "Note processing is not implemented in this base loader."
            )

        else:
            raise ValueError(f"Unsupported mode: {self.model_type}")

    def process_onsets(self, song_meta):
        song_npz = song_meta["data"]

        if not self.with_beats:
            song_npz.pop("beats_array", None)

        beats_array = song_npz.get("beats_array") if self.with_beats else None

        onsets_raw = song_npz.get("onsets", None)
        if isinstance(onsets_raw, np.ndarray) and onsets_raw.dtype == object:
            onsets_dict = onsets_raw.item()
        elif isinstance(onsets_raw, dict):
            onsets_dict = onsets_raw
        else:
            logging.warning(
                f"Invalid or missing onset data for song {song_meta['song']}"
            )
            return

        for difficulty_name, onset_info in onsets_dict.items():
            if "onsets_array" not in onset_info or "condition" not in onset_info:
                continue

            condition = onset_info["condition"]
            onsets_array = onset_info["onsets_array"]

            batch = []
            for audio, start_index, end_index, params in self.iter_audio(song_meta):
                score_segment = self.cut_segment(
                    onsets_array, start_index, end_index, audio.shape[0]
                )

                data = {
                    "condition": torch.tensor([condition]),
                    "onset": torch.from_numpy(score_segment).float(),
                    "audio": torch.from_numpy(audio).float(),
                }

                if self.with_beats and beats_array is not None:
                    data["beats"] = torch.from_numpy(
                        self.cut_segment(
                            beats_array, start_index, end_index, audio.shape[0]
                        )
                    ).float()

                batch.append(data)
                if len(batch) == self.batch_size:
                    yield self.collate_batch(batch)
                    batch = []

            if batch:
                yield self.collate_batch(batch)

    def collate_batch(self, batch: list[dict]):
        return {key: torch.stack([item[key] for item in batch]) for key in batch[0]}

    def get_dataloader(self):
        return DataLoader(
            self,
            collate_fn=non_collate,
        )

    def iter_audio(self, song: SongIteration):
        """Iterate audio"""
        seq_length = int(round(self.seq_length / FRAME))
        song_mel = song["data"]["song"].T  # type: ignore
        skip_step = int(round(self.skip_step / FRAME))
        for skip in range(0, seq_length, skip_step):
            params = dict(skip=skip, seq_length=seq_length)
            for data_tuple in iter_array(song_mel, seq_length, skip, params):
                # Add debugging statement to print data_tuple
                yield data_tuple

    def cut_segment(
        self, score_data: np.ndarray, start_index: int, end_index: int, length: int
    ):
        """Ensure the length of data array.

        Parameters
        ----------
        score_data : np.ndarray
            An array containing score data where the length will be adjusted.
        start_index : int
            The start index to cut the array.
        end_index : int
            The end index to cut the array.
        length : length
            The length of the array to be returned.

        Returns
        -------

        """
        # Cut the score data by specified length
        score_segment = score_data[start_index:end_index]
        # Pad if the length is insufficient
        score_segment = assert_length(score_segment, length)
        return score_segment

    def __getitem__(self, idx):
        if self.split == Split.TRAIN:
            max_lookahead = 3
            for i in range(idx, min(idx + max_lookahead, len(self.files))):
                file_path = self.files[i]
                self.downloader.enqueue(file_path, file_path)

        current_path = self.files[idx]
        self.downloader.enqueue(current_path, current_path)

        while not os.path.exists(current_path):
            time.sleep(1)

        try:
            data = np.load(current_path, allow_pickle=True, encoding="latin1")
        except Exception as e:
            raise RuntimeError(f"[Load error] {current_path}: {e}")

        if idx > 0 and self.split == Split.TRAIN:
            prev_path = self.files[idx - 1]
            if os.path.exists(prev_path):
                try:
                    os.remove(prev_path)
                    print(f"[Cleanup] Deleted previous file: {prev_path}")
                except Exception as e:
                    print(f"[Cleanup error] Could not delete {prev_path}: {e}")

        return dict(data)

    def __len__(self):
        return self.no_songs


def iter_array(array, length, skip, params):
    max_len = len(array)
    for i in range(skip, max_len, length):
        data = array[i : (i + length)]
        if len(data) == length:
            yield data, i, i + length, params


def get_bpm_info(song):
    return NotImplementedError

    bpm = song["meta"]["bpm"]

    energy = np.sum(song["data"]["mel"], axis=0)
    start_index = np.argmax(energy > 0)

    start_time = librosa.frames_to_time(start_index, sr=sample_rate)

    start = float(start_time * 1000)
    beats = int(4)
    return [(bpm, start, beats)]


def get_onset_array(song: dict, difficulty: DifficultyName = DifficultyName.ALL):
    return NotImplementedError

    def get_onsets_for_beatmap(beatmap, timestamps, bpm):
        onsets_array = np.zeros_like(timestamps, dtype=np.float32)
        for obj in beatmap:
            beat_time = obj[1]
            beat_time_to_sec = beat_time / bpm * 60
            closest_frame_idx = np.argmin(np.abs(timestamps - beat_time_to_sec))
            onsets_array[closest_frame_idx] = 1
        return onsets_array.reshape(-1, 1)

    if not isinstance(song["song"], np.ndarray):
        song["song"] = np.array(song["song"])

    timestamps = librosa.times_like(song["song"], sr=sample_rate)
    onsets = {}

    for key, beatmap in song.items():
        if key in DIFFICULTY_NAMES:
            onsets[key] = {}
            onsets[key]["onsets_array"] = get_onsets_for_beatmap(
                beatmap, timestamps, song["bpm"]
            )
            pascal_key = re.sub(r"([a-z])([A-Z])", r"\1_\2", key).upper()
            onsets[key]["condition"] = DifficultyNumber[pascal_key].value

    return onsets


def process_bpminfo(
    bpm_info: List, max_length_ms: float, units: TimeUnit = TimeUnit.milliseconds
) -> Tuple[List, List, List, List]:
    bpms, starts, ends, beats = [], [], [], []
    max_length = convert_units(max_length_ms, units)
    for i, (bpm, start, beat) in enumerate(bpm_info):
        start = convert_units(start, units)
        if start > max_length:
            continue
        if i < len(bpm_info) - 1:
            bpms.append(bpm)
            starts.append(start)
            next_start = convert_units(bpm_info[i + 1][1], units)
            ends.append(min(next_start, max_length))
            beats.append(beat)
        else:
            bpms.append(bpm)
            starts.append(start)
            ends.append(max_length)
            beats.append(beat)
    return bpms, starts, ends, beats


def gen_beats_array(
    length: int,
    bpm_info: List[Tuple[float, float, int]],
    mel_length: int,
    distinguish_downbeat: bool = False,
):
    """

    Parameters
    ----------
    length : int
        length of onset label sequence
    bpm_info : List[Tuple[float, float, int]]
        list of tuple (bpm, start(ms), beats)
        If there are tempo changes during the song, bpm_info contains
        more than one tuples.
    distinguish_downbeat : bool
        If `True`, distinguish downbeat of a measure from other beats.
    mel_length : int
        length of mel spectrogram sequence

    Returns
    -------

    """

    validate(bpm_info, mel_length)

    # The time range that nth(>= 0) frame represents is
    #   (n - 0.5) * FRAME < time <= (n + 0.5) * FRAME [ms]
    # , where `FRAME` is a constant for frame length.
    # Set an upper bound of the time for last frame (n = length - 1)
    max_length_ms = max(0, (length - 0.5) * FRAME)
    arr = np.zeros(length)
    bpms, starts, ends, beats = process_bpminfo(bpm_info, max_length_ms)
    for i, (bpm, start, end, beat) in enumerate(zip(bpms, starts, ends, beats)):
        # calc beat timing in milliseconds
        interval = 60 * 1000 / bpm  # ms
        beats_timing = np.arange(start, end, interval)

        # convert to array index
        # The conversion method (float -> int) is taking round, which is
        # the same as the preprocessing method for onset.
        # (in preprocessing/onset_converter.py)
        arg_beats = np.round(beats_timing / FRAME).astype("int64")

        # assign flag to beats array
        for b in range(beat):
            if b == 0:  # downbeat (beginning of a measure)
                if distinguish_downbeat:
                    arr[arg_beats[b::beat]] = 2
                else:
                    arr[arg_beats[b::beat]] = 1
            else:  # other beats
                arr[arg_beats[b::beat]] = 1

    return arr.reshape([-1, 1])


def convert_units(ms: float, units: TimeUnit) -> float:
    if units == TimeUnit.milliseconds:
        return float(ms)
    elif units == TimeUnit.seconds:
        return float(ms) / 1000.0
    elif units == TimeUnit.frames:
        return float(ms) / 32.0


def validate(bpm_info: List[Tuple[float, float, int]], mel_length: int):
    for x, (bpm, start, beat) in enumerate(bpm_info):
        assert bpm > 0
        assert start >= 0
        assert beat > 0
        assert (
            np.round(start / FRAME) <= mel_length
        ), f"The start position of bpm_info ({start}) is outside the song length ({mel_length})."


def assert_length(arr: np.ndarray, length: int):
    """Pad with zeros to ensure the array length
    Parameters
    ----------
    arr
    length

    Returns
    -------

    """
    if arr.shape[0] >= length:
        return arr[:length]
    length2 = length - arr.shape[0]
    arr2 = np.zeros((length2, arr.shape[1]))
    return np.concatenate([arr, arr2])