Level 3: A first failed attempt of encoding-decoding -> SNR=0

Level 2: Psychoacoustic first version
2026-02-09 01:58:21 +02:00 · 2026-02-08 22:53:52 +02:00
47 changed files with 5155 additions and 1579 deletions
--- a/source/core/aac_coder.py
+++ b/source/core/aac_coder.py
@ -26,14 +26,106 @@ from pathlib import Path
 from typing import Union
 import soundfile as sf
 from scipy.io import savemat
 from core.aac_configuration import WIN_TYPE
 from core.aac_filterbank import aac_filter_bank
-from core.aac_ssc import aac_SSC
+from core.aac_ssc import aac_ssc
 from core.aac_tns import aac_tns
 from core.aac_psycho import aac_psycho
 from core.aac_quantizer import aac_quantizer  # assumes your quantizer file is core/aac_quantizer.py
 from core.aac_huffman import aac_encode_huff
 from core.aac_utils import get_table, band_limits
 from material.huff_utils import load_LUT
 from core.aac_types import *
 # -----------------------------------------------------------------------------
 # Helpers for thresholds (T(b))
 # -----------------------------------------------------------------------------
 def _band_slices_from_table(frame_type: FrameType) -> list[tuple[int, int]]:
    """
    Return inclusive (lo, hi) band slices derived from TableB219.
    """
    table, _ = get_table(frame_type)
    wlow, whigh, _bval, _qthr_db = band_limits(table)
    return [(int(lo), int(hi)) for lo, hi in zip(wlow, whigh)]
 def _thresholds_from_smr(
    frame_F_ch: FrameChannelF,
    frame_type: FrameType,
    SMR: FloatArray,
 ) -> FloatArray:
    """
    Compute thresholds T(b) = P(b) / SMR(b), where P(b) is band energy.
    Shapes:
    - Long: returns (NB, 1)
    - ESH: returns (NB, 8)
    """
    bands = _band_slices_from_table(frame_type)
    NB = len(bands)
    X = np.asarray(frame_F_ch, dtype=np.float64)
    SMR = np.asarray(SMR, dtype=np.float64)
    if frame_type == "ESH":
        if X.shape != (128, 8):
            raise ValueError("For ESH, frame_F_ch must have shape (128, 8).")
        if SMR.shape != (NB, 8):
            raise ValueError(f"For ESH, SMR must have shape ({NB}, 8).")
        T = np.zeros((NB, 8), dtype=np.float64)
        for j in range(8):
            Xj = X[:, j]
            for b, (lo, hi) in enumerate(bands):
                P = float(np.sum(Xj[lo : hi + 1] ** 2))
                smr = float(SMR[b, j])
                T[b, j] = 0.0 if smr <= 1e-12 else (P / smr)
        return T
    # Long
    if X.shape == (1024,):
        Xv = X
    elif X.shape == (1024, 1):
        Xv = X[:, 0]
    else:
        raise ValueError("For non-ESH, frame_F_ch must be shape (1024,) or (1024, 1).")
    if SMR.shape == (NB,):
        SMRv = SMR
    elif SMR.shape == (NB, 1):
        SMRv = SMR[:, 0]
    else:
        raise ValueError(f"For non-ESH, SMR must be shape ({NB},) or ({NB}, 1).")
    T = np.zeros((NB, 1), dtype=np.float64)
    for b, (lo, hi) in enumerate(bands):
        P = float(np.sum(Xv[lo : hi + 1] ** 2))
        smr = float(SMRv[b])
        T[b, 0] = 0.0 if smr <= 1e-12 else (P / smr)
    return T
 def _normalize_global_gain(G: GlobalGain) -> float | FloatArray:
    """
    Normalize GlobalGain to match AACChannelFrameF3["G"] type:
    - long: return float
    - ESH: return float64 ndarray of shape (1, 8)
    """
    if np.isscalar(G):
        return float(G)
    G_arr = np.asarray(G)
    if G_arr.size == 1:
        return float(G_arr.reshape(-1)[0])
    return np.asarray(G_arr, dtype=np.float64)
 # -----------------------------------------------------------------------------
 # Public helpers (useful for level_x demo wrappers)
 # -----------------------------------------------------------------------------
@ -182,7 +274,7 @@ def aac_coder_1(filename_in: Union[str, Path]) -> AACSeq1:
            tail = np.zeros((win - next_t.shape[0], 2), dtype=np.float64)
            next_t = np.vstack([next_t, tail])
-        frame_type = aac_SSC(frame_t, next_t, prev_frame_type)
+        frame_type = aac_ssc(frame_t, next_t, prev_frame_type)
        frame_f = aac_filter_bank(frame_t, frame_type, win_type)
        chl_f, chr_f = aac_pack_frame_f_to_seq_channels(frame_type, frame_f)
@ -250,7 +342,7 @@ def aac_coder_2(filename_in: Union[str, Path]) -> AACSeq2:
            tail = np.zeros((win - next_t.shape[0], 2), dtype=np.float64)
            next_t = np.vstack([next_t, tail])
-        frame_type = aac_SSC(frame_t, next_t, prev_frame_type)
+        frame_type = aac_ssc(frame_t, next_t, prev_frame_type)
        # Level 1 analysis (packed stereo container)
        frame_f_stereo = aac_filter_bank(frame_t, frame_type, WIN_TYPE)
@ -282,3 +374,180 @@ def aac_coder_2(filename_in: Union[str, Path]) -> AACSeq2:
        prev_frame_type = frame_type
    return aac_seq
 def aac_coder_3(
    filename_in: Union[str, Path],
    filename_aac_coded: Union[str, Path] | None = None,
 ) -> AACSeq3:
    """
    Level-3 AAC encoder (Level 2 + Psycho + Quantizer + Huffman).
    Parameters
    ----------
    filename_in : Union[str, Path]
        Input WAV filename (stereo, 48 kHz).
    filename_aac_coded : Union[str, Path] | None
        Optional .mat filename to store aac_seq_3 (assignment convenience).
    Returns
    -------
    AACSeq3
        Encoded AAC sequence (Level 3 payload schema).
    """
    filename_in = Path(filename_in)
    x, _ = aac_read_wav_stereo_48k(filename_in)
    hop = 1024
    win = 2048
    pad_pre = np.zeros((hop, 2), dtype=np.float64)
    pad_post = np.zeros((hop, 2), dtype=np.float64)
    x_pad = np.vstack([pad_pre, x, pad_post])
    K = int((x_pad.shape[0] - win) // hop + 1)
    if K <= 0:
        raise ValueError("Input too short for framing.")
    # Load Huffman LUTs once.
    huff_LUT_list = load_LUT()
    aac_seq: AACSeq3 = []
    prev_frame_type: FrameType = "OLS"
    # Pin win_type to the WinType literal for type checkers.
    win_type: WinType = WIN_TYPE
    # Psycho model needs per-channel history (prev1, prev2) of 2048-sample frames.
    prev1_L = np.zeros((2048,), dtype=np.float64)
    prev2_L = np.zeros((2048,), dtype=np.float64)
    prev1_R = np.zeros((2048,), dtype=np.float64)
    prev2_R = np.zeros((2048,), dtype=np.float64)
    for i in range(K):
        start = i * hop
        frame_t: FrameT = x_pad[start : start + win, :]
        if frame_t.shape != (win, 2):
            raise ValueError("Internal framing error: frame_t has wrong shape.")
        next_t = x_pad[start + hop : start + hop + win, :]
        if next_t.shape[0] < win:
            tail = np.zeros((win - next_t.shape[0], 2), dtype=np.float64)
            next_t = np.vstack([next_t, tail])
        frame_type = aac_ssc(frame_t, next_t, prev_frame_type)
        # Analysis filterbank (stereo packed)
        frame_f_stereo = aac_filter_bank(frame_t, frame_type, win_type)
        chl_f, chr_f = aac_pack_frame_f_to_seq_channels(frame_type, frame_f_stereo)
        # TNS per channel
        chl_f_tns, chl_tns_coeffs = aac_tns(chl_f, frame_type)
        chr_f_tns, chr_tns_coeffs = aac_tns(chr_f, frame_type)
        # Psychoacoustic model per channel (time-domain)
        frame_L = np.asarray(frame_t[:, 0], dtype=np.float64)
        frame_R = np.asarray(frame_t[:, 1], dtype=np.float64)
        SMR_L = aac_psycho(frame_L, frame_type, prev1_L, prev2_L)
        SMR_R = aac_psycho(frame_R, frame_type, prev1_R, prev2_R)
        # Thresholds T(b) (stored, not entropy-coded)
        T_L = _thresholds_from_smr(chl_f_tns, frame_type, SMR_L)
        T_R = _thresholds_from_smr(chr_f_tns, frame_type, SMR_R)
        # Quantizer per channel
        S_L, sfc_L, G_L = aac_quantizer(chl_f_tns, frame_type, SMR_L)
        S_R, sfc_R, G_R = aac_quantizer(chr_f_tns, frame_type, SMR_R)
        # Normalize G types for AACSeq3 schema (float | float64 ndarray).
        G_Ln = _normalize_global_gain(G_L)
        G_Rn = _normalize_global_gain(G_R)
        # Huffman-code ONLY the DPCM differences for b>0.
        # sfc[0] corresponds to alpha(0)=G and is stored separately in the frame.
        sfc_L_dpcm = np.asarray(sfc_L, dtype=np.int64)[1:, ...]
        sfc_R_dpcm = np.asarray(sfc_R, dtype=np.int64)[1:, ...]
        # Codebook 11:
        # maxAbsCodeVal = 16 is RESERVED for ESCAPE.
        # We must stay strictly within [-15, +15] to avoid escape decoding.
        sf_cb = 11
        sf_max_abs = int(huff_LUT_list[sf_cb]["maxAbsCodeVal"]) - 1  # -> 15
        sfc_L_dpcm = np.clip(
            sfc_L_dpcm,
            -sf_max_abs,
            sf_max_abs,
        ).astype(np.int64, copy=False)
        sfc_R_dpcm = np.clip(
            sfc_R_dpcm,
            -sf_max_abs,
            sf_max_abs,
        ).astype(np.int64, copy=False)
        sfc_L_stream, _ = aac_encode_huff(
            sfc_L_dpcm.reshape(-1, order="F"),
            huff_LUT_list,
            force_codebook=sf_cb,
        )
        sfc_R_stream, _ = aac_encode_huff(
            sfc_R_dpcm.reshape(-1, order="F"),
            huff_LUT_list,
            force_codebook=sf_cb,
        )
        mdct_L_stream, cb_L = aac_encode_huff(
            np.asarray(S_L, dtype=np.int64).reshape(-1),
            huff_LUT_list,
        )
        mdct_R_stream, cb_R = aac_encode_huff(
            np.asarray(S_R, dtype=np.int64).reshape(-1),
            huff_LUT_list,
        )
        # Typed dict construction helps static analyzers validate the schema.
        frame_out: AACSeq3Frame = {
            "frame_type": frame_type,
            "win_type": win_type,
            "chl": {
                "tns_coeffs": np.asarray(chl_tns_coeffs, dtype=np.float64),
                "T": np.asarray(T_L, dtype=np.float64),
                "G": G_Ln,
                "sfc": sfc_L_stream,
                "stream": mdct_L_stream,
                "codebook": int(cb_L),
            },
            "chr": {
                "tns_coeffs": np.asarray(chr_tns_coeffs, dtype=np.float64),
                "T": np.asarray(T_R, dtype=np.float64),
                "G": G_Rn,
                "sfc": sfc_R_stream,
                "stream": mdct_R_stream,
                "codebook": int(cb_R),
            },
        }
        aac_seq.append(frame_out)
        # Update psycho history (shift register)
        prev2_L = prev1_L
        prev1_L = frame_L
        prev2_R = prev1_R
        prev1_R = frame_R
        prev_frame_type = frame_type
    # Optional: store to .mat for the assignment wrapper
    if filename_aac_coded is not None:
        filename_aac_coded = Path(filename_aac_coded)
        savemat(
            str(filename_aac_coded),
            {"aac_seq_3": np.array(aac_seq, dtype=object)},
            do_compression=True,
        )
    return aac_seq
--- a/source/core/aac_configuration.py
+++ b/source/core/aac_configuration.py
@ -15,6 +15,8 @@
 from __future__ import annotations
 # Imports
 from typing import Final
 from core.aac_types import WinType
 # Filterbank
@ -29,3 +31,11 @@ WIN_TYPE: WinType = "SIN"
 PRED_ORDER = 4
 QUANT_STEP = 0.1
 QUANT_MAX = 0.7  # 4-bit symmetric with step 0.1 -> clamp to [-0.7, +0.7]
 # -----------------------------------------------------------------------------
 # Psycho
 # -----------------------------------------------------------------------------
 NMT_DB: Final[float] = 6.0   # Noise Masking Tone (dB)
 TMN_DB: Final[float] = 18.0  # Tone Masking Noise (dB)
--- a/source/core/aac_decoder.py
+++ b/source/core/aac_decoder.py
@ -9,16 +9,9 @@
 #   cchoutou@ece.auth.gr
 #
 # Description:
-#   Level 1 AAC decoder orchestration (inverse of aac_coder_1()).
+#   - Level 1 AAC decoder orchestration (inverse of aac_coder_1()).
-#   Keeps the same functional behavior as the original level_1 implementation:
+#   - Level 2 AAC decoder orchestration (inverse of aac_coder_1()).
 #   - Re-pack per-channel spectra into FrameF expected by aac_i_filter_bank()
 #   - IMDCT synthesis per frame
 #   - Overlap-add with hop=1024
 #   - Remove encoder boundary padding: hop at start and hop at end
 #
 #   Note:
 #   This core module returns the reconstructed samples. Writing to disk is kept
 #   in level_x demos.
 # ------------------------------------------------------------
 from __future__ import annotations
@ -29,11 +22,24 @@ import soundfile as sf
 from core.aac_filterbank import aac_i_filter_bank
 from core.aac_tns import aac_i_tns
 from core.aac_quantizer import aac_i_quantizer
 from core.aac_huffman import aac_decode_huff
 from core.aac_utils import get_table, band_limits
 from material.huff_utils import load_LUT
 from core.aac_types import *
 # -----------------------------------------------------------------------------
-# Public helpers (useful for level_x demo wrappers)
+# Helper for NB
 # -----------------------------------------------------------------------------
 def _nbands(frame_type: FrameType) -> int:
    table, _ = get_table(frame_type)
    wlow, _whigh, _bval, _qthr_db = band_limits(table)
    return int(len(wlow))
 # -----------------------------------------------------------------------------
 # Public helpers
 # -----------------------------------------------------------------------------
 def aac_unpack_seq_channels_to_frame_f(frame_type: FrameType, chl_f: FrameChannelF, chr_f: FrameChannelF) -> FrameF:
@ -109,7 +115,7 @@ def aac_remove_padding(y_pad: StereoSignal, hop: int = 1024) -> StereoSignal:
 # -----------------------------------------------------------------------------
-# Level 1 decoder (core)
+# Level 1 decoder
 # -----------------------------------------------------------------------------
 def aac_decoder_1(aac_seq_1: AACSeq1, filename_out: Union[str, Path]) -> StereoSignal:
@ -167,6 +173,10 @@ def aac_decoder_1(aac_seq_1: AACSeq1, filename_out: Union[str, Path]) -> StereoS
    return y
 # -----------------------------------------------------------------------------
 # Level 2 decoder
 # -----------------------------------------------------------------------------
 def aac_decoder_2(aac_seq_2: AACSeq2, filename_out: Union[str, Path]) -> StereoSignal:
    """
    Level-2 AAC decoder (inverse of aac_coder_2).
@ -255,3 +265,144 @@ def aac_decoder_2(aac_seq_2: AACSeq2, filename_out: Union[str, Path]) -> StereoS
    sf.write(str(filename_out), y, 48000)
    return y
 def aac_decoder_3(aac_seq_3: AACSeq3, filename_out: Union[str, Path]) -> StereoSignal:
    """
    Level-3 AAC decoder (inverse of aac_coder_3).
    Steps per frame:
    - Huffman decode scalefactors (sfc) using codebook 11
    - Huffman decode MDCT symbols (stream) using stored codebook
    - iQuantizer -> MDCT coefficients after TNS
    - iTNS using stored predictor coefficients
    - IMDCT filterbank -> time domain
    - Overlap-add, remove padding, write WAV
    Parameters
    ----------
    aac_seq_3 : AACSeq3
        Encoded sequence as produced by aac_coder_3.
    filename_out : Union[str, Path]
        Output WAV filename.
    Returns
    -------
    StereoSignal
        Decoded audio samples (time-domain), stereo, shape (N, 2), dtype float64.
    """
    filename_out = Path(filename_out)
    hop = 1024
    win = 2048
    K = len(aac_seq_3)
    if K <= 0:
        raise ValueError("aac_seq_3 must contain at least one frame.")
    # Load Huffman LUTs once.
    huff_LUT_list = load_LUT()
    n_pad = (K - 1) * hop + win
    y_pad = np.zeros((n_pad, 2), dtype=np.float64)
    for i, fr in enumerate(aac_seq_3):
        frame_type: FrameType = fr["frame_type"]
        win_type: WinType = fr["win_type"]
        NB = _nbands(frame_type)
        # We store G separately, so Huffman stream contains only (NB-1) DPCM differences.
        sfc_len = (NB - 1) * (8 if frame_type == "ESH" else 1)
        # -------------------------
        # Left channel
        # -------------------------
        tns_L = np.asarray(fr["chl"]["tns_coeffs"], dtype=np.float64)
        G_L = fr["chl"]["G"]
        sfc_bits_L = fr["chl"]["sfc"]
        mdct_bits_L = fr["chl"]["stream"]
        cb_L = int(fr["chl"]["codebook"])
        sfc_dec_L = aac_decode_huff(sfc_bits_L, 11, huff_LUT_list)[:sfc_len].astype(np.int64, copy=False)
        if frame_type == "ESH":
            sfc_dpcm_L = sfc_dec_L.reshape(NB - 1, 8, order="F")
            sfc_L = np.zeros((NB, 8), dtype=np.int64)
            Gv = np.asarray(G_L, dtype=np.float64).reshape(1, 8)
            sfc_L[0, :] = Gv[0, :].astype(np.int64)
            sfc_L[1:, :] = sfc_dpcm_L
        else:
            sfc_dpcm_L = sfc_dec_L.reshape(NB - 1, 1, order="F")
            sfc_L = np.zeros((NB, 1), dtype=np.int64)
            sfc_L[0, 0] = int(float(G_L))
            sfc_L[1:, :] = sfc_dpcm_L
        # MDCT symbols: codebook 0 means "all-zero section"
        if cb_L == 0:
            S_dec_L = np.zeros((1024,), dtype=np.int64)
        else:
            S_tmp_L = aac_decode_huff(mdct_bits_L, cb_L, huff_LUT_list).astype(np.int64, copy=False)
            # Tuple coding may produce extra trailing symbols; caller knows the true length (1024).
            # Also guard against short outputs by zero-padding.
            if S_tmp_L.size < 1024:
                S_dec_L = np.zeros((1024,), dtype=np.int64)
                S_dec_L[: S_tmp_L.size] = S_tmp_L
            else:
                S_dec_L = S_tmp_L[:1024]
        S_L = S_dec_L.reshape(1024, 1)
        Xq_L = aac_i_quantizer(S_L, sfc_L, G_L, frame_type)
        X_L = aac_i_tns(Xq_L, frame_type, tns_L)
        # -------------------------
        # Right channel
        # -------------------------
        tns_R = np.asarray(fr["chr"]["tns_coeffs"], dtype=np.float64)
        G_R = fr["chr"]["G"]
        sfc_bits_R = fr["chr"]["sfc"]
        mdct_bits_R = fr["chr"]["stream"]
        cb_R = int(fr["chr"]["codebook"])
        sfc_dec_R = aac_decode_huff(sfc_bits_R, 11, huff_LUT_list)[:sfc_len].astype(np.int64, copy=False)
        if frame_type == "ESH":
            sfc_dpcm_R = sfc_dec_R.reshape(NB - 1, 8, order="F")
            sfc_R = np.zeros((NB, 8), dtype=np.int64)
            Gv = np.asarray(G_R, dtype=np.float64).reshape(1, 8)
            sfc_R[0, :] = Gv[0, :].astype(np.int64)
            sfc_R[1:, :] = sfc_dpcm_R
        else:
            sfc_dpcm_R = sfc_dec_R.reshape(NB - 1, 1, order="F")
            sfc_R = np.zeros((NB, 1), dtype=np.int64)
            sfc_R[0, 0] = int(float(G_R))
            sfc_R[1:, :] = sfc_dpcm_R
        if cb_R == 0:
            S_dec_R = np.zeros((1024,), dtype=np.int64)
        else:
            S_tmp_R = aac_decode_huff(mdct_bits_R, cb_R, huff_LUT_list).astype(np.int64, copy=False)
            if S_tmp_R.size < 1024:
                S_dec_R = np.zeros((1024,), dtype=np.int64)
                S_dec_R[: S_tmp_R.size] = S_tmp_R
            else:
                S_dec_R = S_tmp_R[:1024]
        S_R = S_dec_R.reshape(1024, 1)
        Xq_R = aac_i_quantizer(S_R, sfc_R, G_R, frame_type)
        X_R = aac_i_tns(Xq_R, frame_type, tns_R)
        # Re-pack to stereo container and inverse filterbank
        frame_f = aac_unpack_seq_channels_to_frame_f(frame_type, np.asarray(X_L), np.asarray(X_R))
        frame_t_hat: FrameT = aac_i_filter_bank(frame_f, frame_type, win_type)
        start = i * hop
        y_pad[start : start + win, :] += frame_t_hat
    y = aac_remove_padding(y_pad, hop=hop)
    sf.write(str(filename_out), y, 48000)
    return y
--- a/source/core/aac_filterbank.py
+++ b/source/core/aac_filterbank.py
@ -14,6 +14,7 @@
 # ------------------------------------------------------------
 from __future__ import annotations
 from core.aac_utils import mdct, imdct
 from core.aac_types import *
 from scipy.signal.windows import kaiser
@ -186,74 +187,6 @@ def _window_sequence(frame_type: FrameType, win_type: WinType) -> Window:
    raise ValueError(f"Invalid frame_type for long window sequence: {frame_type!r}")
 def _mdct(s: TimeSignal) -> MdctCoeffs:
    """
    MDCT (direct form) as specified in the assignment.
    Parameters
    ----------
    s : TimeSignal
        Windowed time samples, 1-D array of length N (N = 2048 or 256).
    Returns
    -------
    MdctCoeffs
        MDCT coefficients, 1-D array of length N/2.
    Definition
    ----------
    X[k] = 2 * sum_{n=0..N-1} s[n] * cos((2*pi/N) * (n + n0) * (k + 1/2)),
    where n0 = (N/2 + 1)/2.
    """
    s = np.asarray(s, dtype=np.float64).reshape(-1)
    N = int(s.shape[0])
    if N not in (2048, 256):
        raise ValueError("MDCT input length must be 2048 or 256.")
    n0 = (N / 2.0 + 1.0) / 2.0
    n = np.arange(N, dtype=np.float64) + n0
    k = np.arange(N // 2, dtype=np.float64) + 0.5
    C = np.cos((2.0 * np.pi / N) * np.outer(n, k))  # (N, N/2)
    X = 2.0 * (s @ C)  # (N/2,)
    return X
 def _imdct(X: MdctCoeffs) -> TimeSignal:
    """
    IMDCT (direct form) as specified in the assignment.
    Parameters
    ----------
    X : MdctCoeffs
        MDCT coefficients, 1-D array of length K (K = 1024 or 128).
    Returns
    -------
    TimeSignal
        Reconstructed time samples, 1-D array of length N = 2K.
    Definition
    ----------
    s[n] = (2/N) * sum_{k=0..N/2-1} X[k] * cos((2*pi/N) * (n + n0) * (k + 1/2)),
    where n0 = (N/2 + 1)/2.
    """
    X = np.asarray(X, dtype=np.float64).reshape(-1)
    K = int(X.shape[0])
    if K not in (1024, 128):
        raise ValueError("IMDCT input length must be 1024 or 128.")
    N = 2 * K
    n0 = (N / 2.0 + 1.0) / 2.0
    n = np.arange(N, dtype=np.float64) + n0
    k = np.arange(K, dtype=np.float64) + 0.5
    C = np.cos((2.0 * np.pi / N) * np.outer(n, k))  # (N, K)
    s = (2.0 / N) * (C @ X)  # (N,)
    return s
 def _filter_bank_esh_channel(x_ch: FrameChannelT, win_type: WinType) -> FrameChannelF:
    """
    ESH analysis for one channel.
@ -279,7 +212,7 @@ def _filter_bank_esh_channel(x_ch: FrameChannelT, win_type: WinType) -> FrameCha
    for j in range(8):
        start = 448 + 128 * j
        seg = x_ch[start:start + 256] * wS  # (256,)
-        X_esh[:, j] = _mdct(seg)           # (128,)
+        X_esh[:, j] = mdct(seg)           # (128,)
    return X_esh
@ -344,7 +277,7 @@ def _i_filter_bank_esh_channel(X_esh: FrameChannelF, win_type: WinType) -> Frame
    # Each short IMDCT returns 256 samples. Place them at:
    # start = 448 + 128*j, j=0..7 (50% overlap)
    for j in range(8):
-        seg = _imdct(X_esh[:, j]) * wS  # (256,)
+        seg = imdct(X_esh[:, j]) * wS  # (256,)
        start = 448 + 128 * j
        out[start:start + 256] += seg
@ -352,7 +285,7 @@ def _i_filter_bank_esh_channel(X_esh: FrameChannelF, win_type: WinType) -> Frame
 # -----------------------------------------------------------------------------
-# Public Function prototypes (Level 1)
+# Public Function prototypes
 # -----------------------------------------------------------------------------
 def aac_filter_bank(frame_T: FrameT, frame_type: FrameType, win_type: WinType) -> FrameF:
@ -385,8 +318,8 @@ def aac_filter_bank(frame_T: FrameT, frame_type: FrameType, win_type: WinType) -
    if frame_type in ("OLS", "LSS", "LPS"):
        w = _window_sequence(frame_type, win_type)  # length 2048
-        XL = _mdct(xL * w)  # length 1024
+        XL = mdct(xL * w)  # length 1024
-        XR = _mdct(xR * w)  # length 1024
+        XR = mdct(xR * w)  # length 1024
        out = np.empty((1024, 2), dtype=np.float64)
        out[:, 0] = XL
        out[:, 1] = XR
@ -430,8 +363,8 @@ def aac_i_filter_bank(frame_F: FrameF, frame_type: FrameType, win_type: WinType)
        w = _window_sequence(frame_type, win_type)
-        xL = _imdct(frame_F[:, 0]) * w
+        xL = imdct(frame_F[:, 0]) * w
-        xR = _imdct(frame_F[:, 1]) * w
+        xR = imdct(frame_F[:, 1]) * w
        out = np.empty((2048, 2), dtype=np.float64)
        out[:, 0] = xL
--- a/source/core/aac_huffman.py
+++ b/source/core/aac_huffman.py
@ -0,0 +1,112 @@
 # ------------------------------------------------------------
 # AAC Coder/Decoder - Huffman wrappers (Level 3)
 #
 # Multimedia course at Aristotle University of
 # Thessaloniki (AUTh)
 #
 # Author:
 #   Christos Choutouridis (ΑΕΜ 8997)
 #   cchoutou@ece.auth.gr
 #
 # Description:
 #   Thin wrappers around the provided Huffman utilities (material/huff_utils.py)
 #   so that the API matches the assignment text.
 #
 # Exposed API (assignment):
 #   huff_sec, huff_codebook = aac_encode_huff(coeff_sec, huff_LUT_list, force_codebook)
 #   dec_coeffs = aac_decode_huff(huff_sec, huff_codebook, huff_LUT_list)
 #
 # Notes:
 #   - Huffman coding operates on tuples. Therefore, decode(encode(x)) may return
 #     extra trailing symbols due to tuple padding. The AAC decoder knows the
 #     true section length from side information (band limits) and truncates.
 # ------------------------------------------------------------
 from __future__ import annotations
 from typing import Any
 import numpy as np
 from material.huff_utils import encode_huff, decode_huff
 def aac_encode_huff(
    coeff_sec: np.ndarray,
    huff_LUT_list: list[dict[str, Any]],
    force_codebook: int | None = None,
 ) -> tuple[str, int]:
    """
    Huffman-encode a section of coefficients (MDCT symbols or scalefactors).
    Parameters
    ----------
    coeff_sec : np.ndarray
        Coefficient section to be encoded. Any shape is accepted; the input
        is flattened and treated as a 1-D sequence of int64 symbols.
    huff_LUT_list : list[dict[str, Any]]
        List of Huffman Look-Up Tables (LUTs) as returned by material.load_LUT().
        Index corresponds to codebook id (typically 1..11, with 0 reserved).
    force_codebook : int | None
        If provided, forces the use of this Huffman codebook. In the assignment,
        scalefactors are encoded with codebook 11. For MDCT coefficients, this
        argument is usually omitted (auto-selection).
    Returns
    -------
    tuple[str, int]
        (huff_sec, huff_codebook)
        - huff_sec: bitstream as a string of '0'/'1'
        - huff_codebook: codebook id used by the encoder
    """
    coeff_sec_arr = np.asarray(coeff_sec, dtype=np.int64).reshape(-1)
    if force_codebook is None:
        # Provided utility returns (bitstream, codebook) in the auto-selection case.
        huff_sec, huff_codebook = encode_huff(coeff_sec_arr, huff_LUT_list)
        return str(huff_sec), int(huff_codebook)
    # Provided utility returns ONLY the bitstream when force_codebook is set.
    cb = int(force_codebook)
    huff_sec = encode_huff(coeff_sec_arr, huff_LUT_list, force_codebook=cb)
    return str(huff_sec), cb
 def aac_decode_huff(
    huff_sec: str | np.ndarray,
    huff_codebook: int,
    huff_LUT: list[dict[str, Any]],
 ) -> np.ndarray:
    """
    Huffman-decode a bitstream using the specified codebook.
    Parameters
    ----------
    huff_sec : str | np.ndarray
        Huffman bitstream. Typically a string of '0'/'1'. If an array is provided,
        it is passed through to the provided decoder.
    huff_codebook : int
        Codebook id that was returned by aac_encode_huff.
        Codebook 0 represents an all-zero section.
    huff_LUT : list[dict[str, Any]]
        Huffman LUT list as returned by material.load_LUT().
    Returns
    -------
    np.ndarray
        Decoded coefficients as a 1-D np.int64 array.
        Note: Due to tuple coding, the decoded array may contain extra trailing
        padding symbols. The caller must truncate to the known section length.
    """
    cb = int(huff_codebook)
    if cb == 0:
        # Codebook 0 represents an all-zero section. The decoded length is not
        # recoverable from the bitstream alone; the caller must expand/truncate.
        return np.zeros((0,), dtype=np.int64)
    if cb < 0 or cb >= len(huff_LUT):
        raise ValueError(f"Invalid Huffman codebook index: {cb}")
    lut = huff_LUT[cb]
    dec = decode_huff(huff_sec, lut)
    return np.asarray(dec, dtype=np.int64).reshape(-1)
--- a/source/core/aac_psycho.py
+++ b/source/core/aac_psycho.py
@ -0,0 +1,441 @@
 # ------------------------------------------------------------
 # AAC Coder/Decoder - Psychoacoustic Model
 #
 # Multimedia course at Aristotle University of
 # Thessaloniki (AUTh)
 #
 # Author:
 #   Christos Choutouridis (ΑΕΜ 8997)
 #   cchoutou@ece.auth.gr
 #
 # Description:
 #   Psychoacoustic model for ONE channel, based on the assignment notes (Section 2.4).
 #
 #   Public API:
 #       SMR = aac_psycho(frame_T, frame_type, frame_T_prev_1, frame_T_prev_2)
 #
 #   Output:
 #     - For long frames ("OLS", "LSS", "LPS"): SMR has shape (69,)
 #     - For short frames ("ESH"): SMR has shape (42, 8)  (one column per subframe)
 #
 #   Notes:
 #   - Uses Bark band tables from material/TableB219.mat:
 #       * B219a for long windows (69 bands, N=2048 FFT, N/2=1024 bins)
 #       * B219b for short windows (42 bands, N=256 FFT,  N/2=128 bins)
 #   - Applies a Hann window in time domain before FFT magnitude/phase extraction.
 #   - Implements:
 #       spreading function -> band spreading -> tonality index -> masking thresholds -> SMR.
 # ------------------------------------------------------------
 from __future__ import annotations
 import numpy as np
 from core.aac_utils import band_limits, get_table
 from core.aac_configuration import NMT_DB, TMN_DB
 from core.aac_types import *
 # -----------------------------------------------------------------------------
 # Spreading function
 # -----------------------------------------------------------------------------
 def _spreading_matrix(bval: BandValueArray) -> FloatArray:
    """
    Compute the spreading function matrix between psychoacoustic bands.
    The spreading function describes how energy in one critical band masks
    nearby bands. The formula follows the assignment pseudo-code.
    Parameters
    ----------
    bval : BandValueArray
        Bark value per band, shape (B,).
    Returns
    -------
    FloatArray
        Spreading matrix S of shape (B, B), where:
          S[bb, b] quantifies the contribution of band bb masking band b.
    """
    bval = np.asarray(bval, dtype=np.float64).reshape(-1)
    B = int(bval.shape[0])
    spread = np.zeros((B, B), dtype=np.float64)
    for b in range(B):
        for bb in range(B):
            # tmpx depends on direction (asymmetric spreading)
            if bb >= b:
                tmpx = 3.0 * (bval[bb] - bval[b])
            else:
                tmpx = 1.5 * (bval[bb] - bval[b])
            # tmpz uses the "min(..., 0)" nonlinearity exactly as in the notes
            tmpz = 8.0 * min((tmpx - 0.5) ** 2 - 2.0 * (tmpx - 0.5), 0.0)
            tmpy = 15.811389 + 7.5 * (tmpx + 0.474) - 17.5 * np.sqrt(1.0 + (tmpx + 0.474) ** 2)
            # Clamp very small values (below -100 dB) to 0 contribution
            if tmpy < -100.0:
                spread[bb, b] = 0.0
            else:
                spread[bb, b] = 10.0 ** ((tmpz + tmpy) / 10.0)
    return spread
 # -----------------------------------------------------------------------------
 # Windowing + FFT feature extraction
 # -----------------------------------------------------------------------------
 def _hann_window(N: int) -> FloatArray:
    """
    Hann window as specified in the notes:
        w[n] = 0.5 - 0.5*cos(2*pi*(n + 0.5)/N)
    Parameters
    ----------
    N : int
        Window length.
    Returns
    -------
    FloatArray
        1-D array of shape (N,), dtype float64.
    """
    n = np.arange(N, dtype=np.float64)
    return 0.5 - 0.5 * np.cos((2.0 * np.pi / N) * (n + 0.5))
 def _r_phi_from_time(x: FrameChannelT, N: int) -> tuple[FloatArray, FloatArray]:
    """
    Compute FFT magnitude r(w) and phase phi(w) for bins w = 0 .. N/2-1.
    Processing:
    1) Apply Hann window in time domain.
    2) Compute N-point FFT.
    3) Keep only the positive-frequency bins [0 .. N/2-1].
    Parameters
    ----------
    x : FrameChannelT
        Time-domain samples, shape (N,).
    N : int
        FFT size (2048 or 256).
    Returns
    -------
    r : FloatArray
        Magnitude spectrum for bins 0 .. N/2-1, shape (N/2,).
    phi : FloatArray
        Phase spectrum for bins 0 .. N/2-1, shape (N/2,).
    """
    x = np.asarray(x, dtype=np.float64).reshape(-1)
    if x.shape[0] != N:
        raise ValueError(f"Expected time vector of length {N}, got {x.shape[0]}.")
    w = _hann_window(N)
    X = np.fft.fft(x * w, n=N)
    Xp = X[: N // 2]
    r = np.abs(Xp).astype(np.float64, copy=False)
    phi = np.angle(Xp).astype(np.float64, copy=False)
    return r, phi
 def _predictability(
    r: FloatArray,
    phi: FloatArray,
    r_m1: FloatArray,
    phi_m1: FloatArray,
    r_m2: FloatArray,
    phi_m2: FloatArray,
 ) -> FloatArray:
    """
    Compute predictability c(w) per spectral bin.
    The notes define:
      r_pred(w)   = 2*r_{-1}(w)   - r_{-2}(w)
      phi_pred(w) = 2*phi_{-1}(w) - phi_{-2}(w)
      c(w) = |X(w) - X_pred(w)| / (r(w) + |r_pred(w)|)
    where X(w) is represented in polar form using r(w), phi(w).
    Parameters
    ----------
    r, phi : FloatArray
        Current magnitude and phase, shape (N/2,).
    r_m1, phi_m1 : FloatArray
        Previous magnitude and phase, shape (N/2,).
    r_m2, phi_m2 : FloatArray
        Pre-previous magnitude and phase, shape (N/2,).
    Returns
    -------
    FloatArray
        Predictability c(w), shape (N/2,).
    """
    r_pred = 2.0 * r_m1 - r_m2
    phi_pred = 2.0 * phi_m1 - phi_m2
    num = np.sqrt(
        (r * np.cos(phi) - r_pred * np.cos(phi_pred)) ** 2
      + (r * np.sin(phi) - r_pred * np.sin(phi_pred)) ** 2
    )
    den = r + np.abs(r_pred) + 1e-12  # avoid division-by-zero without altering behavior
    return (num / den).astype(np.float64, copy=False)
 # -----------------------------------------------------------------------------
 # Band-domain aggregation
 # -----------------------------------------------------------------------------
 def _band_energy_and_weighted_predictability(
    r: FloatArray,
    c: FloatArray,
    wlow: BandIndexArray,
    whigh: BandIndexArray,
 ) -> tuple[FloatArray, FloatArray]:
    """
    Aggregate spectral bin quantities into psychoacoustic bands.
    Definitions (notes):
      e(b) = sum_{w=wlow(b)..whigh(b)} r(w)^2
      c_num(b) = sum_{w=wlow(b)..whigh(b)} c(w) * r(w)^2
    The band predictability c(b) is later computed after spreading as:
      cb(b) = ct(b) / ecb(b)
    Parameters
    ----------
    r : FloatArray
        Magnitude spectrum, shape (N/2,).
    c : FloatArray
        Predictability per bin, shape (N/2,).
    wlow, whigh : BandIndexArray
        Band limits (inclusive indices), shape (B,).
    Returns
    -------
    e_b : FloatArray
        Band energies e(b), shape (B,).
    c_num_b : FloatArray
        Weighted predictability numerators c_num(b), shape (B,).
    """
    r2 = (r * r).astype(np.float64, copy=False)
    B = int(wlow.shape[0])
    e_b = np.zeros(B, dtype=np.float64)
    c_num_b = np.zeros(B, dtype=np.float64)
    for b in range(B):
        a = int(wlow[b])
        z = int(whigh[b])
        seg_r2 = r2[a : z + 1]
        e_b[b] = float(np.sum(seg_r2))
        c_num_b[b] = float(np.sum(c[a : z + 1] * seg_r2))
    return e_b, c_num_b
 def _psycho_one_window(
    time_x: FrameChannelT,
    prev1_x: FrameChannelT,
    prev2_x: FrameChannelT,
    *,
    N: int,
    table: BarkTable,
 ) -> FloatArray:
    """
    Compute SMR for one FFT analysis window (N=2048 for long, N=256 for short).
    This implements the pipeline described in the notes:
      - FFT magnitude/phase
      - predictability per bin
      - band energies and predictability
      - band spreading
      - tonality index tb(b)
      - masking threshold (noise + threshold in quiet)
      - SMR(b) = e(b) / np(b)
    Parameters
    ----------
    time_x : FrameChannelT
        Current time-domain samples, shape (N,).
    prev1_x : FrameChannelT
        Previous time-domain samples, shape (N,).
    prev2_x : FrameChannelT
        Pre-previous time-domain samples, shape (N,).
    N : int
        FFT size.
    table : BarkTable
        Psychoacoustic band table (B219a or B219b).
    Returns
    -------
    FloatArray
        SMR per band, shape (B,).
    """
    wlow, whigh, bval, qthr_db = band_limits(table)
    spread = _spreading_matrix(bval)
    # FFT features for current and history windows
    r, phi = _r_phi_from_time(time_x, N)
    r_m1, phi_m1 = _r_phi_from_time(prev1_x, N)
    r_m2, phi_m2 = _r_phi_from_time(prev2_x, N)
    # Predictability per bin
    c_w = _predictability(r, phi, r_m1, phi_m1, r_m2, phi_m2)
    # Aggregate into psycho bands
    e_b, c_num_b = _band_energy_and_weighted_predictability(r, c_w, wlow, whigh)
    # Spread energies and predictability across bands:
    # ecb(b) = sum_bb e(bb)      * S(bb, b)
    # ct(b)  = sum_bb c_num(bb)  * S(bb, b)
    ecb = spread.T @ e_b
    ct = spread.T @ c_num_b
    # Band predictability after spreading: cb(b) = ct(b) / ecb(b)
    cb = ct / (ecb + 1e-12)
    # Normalized energy term:
    # en(b) = ecb(b) / sum_bb S(bb, b)
    spread_colsum = np.sum(spread, axis=0)
    en = ecb / (spread_colsum + 1e-12)
    # Tonality index (clamped to [0, 1])
    tb = -0.299 - 0.43 * np.log(np.maximum(cb, 1e-12))
    tb = np.clip(tb, 0.0, 1.0)
    # Required SNR per band (dB): interpolate between TMN and NMT
    snr_b = tb * TMN_DB + (1.0 - tb) * NMT_DB
    bc = 10.0 ** (-snr_b / 10.0)
    # Noise masking threshold estimate (power domain)
    nb = en * bc
    # Threshold in quiet (convert from dB to power domain):
    # qthr_power = (N/2) * 10^(qthr_db/10)
    qthr_power = (N / 2.0) * (10.0 ** (qthr_db / 10.0))
    # Final masking threshold per band:
    # np(b) = max(nb(b), qthr(b))
    npart = np.maximum(nb, qthr_power)
    # Signal-to-mask ratio:
    # SMR(b) = e(b) / np(b)
    smr = e_b / (npart + 1e-12)
    return smr.astype(np.float64, copy=False)
 # -----------------------------------------------------------------------------
 # ESH window slicing (match filterbank conventions)
 # -----------------------------------------------------------------------------
 def _esh_subframes_256(x_2048: FrameChannelT) -> list[FrameChannelT]:
    """
    Extract the 8 overlapping 256-sample short windows used by AAC ESH.
    The project convention (matching the filterbank) is:
      start_j = 448 + 128*j,  for j = 0..7
      subframe_j = x[start_j : start_j + 256]
    This selects the central 1152-sample region [448, 1600) and produces
    8 windows with 50% overlap.
    Parameters
    ----------
    x_2048 : FrameChannelT
        Time-domain channel frame, shape (2048,).
    Returns
    -------
    list[FrameChannelT]
        List of 8 subframes, each of shape (256,).
    """
    x_2048 = np.asarray(x_2048, dtype=np.float64).reshape(-1)
    if x_2048.shape[0] != 2048:
        raise ValueError("ESH requires 2048-sample input frames.")
    subs: list[FrameChannelT] = []
    for j in range(8):
        start = 448 + 128 * j
        subs.append(x_2048[start : start + 256])
    return subs
 # -----------------------------------------------------------------------------
 # Public API
 # -----------------------------------------------------------------------------
 def aac_psycho(
    frame_T: FrameChannelT,
    frame_type: FrameType,
    frame_T_prev_1: FrameChannelT,
    frame_T_prev_2: FrameChannelT,
 ) -> FloatArray:
    """
    Psychoacoustic model for ONE channel.
    Parameters
    ----------
    frame_T : FrameChannelT
        Current time-domain channel frame, shape (2048,).
        For "ESH", the 8 short windows are derived internally.
    frame_type : FrameType
        AAC frame type ("OLS", "LSS", "ESH", "LPS").
    frame_T_prev_1 : FrameChannelT
        Previous time-domain channel frame, shape (2048,).
    frame_T_prev_2 : FrameChannelT
        Pre-previous time-domain channel frame, shape (2048,).
    Returns
    -------
    FloatArray
        Signal-to-Mask Ratio (SMR), per psychoacoustic band.
        - If frame_type == "ESH": shape (42, 8)
        - Else: shape (69,)
    """
    frame_T = np.asarray(frame_T, dtype=np.float64).reshape(-1)
    frame_T_prev_1 = np.asarray(frame_T_prev_1, dtype=np.float64).reshape(-1)
    frame_T_prev_2 = np.asarray(frame_T_prev_2, dtype=np.float64).reshape(-1)
    if frame_T.shape[0] != 2048 or frame_T_prev_1.shape[0] != 2048 or frame_T_prev_2.shape[0] != 2048:
        raise ValueError("aac_psycho expects 2048-sample frames for current/prev1/prev2.")
    table, N = get_table(frame_type)
    # Long frame types: compute one SMR vector (69 bands)
    if frame_type != "ESH":
        return _psycho_one_window(frame_T, frame_T_prev_1, frame_T_prev_2, N=N, table=table)
    # ESH: compute 8 SMR vectors (42 bands each), one per short subframe.
    #
    # The notes use short-window history for predictability:
    # - For j=0: use previous frame's subframes (7, 6)
    # - For j=1: use current subframe 0 and previous frame's subframe 7
    # - For j>=2: use current subframes (j-1, j-2)
    #
    # This matches the "within-frame history" convention commonly used in
    # simplified psycho models for ESH.
    cur_subs = _esh_subframes_256(frame_T)
    prev1_subs = _esh_subframes_256(frame_T_prev_1)
    B = int(table.shape[0])  # expected 42
    smr_out = np.zeros((B, 8), dtype=np.float64)
    for j in range(8):
        if j == 0:
            x_m1 = prev1_subs[7]
            x_m2 = prev1_subs[6]
        elif j == 1:
            x_m1 = cur_subs[0]
            x_m2 = prev1_subs[7]
        else:
            x_m1 = cur_subs[j - 1]
            x_m2 = cur_subs[j - 2]
        smr_out[:, j] = _psycho_one_window(cur_subs[j], x_m1, x_m2, N=256, table=table)
    return smr_out
--- a/source/core/aac_quantizer.py
+++ b/source/core/aac_quantizer.py
@ -0,0 +1,604 @@
 # ------------------------------------------------------------
 # AAC Coder/Decoder - Quantizer / iQuantizer (Level 3)
 #
 # Multimedia course at Aristotle University of
 # Thessaloniki (AUTh)
 #
 # Author:
 #   Christos Choutouridis (ΑΕΜ 8997)
 #   cchoutou@ece.auth.gr
 #
 # Description:
 #   Implements AAC quantizer and inverse quantizer for one channel.
 #   Based on assignment section 2.6 (Eq. 12-15).
 #
 # Notes:
 #   - Bit reservoir is not implemented (assignment simplification).
 #   - Scalefactor bands are assumed equal to psychoacoustic bands
 #     (Table B.2.1.9a / B.2.1.9b from TableB219.mat).
 # ------------------------------------------------------------
 from __future__ import annotations
 import numpy as np
 from core.aac_utils import get_table, band_limits
 from core.aac_types import *
 # -----------------------------------------------------------------------------
 # Constants (assignment)
 # -----------------------------------------------------------------------------
 MAGIC_NUMBER: float = 0.4054
 MQ: int = 8191
 EPS: float = 1e-12
 MAX_SFC_DIFF: int = 60
 # Safeguard: prevents infinite loops in pathological cases
 MAX_ALPHA_ITERS: int = 2000
 # -----------------------------------------------------------------------------
 # Helpers: ESH packing/unpacking (128x8 <-> 1024x1)
 # -----------------------------------------------------------------------------
 def _esh_pack_to_1024(x_128x8: FloatArray) -> FloatArray:
    """
    Pack ESH coefficients (128 x 8) into a single long vector (1024 x 1).
    Packing order:
        Columns are concatenated in subframe order (0..7), column-major.
    Parameters
    ----------
    x_128x8 : FloatArray
        ESH coefficients, shape (128, 8).
    Returns
    -------
    FloatArray
        Packed coefficients, shape (1024, 1).
    """
    x_128x8 = np.asarray(x_128x8, dtype=np.float64)
    if x_128x8.shape != (128, 8):
        raise ValueError("ESH pack expects shape (128, 8).")
    return x_128x8.reshape(1024, 1, order="F")
 def _esh_unpack_from_1024(x_1024x1: FloatArray) -> FloatArray:
    """
    Unpack a packed ESH vector (1024 elements) back to shape (128, 8).
    Parameters
    ----------
    x_1024x1 : FloatArray
        Packed ESH vector, shape (1024,) or (1024, 1) after flattening.
    Returns
    -------
    FloatArray
        Unpacked ESH coefficients, shape (128, 8).
    """
    x_1024x1 = np.asarray(x_1024x1, dtype=np.float64).reshape(-1)
    if x_1024x1.shape[0] != 1024:
        raise ValueError("ESH unpack expects 1024 elements.")
    return x_1024x1.reshape(128, 8, order="F")
 # -----------------------------------------------------------------------------
 # Core quantizer formulas (Eq. 12, Eq. 13)
 # -----------------------------------------------------------------------------
 def _quantize_symbol(x: FloatArray, alpha: float) -> QuantizedSymbols:
    """
    Quantize MDCT coefficients to integer symbols S(k).
    Implements Eq. (12):
        S(k) = sgn(X(k)) * int( (|X(k)| * 2^(-alpha/4))^(3/4) + MAGIC_NUMBER )
    Parameters
    ----------
    x : FloatArray
        MDCT coefficients for a contiguous set of spectral lines.
        Shape: (N,)
    alpha : float
        Scalefactor gain for the corresponding scalefactor band.
    Returns
    -------
    QuantizedSymbols
        Quantized symbols S(k) as int64, shape (N,).
    """
    x = np.asarray(x, dtype=np.float64)
    scale = 2.0 ** (-0.25 * float(alpha))
    ax = np.abs(x) * scale
    y = np.power(ax, 0.75, dtype=np.float64)
    # "int" in the assignment corresponds to truncation.
    q = np.floor(y + MAGIC_NUMBER).astype(np.int64)
    return (np.sign(x).astype(np.int64) * q).astype(np.int64)
 def _dequantize_symbol(S: QuantizedSymbols, alpha: float) -> FloatArray:
    """
    Inverse quantizer (dequantization of symbols).
    Implements Eq. (13):
        Xhat(k) = sgn(S(k)) * |S(k)|^(4/3) * 2^(alpha/4)
    Parameters
    ----------
    S : QuantizedSymbols
        Quantized symbols S(k), int64, shape (N,).
    alpha : float
        Scalefactor gain for the corresponding scalefactor band.
    Returns
    -------
    FloatArray
        Reconstructed MDCT coefficients Xhat(k), float64, shape (N,).
    """
    S = np.asarray(S, dtype=np.int64)
    scale = 2.0 ** (0.25 * float(alpha))
    aS = np.abs(S).astype(np.float64)
    y = np.power(aS, 4.0 / 3.0, dtype=np.float64)
    return (np.sign(S).astype(np.float64) * y * scale).astype(np.float64)
 # -----------------------------------------------------------------------------
 # Alpha initialization (Eq. 14)
 # -----------------------------------------------------------------------------
 def _alpha_initial_from_frame_max(x_all: FloatArray) -> int:
    """
    Compute the initial scalefactor gain alpha_hat for a frame.
    Implements Eq. (14):
        alpha_hat = (16/3) * log2( max_k(|X(k)|^(3/4)) / MQ )
    The same initial value is used for all bands before the per-band refinement.
    Parameters
    ----------
    x_all : FloatArray
        All MDCT coefficients of a frame (one channel), flattened.
    Returns
    -------
    int
        Initial alpha value (integer).
    """
    x_all = np.asarray(x_all, dtype=np.float64).reshape(-1)
    if x_all.size == 0:
        return 0
    max_abs = float(np.max(np.abs(x_all)))
    if max_abs <= 0.0:
        return 0
    val = (max_abs ** 0.75) / float(MQ)
    if val <= 0.0:
        return 0
    alpha_hat = (16.0 / 3.0) * np.log2(val)
    return int(np.floor(alpha_hat))
 # -----------------------------------------------------------------------------
 # Band utilities
 # -----------------------------------------------------------------------------
 def _band_slices(frame_type: FrameType) -> list[tuple[int, int]]:
    """
    Return scalefactor band ranges [wlow, whigh] (inclusive) for the given frame type.
    These are derived from the psychoacoustic tables (TableB219),
    and map directly to MDCT indices:
      - long: 0..1023
      - short (ESH subframe): 0..127
    Parameters
    ----------
    frame_type : FrameType
        Frame type ("OLS", "LSS", "ESH", "LPS").
    Returns
    -------
    list[tuple[int, int]]
        List of (lo, hi) inclusive index pairs for each band.
    """
    table, _Nfft = get_table(frame_type)
    wlow, whigh, _bval, _qthr_db = band_limits(table)
    bands: list[tuple[int, int]] = []
    for lo, hi in zip(wlow, whigh):
        bands.append((int(lo), int(hi)))
    return bands
 def _band_energy(x: FloatArray, lo: int, hi: int) -> float:
    """
    Compute energy of a spectral segment x[lo:hi+1].
    Parameters
    ----------
    x : FloatArray
        MDCT coefficient vector.
    lo, hi : int
        Inclusive index range.
    Returns
    -------
    float
        Sum of squares (energy) within the band.
    """
    sec = x[lo : hi + 1]
    return float(np.sum(sec * sec))
 def _threshold_T_from_SMR(
    X: FloatArray,
    SMR_col: FloatArray,
    bands: list[tuple[int, int]],
 ) -> FloatArray:
    """
    Compute psychoacoustic thresholds T(b) per band.
    Uses:
        P(b) = sum_{k in band} X(k)^2
        T(b) = P(b) / SMR(b)
    Parameters
    ----------
    X : FloatArray
        MDCT coefficients for a frame (long) or one ESH subframe (short).
    SMR_col : FloatArray
        SMR values for this frame/subframe, shape (NB,).
    bands : list[tuple[int, int]]
        Band index ranges.
    Returns
    -------
    FloatArray
        Threshold vector T(b), shape (NB,).
    """
    nb = len(bands)
    T = np.zeros((nb,), dtype=np.float64)
    for b, (lo, hi) in enumerate(bands):
        P = _band_energy(X, lo, hi)
        smr = float(SMR_col[b])
        if smr <= EPS:
            T[b] = 0.0
        else:
            T[b] = P / smr
    return T
 # -----------------------------------------------------------------------------
 # Alpha selection per band + neighbor-difference constraint
 # -----------------------------------------------------------------------------
 def _best_alpha_for_band(
    X: FloatArray,
    lo: int,
    hi: int,
    T_b: float,
    alpha0: int,
    alpha_min: int,
    alpha_max: int,
 ) -> int:
    """
    Determine the band-wise scalefactor alpha(b) by iteratively increasing alpha.
    The algorithm increases alpha until the quantization error power exceeds
    the band threshold:
        P_e(b) = sum_{k in band} (X(k) - Xhat(k))^2
        select the largest alpha such that P_e(b) <= T(b)
    Parameters
    ----------
    X : FloatArray
        Full MDCT vector (one frame or one subframe), shape (N,).
    lo, hi : int
        Inclusive MDCT index range defining the band.
    T_b : float
        Psychoacoustic threshold for this band.
    alpha0 : int
        Initial alpha value for the band.
    alpha_min, alpha_max : int
        Bounds for alpha, used as a safeguard.
    Returns
    -------
    int
        Selected integer alpha(b).
    """
    if T_b <= 0.0:
        return int(alpha0)
    Xsec = X[lo : hi + 1]
    alpha = int(alpha0)
    alpha = max(alpha_min, min(alpha, alpha_max))
    # Evaluate at current alpha
    Ssec = _quantize_symbol(Xsec, alpha)
    Xhat = _dequantize_symbol(Ssec, alpha)
    Pe = float(np.sum((Xsec - Xhat) ** 2))
    if Pe > T_b:
        return alpha
    iters = 0
    while iters < MAX_ALPHA_ITERS:
        iters += 1
        alpha_next = alpha + 1
        if alpha_next > alpha_max:
            break
        Ssec = _quantize_symbol(Xsec, alpha_next)
        Xhat = _dequantize_symbol(Ssec, alpha_next)
        Pe_next = float(np.sum((Xsec - Xhat) ** 2))
        if Pe_next > T_b:
            break
        alpha = alpha_next
        Pe = Pe_next
    return alpha
 def _enforce_max_diff(alpha: np.ndarray, max_diff: int = MAX_SFC_DIFF) -> np.ndarray:
    """
    Enforce neighbor constraint |alpha[b] - alpha[b-1]| <= max_diff by clamping.
    Uses a forward pass and a backward pass to reduce drift.
    Parameters
    ----------
    alpha : np.ndarray
        Alpha vector, shape (NB,).
    max_diff : int
        Maximum allowed absolute difference between adjacent bands.
    Returns
    -------
    np.ndarray
        Clamped alpha vector, int64, shape (NB,).
    """
    a = np.asarray(alpha, dtype=np.int64).copy()
    nb = a.shape[0]
    for b in range(1, nb):
        lo = int(a[b - 1] - max_diff)
        hi = int(a[b - 1] + max_diff)
        if a[b] < lo:
            a[b] = lo
        elif a[b] > hi:
            a[b] = hi
    for b in range(nb - 2, -1, -1):
        lo = int(a[b + 1] - max_diff)
        hi = int(a[b + 1] + max_diff)
        if a[b] < lo:
            a[b] = lo
        elif a[b] > hi:
            a[b] = hi
    return a
 # -----------------------------------------------------------------------------
 # Public API
 # -----------------------------------------------------------------------------
 def aac_quantizer(
    frame_F: FrameChannelF,
    frame_type: FrameType,
    SMR: FloatArray,
 ) -> tuple[QuantizedSymbols, ScaleFactors, GlobalGain]:
    """
    AAC quantizer for one channel (Level 3).
    Quantizes MDCT coefficients using band-wise scalefactors derived from SMR.
    Parameters
    ----------
    frame_F : FrameChannelF
        MDCT coefficients after TNS, one channel.
        Shapes:
        - Long frames: (1024,) or (1024, 1)
        - ESH: (128, 8)
    frame_type : FrameType
        AAC frame type ("OLS", "LSS", "ESH", "LPS").
    SMR : FloatArray
        Signal-to-Mask Ratio per band.
        Shapes:
        - Long: (NB,) or (NB, 1)
        - ESH: (NB, 8)
    Returns
    -------
    S : QuantizedSymbols
        Quantized symbols S(k), shape (1024, 1) for all frame types.
    sfc : ScaleFactors
        DPCM-coded scalefactor differences sfc(b) = alpha(b) - alpha(b-1).
        Shapes:
        - Long: (NB, 1)
        - ESH: (NB, 8)
    G : GlobalGain
        Global gain G = alpha(0).
        - Long: scalar float
        - ESH: array shape (1, 8)
    """
    bands = _band_slices(frame_type)
    NB = len(bands)
    X = np.asarray(frame_F, dtype=np.float64)
    SMR = np.asarray(SMR, dtype=np.float64)
    if frame_type == "ESH":
        if X.shape != (128, 8):
            raise ValueError("For ESH, frame_F must have shape (128, 8).")
        if SMR.shape != (NB, 8):
            raise ValueError(f"For ESH, SMR must have shape ({NB}, 8).")
        S_out: QuantizedSymbols = np.zeros((1024, 1), dtype=np.int64)
        sfc: ScaleFactors = np.zeros((NB, 8), dtype=np.int64)
        G_arr = np.zeros((1, 8), dtype=np.int64)
        for j in range(8):
            Xj = X[:, j].reshape(128)
            SMRj = SMR[:, j].reshape(NB)
            T = _threshold_T_from_SMR(Xj, SMRj, bands)
            alpha0 = _alpha_initial_from_frame_max(Xj)
            alpha = np.full((NB,), alpha0, dtype=np.int64)
            for b, (lo, hi) in enumerate(bands):
                alpha[b] = _best_alpha_for_band(
                    X=Xj, lo=lo, hi=hi, T_b=float(T[b]),
                    alpha0=int(alpha[b]),
                    alpha_min=-4096,
                    alpha_max=4096,
                )
            alpha = _enforce_max_diff(alpha, MAX_SFC_DIFF)
            G_arr[0, j] = int(alpha[0])
            sfc[0, j] = int(alpha[0])
            for b in range(1, NB):
                sfc[b, j] = int(alpha[b] - alpha[b - 1])
            Sj = np.zeros((128,), dtype=np.int64)
            for b, (lo, hi) in enumerate(bands):
                Sj[lo : hi + 1] = _quantize_symbol(Xj[lo : hi + 1], float(alpha[b]))
            # Place this subframe in the packed output (column-major subframe layout)
            S_out[:, 0].reshape(128, 8, order="F")[:, j] = Sj
        return S_out, sfc, G_arr.astype(np.float64)
    # Long frames
    if X.shape == (1024,):
        Xv = X
    elif X.shape == (1024, 1):
        Xv = X[:, 0]
    else:
        raise ValueError("For non-ESH, frame_F must have shape (1024,) or (1024, 1).")
    if SMR.shape == (NB,):
        SMRv = SMR
    elif SMR.shape == (NB, 1):
        SMRv = SMR[:, 0]
    else:
        raise ValueError(f"For non-ESH, SMR must have shape ({NB},) or ({NB}, 1).")
    T = _threshold_T_from_SMR(Xv, SMRv, bands)
    alpha0 = _alpha_initial_from_frame_max(Xv)
    alpha = np.full((NB,), alpha0, dtype=np.int64)
    for b, (lo, hi) in enumerate(bands):
        alpha[b] = _best_alpha_for_band(
            X=Xv, lo=lo, hi=hi, T_b=float(T[b]),
            alpha0=int(alpha[b]),
            alpha_min=-4096,
            alpha_max=4096,
        )
    alpha = _enforce_max_diff(alpha, MAX_SFC_DIFF)
    sfc: ScaleFactors = np.zeros((NB, 1), dtype=np.int64)
    sfc[0, 0] = int(alpha[0])
    for b in range(1, NB):
        sfc[b, 0] = int(alpha[b] - alpha[b - 1])
    G: float = float(alpha[0])
    S_vec = np.zeros((1024,), dtype=np.int64)
    for b, (lo, hi) in enumerate(bands):
        S_vec[lo : hi + 1] = _quantize_symbol(Xv[lo : hi + 1], float(alpha[b]))
    return S_vec.reshape(1024, 1), sfc, G
 def aac_i_quantizer(
    S: QuantizedSymbols,
    sfc: ScaleFactors,
    G: GlobalGain,
    frame_type: FrameType,
 ) -> FrameChannelF:
    """
    Inverse quantizer (iQuantizer) for one channel.
    Reconstructs MDCT coefficients from quantized symbols and DPCM scalefactors.
    Parameters
    ----------
    S : QuantizedSymbols
        Quantized symbols, shape (1024, 1) (or any array with 1024 elements).
    sfc : ScaleFactors
        DPCM-coded scalefactors.
        Shapes:
        - Long: (NB, 1)
        - ESH: (NB, 8)
    G : GlobalGain
        Global gain (not strictly required if sfc includes sfc(0)=alpha(0)).
        Present for API compatibility with the assignment.
    frame_type : FrameType
        AAC frame type.
    Returns
    -------
    FrameChannelF
        Reconstructed MDCT coefficients:
        - ESH: (128, 8)
        - Long: (1024, 1)
    """
    bands = _band_slices(frame_type)
    NB = len(bands)
    S_flat = np.asarray(S, dtype=np.int64).reshape(-1)
    if S_flat.shape[0] != 1024:
        raise ValueError("S must contain 1024 symbols.")
    if frame_type == "ESH":
        sfc = np.asarray(sfc, dtype=np.int64)
        if sfc.shape != (NB, 8):
            raise ValueError(f"For ESH, sfc must have shape ({NB}, 8).")
        S_128x8 = _esh_unpack_from_1024(S_flat)
        Xrec = np.zeros((128, 8), dtype=np.float64)
        for j in range(8):
            alpha = np.zeros((NB,), dtype=np.int64)
            alpha[0] = int(sfc[0, j])
            for b in range(1, NB):
                alpha[b] = int(alpha[b - 1] + sfc[b, j])
            Xj = np.zeros((128,), dtype=np.float64)
            for b, (lo, hi) in enumerate(bands):
                Xj[lo : hi + 1] = _dequantize_symbol(S_128x8[lo : hi + 1, j].astype(np.int64), float(alpha[b]))
            Xrec[:, j] = Xj
        return Xrec
    sfc = np.asarray(sfc, dtype=np.int64)
    if sfc.shape != (NB, 1):
        raise ValueError(f"For non-ESH, sfc must have shape ({NB}, 1).")
    alpha = np.zeros((NB,), dtype=np.int64)
    alpha[0] = int(sfc[0, 0])
    for b in range(1, NB):
        alpha[b] = int(alpha[b - 1] + sfc[b, 0])
    Xrec = np.zeros((1024,), dtype=np.float64)
    for b, (lo, hi) in enumerate(bands):
        Xrec[lo : hi + 1] = _dequantize_symbol(S_flat[lo : hi + 1], float(alpha[b]))
    return Xrec.reshape(1024, 1)
--- a/source/core/aac_snr_db.py
+++ b/source/core/aac_snr_db.py
@ -1,60 +0,0 @@
 # ------------------------------------------------------------
 # AAC Coder/Decoder - SNR dB calculator
 #
 # Multimedia course at Aristotle University of
 # Thessaloniki (AUTh)
 #
 # Author:
 #   Christos Choutouridis (ΑΕΜ 8997)
 #   cchoutou@ece.auth.gr
 #
 # Description:
 #   This module implements SNR calculation in dB
 # ------------------------------------------------------------
 from __future__ import annotations
 from core.aac_types import StereoSignal
 import numpy as np
 def snr_db(x_ref: StereoSignal, x_hat: StereoSignal) -> float:
    """
    Compute overall SNR (dB) over all samples and channels after aligning lengths.
    Parameters
    ----------
    x_ref : StereoSignal
        Reference stereo stream.
    x_hat : StereoSignal
        Reconstructed stereo stream.
    Returns
    -------
    float
        SNR in dB.
        - Returns +inf if noise power is zero.
        - Returns -inf if signal power is zero.
    """
    x_ref = np.asarray(x_ref, dtype=np.float64)
    x_hat = np.asarray(x_hat, dtype=np.float64)
    if x_ref.ndim == 1:
        x_ref = x_ref.reshape(-1, 1)
    if x_hat.ndim == 1:
        x_hat = x_hat.reshape(-1, 1)
    n = min(x_ref.shape[0], x_hat.shape[0])
    c = min(x_ref.shape[1], x_hat.shape[1])
    x_ref = x_ref[:n, :c]
    x_hat = x_hat[:n, :c]
    err = x_ref - x_hat
    ps = float(np.sum(x_ref * x_ref))
    pn = float(np.sum(err * err))
    if pn <= 0.0:
        return float("inf")
    if ps <= 0.0:
        return float("-inf")
    return float(10.0 * np.log10(ps / pn))
--- a/source/core/aac_ssc.py
+++ b/source/core/aac_ssc.py
@ -173,10 +173,10 @@ def _stereo_merge(ft_l: FrameType, ft_r: FrameType) -> FrameType:
 # -----------------------------------------------------------------------------
-# Public Function prototypes (Level 1)
+# Public Function prototypes
 # -----------------------------------------------------------------------------
-def aac_SSC(frame_T: FrameT, next_frame_T: FrameT, prev_frame_type: FrameType) -> FrameType:
+def aac_ssc(frame_T: FrameT, next_frame_T: FrameT, prev_frame_type: FrameType) -> FrameType:
    """
    Sequence Segmentation Control (SSC).
--- a/source/core/aac_tns.py
+++ b/source/core/aac_tns.py
@ -30,9 +30,7 @@ from __future__ import annotations
 from pathlib import Path
 from typing import Tuple
-import numpy as np
+from core.aac_utils import load_b219_tables
 from scipy.io import loadmat
 from core.aac_configuration import PRED_ORDER, QUANT_STEP, QUANT_MAX
 from core.aac_types import *
@ -40,41 +38,6 @@ from core.aac_types import *
 # Private helpers
 # -----------------------------------------------------------------------------
 _B219_CACHE: dict[str, FloatArray] | None = None
 def _load_b219_tables() -> dict[str, FloatArray]:
    """
    Load TableB219.mat and cache the contents.
    The project layout guarantees that a 'material' directory is discoverable
    from the current working directory (tests and level_123 entrypoints).
    Returns
    -------
    dict[str, FloatArray]
        Keys:
        - "B219a": long bands table (for K=1024 MDCT lines)
        - "B219b": short bands table (for K=128 MDCT lines)
    """
    global _B219_CACHE
    if _B219_CACHE is not None:
        return _B219_CACHE
    mat_path = Path("material") / "TableB219.mat"
    if not mat_path.exists():
        raise FileNotFoundError("Could not locate material/TableB219.mat in the current working directory.")
    d = loadmat(str(mat_path))
    if "B219a" not in d or "B219b" not in d:
        raise ValueError("TableB219.mat missing required variables B219a and/or B219b.")
    _B219_CACHE = {
        "B219a": np.asarray(d["B219a"], dtype=np.float64),
        "B219b": np.asarray(d["B219b"], dtype=np.float64),
    }
    return _B219_CACHE
 def _band_ranges_for_kcount(k_count: int) -> BandRanges:
    """
@ -92,7 +55,7 @@ def _band_ranges_for_kcount(k_count: int) -> BandRanges:
    BandRanges (list[tuple[int, int]])
        Each tuple is (start_k, end_k) inclusive.
    """
-    tables = _load_b219_tables()
+    tables = load_b219_tables()
    if k_count == 1024:
        tbl = tables["B219a"]
    elif k_count == 128:
@ -411,7 +374,9 @@ def _tns_one_vector(x: MdctCoeffs) -> tuple[MdctCoeffs, MdctCoeffs]:
    sw = _compute_sw(x)
    eps = 1e-12
-    xw = np.where(sw > eps, x / sw, 0.0)
+    xw = np.zeros_like(x, dtype=np.float64)
    mask = sw > eps
    np.divide(x, sw, out=xw, where=mask)
    a = _lpc_coeffs(xw, PRED_ORDER)
    a_q = _quantize_coeffs(a)
@ -425,7 +390,7 @@ def _tns_one_vector(x: MdctCoeffs) -> tuple[MdctCoeffs, MdctCoeffs]:
 # -----------------------------------------------------------------------------
-# Public Functions (Level 2)
+# Public Functions
 # -----------------------------------------------------------------------------
 def aac_tns(frame_F_in: FrameChannelF, frame_type: FrameType) -> Tuple[FrameChannelF, TnsCoeffs]:
--- a/source/core/aac_types.py
+++ b/source/core/aac_types.py
@ -193,6 +193,61 @@ Bark-band index ranges [start, end] (inclusive) for MDCT lines.
 Used by TNS to map MDCT indices k to Bark bands.
 """
 BarkTable: TypeAlias = FloatArray
 """
 Psychoacoustic Bark band table loaded from TableB219.mat.
 Typical shapes:
 - Long: (69, 6)
 - Short: (42, 6)
 """
 BandIndexArray: TypeAlias = NDArray[np.int_]
 """
 Array of FFT bin indices per psychoacoustic band.
 """
 BandValueArray: TypeAlias = FloatArray
 """
 Per-band psychoacoustic values (e.g. Bark position, thresholds).
 """
 # Quantizer-related semantic aliases
 QuantizedSymbols: TypeAlias = NDArray[np.generic]
 """
 Quantized MDCT symbols S(k).
 Shapes:
 - Always (1024, 1) at the quantizer output (ESH packed to 1024 symbols).
 """
 ScaleFactors: TypeAlias = NDArray[np.generic]
 """
 DPCM-coded scalefactors sfc(b) = alpha(b) - alpha(b-1).
 Shapes:
 - Long frames: (NB, 1)
 - ESH frames: (NB, 8)
 """
 GlobalGain: TypeAlias = float | NDArray[np.generic]
 """
 Global gain G = alpha(0).
 - Long frames: scalar float
 - ESH frames: array shape (1, 8)
 """
 # Huffman semantic aliases
 HuffmanBitstream: TypeAlias = str
 """Huffman-coded bitstream stored as a string of '0'/'1'."""
 HuffmanCodebook: TypeAlias = int
 """Huffman codebook id (e.g., 0..11)."""
 # -----------------------------------------------------------------------------
 # Level 1 AAC sequence payload types
 # -----------------------------------------------------------------------------
@ -280,3 +335,77 @@ Level 2 adds:
 and stores:
 - per-channel "frame_F" after applying TNS.
 """
 # -----------------------------------------------------------------------------
 # Level 3 AAC sequence payload types (Quantizer + Huffman)
 # -----------------------------------------------------------------------------
 class AACChannelFrameF3(TypedDict):
    """
    Per-channel payload for aac_seq_3[i]["chl"] or ["chr"] (Level 3).
    Keys
    ----
    tns_coeffs:
        Quantized TNS predictor coefficients for ONE channel.
        Shapes:
        - ESH: (PRED_ORDER, 8)
        - else: (PRED_ORDER, 1)
    T:
        Psychoacoustic thresholds per band.
        Shapes:
        - ESH: (NB, 8)
        - else: (NB, 1)
        Note: Stored for completeness / debugging; not entropy-coded.
    G:
        Quantized global gains.
        Shapes:
        - ESH: (1, 8)  (one per short subframe)
        - else: scalar (or compatible np scalar)
    sfc:
        Huffman-coded scalefactor differences (DPCM sequence).
    stream:
        Huffman-coded MDCT quantized symbols S(k) (packed to 1024 symbols).
    codebook:
        Huffman codebook id used for MDCT symbols (stream).
        (Scalefactors typically use fixed codebook 11 and do not need to store it.)
    """
    tns_coeffs: TnsCoeffs
    T: FloatArray
    G: FloatArray | float
    sfc: HuffmanBitstream
    stream: HuffmanBitstream
    codebook: HuffmanCodebook
 class AACSeq3Frame(TypedDict):
    """
    One frame dictionary element of aac_seq_3 (Level 3).
    """
    frame_type: FrameType
    win_type: WinType
    chl: AACChannelFrameF3
    chr: AACChannelFrameF3
 AACSeq3: TypeAlias = List[AACSeq3Frame]
 """
 AAC sequence for Level 3:
 List of length K (K = number of frames).
 Each element is a dict with keys:
 - "frame_type", "win_type", "chl", "chr"
 Level 3 adds (per channel):
 - "tns_coeffs"
 - "T" thresholds (not entropy-coded)
 - "G" global gain(s)
 - "sfc" Huffman-coded scalefactor differences
 - "stream" Huffman-coded MDCT quantized symbols
 - "codebook" Huffman codebook for MDCT symbols
 """
--- a/source/core/aac_utils.py
+++ b/source/core/aac_utils.py
@ -0,0 +1,270 @@
 # ------------------------------------------------------------
 # AAC Coder/Decoder - AAC Utilities
 #
 # Multimedia course at Aristotle University of
 # Thessaloniki (AUTh)
 #
 # Author:
 #   Christos Choutouridis (ΑΕΜ 8997)
 #   cchoutou@ece.auth.gr
 #
 # Description:
 #   Shared utility functions used across AAC encoder/decoder levels.
 #
 #   This module currently provides:
 #   - MDCT / IMDCT conversions
 #   - Signal-to-Noise Ratio (SNR) computation in dB
 #   - Loading and access helpers for psychoacoustic band tables
 #     (TableB219.mat, Tables B.2.1.9a / B.2.1.9b of the AAC specification)
 # ------------------------------------------------------------
 from __future__ import annotations
 import numpy as np
 from pathlib import Path
 from scipy.io import loadmat
 from core.aac_types import *
 # -----------------------------------------------------------------------------
 # Global cached data
 # -----------------------------------------------------------------------------
 # Cached contents of TableB219.mat to avoid repeated disk I/O.
 # Keys:
 #   - "B219a": long-window psychoacoustic bands (69 bands, FFT size 2048)
 #   - "B219b": short-window psychoacoustic bands (42 bands, FFT size 256)
 B219_CACHE: dict[str, BarkTable] | None = None
 # -----------------------------------------------------------------------------
 # MDCT / IMDCT
 # -----------------------------------------------------------------------------
 def mdct(s: TimeSignal) -> MdctCoeffs:
    """
    MDCT (direct form) as specified in the assignment.
    Parameters
    ----------
    s : TimeSignal
        Windowed time samples, 1-D array of length N (N = 2048 or 256).
    Returns
    -------
    MdctCoeffs
        MDCT coefficients, 1-D array of length N/2.
    Definition
    ----------
    X[k] = 2 * sum_{n=0..N-1} s[n] * cos((2*pi/N) * (n + n0) * (k + 1/2)),
    where n0 = (N/2 + 1)/2.
    """
    s = np.asarray(s, dtype=np.float64).reshape(-1)
    N = int(s.shape[0])
    if N not in (2048, 256):
        raise ValueError("MDCT input length must be 2048 or 256.")
    n0 = (N / 2.0 + 1.0) / 2.0
    n = np.arange(N, dtype=np.float64) + n0
    k = np.arange(N // 2, dtype=np.float64) + 0.5
    C = np.cos((2.0 * np.pi / N) * np.outer(n, k))  # (N, N/2)
    X = 2.0 * (s @ C)  # (N/2,)
    return X
 def imdct(X: MdctCoeffs) -> TimeSignal:
    """
    IMDCT (direct form) as specified in the assignment.
    Parameters
    ----------
    X : MdctCoeffs
        MDCT coefficients, 1-D array of length K (K = 1024 or 128).
    Returns
    -------
    TimeSignal
        Reconstructed time samples, 1-D array of length N = 2K.
    Definition
    ----------
    s[n] = (2/N) * sum_{k=0..N/2-1} X[k] * cos((2*pi/N) * (n + n0) * (k + 1/2)),
    where n0 = (N/2 + 1)/2.
    """
    X = np.asarray(X, dtype=np.float64).reshape(-1)
    K = int(X.shape[0])
    if K not in (1024, 128):
        raise ValueError("IMDCT input length must be 1024 or 128.")
    N = 2 * K
    n0 = (N / 2.0 + 1.0) / 2.0
    n = np.arange(N, dtype=np.float64) + n0
    k = np.arange(K, dtype=np.float64) + 0.5
    C = np.cos((2.0 * np.pi / N) * np.outer(n, k))  # (N, K)
    s = (2.0 / N) * (C @ X)  # (N,)
    return s
 # -----------------------------------------------------------------------------
 # Signal quality metrics
 # -----------------------------------------------------------------------------
 def snr_db(x_ref: StereoSignal, x_hat: StereoSignal) -> float:
    """
    Compute the overall Signal-to-Noise Ratio (SNR) in dB.
    The SNR is computed over all available samples and channels,
    after conservatively aligning the two signals to their common
    length and channel count.
    Parameters
    ----------
    x_ref : StereoSignal
        Reference (original) signal.
        Typical shape: (N, 2) for stereo.
    x_hat : StereoSignal
        Reconstructed or processed signal.
        Typical shape: (M, 2) for stereo.
    Returns
    -------
    float
        SNR in dB.
        - +inf if the noise power is zero (perfect reconstruction).
        - -inf if the reference signal power is zero.
    """
    x_ref = np.asarray(x_ref, dtype=np.float64)
    x_hat = np.asarray(x_hat, dtype=np.float64)
    # Ensure 2-D shape: (samples, channels)
    if x_ref.ndim == 1:
        x_ref = x_ref.reshape(-1, 1)
    if x_hat.ndim == 1:
        x_hat = x_hat.reshape(-1, 1)
    # Align lengths and channel count conservatively
    n = min(x_ref.shape[0], x_hat.shape[0])
    c = min(x_ref.shape[1], x_hat.shape[1])
    x_ref = x_ref[:n, :c]
    x_hat = x_hat[:n, :c]
    err = x_ref - x_hat
    ps = float(np.sum(x_ref * x_ref))     # signal power
    pn = float(np.sum(err * err))          # noise power
    if pn <= 0.0:
        return float("inf")
    if ps <= 0.0:
        return float("-inf")
    return float(10.0 * np.log10(ps / pn))
 # -----------------------------------------------------------------------------
 # Psychoacoustic band tables (TableB219.mat)
 # -----------------------------------------------------------------------------
 def load_b219_tables() -> dict[str, BarkTable]:
    """
    Load and cache psychoacoustic band tables from TableB219.mat.
    The assignment/project layout assumes that a 'material' directory
    is available in the current working directory when running:
    - tests
    - level_1 / level_2 / level_3 entrypoints
    This function loads the tables once and caches them for subsequent calls.
    Returns
    -------
    dict[str, BarkTable]
        Dictionary with the following entries:
        - "B219a": long-window psychoacoustic table
                   (69 bands, FFT size 2048 / 1024 spectral lines)
        - "B219b": short-window psychoacoustic table
                   (42 bands, FFT size 256 / 128 spectral lines)
    """
    global B219_CACHE
    if B219_CACHE is not None:
        return B219_CACHE
    mat_path = Path("material") / "TableB219.mat"
    if not mat_path.exists():
        raise FileNotFoundError(
            "Could not locate material/TableB219.mat in the current working directory."
        )
    data = loadmat(str(mat_path))
    if "B219a" not in data or "B219b" not in data:
        raise ValueError(
            "TableB219.mat missing required variables 'B219a' and/or 'B219b'."
        )
    B219_CACHE = {
        "B219a": np.asarray(data["B219a"], dtype=np.float64),
        "B219b": np.asarray(data["B219b"], dtype=np.float64),
    }
    return B219_CACHE
 def get_table(frame_type: FrameType) -> tuple[BarkTable, int]:
    """
    Select the appropriate psychoacoustic band table and FFT size
    based on the AAC frame type.
    Parameters
    ----------
    frame_type : FrameType
        AAC frame type ("OLS", "LSS", "ESH", "LPS").
    Returns
    -------
    table : BarkTable
        Psychoacoustic band table:
        - B219a for long frames
        - B219b for ESH short subframes
    N : int
        FFT size corresponding to the table:
        - 2048 for long frames
        - 256 for short frames (ESH)
    """
    tables = load_b219_tables()
    if frame_type == "ESH":
        return tables["B219b"], 256
    return tables["B219a"], 2048
 def band_limits(
    table: BarkTable,
 ) -> tuple[BandIndexArray, BandIndexArray, BandValueArray, BandValueArray]:
    """
    Extract per-band metadata from a TableB2.1.9 psychoacoustic table.
    The column layout follows the provided TableB219.mat file and the
    AAC specification tables B.2.1.9a / B.2.1.9b.
    Parameters
    ----------
    table : BarkTable
        Psychoacoustic band table (B219a or B219b).
    Returns
    -------
    wlow : BandIndexArray
        Lower FFT bin index (inclusive) for each band.
    whigh : BandIndexArray
        Upper FFT bin index (inclusive) for each band.
    bval : BandValueArray
        Bark-scale (or equivalent) band position values.
        Used in the spreading function.
    qthr_db : BandValueArray
        Threshold in quiet for each band, in dB.
    """
    wlow = table[:, 1].astype(int)
    whigh = table[:, 2].astype(int)
    bval = table[:, 4].astype(np.float64)
    qthr_db = table[:, 5].astype(np.float64)
    return wlow, whigh, bval, qthr_db
--- a/source/core/tests/test_aac_coder_decoder.py
+++ b/source/core/tests/test_aac_coder_decoder.py
@ -19,10 +19,10 @@ import numpy as np
 import pytest
 import soundfile as sf
-from core.aac_coder import aac_coder_1, aac_coder_2, aac_read_wav_stereo_48k
+from core.aac_coder import aac_coder_1, aac_coder_2, aac_coder_3, aac_read_wav_stereo_48k
-from core.aac_decoder import aac_decoder_1, aac_decoder_2, aac_remove_padding
+from core.aac_decoder import aac_decoder_1, aac_decoder_2, aac_decoder_3, aac_remove_padding
 from core.aac_utils import snr_db
 from core.aac_types import *
 from core.aac_snr_db import snr_db
 # Helper "fixtures" for aac_coder_1 / i_aac_coder_1
@ -222,4 +222,153 @@ def test_end_to_end_level_2_high_snr(tmp_stereo_wav: Path, tmp_path: Path) -> No
    assert int(fs_hat) == 48000
    snr = snr_db(x_ref, x_hat)
-    assert snr > 75.0
+    assert snr > 80
 # -----------------------------------------------------------------------------
 # Level 3 tests (Quantizer + Huffman)
 # -----------------------------------------------------------------------------
@pytest.fixture(scope="module")
 def wav_in_path() -> Path:
    """
    Input WAV used for end-to-end tests.
    This should point to the provided test audio under material/.
    Adjust this path if your project layout differs.
    """
    # Typical layout in this project:
    # source/material/LicorDeCalandraca.wav
    return Path(__file__).resolve().parents[2] / "material" / "LicorDeCalandraca.wav"
 def _assert_level3_frame_schema(frame: AACSeq3Frame) -> None:
    """
    Validate Level-3 per-frame schema (keys + basic types only).
    """
    assert "frame_type" in frame
    assert "win_type" in frame
    assert "chl" in frame
    assert "chr" in frame
    for ch_key in ("chl", "chr"):
        ch = frame[ch_key]  # type: ignore[index]
        assert "tns_coeffs" in ch
        assert "T" in ch
        assert "G" in ch
        assert "sfc" in ch
        assert "stream" in ch
        assert "codebook" in ch
        assert isinstance(ch["sfc"], str)
        assert isinstance(ch["stream"], str)
        assert isinstance(ch["codebook"], int)
        # Arrays: only check they are numpy arrays with expected dtype categories.
        assert isinstance(ch["tns_coeffs"], np.ndarray)
        assert isinstance(ch["T"], np.ndarray)
        # Global gain: long frames may be scalar float, ESH may be ndarray
        assert np.isscalar(ch["G"]) or isinstance(ch["G"], np.ndarray)
 def test_aac_coder_3_seq_schema_and_shapes(wav_in_path: Path, tmp_path: Path) -> None:
    """
    Contract test:
    - aac_coder_3 returns AACSeq3
    - Per-frame keys exist and types are consistent
    - Basic shape expectations hold for ESH vs non-ESH cases
    Note:
    This test uses a short excerpt (a few frames) to keep runtime bounded.
    """
    # Use only a few frames to avoid long runtimes in the quantizer loop.
    hop = 1024
    win = 2048
    n_frames = 4
    n_samples = win + (n_frames - 1) * hop
    x, fs = aac_read_wav_stereo_48k(wav_in_path)
    x_short = x[:n_samples, :]
    short_wav = tmp_path / "input_short.wav"
    sf.write(str(short_wav), x_short, fs)
    aac_seq_3: AACSeq3 = aac_coder_3(short_wav)
    assert isinstance(aac_seq_3, list)
    assert len(aac_seq_3) > 0
    for fr in aac_seq_3:
        _assert_level3_frame_schema(fr)
        frame_type = fr["frame_type"]
        for ch_key in ("chl", "chr"):
            ch = fr[ch_key]  # type: ignore[index]
            tns = np.asarray(ch["tns_coeffs"])
            if frame_type == "ESH":
                assert tns.ndim == 2
                assert tns.shape[1] == 8
            else:
                assert tns.ndim == 2
                assert tns.shape[1] == 1
            T = np.asarray(ch["T"])
            if frame_type == "ESH":
                assert T.ndim == 2
                assert T.shape[1] == 8
            else:
                assert T.ndim == 2
                assert T.shape[1] == 1
            G = ch["G"]
            if frame_type == "ESH":
                assert isinstance(G, np.ndarray)
                assert np.asarray(G).shape == (1, 8)
            else:
                assert np.isscalar(G)
            assert isinstance(ch["sfc"], str)
            assert isinstance(ch["stream"], str)
 def test_end_to_end_level_3_high_snr(wav_in_path: Path, tmp_path: Path) -> None:
    """
    End-to-end test for Level 3 (Quantizer + Huffman):
    coder_3 -> decoder_3 should reconstruct a waveform with acceptable SNR.
    Notes
    -----
    - Level 3 includes quantization, so SNR is expected to be lower than Level 1/2.
    - We intentionally use a short excerpt (few frames) to keep runtime bounded,
      since the reference quantizer implementation is computationally expensive.
    """
    # Use only a few frames to avoid long runtimes.
    hop = 1024
    win = 2048
    n_frames = 4
    n_samples = win + (n_frames - 1) * hop
    x_ref, fs = aac_read_wav_stereo_48k(wav_in_path)
    x_short = x_ref[:n_samples, :]
    short_wav = tmp_path / "input_short_l3.wav"
    sf.write(str(short_wav), x_short, fs)
    out_wav = tmp_path / "decoded_level3.wav"
    aac_seq_3: AACSeq3 = aac_coder_3(short_wav)
    y_hat: StereoSignal = aac_decoder_3(aac_seq_3, out_wav)
    # Align lengths defensively (padding removal may differ by a few samples)
    n = min(x_short.shape[0], y_hat.shape[0])
    x2 = x_short[:n, :]
    y2 = y_hat[:n, :]
    s = snr_db(x2, y2)
    # Conservative threshold: Level 3 is lossy by design.
    assert s > 10.0
--- a/source/core/tests/test_filterbank.py
+++ b/source/core/tests/test_filterbank.py
@ -17,7 +17,7 @@ from typing import Sequence
 import pytest
 from core.aac_filterbank import aac_filter_bank, aac_i_filter_bank
-from core.aac_snr_db import snr_db
+from core.aac_utils import snr_db
 from core.aac_types import *
 # Helper fixtures for filterbank
--- a/source/core/tests/test_filterbank_internal.py
+++ b/source/core/tests/test_filterbank_internal.py
@ -1,117 +0,0 @@
 # ------------------------------------------------------------
 # AAC Coder/Decoder - Filterbank internal (mdct) Tests
 #
 # Multimedia course at Aristotle University of
 # Thessaloniki (AUTh)
 #
 # Author:
 #   Christos Choutouridis (ΑΕΜ 8997)
 #   cchoutou@ece.auth.gr
 #
 # Description:
 #   Tests for Filterbank internal MDCT/IMDCT functionality.
 # ------------------------------------------------------------
 from __future__ import annotations
 import numpy as np
 import pytest
 from core.aac_filterbank import _imdct, _mdct
 from core.aac_types import FloatArray, TimeSignal, MdctCoeffs
 def _assert_allclose(a: FloatArray, b: FloatArray, *, rtol: float, atol: float) -> None:
    """
    Helper for consistent tolerances across tests.
    """
    np.testing.assert_allclose(a, b, rtol=rtol, atol=atol)
 def _estimate_gain(y: MdctCoeffs, x: MdctCoeffs) -> float:
    """
    Estimate scalar gain g such that y ~= g*x in least-squares sense.
    """
    denom = float(np.dot(x, x))
    if denom == 0.0:
        return 0.0
    return float(np.dot(y, x) / denom)
 tolerance = 1e-10
@pytest.mark.parametrize("N", [256, 2048])
 def test_mdct_imdct_mdct_identity_up_to_gain(N: int) -> None:
    """
    Consistency test in coefficient domain:
      mdct(imdct(X)) ~= g * X
    For the chosen (non-orthonormal) scaling, g is expected to be close to 2.
    """
    rng = np.random.default_rng(0)
    K = N // 2
    X: MdctCoeffs = rng.normal(size=K).astype(np.float64)
    x: TimeSignal = _imdct(X)
    X_hat: MdctCoeffs = _mdct(x)
    g = _estimate_gain(X_hat, X)
    _assert_allclose(X_hat, g * X, rtol=tolerance, atol=tolerance)
    _assert_allclose(np.array([g], dtype=np.float64), np.array([2.0], dtype=np.float64), rtol=tolerance, atol=tolerance)
@pytest.mark.parametrize("N", [256, 2048])
 def test_mdct_linearity(N: int) -> None:
    """
    Linearity test:
      mdct(a*x + b*y) == a*mdct(x) + b*mdct(y)
    """
    rng = np.random.default_rng(1)
    x: TimeSignal = rng.normal(size=N).astype(np.float64)
    y: TimeSignal = rng.normal(size=N).astype(np.float64)
    a = 0.37
    b = -1.12
    left: MdctCoeffs = _mdct(a * x + b * y)
    right: MdctCoeffs = a * _mdct(x) + b * _mdct(y)
    _assert_allclose(left, right, rtol=tolerance, atol=tolerance)
@pytest.mark.parametrize("N", [256, 2048])
 def test_imdct_linearity(N: int) -> None:
    """
    Linearity test for IMDCT:
      imdct(a*X + b*Y) == a*imdct(X) + b*imdct(Y)
    """
    rng = np.random.default_rng(2)
    K = N // 2
    X: MdctCoeffs = rng.normal(size=K).astype(np.float64)
    Y: MdctCoeffs = rng.normal(size=K).astype(np.float64)
    a = -0.5
    b = 2.0
    left: TimeSignal = _imdct(a * X + b * Y)
    right: TimeSignal = a * _imdct(X) + b * _imdct(Y)
    _assert_allclose(left, right, rtol=tolerance, atol=tolerance)
@pytest.mark.parametrize("N", [256, 2048])
 def test_mdct_imdct_outputs_are_finite(N: int) -> None:
    """
    Sanity test: no NaN/inf on random inputs.
    """
    rng = np.random.default_rng(3)
    K = N // 2
    x: TimeSignal = rng.normal(size=N).astype(np.float64)
    X: MdctCoeffs = rng.normal(size=K).astype(np.float64)
    X1 = _mdct(x)
    x1 = _imdct(X)
    assert np.isfinite(X1).all()
    assert np.isfinite(x1).all()
--- a/source/core/tests/test_huffman.py
+++ b/source/core/tests/test_huffman.py
@ -0,0 +1,139 @@
 # ------------------------------------------------------------
 # AAC Coder/Decoder - Huffman Wrapper Tests (Level 3)
 #
 # Multimedia course at Aristotle University of
 # Thessaloniki (AUTh)
 #
 # Author:
 #   Christos Choutouridis (ΑΕΜ 8997)
 #   cchoutou@ece.auth.gr
 #
 # Description:
 #   Contract tests for the Huffman coding stage, using the provided
 #   Huffman utilities (material/huff_utils.py).
 #
 #   The Huffman encoder/decoder itself is GIVEN by the assignment and
 #   is not re-implemented here. These tests only verify that:
 #
 #   - The wrapper functions (aac_encode_huff / aac_decode_huff) expose
 #     the API described in the assignment.
 #   - Forced codebook selection works as expected (e.g. scalefactors).
 #   - Tuple-based Huffman coding semantics are respected.
 #
 # Notes on tuple coding:
 #   Huffman coding operates on tuples of symbols. As a result,
 #   decode(encode(x)) may return extra trailing symbols due to padding.
 #   The AAC decoder always knows the true section length (from band limits)
 #   and truncates accordingly. Therefore, these tests only enforce that
 #   the decoded PREFIX matches the original data.
 # ------------------------------------------------------------
 from __future__ import annotations
 import numpy as np
 import pytest
 from core.aac_huffman import aac_encode_huff, aac_decode_huff
 from material.huff_utils import load_LUT
 # -----------------------------------------------------------------------------
 # Fixtures
 # -----------------------------------------------------------------------------
@pytest.fixture(scope="module")
 def huff_LUT():
    """
    Load Huffman Look-Up Tables (LUTs) once per test module.
    The LUTs are provided by the assignment (huffCodebooks.mat) via
    material.huff_utils.load_LUT().
    """
    return load_LUT()
 # -----------------------------------------------------------------------------
 # Roundtrip (prefix) tests
 # -----------------------------------------------------------------------------
@pytest.mark.parametrize(
    "coeff_sec",
    [
        np.array([1, -1, 2, -2, 0, 0, 3], dtype=np.int64),
        np.array([0, 0, 0, 0], dtype=np.int64),
        np.array([5], dtype=np.int64),
        np.array([-3, -3, -3, -3], dtype=np.int64),
    ],
 )
 def test_huffman_roundtrip_prefix_matches(
    coeff_sec: np.ndarray,
    huff_LUT,
 ) -> None:
    """
    Contract test for Huffman encode/decode.
    Guarantees:
    - Encoding followed by decoding does not crash.
    - The decoded output has at least as many symbols as the input.
    - The prefix of the decoded output matches the original coefficients.
    Rationale:
    Huffman tuple coding may introduce padding, so exact length equality
    is NOT required or expected.
    """
    huff_sec, cb = aac_encode_huff(coeff_sec, huff_LUT)
    dec = aac_decode_huff(huff_sec, cb, huff_LUT)
    if cb == 0:
        # Codebook 0 represents an all-zero section.
        assert np.all(coeff_sec == 0)
        assert dec.size == 0
        return
    assert dec.size >= coeff_sec.size
    np.testing.assert_array_equal(dec[: coeff_sec.size], coeff_sec)
 # -----------------------------------------------------------------------------
 # Forced codebook tests
 # -----------------------------------------------------------------------------
 def test_huffman_force_codebook_returns_requested_codebook(huff_LUT) -> None:
    """
    Verify forced codebook selection.
    According to the assignment, scalefactors must be encoded using
    Huffman codebook 11. This test checks that:
    - The requested codebook is actually used.
    - The decoded prefix matches the original scalefactors.
    """
    scalefactors = np.array([10, -2, 1, 0, -1, 3], dtype=np.int64)
    huff_sec, cb = aac_encode_huff(
        scalefactors,
        huff_LUT,
        force_codebook=11,
    )
    assert cb == 11
    assert isinstance(huff_sec, str)
    dec = aac_decode_huff(huff_sec, cb, huff_LUT)
    assert dec.size >= scalefactors.size
    np.testing.assert_array_equal(dec[: scalefactors.size], scalefactors)
 # -----------------------------------------------------------------------------
 # Error handling
 # -----------------------------------------------------------------------------
 def test_huffman_invalid_codebook_raises(huff_LUT) -> None:
    """
    Decoding with an invalid Huffman codebook index must raise an error.
    """
    with pytest.raises(Exception):
        _ = aac_decode_huff(
            huff_sec="010101",
            huff_codebook=99,
            huff_LUT=huff_LUT,
        )
--- a/source/core/tests/test_psycho.py
+++ b/source/core/tests/test_psycho.py
@ -0,0 +1,253 @@
 # ------------------------------------------------------------
 # AAC Coder/Decoder - Psychoacoustic Model Tests
 #
 # Multimedia course at Aristotle University of
 # Thessaloniki (AUTh)
 #
 # Author:
 #   Christos Choutouridis (ΑΕΜ 8997)
 #
 # Description:
 #   Contract + sanity tests for the psychoacoustic model (core.aac_psycho).
 #
 #   These tests focus on:
 #   - output shapes per frame_type (long vs ESH),
 #   - numerical sanity (finite, non-negative),
 #   - deterministic behavior,
 #   - ESH central-region dependency (outer regions must not affect result),
 #   - basic input validation (length checks).
 #
 #   We intentionally avoid asserting exact numeric values, because the model
 #   includes FFT operations and table-driven psychoacoustic parameters.
 # ------------------------------------------------------------
 from __future__ import annotations
 import numpy as np
 import pytest
 from core.aac_psycho import aac_psycho
 from core.aac_types import FrameChannelT, FrameType
 # -----------------------------------------------------------------------------
 # Helpers
 # -----------------------------------------------------------------------------
 def _make_frames(
    *,
    kind: str,
    amp: float = 1.0,
    seed: int = 0,
 ) -> tuple[FrameChannelT, FrameChannelT, FrameChannelT]:
    """
    Create (current, prev1, prev2) 2048-sample frames for one channel.
    Parameters
    ----------
    kind : str
        "noise" or "tone".
    amp : float
        Amplitude scaling (applied to all frames).
    seed : int
        RNG seed for reproducibility (noise case).
    Returns
    -------
    tuple[FrameChannelT, FrameChannelT, FrameChannelT]
        Three arrays of shape (2048,), dtype float64.
    """
    if kind == "noise":
        rng = np.random.default_rng(seed)
        x2 = amp * rng.normal(size=2048).astype(np.float64)
        x1 = amp * rng.normal(size=2048).astype(np.float64)
        x0 = amp * rng.normal(size=2048).astype(np.float64)
        return x0, x1, x2
    if kind == "tone":
        # A simple sinusoid which is identical across frames (highly predictable).
        n = np.arange(2048, dtype=np.float64)
        f0 = 13.0  # arbitrary normalized-bin-ish tone (not critical for these tests)
        tone = amp * np.sin(2.0 * np.pi * f0 * n / 2048.0).astype(np.float64)
        return tone, tone.copy(), tone.copy()
    raise ValueError(f"Unknown kind: {kind!r}")
 def _assert_finite_nonnegative(x: np.ndarray) -> None:
    """Utility assertions for psycho outputs."""
    assert np.isfinite(x).all()
    # SMR is a ratio of energies, it should not be negative.
    assert np.min(x) >= 0.0
 # -----------------------------------------------------------------------------
 # Shape / contract tests
 # -----------------------------------------------------------------------------
@pytest.mark.parametrize("frame_type", ["OLS", "LSS", "LPS"])
 def test_psycho_long_shapes(frame_type: FrameType) -> None:
    """
    Contract test:
    For long frame types, psycho returns SMR shape (69,).
    """
    x0, x1, x2 = _make_frames(kind="noise", seed=1, amp=1.0)
    smr = aac_psycho(x0, frame_type, x1, x2)
    assert isinstance(smr, np.ndarray)
    assert smr.shape == (69,)
    _assert_finite_nonnegative(smr)
 def test_psycho_esh_shape() -> None:
    """
    Contract test:
    For ESH, psycho returns SMR shape (42, 8).
    """
    x0, x1, x2 = _make_frames(kind="noise", seed=2, amp=1.0)
    smr = aac_psycho(x0, "ESH", x1, x2)
    assert isinstance(smr, np.ndarray)
    assert smr.shape == (42, 8)
    _assert_finite_nonnegative(smr)
 def test_psycho_is_deterministic_for_same_inputs() -> None:
    """
    Determinism test:
    Psycho must return the same output for identical inputs.
    """
    x0, x1, x2 = _make_frames(kind="noise", seed=3, amp=1.0)
    smr1 = aac_psycho(x0, "OLS", x1, x2)
    smr2 = aac_psycho(x0, "OLS", x1, x2)
    np.testing.assert_allclose(smr1, smr2, rtol=0.0, atol=0.0)
 # -----------------------------------------------------------------------------
 # ESH-specific behavior tests
 # -----------------------------------------------------------------------------
 def test_psycho_esh_ignores_outer_regions() -> None:
    """
    Spec-driven behavior test:
    In this project, ESH uses only the central region of the 2048-sample frame to
    derive the 8 overlapping 256-sample subframes:
        start = 448 + 128*j, j=0..7
    Therefore, changing samples outside [448, 1600) must not affect the output.
    """
    rng = np.random.default_rng(10)
    # Build base frames (current and prev1) with identical central region.
    center_cur = rng.normal(size=1152).astype(np.float64)
    center_prev1 = rng.normal(size=1152).astype(np.float64)
    cur_a = np.zeros(2048, dtype=np.float64)
    cur_b = np.zeros(2048, dtype=np.float64)
    prev1_a = np.zeros(2048, dtype=np.float64)
    prev1_b = np.zeros(2048, dtype=np.float64)
    cur_a[448:1600] = center_cur
    cur_b[448:1600] = center_cur
    prev1_a[448:1600] = center_prev1
    prev1_b[448:1600] = center_prev1
    # Modify only outer regions in the *_b variants.
    cur_b[:448] = rng.normal(size=448)
    cur_b[1600:] = rng.normal(size=448)
    prev1_b[:448] = rng.normal(size=448)
    prev1_b[1600:] = rng.normal(size=448)
    # prev2 is irrelevant for the chosen ESH history convention; keep it fixed.
    prev2 = rng.normal(size=2048).astype(np.float64)
    smr_a = aac_psycho(cur_a, "ESH", prev1_a, prev2)
    smr_b = aac_psycho(cur_b, "ESH", prev1_b, prev2)
    np.testing.assert_allclose(smr_a, smr_b, rtol=0.0, atol=0.0)
 def test_psycho_esh_columns_are_not_all_identical_for_random_input() -> None:
    """
    Sanity test:
    For random input, different ESH subframes should typically produce
    different SMR columns (not a strict requirement, but a strong sanity signal).
    We check that at least one column differs from another beyond a tiny tolerance.
    """
    x0, x1, x2 = _make_frames(kind="noise", seed=11, amp=1.0)
    smr = aac_psycho(x0, "ESH", x1, x2)
    # Compare column 0 vs column 7; for random signals they should differ.
    diff = np.max(np.abs(smr[:, 0] - smr[:, 7]))
    assert diff > 1e-12
 # -----------------------------------------------------------------------------
 # Scaling sanity (avoid fragile numeric targets)
 # -----------------------------------------------------------------------------
 def test_psycho_long_smr_is_mostly_monotone_with_amplitude() -> None:
    """
    Sanity test:
    Increasing signal amplitude should not reduce the SMR for the vast majority
    of Bark bands.
    Due to the use of max(nb, qthr), a small fraction of bands close to the
    threshold-in-quiet boundary may violate strict monotonicity. This is expected
    behavior, so we test a percentage-based criterion instead of a strict one.
    """
    x0, x1, x2 = _make_frames(kind="noise", seed=20, amp=1e3)
    y0, y1, y2 = (2.0 * x0, 2.0 * x1, 2.0 * x2)
    smr1 = aac_psycho(x0, "OLS", x1, x2)
    smr2 = aac_psycho(y0, "OLS", y1, y2)
    eps = 1e-12
    nondecreasing = np.sum(smr2 + eps >= smr1)
    ratio = nondecreasing / smr1.size
    # Expect monotonic behavior for the overwhelming majority of bands.
    assert ratio >= 0.95
 def test_psycho_long_is_approximately_scale_invariant_at_high_level() -> None:
    """
    Sanity test (robust):
    At high levels, SMR should be approximately scale-invariant for most bands.
    Some bands may deviate due to the max(nb, qthr) branch.
    """
    x0, x1, x2 = _make_frames(kind="noise", seed=20, amp=1e3)
    y0, y1, y2 = (2.0 * x0, 2.0 * x1, 2.0 * x2)
    smr1 = aac_psycho(x0, "OLS", x1, x2)
    smr2 = aac_psycho(y0, "OLS", y1, y2)
    rel = np.abs(smr2 - smr1) / np.maximum(np.abs(smr1), 1e-12)
    # Most bands should be close (<= 5%), but allow a small number of outliers.
    close = np.sum(rel <= 5e-2)
    assert close >= (smr1.size - 2)  # allow up to 2 bands to deviate
 # -----------------------------------------------------------------------------
 # Input validation tests
 # -----------------------------------------------------------------------------
 def test_psycho_rejects_wrong_lengths() -> None:
    """
    Contract test:
    aac_psycho requires 2048-sample frames for current/prev1/prev2.
    """
    x = np.zeros(2048, dtype=np.float64)
    bad = np.zeros(2047, dtype=np.float64)
    with pytest.raises(ValueError):
        _ = aac_psycho(bad, "OLS", x, x)
    with pytest.raises(ValueError):
        _ = aac_psycho(x, "OLS", bad, x)
    with pytest.raises(ValueError):
        _ = aac_psycho(x, "OLS", x, bad)
--- a/source/core/tests/test_quantizer.py
+++ b/source/core/tests/test_quantizer.py
@ -0,0 +1,395 @@
 # ------------------------------------------------------------
 # AAC Coder/Decoder - Quantizer Tests
 #
 # Multimedia course at Aristotle University of
 # Thessaloniki (AUTh)
 #
 # Author:
 #   Christos Choutouridis (ΑΕΜ 8997)
 #   cchoutou@ece.auth.gr
 #
 # Description:
 #   Tests for Quantizer / iQuantizer module.
 #
 #   These tests are deliberately "contract-oriented":
 #   - They validate shapes, dtypes and invariants that downstream stages
 #     (e.g., Huffman coding) depend on.
 #   - They do not attempt to validate psychoacoustic optimality (that would
 #     require a reference implementation and careful numerical baselines).
 #
 # Validates:
 #   - I/O shapes for long and ESH modes
 #   - DPCM scalefactor coding consistency (sfc)
 #   - ESH packing order of quantized symbols (128x8 <-> 1024)
 #   - Edge cases (zeros / near silence)
 #   - Sanity (finite outputs, no extreme numerical blow-up)
 # ------------------------------------------------------------
 from __future__ import annotations
 import numpy as np
 import pytest
 from core.aac_quantizer import aac_quantizer, aac_i_quantizer
 from core.aac_utils import get_table, band_limits
 from core.aac_types import FrameType
 # Small epsilon to avoid divisions by zero in sanity ratios
 EPS = 1e-12
 # -----------------------------------------------------------------------------
 # Helper utilities
 # -----------------------------------------------------------------------------
 def _nbands(frame_type: FrameType) -> int:
    """
    Return number of scalefactor bands for the given frame type.
    This is derived from TableB219 (psycho tables) via aac_utils helpers,
    so the tests remain consistent even if tables are updated.
    """
    table, _nfft = get_table(frame_type)
    wlow, _whigh, _bval, _qthr = band_limits(table)
    return int(len(wlow))
 def _make_smr(frame_type: FrameType, seed: int = 0) -> np.ndarray:
    """
    Create a strictly positive SMR array with the correct shape.
    These tests are not about psycho correctness; they only need SMR > 0
    to avoid division by zero and to make the quantizer's threshold logic
    behave deterministically.
    """
    rng = np.random.default_rng(seed)
    NB = _nbands(frame_type)
    if frame_type == "ESH":
        # ESH uses 8 short windows, thus SMR has 8 columns.
        return (1.0 + np.abs(rng.normal(size=(NB, 8)))).astype(np.float64)
    # Long frames: use a column vector (NB, 1).
    return (1.0 + np.abs(rng.normal(size=(NB, 1)))).astype(np.float64)
 def _reconstruct_alpha_from_sfc(sfc: np.ndarray) -> np.ndarray:
    """
    Reconstruct alpha(b) from DPCM-coded scalefactors sfc(b).
    By definition in the assignment:
        sfc(0) = alpha(0)
        alpha(b) = alpha(b-1) + sfc(b)  for b > 0
    This reconstruction is useful to validate the internal consistency
    of the produced scalefactor information.
    """
    sfc = np.asarray(sfc, dtype=np.int64)
    # Long frames: sfc shape (NB, 1)
    if sfc.ndim == 2 and sfc.shape[1] == 1:
        NB = sfc.shape[0]
        alpha = np.zeros((NB,), dtype=np.int64)
        alpha[0] = int(sfc[0, 0])
        for b in range(1, NB):
            alpha[b] = int(alpha[b - 1] + sfc[b, 0])
        return alpha
    # ESH frames: sfc shape (NB, 8)
    if sfc.ndim == 2 and sfc.shape[1] == 8:
        NB = sfc.shape[0]
        alpha = np.zeros((NB, 8), dtype=np.int64)
        alpha[0, :] = sfc[0, :]
        for b in range(1, NB):
            alpha[b, :] = alpha[b - 1, :] + sfc[b, :]
        return alpha
    raise ValueError("Unsupported sfc shape.")
 # -----------------------------------------------------------------------------
 # Shape / contract tests
 # -----------------------------------------------------------------------------
@pytest.mark.parametrize("frame_type", ["OLS", "LSS", "LPS"])
 def test_quantizer_shapes_long(frame_type: FrameType) -> None:
    """
    Contract test for long frames:
    - Input: MDCT coefficients shape (1024, 1)
    - Output S: always (1024, 1)
    - Output sfc: (NB, 1)
    - G: scalar float for long frames
    - iQuantizer output: (1024, 1)
    """
    NB = _nbands(frame_type)
    rng = np.random.default_rng(1)
    X = rng.normal(size=(1024, 1)).astype(np.float64)
    SMR = _make_smr(frame_type, seed=2)
    S, sfc, G = aac_quantizer(X, frame_type, SMR)
    assert S.shape == (1024, 1)
    assert sfc.shape == (NB, 1)
    assert isinstance(G, (float, np.floating))
    Xhat = aac_i_quantizer(S, sfc, G, frame_type)
    assert Xhat.shape == (1024, 1)
 def test_quantizer_shapes_esh() -> None:
    """
    Contract test for ESH frames:
    - Input: MDCT coefficients shape (128, 8)
    - Output S: packed to (1024, 1)
    - Output sfc: (NB, 8)
    - G: array shape (1, 8) for ESH (one gain per short window)
    - iQuantizer output: (128, 8)
    """
    frame_type: FrameType = "ESH"
    NB = _nbands(frame_type)
    rng = np.random.default_rng(3)
    X = rng.normal(size=(128, 8)).astype(np.float64)
    SMR = _make_smr(frame_type, seed=4)
    S, sfc, G = aac_quantizer(X, frame_type, SMR)
    assert S.shape == (1024, 1)
    assert sfc.shape == (NB, 8)
    assert isinstance(G, np.ndarray)
    assert G.shape == (1, 8)
    Xhat = aac_i_quantizer(S, sfc, G, frame_type)
    assert Xhat.shape == (128, 8)
 # -----------------------------------------------------------------------------
 # DPCM consistency tests
 # -----------------------------------------------------------------------------
@pytest.mark.parametrize("frame_type", ["OLS", "LSS", "LPS"])
 def test_quantizer_dpcm_reconstructs_alpha_long(frame_type: FrameType) -> None:
    """
    Verify the DPCM coding rule for long frames.
    The quantizer returns:
      sfc(0) = alpha(0)
      sfc(b) = alpha(b) - alpha(b-1), b>0
    Reconstruct alpha from sfc and check:
      alpha(0) == sfc(0) == G
    """
    rng = np.random.default_rng(5)
    X = rng.normal(size=(1024, 1)).astype(np.float64)
    SMR = _make_smr(frame_type, seed=6)
    _S, sfc, G = aac_quantizer(X, frame_type, SMR)
    alpha = _reconstruct_alpha_from_sfc(sfc)
    assert int(sfc[0, 0]) == int(alpha[0])
    assert float(alpha[0]) == float(G)
 def test_quantizer_dpcm_reconstructs_alpha_esh() -> None:
    """
    Verify the DPCM coding rule for ESH frames.
    For each short window j:
      sfc(0, j) = alpha(0, j) == G(0, j)
    """
    frame_type: FrameType = "ESH"
    rng = np.random.default_rng(7)
    X = rng.normal(size=(128, 8)).astype(np.float64)
    SMR = _make_smr(frame_type, seed=8)
    _S, sfc, G = aac_quantizer(X, frame_type, SMR)
    alpha = _reconstruct_alpha_from_sfc(sfc)
    assert np.all(alpha[0, :] == sfc[0, :])
    assert np.all(alpha[0, :] == G.reshape(-1))
 # -----------------------------------------------------------------------------
 # ESH packing order test
 # -----------------------------------------------------------------------------
 def test_quantizer_esh_packing_order_matches_iquantizer_layout() -> None:
    """
    Verify ESH packing order.
    The quantizer outputs S in packed shape (1024, 1). The expected packing
    is column-major concatenation of the 8 short subframes.
    This test constructs a deterministic input where each subframe column
    has a distinct constant value. After quantize+inverse-quantize, the
    reconstructed columns should remain distinguishable in the same order.
    This primarily tests ordering, not exact numerical values.
    """
    frame_type: FrameType = "ESH"
    NB = _nbands(frame_type)
    # Create 8 distinct subframes: column j is constant (j+1)
    X = np.zeros((128, 8), dtype=np.float64)
    for j in range(8):
        X[:, j] = float(j + 1)
    # Use very large SMR so thresholds are permissive and alpha changes are
    # minimal. This helps keep the ordering signal strong.
    SMR = np.ones((NB, 8), dtype=np.float64) * 1e6
    S, sfc, G = aac_quantizer(X, frame_type, SMR)
    Xhat = aac_i_quantizer(S, sfc, G, frame_type)
    # The average magnitude per column must be increasing with the original order.
    col_means = np.mean(Xhat, axis=0)
    assert np.all(np.diff(col_means) > 0.0)
 # -----------------------------------------------------------------------------
 # Edge cases: zeros and near-silence
 # -----------------------------------------------------------------------------
@pytest.mark.parametrize("frame_type", ["OLS", "LSS", "LPS"])
 def test_quantizer_zero_input_long_is_finite(frame_type: FrameType) -> None:
    """
    Edge case: zero MDCT coefficients should not produce NaN/Inf.
    We do not require identity here (quantizer is lossy), but we require
    the pipeline to remain numerically safe and produce finite outputs.
    """
    NB = _nbands(frame_type)
    X = np.zeros((1024, 1), dtype=np.float64)
    SMR = np.ones((NB, 1), dtype=np.float64)
    S, sfc, G = aac_quantizer(X, frame_type, SMR)
    assert np.isfinite(S).all()
    assert np.isfinite(sfc).all()
    assert isinstance(G, (float, np.floating))
    Xhat = aac_i_quantizer(S, sfc, G, frame_type)
    assert np.isfinite(Xhat).all()
 def test_quantizer_zero_input_esh_is_finite() -> None:
    """
    Edge case: same as above, for ESH mode.
    """
    frame_type: FrameType = "ESH"
    NB = _nbands(frame_type)
    X = np.zeros((128, 8), dtype=np.float64)
    SMR = np.ones((NB, 8), dtype=np.float64)
    S, sfc, G = aac_quantizer(X, frame_type, SMR)
    assert np.isfinite(S).all()
    assert np.isfinite(sfc).all()
    assert np.isfinite(G).all()
    Xhat = aac_i_quantizer(S, sfc, G, frame_type)
    assert np.isfinite(Xhat).all()
@pytest.mark.parametrize("frame_type", ["OLS", "LSS", "LPS"])
 def test_quantizer_near_silence_long_is_finite(frame_type: FrameType) -> None:
    """
    Edge case: extremely small values.
    This stresses numerical guards (EPS usage) and ensures no invalid operations.
    """
    NB = _nbands(frame_type)
    X = (1e-15 * np.ones((1024, 1), dtype=np.float64))
    SMR = np.ones((NB, 1), dtype=np.float64)
    S, sfc, G = aac_quantizer(X, frame_type, SMR)
    assert np.isfinite(S).all()
    assert np.isfinite(sfc).all()
    Xhat = aac_i_quantizer(S, sfc, G, frame_type)
    assert np.isfinite(Xhat).all()
 def test_quantizer_near_silence_esh_is_finite() -> None:
    """
    Edge case: extremely small values, ESH mode.
    """
    frame_type: FrameType = "ESH"
    NB = _nbands(frame_type)
    X = (1e-15 * np.ones((128, 8), dtype=np.float64))
    SMR = np.ones((NB, 8), dtype=np.float64)
    S, sfc, G = aac_quantizer(X, frame_type, SMR)
    assert np.isfinite(S).all()
    assert np.isfinite(sfc).all()
    assert np.isfinite(G).all()
    Xhat = aac_i_quantizer(S, sfc, G, frame_type)
    assert np.isfinite(Xhat).all()
 # -----------------------------------------------------------------------------
 # Sanity: avoid catastrophic numerical blow-up
 # -----------------------------------------------------------------------------
@pytest.mark.parametrize("frame_type", ["OLS", "LSS", "LPS"])
 def test_quantizer_sanity_no_extreme_blowup_long(frame_type: FrameType) -> None:
    """
    Loose sanity guard.
    The quantizer is lossy, but it should not produce reconstructions with
    catastrophic peak/energy growth compared to the input.
    """
    NB = _nbands(frame_type)
    rng = np.random.default_rng(11)
    X = rng.normal(size=(1024, 1)).astype(np.float64)
    SMR = np.ones((NB, 1), dtype=np.float64) * 10.0
    S, sfc, G = aac_quantizer(X, frame_type, SMR)
    Xhat = aac_i_quantizer(S, sfc, G, frame_type)
    in_peak = float(np.max(np.abs(X)))
    out_peak = float(np.max(np.abs(Xhat)))
    peak_ratio = out_peak / (in_peak + EPS)
    in_energy = float(np.sum(X * X))
    out_energy = float(np.sum(Xhat * Xhat))
    energy_ratio = out_energy / (in_energy + EPS)
    # Very loose thresholds: only catch severe regressions.
    assert peak_ratio < 100.0
    assert energy_ratio < 1e4
 def test_quantizer_sanity_no_extreme_blowup_esh() -> None:
    """
    Same loose sanity guard for ESH mode.
    """
    frame_type: FrameType = "ESH"
    NB = _nbands(frame_type)
    rng = np.random.default_rng(12)
    X = rng.normal(size=(128, 8)).astype(np.float64)
    SMR = np.ones((NB, 8), dtype=np.float64) * 10.0
    S, sfc, G = aac_quantizer(X, frame_type, SMR)
    Xhat = aac_i_quantizer(S, sfc, G, frame_type)
    in_peak = float(np.max(np.abs(X)))
    out_peak = float(np.max(np.abs(Xhat)))
    peak_ratio = out_peak / (in_peak + EPS)
    in_energy = float(np.sum(X * X))
    out_energy = float(np.sum(Xhat * Xhat))
    energy_ratio = out_energy / (in_energy + EPS)
    assert peak_ratio < 100.0
    assert energy_ratio < 1e4
--- a/source/core/tests/test_snr_db.py
+++ b/source/core/tests/test_snr_db.py
@ -1,98 +0,0 @@
 # ------------------------------------------------------------
 # AAC Coder/Decoder - SNR dB Tests
 #
 # Multimedia course at Aristotle University of
 # Thessaloniki (AUTh)
 #
 # Author:
 #   Christos Choutouridis (ΑΕΜ 8997)
 #   cchoutou@ece.auth.gr
 #
 # Description:
 #   Basic tests for SNR calculation utility.
 # ------------------------------------------------------------
 from __future__ import annotations
 import numpy as np
 import pytest
 from core.aac_snr_db import snr_db
 from core.aac_types import StereoSignal
 def test_snr_perfect_reconstruction_returns_inf() -> None:
    """
    If x_hat == x_ref exactly, noise power is zero and SNR must be +inf.
    """
    rng = np.random.default_rng(0)
    x: StereoSignal = rng.normal(size=(1024, 2)).astype(np.float64)
    snr = snr_db(x, x)
    assert snr == float("inf")
 def test_snr_zero_reference_returns_minus_inf() -> None:
    """
    If reference signal is identically zero, signal power is zero
    and SNR must be -inf (unless noise is also zero, which is degenerate).
    """
    x_ref: StereoSignal = np.zeros((1024, 2), dtype=np.float64)
    x_hat: StereoSignal = np.ones((1024, 2), dtype=np.float64)
    snr = snr_db(x_ref, x_hat)
    assert snr == float("-inf")
 def test_snr_known_noise_level_matches_expected_value() -> None:
    """
    Deterministic test with known signal and noise power.
    Let:
      x_ref = ones
      x_hat = ones + noise
    With noise variance sigma^2, expected SNR:
      10 * log10(Ps / Pn)
    """
    n = 1000
    sigma = 0.1
    x_ref: StereoSignal = np.ones((n, 2), dtype=np.float64)
    noise = sigma * np.ones((n, 2), dtype=np.float64)
    x_hat: StereoSignal = x_ref + noise
    ps = float(np.sum(x_ref * x_ref))
    pn = float(np.sum(noise * noise))
    expected = 10.0 * np.log10(ps / pn)
    snr = snr_db(x_ref, x_hat)
    assert np.isclose(snr, expected, rtol=1e-12, atol=1e-12)
 def test_snr_aligns_different_lengths_and_channels() -> None:
    """
    The function must:
    - align to minimum length
    - align to minimum channel count
    without crashing.
    """
    rng = np.random.default_rng(1)
    x_ref: StereoSignal = rng.normal(size=(1000, 2)).astype(np.float64)
    x_hat: StereoSignal = rng.normal(size=(800, 1)).astype(np.float64)
    snr = snr_db(x_ref, x_hat)
    assert np.isfinite(snr)
 def test_snr_accepts_1d_inputs() -> None:
    """
    1-D inputs must be accepted and treated as single-channel signals.
    """
    rng = np.random.default_rng(2)
    x_ref = rng.normal(size=1024).astype(np.float64)
    x_hat = x_ref + 0.01 * rng.normal(size=1024).astype(np.float64)
    snr = snr_db(x_ref, x_hat)
    assert np.isfinite(snr)
--- a/source/core/tests/test_ssc.py
+++ b/source/core/tests/test_ssc.py
@ -16,7 +16,7 @@ from __future__ import annotations
 import numpy as np
-from core.aac_ssc import aac_SSC
+from core.aac_ssc import aac_ssc
 from core.aac_types import FrameT
 # -----------------------------------------------------------------------------
@ -117,10 +117,10 @@ def test_ssc_fixed_cases_prev_lss_and_lps() -> None:
    next_attack = _next_frame_strong_attack(attack_left=True, attack_right=True)
-    out1 = aac_SSC(frame_t, next_attack, "LSS")
+    out1 = aac_ssc(frame_t, next_attack, "LSS")
    assert out1 == "ESH"
-    out2 = aac_SSC(frame_t, next_attack, "LPS")
+    out2 = aac_ssc(frame_t, next_attack, "LPS")
    assert out2 == "OLS"
@ -138,7 +138,7 @@ def test_prev_ols_next_not_esh_returns_ols() -> None:
    frame_t: FrameT = np.zeros((2048, 2), dtype=np.float64)
    next_t = _next_frame_no_attack()
-    out = aac_SSC(frame_t, next_t, "OLS")
+    out = aac_ssc(frame_t, next_t, "OLS")
    assert out == "OLS"
@ -151,7 +151,7 @@ def test_prev_ols_next_esh_both_channels_returns_lss() -> None:
    frame_t: FrameT = np.zeros((2048, 2), dtype=np.float64)
    next_t = _next_frame_strong_attack(attack_left=True, attack_right=True)
-    out = aac_SSC(frame_t, next_t, "OLS")
+    out = aac_ssc(frame_t, next_t, "OLS")
    assert out == "LSS"
@ -165,11 +165,11 @@ def test_prev_ols_next_esh_one_channel_returns_lss() -> None:
    frame_t: FrameT = np.zeros((2048, 2), dtype=np.float64)
    next1_t = _next_frame_strong_attack(attack_left=True, attack_right=False)
-    out1 = aac_SSC(frame_t, next1_t, "OLS")
+    out1 = aac_ssc(frame_t, next1_t, "OLS")
    assert out1 == "LSS"
    next2_t = _next_frame_strong_attack(attack_left=False, attack_right=True)
-    out2 = aac_SSC(frame_t, next2_t, "OLS")
+    out2 = aac_ssc(frame_t, next2_t, "OLS")
    assert out2 == "LSS"
@ -182,7 +182,7 @@ def test_prev_esh_next_esh_both_channels_returns_esh() -> None:
    frame_t: FrameT = np.zeros((2048, 2), dtype=np.float64)
    next_t = _next_frame_strong_attack(attack_left=True, attack_right=True)
-    out = aac_SSC(frame_t, next_t, "ESH")
+    out = aac_ssc(frame_t, next_t, "ESH")
    assert out == "ESH"
@ -195,7 +195,7 @@ def test_prev_esh_next_not_esh_both_channels_returns_lps() -> None:
    frame_t: FrameT = np.zeros((2048, 2), dtype=np.float64)
    next_t = _next_frame_no_attack()
-    out = aac_SSC(frame_t, next_t, "ESH")
+    out = aac_ssc(frame_t, next_t, "ESH")
    assert out == "LPS"
@ -209,11 +209,11 @@ def test_prev_esh_next_esh_one_channel_merged_is_esh() -> None:
    frame_t: FrameT = np.zeros((2048, 2), dtype=np.float64)
    next1_t = _next_frame_strong_attack(attack_left=True, attack_right=False)
-    out1 = aac_SSC(frame_t, next1_t, "ESH")
+    out1 = aac_ssc(frame_t, next1_t, "ESH")
    assert out1 == "ESH"
    next2_t = _next_frame_strong_attack(attack_left=False, attack_right=True)
-    out2 = aac_SSC(frame_t, next2_t, "ESH")
+    out2 = aac_ssc(frame_t, next2_t, "ESH")
    assert out2 == "ESH"
@ -230,5 +230,5 @@ def test_threshold_s_must_exceed_1e_3() -> None:
    frame_t: FrameT = np.zeros((2048, 2), dtype=np.float64)
    next_t = _next_frame_below_s_threshold(left=True, right=True, impulse_amp=0.01)
-    out = aac_SSC(frame_t, next_t, "OLS")
+    out = aac_ssc(frame_t, next_t, "OLS")
    assert out == "OLS"
--- a/source/core/tests/test_tns.py
+++ b/source/core/tests/test_tns.py
@ -26,6 +26,7 @@ from core.aac_configuration import PRED_ORDER, QUANT_MAX, QUANT_STEP
 from core.aac_tns import aac_tns, aac_i_tns
 from core.aac_types import *
 EPS = 1e-12
 # -----------------------------------------------------------------------------
 # Helper utilities
@ -194,3 +195,132 @@ def test_tns_outputs_are_finite() -> None:
    out_esh, coeffs_esh = aac_tns(frame_F_esh, "ESH")
    assert np.isfinite(out_esh).all()
    assert np.isfinite(coeffs_esh).all()
@pytest.mark.parametrize("frame_type", ["OLS", "LSS", "LPS"])
 def test_tns_zero_input_is_identity_long(frame_type: FrameType) -> None:
    """
    Edge case: zero MDCT coefficients should remain zero after TNS and iTNS.
    This checks that no NaN/Inf appears and the pipeline is numerically safe.
    """
    frame_F_in = np.zeros((1024, 1), dtype=np.float64)
    frame_F_tns, tns_coeffs = aac_tns(frame_F_in, frame_type)
    assert np.isfinite(frame_F_tns).all()
    assert np.isfinite(tns_coeffs).all()
    assert np.all(frame_F_tns == 0.0)
    frame_F_hat = aac_i_tns(frame_F_tns, frame_type, tns_coeffs)
    assert np.isfinite(frame_F_hat).all()
    assert np.all(frame_F_hat == 0.0)
 def test_tns_zero_input_is_identity_esh() -> None:
    """
    Edge case: zero MDCT coefficients should remain zero for ESH too.
    """
    frame_F_in = np.zeros((128, 8), dtype=np.float64)
    frame_F_tns, tns_coeffs = aac_tns(frame_F_in, "ESH")
    assert np.isfinite(frame_F_tns).all()
    assert np.isfinite(tns_coeffs).all()
    assert np.all(frame_F_tns == 0.0)
    frame_F_hat = aac_i_tns(frame_F_tns, "ESH", tns_coeffs)
    assert np.isfinite(frame_F_hat).all()
    assert np.all(frame_F_hat == 0.0)
@pytest.mark.parametrize("frame_type", ["OLS", "LSS", "LPS"])
 def test_tns_near_silence_is_finite_and_roundtrips(frame_type: FrameType) -> None:
    """
    Edge case: extremely small values should not cause NaN/Inf,
    and round-trip should remain close.
    """
    frame_F_in = (1e-15 * np.ones((1024, 1), dtype=np.float64))
    frame_F_tns, tns_coeffs = aac_tns(frame_F_in, frame_type)
    assert np.isfinite(frame_F_tns).all()
    assert np.isfinite(tns_coeffs).all()
    frame_F_hat = aac_i_tns(frame_F_tns, frame_type, tns_coeffs)
    assert np.isfinite(frame_F_hat).all()
    np.testing.assert_allclose(frame_F_hat, frame_F_in, rtol=1e-6, atol=1e-12)
 def test_tns_near_silence_esh_is_finite_and_roundtrips() -> None:
    """
    Near-silence test for ESH mode.
    """
    frame_F_in = (1e-15 * np.ones((128, 8), dtype=np.float64))
    frame_F_tns, tns_coeffs = aac_tns(frame_F_in, "ESH")
    assert np.isfinite(frame_F_tns).all()
    assert np.isfinite(tns_coeffs).all()
    frame_F_hat = aac_i_tns(frame_F_tns, "ESH", tns_coeffs)
    assert np.isfinite(frame_F_hat).all()
    np.testing.assert_allclose(frame_F_hat, frame_F_in, rtol=1e-6, atol=1e-12)
@pytest.mark.parametrize("frame_type", ["OLS", "LSS", "LPS"])
 def test_tns_accepts_flat_vector_shape_long(frame_type: FrameType) -> None:
    """
    Contract test: for non-ESH, aac_tns must accept input shape (1024,)
    in addition to (1024, 1), and preserve the shape convention.
    """
    rng = np.random.default_rng(7)
    frame_F_in = rng.normal(size=(1024,)).astype(np.float64)
    frame_F_out, tns_coeffs = aac_tns(frame_F_in, frame_type)
    assert frame_F_out.shape == (1024,)
    assert tns_coeffs.shape == (PRED_ORDER, 1)
@pytest.mark.parametrize("frame_type", ["OLS", "LSS", "LPS"])
 def test_tns_does_not_explode_peak_or_energy_long(frame_type: FrameType) -> None:
    """
    Sanity: TNS should not cause extreme peak/energy blow-up on typical inputs.
    This is a loose guard to catch regressions.
    """
    rng = np.random.default_rng(8)
    frame_F_in = rng.normal(size=(1024, 1)).astype(np.float64)
    in_peak = float(np.max(np.abs(frame_F_in)))
    in_energy = float(np.sum(frame_F_in * frame_F_in))
    frame_F_out, _ = aac_tns(frame_F_in, frame_type)
    out_peak = float(np.max(np.abs(frame_F_out)))
    out_energy = float(np.sum(frame_F_out * frame_F_out))
    peak_ratio = out_peak / (in_peak + EPS)
    energy_ratio = out_energy / (in_energy + EPS)
    assert peak_ratio < 50.0
    assert energy_ratio < 2500.0
 def test_tns_does_not_explode_peak_or_energy_esh() -> None:
    """
    Sanity: same blow-up guard for ESH mode.
    """
    rng = np.random.default_rng(9)
    frame_F_in = rng.normal(size=(128, 8)).astype(np.float64)
    in_peak = float(np.max(np.abs(frame_F_in)))
    in_energy = float(np.sum(frame_F_in * frame_F_in))
    frame_F_out, _ = aac_tns(frame_F_in, "ESH")
    out_peak = float(np.max(np.abs(frame_F_out)))
    out_energy = float(np.sum(frame_F_out * frame_F_out))
    peak_ratio = out_peak / (in_peak + EPS)
    energy_ratio = out_energy / (in_energy + EPS)
    assert peak_ratio < 50.0
    assert energy_ratio < 2500.0
--- a/source/core/tests/test_utils.py
+++ b/source/core/tests/test_utils.py
@ -0,0 +1,329 @@
 # ------------------------------------------------------------
 # AAC Coder/Decoder - SNR dB Tests
 #
 # Multimedia course at Aristotle University of
 # Thessaloniki (AUTh)
 #
 # Author:
 #   Christos Choutouridis (ΑΕΜ 8997)
 #   cchoutou@ece.auth.gr
 #
 # Description:
 #   - Basic tests for SNR calculation utility.
 #   - Contract and sanity tests for TableB219-related utilities.
 #
 #     These tests do NOT validate the numerical correctness of the
 #     Bark tables themselves (they are given by the AAC spec),
 #     but instead ensure:
 #       - correct loading from disk,
 #       - correct table selection per frame type,
 #       - internal consistency of band limits,
 #       - correct caching behavior.
 # ------------------------------------------------------------
 from __future__ import annotations
 import numpy as np
 import pytest
 from core.aac_utils import mdct, imdct, snr_db, load_b219_tables, get_table, band_limits
 from core.aac_types import *
 tolerance = 1e-10
 # mdct / imdct
 # ------------------------------------------------------------
 def _assert_allclose(a: FloatArray, b: FloatArray, *, rtol: float, atol: float) -> None:
    """
    Helper for consistent tolerances across tests.
    """
    np.testing.assert_allclose(a, b, rtol=rtol, atol=atol)
 def _estimate_gain(y: MdctCoeffs, x: MdctCoeffs) -> float:
    """
    Estimate scalar gain g such that y ~= g*x in least-squares sense.
    """
    denom = float(np.dot(x, x))
    if denom == 0.0:
        return 0.0
    return float(np.dot(y, x) / denom)
@pytest.mark.parametrize("N", [256, 2048])
 def test_mdct_imdct_mdct_identity_up_to_gain(N: int) -> None:
    """
    Consistency test in coefficient domain:
      mdct(imdct(X)) ~= g * X
    For the chosen (non-orthonormal) scaling, g is expected to be close to 2.
    """
    rng = np.random.default_rng(0)
    K = N // 2
    X: MdctCoeffs = rng.normal(size=K).astype(np.float64)
    x: TimeSignal = imdct(X)
    X_hat: MdctCoeffs = mdct(x)
    g = _estimate_gain(X_hat, X)
    _assert_allclose(X_hat, g * X, rtol=tolerance, atol=tolerance)
    _assert_allclose(np.array([g], dtype=np.float64), np.array([2.0], dtype=np.float64), rtol=tolerance, atol=tolerance)
@pytest.mark.parametrize("N", [256, 2048])
 def test_mdct_linearity(N: int) -> None:
    """
    Linearity test:
      mdct(a*x + b*y) == a*mdct(x) + b*mdct(y)
    """
    rng = np.random.default_rng(1)
    x: TimeSignal = rng.normal(size=N).astype(np.float64)
    y: TimeSignal = rng.normal(size=N).astype(np.float64)
    a = 0.37
    b = -1.12
    left: MdctCoeffs = mdct(a * x + b * y)
    right: MdctCoeffs = a * mdct(x) + b * mdct(y)
    _assert_allclose(left, right, rtol=tolerance, atol=tolerance)
@pytest.mark.parametrize("N", [256, 2048])
 def test_imdct_linearity(N: int) -> None:
    """
    Linearity test for IMDCT:
      imdct(a*X + b*Y) == a*imdct(X) + b*imdct(Y)
    """
    rng = np.random.default_rng(2)
    K = N // 2
    X: MdctCoeffs = rng.normal(size=K).astype(np.float64)
    Y: MdctCoeffs = rng.normal(size=K).astype(np.float64)
    a = -0.5
    b = 2.0
    left: TimeSignal = imdct(a * X + b * Y)
    right: TimeSignal = a * imdct(X) + b * imdct(Y)
    _assert_allclose(left, right, rtol=tolerance, atol=tolerance)
@pytest.mark.parametrize("N", [256, 2048])
 def test_mdct_imdct_outputs_are_finite(N: int) -> None:
    """
    Sanity test: no NaN/inf on random inputs.
    """
    rng = np.random.default_rng(3)
    K = N // 2
    x: TimeSignal = rng.normal(size=N).astype(np.float64)
    X: MdctCoeffs = rng.normal(size=K).astype(np.float64)
    X1 = mdct(x)
    x1 = imdct(X)
    assert np.isfinite(X1).all()
    assert np.isfinite(x1).all()
 # SNR
 # ------------------------------------------------------------
 def test_snr_perfect_reconstruction_returns_inf() -> None:
    """
    If x_hat == x_ref exactly, noise power is zero and SNR must be +inf.
    """
    rng = np.random.default_rng(0)
    x: StereoSignal = rng.normal(size=(1024, 2)).astype(np.float64)
    snr = snr_db(x, x)
    assert snr == float("inf")
 def test_snr_zero_reference_returns_minus_inf() -> None:
    """
    If reference signal is identically zero, signal power is zero
    and SNR must be -inf (unless noise is also zero, which is degenerate).
    """
    x_ref: StereoSignal = np.zeros((1024, 2), dtype=np.float64)
    x_hat: StereoSignal = np.ones((1024, 2), dtype=np.float64)
    snr = snr_db(x_ref, x_hat)
    assert snr == float("-inf")
 def test_snr_known_noise_level_matches_expected_value() -> None:
    """
    Deterministic test with known signal and noise power.
    Let:
      x_ref = ones
      x_hat = ones + noise
    With noise variance sigma^2, expected SNR:
      10 * log10(Ps / Pn)
    """
    n = 1000
    sigma = 0.1
    x_ref: StereoSignal = np.ones((n, 2), dtype=np.float64)
    noise = sigma * np.ones((n, 2), dtype=np.float64)
    x_hat: StereoSignal = x_ref + noise
    ps = float(np.sum(x_ref * x_ref))
    pn = float(np.sum(noise * noise))
    expected = 10.0 * np.log10(ps / pn)
    snr = snr_db(x_ref, x_hat)
    assert np.isclose(snr, expected, rtol=1e-12, atol=1e-12)
 def test_snr_aligns_different_lengths_and_channels() -> None:
    """
    The function must:
    - align to minimum length
    - align to minimum channel count
    without crashing.
    """
    rng = np.random.default_rng(1)
    x_ref: StereoSignal = rng.normal(size=(1000, 2)).astype(np.float64)
    x_hat: StereoSignal = rng.normal(size=(800, 1)).astype(np.float64)
    snr = snr_db(x_ref, x_hat)
    assert np.isfinite(snr)
 def test_snr_accepts_1d_inputs() -> None:
    """
    1-D inputs must be accepted and treated as single-channel signals.
    """
    rng = np.random.default_rng(2)
    x_ref = rng.normal(size=1024).astype(np.float64)
    x_hat = x_ref + 0.01 * rng.normal(size=1024).astype(np.float64)
    snr = snr_db(x_ref, x_hat)
    assert np.isfinite(snr)
 # Table219b
 # ------------------------------------------------------------
 def test_load_b219_tables_returns_expected_keys() -> None:
    """
    Contract test:
    TableB219.mat must load successfully and expose both tables
    required by the psychoacoustic model.
    The AAC spec defines:
      - B219a: long-frame Bark bands
      - B219b: short-frame Bark bands
    """
    tables = load_b219_tables()
    assert isinstance(tables, dict)
    assert "B219a" in tables
    assert "B219b" in tables
 def test_b219_table_shapes_are_correct() -> None:
    """
    Sanity test:
    Verify that the Bark tables have the expected number of bands
    and sufficient columns.
    Expected from AAC spec:
      - B219a: 69 bands (long frames)
      - B219b: 42 bands (short frames)
      - At least 6 columns (as accessed by band_limits()).
    """
    tables = load_b219_tables()
    B219a = tables["B219a"]
    assert B219a.ndim == 2
    assert B219a.shape[0] == 69
    assert B219a.shape[1] >= 6
    B219b = tables["B219b"]
    assert B219b.ndim == 2
    assert B219b.shape[0] == 42
    assert B219b.shape[1] >= 6
 def test_get_table_returns_correct_fft_size() -> None:
    """
    Interface test:
    get_table(frame_type) must return both:
      - the correct Bark table
      - the correct FFT size N
    This mapping is fundamental for the psychoacoustic model.
    """
    table_long, N_long = get_table("OLS")
    assert N_long == 2048
    assert table_long.shape[0] == 69
    table_short, N_short = get_table("ESH")
    assert N_short == 256
    assert table_short.shape[0] == 42
 def test_band_limits_are_consistent_for_long_table() -> None:
    """
    Sanity test for band limits (long frames):
    For each Bark band:
      - wlow <= whigh
      - frequency indices stay within [0, N/2)
      - all returned arrays have consistent lengths
    """
    table, N = get_table("OLS")
    wlow, whigh, bval, qthr = band_limits(table)
    B = table.shape[0]
    assert len(wlow) == B
    assert len(whigh) == B
    assert len(bval) == B
    assert len(qthr) == B
    for b in range(B):
        assert 0 <= wlow[b] <= whigh[b]
        assert whigh[b] < N // 2
 def test_band_limits_are_consistent_for_short_table() -> None:
    """
    Sanity test for band limits (short frames / ESH).
    Same invariants as for long frames, but with FFT size N=256.
    """
    table, N = get_table("ESH")
    wlow, whigh, bval, qthr = band_limits(table)
    B = table.shape[0]
    assert len(wlow) == B
    assert len(whigh) == B
    for b in range(B):
        assert 0 <= wlow[b] <= whigh[b]
        assert whigh[b] < N // 2
 def test_b219_tables_are_cached() -> None:
    """
    Implementation test:
    load_b219_tables() should cache the loaded tables so that
    subsequent calls return the same object (identity check).
    This avoids repeated disk I/O during psychoacoustic analysis.
    """
    t1 = load_b219_tables()
    t2 = load_b219_tables()
    assert t1 is t2
--- a/source/level_1/core/aac_coder.py
+++ b/source/level_1/core/aac_coder.py
@ -26,14 +26,106 @@ from pathlib import Path
 from typing import Union
 import soundfile as sf
 from scipy.io import savemat
 from core.aac_configuration import WIN_TYPE
 from core.aac_filterbank import aac_filter_bank
-from core.aac_ssc import aac_SSC
+from core.aac_ssc import aac_ssc
 from core.aac_tns import aac_tns
 from core.aac_psycho import aac_psycho
 from core.aac_quantizer import aac_quantizer  # assumes your quantizer file is core/aac_quantizer.py
 from core.aac_huffman import aac_encode_huff
 from core.aac_utils import get_table, band_limits
 from material.huff_utils import load_LUT
 from core.aac_types import *
 # -----------------------------------------------------------------------------
 # Helpers for thresholds (T(b))
 # -----------------------------------------------------------------------------
 def _band_slices_from_table(frame_type: FrameType) -> list[tuple[int, int]]:
    """
    Return inclusive (lo, hi) band slices derived from TableB219.
    """
    table, _ = get_table(frame_type)
    wlow, whigh, _bval, _qthr_db = band_limits(table)
    return [(int(lo), int(hi)) for lo, hi in zip(wlow, whigh)]
 def _thresholds_from_smr(
    frame_F_ch: FrameChannelF,
    frame_type: FrameType,
    SMR: FloatArray,
 ) -> FloatArray:
    """
    Compute thresholds T(b) = P(b) / SMR(b), where P(b) is band energy.
    Shapes:
    - Long: returns (NB, 1)
    - ESH: returns (NB, 8)
    """
    bands = _band_slices_from_table(frame_type)
    NB = len(bands)
    X = np.asarray(frame_F_ch, dtype=np.float64)
    SMR = np.asarray(SMR, dtype=np.float64)
    if frame_type == "ESH":
        if X.shape != (128, 8):
            raise ValueError("For ESH, frame_F_ch must have shape (128, 8).")
        if SMR.shape != (NB, 8):
            raise ValueError(f"For ESH, SMR must have shape ({NB}, 8).")
        T = np.zeros((NB, 8), dtype=np.float64)
        for j in range(8):
            Xj = X[:, j]
            for b, (lo, hi) in enumerate(bands):
                P = float(np.sum(Xj[lo : hi + 1] ** 2))
                smr = float(SMR[b, j])
                T[b, j] = 0.0 if smr <= 1e-12 else (P / smr)
        return T
    # Long
    if X.shape == (1024,):
        Xv = X
    elif X.shape == (1024, 1):
        Xv = X[:, 0]
    else:
        raise ValueError("For non-ESH, frame_F_ch must be shape (1024,) or (1024, 1).")
    if SMR.shape == (NB,):
        SMRv = SMR
    elif SMR.shape == (NB, 1):
        SMRv = SMR[:, 0]
    else:
        raise ValueError(f"For non-ESH, SMR must be shape ({NB},) or ({NB}, 1).")
    T = np.zeros((NB, 1), dtype=np.float64)
    for b, (lo, hi) in enumerate(bands):
        P = float(np.sum(Xv[lo : hi + 1] ** 2))
        smr = float(SMRv[b])
        T[b, 0] = 0.0 if smr <= 1e-12 else (P / smr)
    return T
 def _normalize_global_gain(G: GlobalGain) -> float | FloatArray:
    """
    Normalize GlobalGain to match AACChannelFrameF3["G"] type:
    - long: return float
    - ESH: return float64 ndarray of shape (1, 8)
    """
    if np.isscalar(G):
        return float(G)
    G_arr = np.asarray(G)
    if G_arr.size == 1:
        return float(G_arr.reshape(-1)[0])
    return np.asarray(G_arr, dtype=np.float64)
 # -----------------------------------------------------------------------------
 # Public helpers (useful for level_x demo wrappers)
 # -----------------------------------------------------------------------------
@ -182,7 +274,7 @@ def aac_coder_1(filename_in: Union[str, Path]) -> AACSeq1:
            tail = np.zeros((win - next_t.shape[0], 2), dtype=np.float64)
            next_t = np.vstack([next_t, tail])
-        frame_type = aac_SSC(frame_t, next_t, prev_frame_type)
+        frame_type = aac_ssc(frame_t, next_t, prev_frame_type)
        frame_f = aac_filter_bank(frame_t, frame_type, win_type)
        chl_f, chr_f = aac_pack_frame_f_to_seq_channels(frame_type, frame_f)
@ -250,7 +342,7 @@ def aac_coder_2(filename_in: Union[str, Path]) -> AACSeq2:
            tail = np.zeros((win - next_t.shape[0], 2), dtype=np.float64)
            next_t = np.vstack([next_t, tail])
-        frame_type = aac_SSC(frame_t, next_t, prev_frame_type)
+        frame_type = aac_ssc(frame_t, next_t, prev_frame_type)
        # Level 1 analysis (packed stereo container)
        frame_f_stereo = aac_filter_bank(frame_t, frame_type, WIN_TYPE)
@ -282,3 +374,180 @@ def aac_coder_2(filename_in: Union[str, Path]) -> AACSeq2:
        prev_frame_type = frame_type
    return aac_seq
 def aac_coder_3(
    filename_in: Union[str, Path],
    filename_aac_coded: Union[str, Path] | None = None,
 ) -> AACSeq3:
    """
    Level-3 AAC encoder (Level 2 + Psycho + Quantizer + Huffman).
    Parameters
    ----------
    filename_in : Union[str, Path]
        Input WAV filename (stereo, 48 kHz).
    filename_aac_coded : Union[str, Path] | None
        Optional .mat filename to store aac_seq_3 (assignment convenience).
    Returns
    -------
    AACSeq3
        Encoded AAC sequence (Level 3 payload schema).
    """
    filename_in = Path(filename_in)
    x, _ = aac_read_wav_stereo_48k(filename_in)
    hop = 1024
    win = 2048
    pad_pre = np.zeros((hop, 2), dtype=np.float64)
    pad_post = np.zeros((hop, 2), dtype=np.float64)
    x_pad = np.vstack([pad_pre, x, pad_post])
    K = int((x_pad.shape[0] - win) // hop + 1)
    if K <= 0:
        raise ValueError("Input too short for framing.")
    # Load Huffman LUTs once.
    huff_LUT_list = load_LUT()
    aac_seq: AACSeq3 = []
    prev_frame_type: FrameType = "OLS"
    # Pin win_type to the WinType literal for type checkers.
    win_type: WinType = WIN_TYPE
    # Psycho model needs per-channel history (prev1, prev2) of 2048-sample frames.
    prev1_L = np.zeros((2048,), dtype=np.float64)
    prev2_L = np.zeros((2048,), dtype=np.float64)
    prev1_R = np.zeros((2048,), dtype=np.float64)
    prev2_R = np.zeros((2048,), dtype=np.float64)
    for i in range(K):
        start = i * hop
        frame_t: FrameT = x_pad[start : start + win, :]
        if frame_t.shape != (win, 2):
            raise ValueError("Internal framing error: frame_t has wrong shape.")
        next_t = x_pad[start + hop : start + hop + win, :]
        if next_t.shape[0] < win:
            tail = np.zeros((win - next_t.shape[0], 2), dtype=np.float64)
            next_t = np.vstack([next_t, tail])
        frame_type = aac_ssc(frame_t, next_t, prev_frame_type)
        # Analysis filterbank (stereo packed)
        frame_f_stereo = aac_filter_bank(frame_t, frame_type, win_type)
        chl_f, chr_f = aac_pack_frame_f_to_seq_channels(frame_type, frame_f_stereo)
        # TNS per channel
        chl_f_tns, chl_tns_coeffs = aac_tns(chl_f, frame_type)
        chr_f_tns, chr_tns_coeffs = aac_tns(chr_f, frame_type)
        # Psychoacoustic model per channel (time-domain)
        frame_L = np.asarray(frame_t[:, 0], dtype=np.float64)
        frame_R = np.asarray(frame_t[:, 1], dtype=np.float64)
        SMR_L = aac_psycho(frame_L, frame_type, prev1_L, prev2_L)
        SMR_R = aac_psycho(frame_R, frame_type, prev1_R, prev2_R)
        # Thresholds T(b) (stored, not entropy-coded)
        T_L = _thresholds_from_smr(chl_f_tns, frame_type, SMR_L)
        T_R = _thresholds_from_smr(chr_f_tns, frame_type, SMR_R)
        # Quantizer per channel
        S_L, sfc_L, G_L = aac_quantizer(chl_f_tns, frame_type, SMR_L)
        S_R, sfc_R, G_R = aac_quantizer(chr_f_tns, frame_type, SMR_R)
        # Normalize G types for AACSeq3 schema (float | float64 ndarray).
        G_Ln = _normalize_global_gain(G_L)
        G_Rn = _normalize_global_gain(G_R)
        # Huffman-code ONLY the DPCM differences for b>0.
        # sfc[0] corresponds to alpha(0)=G and is stored separately in the frame.
        sfc_L_dpcm = np.asarray(sfc_L, dtype=np.int64)[1:, ...]
        sfc_R_dpcm = np.asarray(sfc_R, dtype=np.int64)[1:, ...]
        # Codebook 11:
        # maxAbsCodeVal = 16 is RESERVED for ESCAPE.
        # We must stay strictly within [-15, +15] to avoid escape decoding.
        sf_cb = 11
        sf_max_abs = int(huff_LUT_list[sf_cb]["maxAbsCodeVal"]) - 1  # -> 15
        sfc_L_dpcm = np.clip(
            sfc_L_dpcm,
            -sf_max_abs,
            sf_max_abs,
        ).astype(np.int64, copy=False)
        sfc_R_dpcm = np.clip(
            sfc_R_dpcm,
            -sf_max_abs,
            sf_max_abs,
        ).astype(np.int64, copy=False)
        sfc_L_stream, _ = aac_encode_huff(
            sfc_L_dpcm.reshape(-1, order="F"),
            huff_LUT_list,
            force_codebook=sf_cb,
        )
        sfc_R_stream, _ = aac_encode_huff(
            sfc_R_dpcm.reshape(-1, order="F"),
            huff_LUT_list,
            force_codebook=sf_cb,
        )
        mdct_L_stream, cb_L = aac_encode_huff(
            np.asarray(S_L, dtype=np.int64).reshape(-1),
            huff_LUT_list,
        )
        mdct_R_stream, cb_R = aac_encode_huff(
            np.asarray(S_R, dtype=np.int64).reshape(-1),
            huff_LUT_list,
        )
        # Typed dict construction helps static analyzers validate the schema.
        frame_out: AACSeq3Frame = {
            "frame_type": frame_type,
            "win_type": win_type,
            "chl": {
                "tns_coeffs": np.asarray(chl_tns_coeffs, dtype=np.float64),
                "T": np.asarray(T_L, dtype=np.float64),
                "G": G_Ln,
                "sfc": sfc_L_stream,
                "stream": mdct_L_stream,
                "codebook": int(cb_L),
            },
            "chr": {
                "tns_coeffs": np.asarray(chr_tns_coeffs, dtype=np.float64),
                "T": np.asarray(T_R, dtype=np.float64),
                "G": G_Rn,
                "sfc": sfc_R_stream,
                "stream": mdct_R_stream,
                "codebook": int(cb_R),
            },
        }
        aac_seq.append(frame_out)
        # Update psycho history (shift register)
        prev2_L = prev1_L
        prev1_L = frame_L
        prev2_R = prev1_R
        prev1_R = frame_R
        prev_frame_type = frame_type
    # Optional: store to .mat for the assignment wrapper
    if filename_aac_coded is not None:
        filename_aac_coded = Path(filename_aac_coded)
        savemat(
            str(filename_aac_coded),
            {"aac_seq_3": np.array(aac_seq, dtype=object)},
            do_compression=True,
        )
    return aac_seq
--- a/source/level_1/core/aac_configuration.py
+++ b/source/level_1/core/aac_configuration.py
@ -15,6 +15,8 @@
 from __future__ import annotations
 # Imports
 from typing import Final
 from core.aac_types import WinType
 # Filterbank
@ -29,3 +31,11 @@ WIN_TYPE: WinType = "SIN"
 PRED_ORDER = 4
 QUANT_STEP = 0.1
 QUANT_MAX = 0.7  # 4-bit symmetric with step 0.1 -> clamp to [-0.7, +0.7]
 # -----------------------------------------------------------------------------
 # Psycho
 # -----------------------------------------------------------------------------
 NMT_DB: Final[float] = 6.0   # Noise Masking Tone (dB)
 TMN_DB: Final[float] = 18.0  # Tone Masking Noise (dB)
--- a/source/level_1/core/aac_decoder.py
+++ b/source/level_1/core/aac_decoder.py
@ -9,16 +9,9 @@
 #   cchoutou@ece.auth.gr
 #
 # Description:
-#   Level 1 AAC decoder orchestration (inverse of aac_coder_1()).
+#   - Level 1 AAC decoder orchestration (inverse of aac_coder_1()).
-#   Keeps the same functional behavior as the original level_1 implementation:
+#   - Level 2 AAC decoder orchestration (inverse of aac_coder_1()).
 #   - Re-pack per-channel spectra into FrameF expected by aac_i_filter_bank()
 #   - IMDCT synthesis per frame
 #   - Overlap-add with hop=1024
 #   - Remove encoder boundary padding: hop at start and hop at end
 #
 #   Note:
 #   This core module returns the reconstructed samples. Writing to disk is kept
 #   in level_x demos.
 # ------------------------------------------------------------
 from __future__ import annotations
@ -29,11 +22,24 @@ import soundfile as sf
 from core.aac_filterbank import aac_i_filter_bank
 from core.aac_tns import aac_i_tns
 from core.aac_quantizer import aac_i_quantizer
 from core.aac_huffman import aac_decode_huff
 from core.aac_utils import get_table, band_limits
 from material.huff_utils import load_LUT
 from core.aac_types import *
 # -----------------------------------------------------------------------------
-# Public helpers (useful for level_x demo wrappers)
+# Helper for NB
 # -----------------------------------------------------------------------------
 def _nbands(frame_type: FrameType) -> int:
    table, _ = get_table(frame_type)
    wlow, _whigh, _bval, _qthr_db = band_limits(table)
    return int(len(wlow))
 # -----------------------------------------------------------------------------
 # Public helpers
 # -----------------------------------------------------------------------------
 def aac_unpack_seq_channels_to_frame_f(frame_type: FrameType, chl_f: FrameChannelF, chr_f: FrameChannelF) -> FrameF:
@ -109,7 +115,7 @@ def aac_remove_padding(y_pad: StereoSignal, hop: int = 1024) -> StereoSignal:
 # -----------------------------------------------------------------------------
-# Level 1 decoder (core)
+# Level 1 decoder
 # -----------------------------------------------------------------------------
 def aac_decoder_1(aac_seq_1: AACSeq1, filename_out: Union[str, Path]) -> StereoSignal:
@ -167,6 +173,10 @@ def aac_decoder_1(aac_seq_1: AACSeq1, filename_out: Union[str, Path]) -> StereoS
    return y
 # -----------------------------------------------------------------------------
 # Level 2 decoder
 # -----------------------------------------------------------------------------
 def aac_decoder_2(aac_seq_2: AACSeq2, filename_out: Union[str, Path]) -> StereoSignal:
    """
    Level-2 AAC decoder (inverse of aac_coder_2).
@ -255,3 +265,144 @@ def aac_decoder_2(aac_seq_2: AACSeq2, filename_out: Union[str, Path]) -> StereoS
    sf.write(str(filename_out), y, 48000)
    return y
 def aac_decoder_3(aac_seq_3: AACSeq3, filename_out: Union[str, Path]) -> StereoSignal:
    """
    Level-3 AAC decoder (inverse of aac_coder_3).
    Steps per frame:
    - Huffman decode scalefactors (sfc) using codebook 11
    - Huffman decode MDCT symbols (stream) using stored codebook
    - iQuantizer -> MDCT coefficients after TNS
    - iTNS using stored predictor coefficients
    - IMDCT filterbank -> time domain
    - Overlap-add, remove padding, write WAV
    Parameters
    ----------
    aac_seq_3 : AACSeq3
        Encoded sequence as produced by aac_coder_3.
    filename_out : Union[str, Path]
        Output WAV filename.
    Returns
    -------
    StereoSignal
        Decoded audio samples (time-domain), stereo, shape (N, 2), dtype float64.
    """
    filename_out = Path(filename_out)
    hop = 1024
    win = 2048
    K = len(aac_seq_3)
    if K <= 0:
        raise ValueError("aac_seq_3 must contain at least one frame.")
    # Load Huffman LUTs once.
    huff_LUT_list = load_LUT()
    n_pad = (K - 1) * hop + win
    y_pad = np.zeros((n_pad, 2), dtype=np.float64)
    for i, fr in enumerate(aac_seq_3):
        frame_type: FrameType = fr["frame_type"]
        win_type: WinType = fr["win_type"]
        NB = _nbands(frame_type)
        # We store G separately, so Huffman stream contains only (NB-1) DPCM differences.
        sfc_len = (NB - 1) * (8 if frame_type == "ESH" else 1)
        # -------------------------
        # Left channel
        # -------------------------
        tns_L = np.asarray(fr["chl"]["tns_coeffs"], dtype=np.float64)
        G_L = fr["chl"]["G"]
        sfc_bits_L = fr["chl"]["sfc"]
        mdct_bits_L = fr["chl"]["stream"]
        cb_L = int(fr["chl"]["codebook"])
        sfc_dec_L = aac_decode_huff(sfc_bits_L, 11, huff_LUT_list)[:sfc_len].astype(np.int64, copy=False)
        if frame_type == "ESH":
            sfc_dpcm_L = sfc_dec_L.reshape(NB - 1, 8, order="F")
            sfc_L = np.zeros((NB, 8), dtype=np.int64)
            Gv = np.asarray(G_L, dtype=np.float64).reshape(1, 8)
            sfc_L[0, :] = Gv[0, :].astype(np.int64)
            sfc_L[1:, :] = sfc_dpcm_L
        else:
            sfc_dpcm_L = sfc_dec_L.reshape(NB - 1, 1, order="F")
            sfc_L = np.zeros((NB, 1), dtype=np.int64)
            sfc_L[0, 0] = int(float(G_L))
            sfc_L[1:, :] = sfc_dpcm_L
        # MDCT symbols: codebook 0 means "all-zero section"
        if cb_L == 0:
            S_dec_L = np.zeros((1024,), dtype=np.int64)
        else:
            S_tmp_L = aac_decode_huff(mdct_bits_L, cb_L, huff_LUT_list).astype(np.int64, copy=False)
            # Tuple coding may produce extra trailing symbols; caller knows the true length (1024).
            # Also guard against short outputs by zero-padding.
            if S_tmp_L.size < 1024:
                S_dec_L = np.zeros((1024,), dtype=np.int64)
                S_dec_L[: S_tmp_L.size] = S_tmp_L
            else:
                S_dec_L = S_tmp_L[:1024]
        S_L = S_dec_L.reshape(1024, 1)
        Xq_L = aac_i_quantizer(S_L, sfc_L, G_L, frame_type)
        X_L = aac_i_tns(Xq_L, frame_type, tns_L)
        # -------------------------
        # Right channel
        # -------------------------
        tns_R = np.asarray(fr["chr"]["tns_coeffs"], dtype=np.float64)
        G_R = fr["chr"]["G"]
        sfc_bits_R = fr["chr"]["sfc"]
        mdct_bits_R = fr["chr"]["stream"]
        cb_R = int(fr["chr"]["codebook"])
        sfc_dec_R = aac_decode_huff(sfc_bits_R, 11, huff_LUT_list)[:sfc_len].astype(np.int64, copy=False)
        if frame_type == "ESH":
            sfc_dpcm_R = sfc_dec_R.reshape(NB - 1, 8, order="F")
            sfc_R = np.zeros((NB, 8), dtype=np.int64)
            Gv = np.asarray(G_R, dtype=np.float64).reshape(1, 8)
            sfc_R[0, :] = Gv[0, :].astype(np.int64)
            sfc_R[1:, :] = sfc_dpcm_R
        else:
            sfc_dpcm_R = sfc_dec_R.reshape(NB - 1, 1, order="F")
            sfc_R = np.zeros((NB, 1), dtype=np.int64)
            sfc_R[0, 0] = int(float(G_R))
            sfc_R[1:, :] = sfc_dpcm_R
        if cb_R == 0:
            S_dec_R = np.zeros((1024,), dtype=np.int64)
        else:
            S_tmp_R = aac_decode_huff(mdct_bits_R, cb_R, huff_LUT_list).astype(np.int64, copy=False)
            if S_tmp_R.size < 1024:
                S_dec_R = np.zeros((1024,), dtype=np.int64)
                S_dec_R[: S_tmp_R.size] = S_tmp_R
            else:
                S_dec_R = S_tmp_R[:1024]
        S_R = S_dec_R.reshape(1024, 1)
        Xq_R = aac_i_quantizer(S_R, sfc_R, G_R, frame_type)
        X_R = aac_i_tns(Xq_R, frame_type, tns_R)
        # Re-pack to stereo container and inverse filterbank
        frame_f = aac_unpack_seq_channels_to_frame_f(frame_type, np.asarray(X_L), np.asarray(X_R))
        frame_t_hat: FrameT = aac_i_filter_bank(frame_f, frame_type, win_type)
        start = i * hop
        y_pad[start : start + win, :] += frame_t_hat
    y = aac_remove_padding(y_pad, hop=hop)
    sf.write(str(filename_out), y, 48000)
    return y
--- a/source/level_1/core/aac_filterbank.py
+++ b/source/level_1/core/aac_filterbank.py
@ -14,6 +14,7 @@
 # ------------------------------------------------------------
 from __future__ import annotations
 from core.aac_utils import mdct, imdct
 from core.aac_types import *
 from scipy.signal.windows import kaiser
@ -186,74 +187,6 @@ def _window_sequence(frame_type: FrameType, win_type: WinType) -> Window:
    raise ValueError(f"Invalid frame_type for long window sequence: {frame_type!r}")
 def _mdct(s: TimeSignal) -> MdctCoeffs:
    """
    MDCT (direct form) as specified in the assignment.
    Parameters
    ----------
    s : TimeSignal
        Windowed time samples, 1-D array of length N (N = 2048 or 256).
    Returns
    -------
    MdctCoeffs
        MDCT coefficients, 1-D array of length N/2.
    Definition
    ----------
    X[k] = 2 * sum_{n=0..N-1} s[n] * cos((2*pi/N) * (n + n0) * (k + 1/2)),
    where n0 = (N/2 + 1)/2.
    """
    s = np.asarray(s, dtype=np.float64).reshape(-1)
    N = int(s.shape[0])
    if N not in (2048, 256):
        raise ValueError("MDCT input length must be 2048 or 256.")
    n0 = (N / 2.0 + 1.0) / 2.0
    n = np.arange(N, dtype=np.float64) + n0
    k = np.arange(N // 2, dtype=np.float64) + 0.5
    C = np.cos((2.0 * np.pi / N) * np.outer(n, k))  # (N, N/2)
    X = 2.0 * (s @ C)  # (N/2,)
    return X
 def _imdct(X: MdctCoeffs) -> TimeSignal:
    """
    IMDCT (direct form) as specified in the assignment.
    Parameters
    ----------
    X : MdctCoeffs
        MDCT coefficients, 1-D array of length K (K = 1024 or 128).
    Returns
    -------
    TimeSignal
        Reconstructed time samples, 1-D array of length N = 2K.
    Definition
    ----------
    s[n] = (2/N) * sum_{k=0..N/2-1} X[k] * cos((2*pi/N) * (n + n0) * (k + 1/2)),
    where n0 = (N/2 + 1)/2.
    """
    X = np.asarray(X, dtype=np.float64).reshape(-1)
    K = int(X.shape[0])
    if K not in (1024, 128):
        raise ValueError("IMDCT input length must be 1024 or 128.")
    N = 2 * K
    n0 = (N / 2.0 + 1.0) / 2.0
    n = np.arange(N, dtype=np.float64) + n0
    k = np.arange(K, dtype=np.float64) + 0.5
    C = np.cos((2.0 * np.pi / N) * np.outer(n, k))  # (N, K)
    s = (2.0 / N) * (C @ X)  # (N,)
    return s
 def _filter_bank_esh_channel(x_ch: FrameChannelT, win_type: WinType) -> FrameChannelF:
    """
    ESH analysis for one channel.
@ -279,7 +212,7 @@ def _filter_bank_esh_channel(x_ch: FrameChannelT, win_type: WinType) -> FrameCha
    for j in range(8):
        start = 448 + 128 * j
        seg = x_ch[start:start + 256] * wS  # (256,)
-        X_esh[:, j] = _mdct(seg)           # (128,)
+        X_esh[:, j] = mdct(seg)           # (128,)
    return X_esh
@ -344,7 +277,7 @@ def _i_filter_bank_esh_channel(X_esh: FrameChannelF, win_type: WinType) -> Frame
    # Each short IMDCT returns 256 samples. Place them at:
    # start = 448 + 128*j, j=0..7 (50% overlap)
    for j in range(8):
-        seg = _imdct(X_esh[:, j]) * wS  # (256,)
+        seg = imdct(X_esh[:, j]) * wS  # (256,)
        start = 448 + 128 * j
        out[start:start + 256] += seg
@ -352,7 +285,7 @@ def _i_filter_bank_esh_channel(X_esh: FrameChannelF, win_type: WinType) -> Frame
 # -----------------------------------------------------------------------------
-# Public Function prototypes (Level 1)
+# Public Function prototypes
 # -----------------------------------------------------------------------------
 def aac_filter_bank(frame_T: FrameT, frame_type: FrameType, win_type: WinType) -> FrameF:
@ -385,8 +318,8 @@ def aac_filter_bank(frame_T: FrameT, frame_type: FrameType, win_type: WinType) -
    if frame_type in ("OLS", "LSS", "LPS"):
        w = _window_sequence(frame_type, win_type)  # length 2048
-        XL = _mdct(xL * w)  # length 1024
+        XL = mdct(xL * w)  # length 1024
-        XR = _mdct(xR * w)  # length 1024
+        XR = mdct(xR * w)  # length 1024
        out = np.empty((1024, 2), dtype=np.float64)
        out[:, 0] = XL
        out[:, 1] = XR
@ -430,8 +363,8 @@ def aac_i_filter_bank(frame_F: FrameF, frame_type: FrameType, win_type: WinType)
        w = _window_sequence(frame_type, win_type)
-        xL = _imdct(frame_F[:, 0]) * w
+        xL = imdct(frame_F[:, 0]) * w
-        xR = _imdct(frame_F[:, 1]) * w
+        xR = imdct(frame_F[:, 1]) * w
        out = np.empty((2048, 2), dtype=np.float64)
        out[:, 0] = xL
--- a/source/level_1/core/aac_snr_db.py
+++ b/source/level_1/core/aac_snr_db.py
@ -1,60 +0,0 @@
 # ------------------------------------------------------------
 # AAC Coder/Decoder - SNR dB calculator
 #
 # Multimedia course at Aristotle University of
 # Thessaloniki (AUTh)
 #
 # Author:
 #   Christos Choutouridis (ΑΕΜ 8997)
 #   cchoutou@ece.auth.gr
 #
 # Description:
 #   This module implements SNR calculation in dB
 # ------------------------------------------------------------
 from __future__ import annotations
 from core.aac_types import StereoSignal
 import numpy as np
 def snr_db(x_ref: StereoSignal, x_hat: StereoSignal) -> float:
    """
    Compute overall SNR (dB) over all samples and channels after aligning lengths.
    Parameters
    ----------
    x_ref : StereoSignal
        Reference stereo stream.
    x_hat : StereoSignal
        Reconstructed stereo stream.
    Returns
    -------
    float
        SNR in dB.
        - Returns +inf if noise power is zero.
        - Returns -inf if signal power is zero.
    """
    x_ref = np.asarray(x_ref, dtype=np.float64)
    x_hat = np.asarray(x_hat, dtype=np.float64)
    if x_ref.ndim == 1:
        x_ref = x_ref.reshape(-1, 1)
    if x_hat.ndim == 1:
        x_hat = x_hat.reshape(-1, 1)
    n = min(x_ref.shape[0], x_hat.shape[0])
    c = min(x_ref.shape[1], x_hat.shape[1])
    x_ref = x_ref[:n, :c]
    x_hat = x_hat[:n, :c]
    err = x_ref - x_hat
    ps = float(np.sum(x_ref * x_ref))
    pn = float(np.sum(err * err))
    if pn <= 0.0:
        return float("inf")
    if ps <= 0.0:
        return float("-inf")
    return float(10.0 * np.log10(ps / pn))
--- a/source/level_1/core/aac_ssc.py
+++ b/source/level_1/core/aac_ssc.py
@ -173,10 +173,10 @@ def _stereo_merge(ft_l: FrameType, ft_r: FrameType) -> FrameType:
 # -----------------------------------------------------------------------------
-# Public Function prototypes (Level 1)
+# Public Function prototypes
 # -----------------------------------------------------------------------------
-def aac_SSC(frame_T: FrameT, next_frame_T: FrameT, prev_frame_type: FrameType) -> FrameType:
+def aac_ssc(frame_T: FrameT, next_frame_T: FrameT, prev_frame_type: FrameType) -> FrameType:
    """
    Sequence Segmentation Control (SSC).
--- a/source/level_1/core/aac_types.py
+++ b/source/level_1/core/aac_types.py
@ -193,6 +193,61 @@ Bark-band index ranges [start, end] (inclusive) for MDCT lines.
 Used by TNS to map MDCT indices k to Bark bands.
 """
 BarkTable: TypeAlias = FloatArray
 """
 Psychoacoustic Bark band table loaded from TableB219.mat.
 Typical shapes:
 - Long: (69, 6)
 - Short: (42, 6)
 """
 BandIndexArray: TypeAlias = NDArray[np.int_]
 """
 Array of FFT bin indices per psychoacoustic band.
 """
 BandValueArray: TypeAlias = FloatArray
 """
 Per-band psychoacoustic values (e.g. Bark position, thresholds).
 """
 # Quantizer-related semantic aliases
 QuantizedSymbols: TypeAlias = NDArray[np.generic]
 """
 Quantized MDCT symbols S(k).
 Shapes:
 - Always (1024, 1) at the quantizer output (ESH packed to 1024 symbols).
 """
 ScaleFactors: TypeAlias = NDArray[np.generic]
 """
 DPCM-coded scalefactors sfc(b) = alpha(b) - alpha(b-1).
 Shapes:
 - Long frames: (NB, 1)
 - ESH frames: (NB, 8)
 """
 GlobalGain: TypeAlias = float | NDArray[np.generic]
 """
 Global gain G = alpha(0).
 - Long frames: scalar float
 - ESH frames: array shape (1, 8)
 """
 # Huffman semantic aliases
 HuffmanBitstream: TypeAlias = str
 """Huffman-coded bitstream stored as a string of '0'/'1'."""
 HuffmanCodebook: TypeAlias = int
 """Huffman codebook id (e.g., 0..11)."""
 # -----------------------------------------------------------------------------
 # Level 1 AAC sequence payload types
 # -----------------------------------------------------------------------------
@ -280,3 +335,77 @@ Level 2 adds:
 and stores:
 - per-channel "frame_F" after applying TNS.
 """
 # -----------------------------------------------------------------------------
 # Level 3 AAC sequence payload types (Quantizer + Huffman)
 # -----------------------------------------------------------------------------
 class AACChannelFrameF3(TypedDict):
    """
    Per-channel payload for aac_seq_3[i]["chl"] or ["chr"] (Level 3).
    Keys
    ----
    tns_coeffs:
        Quantized TNS predictor coefficients for ONE channel.
        Shapes:
        - ESH: (PRED_ORDER, 8)
        - else: (PRED_ORDER, 1)
    T:
        Psychoacoustic thresholds per band.
        Shapes:
        - ESH: (NB, 8)
        - else: (NB, 1)
        Note: Stored for completeness / debugging; not entropy-coded.
    G:
        Quantized global gains.
        Shapes:
        - ESH: (1, 8)  (one per short subframe)
        - else: scalar (or compatible np scalar)
    sfc:
        Huffman-coded scalefactor differences (DPCM sequence).
    stream:
        Huffman-coded MDCT quantized symbols S(k) (packed to 1024 symbols).
    codebook:
        Huffman codebook id used for MDCT symbols (stream).
        (Scalefactors typically use fixed codebook 11 and do not need to store it.)
    """
    tns_coeffs: TnsCoeffs
    T: FloatArray
    G: FloatArray | float
    sfc: HuffmanBitstream
    stream: HuffmanBitstream
    codebook: HuffmanCodebook
 class AACSeq3Frame(TypedDict):
    """
    One frame dictionary element of aac_seq_3 (Level 3).
    """
    frame_type: FrameType
    win_type: WinType
    chl: AACChannelFrameF3
    chr: AACChannelFrameF3
 AACSeq3: TypeAlias = List[AACSeq3Frame]
 """
 AAC sequence for Level 3:
 List of length K (K = number of frames).
 Each element is a dict with keys:
 - "frame_type", "win_type", "chl", "chr"
 Level 3 adds (per channel):
 - "tns_coeffs"
 - "T" thresholds (not entropy-coded)
 - "G" global gain(s)
 - "sfc" Huffman-coded scalefactor differences
 - "stream" Huffman-coded MDCT quantized symbols
 - "codebook" Huffman codebook for MDCT symbols
 """
--- a/source/level_1/core/aac_utils.py
+++ b/source/level_1/core/aac_utils.py
@ -0,0 +1,270 @@
 # ------------------------------------------------------------
 # AAC Coder/Decoder - AAC Utilities
 #
 # Multimedia course at Aristotle University of
 # Thessaloniki (AUTh)
 #
 # Author:
 #   Christos Choutouridis (ΑΕΜ 8997)
 #   cchoutou@ece.auth.gr
 #
 # Description:
 #   Shared utility functions used across AAC encoder/decoder levels.
 #
 #   This module currently provides:
 #   - MDCT / IMDCT conversions
 #   - Signal-to-Noise Ratio (SNR) computation in dB
 #   - Loading and access helpers for psychoacoustic band tables
 #     (TableB219.mat, Tables B.2.1.9a / B.2.1.9b of the AAC specification)
 # ------------------------------------------------------------
 from __future__ import annotations
 import numpy as np
 from pathlib import Path
 from scipy.io import loadmat
 from core.aac_types import *
 # -----------------------------------------------------------------------------
 # Global cached data
 # -----------------------------------------------------------------------------
 # Cached contents of TableB219.mat to avoid repeated disk I/O.
 # Keys:
 #   - "B219a": long-window psychoacoustic bands (69 bands, FFT size 2048)
 #   - "B219b": short-window psychoacoustic bands (42 bands, FFT size 256)
 B219_CACHE: dict[str, BarkTable] | None = None
 # -----------------------------------------------------------------------------
 # MDCT / IMDCT
 # -----------------------------------------------------------------------------
 def mdct(s: TimeSignal) -> MdctCoeffs:
    """
    MDCT (direct form) as specified in the assignment.
    Parameters
    ----------
    s : TimeSignal
        Windowed time samples, 1-D array of length N (N = 2048 or 256).
    Returns
    -------
    MdctCoeffs
        MDCT coefficients, 1-D array of length N/2.
    Definition
    ----------
    X[k] = 2 * sum_{n=0..N-1} s[n] * cos((2*pi/N) * (n + n0) * (k + 1/2)),
    where n0 = (N/2 + 1)/2.
    """
    s = np.asarray(s, dtype=np.float64).reshape(-1)
    N = int(s.shape[0])
    if N not in (2048, 256):
        raise ValueError("MDCT input length must be 2048 or 256.")
    n0 = (N / 2.0 + 1.0) / 2.0
    n = np.arange(N, dtype=np.float64) + n0
    k = np.arange(N // 2, dtype=np.float64) + 0.5
    C = np.cos((2.0 * np.pi / N) * np.outer(n, k))  # (N, N/2)
    X = 2.0 * (s @ C)  # (N/2,)
    return X
 def imdct(X: MdctCoeffs) -> TimeSignal:
    """
    IMDCT (direct form) as specified in the assignment.
    Parameters
    ----------
    X : MdctCoeffs
        MDCT coefficients, 1-D array of length K (K = 1024 or 128).
    Returns
    -------
    TimeSignal
        Reconstructed time samples, 1-D array of length N = 2K.
    Definition
    ----------
    s[n] = (2/N) * sum_{k=0..N/2-1} X[k] * cos((2*pi/N) * (n + n0) * (k + 1/2)),
    where n0 = (N/2 + 1)/2.
    """
    X = np.asarray(X, dtype=np.float64).reshape(-1)
    K = int(X.shape[0])
    if K not in (1024, 128):
        raise ValueError("IMDCT input length must be 1024 or 128.")
    N = 2 * K
    n0 = (N / 2.0 + 1.0) / 2.0
    n = np.arange(N, dtype=np.float64) + n0
    k = np.arange(K, dtype=np.float64) + 0.5
    C = np.cos((2.0 * np.pi / N) * np.outer(n, k))  # (N, K)
    s = (2.0 / N) * (C @ X)  # (N,)
    return s
 # -----------------------------------------------------------------------------
 # Signal quality metrics
 # -----------------------------------------------------------------------------
 def snr_db(x_ref: StereoSignal, x_hat: StereoSignal) -> float:
    """
    Compute the overall Signal-to-Noise Ratio (SNR) in dB.
    The SNR is computed over all available samples and channels,
    after conservatively aligning the two signals to their common
    length and channel count.
    Parameters
    ----------
    x_ref : StereoSignal
        Reference (original) signal.
        Typical shape: (N, 2) for stereo.
    x_hat : StereoSignal
        Reconstructed or processed signal.
        Typical shape: (M, 2) for stereo.
    Returns
    -------
    float
        SNR in dB.
        - +inf if the noise power is zero (perfect reconstruction).
        - -inf if the reference signal power is zero.
    """
    x_ref = np.asarray(x_ref, dtype=np.float64)
    x_hat = np.asarray(x_hat, dtype=np.float64)
    # Ensure 2-D shape: (samples, channels)
    if x_ref.ndim == 1:
        x_ref = x_ref.reshape(-1, 1)
    if x_hat.ndim == 1:
        x_hat = x_hat.reshape(-1, 1)
    # Align lengths and channel count conservatively
    n = min(x_ref.shape[0], x_hat.shape[0])
    c = min(x_ref.shape[1], x_hat.shape[1])
    x_ref = x_ref[:n, :c]
    x_hat = x_hat[:n, :c]
    err = x_ref - x_hat
    ps = float(np.sum(x_ref * x_ref))     # signal power
    pn = float(np.sum(err * err))          # noise power
    if pn <= 0.0:
        return float("inf")
    if ps <= 0.0:
        return float("-inf")
    return float(10.0 * np.log10(ps / pn))
 # -----------------------------------------------------------------------------
 # Psychoacoustic band tables (TableB219.mat)
 # -----------------------------------------------------------------------------
 def load_b219_tables() -> dict[str, BarkTable]:
    """
    Load and cache psychoacoustic band tables from TableB219.mat.
    The assignment/project layout assumes that a 'material' directory
    is available in the current working directory when running:
    - tests
    - level_1 / level_2 / level_3 entrypoints
    This function loads the tables once and caches them for subsequent calls.
    Returns
    -------
    dict[str, BarkTable]
        Dictionary with the following entries:
        - "B219a": long-window psychoacoustic table
                   (69 bands, FFT size 2048 / 1024 spectral lines)
        - "B219b": short-window psychoacoustic table
                   (42 bands, FFT size 256 / 128 spectral lines)
    """
    global B219_CACHE
    if B219_CACHE is not None:
        return B219_CACHE
    mat_path = Path("material") / "TableB219.mat"
    if not mat_path.exists():
        raise FileNotFoundError(
            "Could not locate material/TableB219.mat in the current working directory."
        )
    data = loadmat(str(mat_path))
    if "B219a" not in data or "B219b" not in data:
        raise ValueError(
            "TableB219.mat missing required variables 'B219a' and/or 'B219b'."
        )
    B219_CACHE = {
        "B219a": np.asarray(data["B219a"], dtype=np.float64),
        "B219b": np.asarray(data["B219b"], dtype=np.float64),
    }
    return B219_CACHE
 def get_table(frame_type: FrameType) -> tuple[BarkTable, int]:
    """
    Select the appropriate psychoacoustic band table and FFT size
    based on the AAC frame type.
    Parameters
    ----------
    frame_type : FrameType
        AAC frame type ("OLS", "LSS", "ESH", "LPS").
    Returns
    -------
    table : BarkTable
        Psychoacoustic band table:
        - B219a for long frames
        - B219b for ESH short subframes
    N : int
        FFT size corresponding to the table:
        - 2048 for long frames
        - 256 for short frames (ESH)
    """
    tables = load_b219_tables()
    if frame_type == "ESH":
        return tables["B219b"], 256
    return tables["B219a"], 2048
 def band_limits(
    table: BarkTable,
 ) -> tuple[BandIndexArray, BandIndexArray, BandValueArray, BandValueArray]:
    """
    Extract per-band metadata from a TableB2.1.9 psychoacoustic table.
    The column layout follows the provided TableB219.mat file and the
    AAC specification tables B.2.1.9a / B.2.1.9b.
    Parameters
    ----------
    table : BarkTable
        Psychoacoustic band table (B219a or B219b).
    Returns
    -------
    wlow : BandIndexArray
        Lower FFT bin index (inclusive) for each band.
    whigh : BandIndexArray
        Upper FFT bin index (inclusive) for each band.
    bval : BandValueArray
        Bark-scale (or equivalent) band position values.
        Used in the spreading function.
    qthr_db : BandValueArray
        Threshold in quiet for each band, in dB.
    """
    wlow = table[:, 1].astype(int)
    whigh = table[:, 2].astype(int)
    bval = table[:, 4].astype(np.float64)
    qthr_db = table[:, 5].astype(np.float64)
    return wlow, whigh, bval, qthr_db
--- a/source/level_1/level_1.py
+++ b/source/level_1/level_1.py
@ -28,7 +28,7 @@ from core.aac_types   import AACSeq1, StereoSignal
 from core.aac_coder   import aac_coder_1 as core_aac_coder_1
 from core.aac_coder   import aac_read_wav_stereo_48k
 from core.aac_decoder import aac_decoder_1 as core_aac_decoder_1
-from core.aac_snr_db  import snr_db
+from core.aac_utils  import snr_db
 # -----------------------------------------------------------------------------
--- a/source/level_1/material/TableB219.mat
+++ b/source/level_1/material/TableB219.mat
--- a/source/level_1/material/huffCodebooks.mat
+++ b/source/level_1/material/huffCodebooks.mat
--- a/source/level_1/material/huff_utils.py
+++ b/source/level_1/material/huff_utils.py
@ -1,400 +0,0 @@
 import numpy as np
 import scipy.io as sio
 import os
 # ------------------ LOAD LUT ------------------
 def load_LUT(mat_filename=None):
    """
    Loads the list of Huffman Codebooks (LUTs)
    Returns:
        huffLUT : list (index 1..11 used, index 0 unused)
    """
    if mat_filename is None:
        current_dir = os.path.dirname(os.path.abspath(__file__))
        mat_filename = os.path.join(current_dir, "huffCodebooks.mat")
    mat = sio.loadmat(mat_filename)
    huffCodebooks_raw = mat['huffCodebooks'].squeeze()
    huffCodebooks = []
    for i in range(11):
        huffCodebooks.append(np.array(huffCodebooks_raw[i]))
    # Build inverse VLC tables
    invTable = [None] * 11
    for i in range(11):
        h = huffCodebooks[i][:, 2].astype(int)       # column 3
        hlength = huffCodebooks[i][:, 1].astype(int) # column 2
        hbin = []
        for j in range(len(h)):
            hbin.append(format(h[j], f'0{hlength[j]}b'))
        invTable[i] = vlc_table(hbin)
    # Build Huffman LUT dicts
    huffLUT = [None] * 12  # index 0 unused
    params = [
        (4, 1, True),
        (4, 1, True),
        (4, 2, False),
        (4, 2, False),
        (2, 4, True),
        (2, 4, True),
        (2, 7, False),
        (2, 7, False),
        (2, 12, False),
        (2, 12, False),
        (2, 16, False),
    ]
    for i, (nTupleSize, maxAbs, signed) in enumerate(params, start=1):
        huffLUT[i] = {
            'LUT': huffCodebooks[i-1],
            'invTable': invTable[i-1],
            'codebook': i,
            'nTupleSize': nTupleSize,
            'maxAbsCodeVal': maxAbs,
            'signedValues': signed
        }
    return huffLUT
 def vlc_table(code_array):
    """
    codeArray: list of strings, each string is a Huffman codeword (e.g. '0101')
    returns:
        h : NumPy array of shape (num_nodes, 3)
            columns:
              [ next_if_0 , next_if_1 , symbol_index ]
    """
    h = np.zeros((1, 3), dtype=int)
    for code_index, code in enumerate(code_array, start=1):
        word = [int(bit) for bit in code]
        h_index = 0
        for bit in word:
            k = bit
            next_node = h[h_index, k]
            if next_node == 0:
                h = np.vstack([h, [0, 0, 0]])
                new_index = h.shape[0] - 1
                h[h_index, k] = new_index
                h_index = new_index
            else:
                h_index = next_node
        h[h_index, 2] = code_index
    return h
 # ------------------ ENCODE ------------------
 def encode_huff(coeff_sec, huff_LUT_list, force_codebook = None):
    """
    Huffman-encode a sequence of quantized coefficients.
    This function selects the appropriate Huffman codebook based on the
    maximum absolute value of the input coefficients, encodes the coefficients
    into a binary Huffman bitstream, and returns both the bitstream and the
    selected codebook index.
    This is the Python equivalent of the MATLAB `encodeHuff.m` function used
    in audio/image coding (e.g., scale factor band encoding). The input
    coefficient sequence is grouped into fixed-size tuples as defined by
    the chosen Huffman LUT. Zero-padding may be applied internally.
    Parameters
    ----------
    coeff_sec : array_like of int
        1-D array of quantized integer coefficients to encode.
        Typically corresponds to a "section" or scale-factor band.
    huff_LUT_list : list
        List of Huffman lookup-table dictionaries as returned by `loadLUT()`.
        Index 1..11 correspond to valid Huffman codebooks.
        Index 0 is unused.
    Returns
    -------
    huffSec : str
        Huffman-encoded bitstream represented as a string of '0' and '1'
        characters.
    huffCodebook : int
        Index (1..11) of the Huffman codebook used for encoding.
        A value of 0 indicates a special all-zero section.
    """
    if force_codebook is not None:
            return huff_LUT_code_1(huff_LUT_list[force_codebook], coeff_sec)
    maxAbsVal = np.max(np.abs(coeff_sec))
    if maxAbsVal == 0:
        huffCodebook = 0
        huffSec = huff_LUT_code_0()
    elif maxAbsVal == 1:
        candidates = [1, 2]
        huffSec1 = huff_LUT_code_1(huff_LUT_list[candidates[0]], coeff_sec)
        huffSec2 = huff_LUT_code_1(huff_LUT_list[candidates[1]], coeff_sec)
        if len(huffSec1) <= len(huffSec2):
            huffSec = huffSec1
            huffCodebook = candidates[0]
        else:
            huffSec = huffSec2
            huffCodebook = candidates[1]
    elif maxAbsVal == 2:
        candidates = [3, 4]
        huffSec1 = huff_LUT_code_1(huff_LUT_list[candidates[0]], coeff_sec)
        huffSec2 = huff_LUT_code_1(huff_LUT_list[candidates[1]], coeff_sec)
        if len(huffSec1) <= len(huffSec2):
            huffSec = huffSec1
            huffCodebook = candidates[0]
        else:
            huffSec = huffSec2
            huffCodebook = candidates[1]
    elif maxAbsVal in (3, 4):
        candidates = [5, 6]
        huffSec1 = huff_LUT_code_1(huff_LUT_list[candidates[0]], coeff_sec)
        huffSec2 = huff_LUT_code_1(huff_LUT_list[candidates[1]], coeff_sec)
        if len(huffSec1) <= len(huffSec2):
            huffSec = huffSec1
            huffCodebook = candidates[0]
        else:
            huffSec = huffSec2
            huffCodebook = candidates[1]
    elif maxAbsVal in (5, 6, 7):
        candidates = [7, 8]
        huffSec1 = huff_LUT_code_1(huff_LUT_list[candidates[0]], coeff_sec)
        huffSec2 = huff_LUT_code_1(huff_LUT_list[candidates[1]], coeff_sec)
        if len(huffSec1) <= len(huffSec2):
            huffSec = huffSec1
            huffCodebook = candidates[0]
        else:
            huffSec = huffSec2
            huffCodebook = candidates[1]
    elif maxAbsVal in (8, 9, 10, 11, 12):
        candidates = [9, 10]
        huffSec1 = huff_LUT_code_1(huff_LUT_list[candidates[0]], coeff_sec)
        huffSec2 = huff_LUT_code_1(huff_LUT_list[candidates[1]], coeff_sec)
        if len(huffSec1) <= len(huffSec2):
            huffSec = huffSec1
            huffCodebook = candidates[0]
        else:
            huffSec = huffSec2
            huffCodebook = candidates[1]
    elif maxAbsVal in (13, 14, 15):
        huffCodebook = 11
        huffSec = huff_LUT_code_1(huff_LUT_list[huffCodebook], coeff_sec)
    else:
        huffCodebook = 11
        huffSec = huff_LUT_code_ESC(huff_LUT_list[huffCodebook], coeff_sec)
    return huffSec, huffCodebook
 def huff_LUT_code_1(huff_LUT, coeff_sec):
    LUT = huff_LUT['LUT']
    nTupleSize = huff_LUT['nTupleSize']
    maxAbsCodeVal = huff_LUT['maxAbsCodeVal']
    signedValues = huff_LUT['signedValues']
    numTuples = int(np.ceil(len(coeff_sec) / nTupleSize))
    if signedValues:
        coeff = coeff_sec + maxAbsCodeVal
        base = 2 * maxAbsCodeVal + 1
    else:
        coeff = coeff_sec
        base = maxAbsCodeVal + 1
    coeffPad = np.zeros(numTuples * nTupleSize, dtype=int)
    coeffPad[:len(coeff)] = coeff
    huffSec = []
    powers = base ** np.arange(nTupleSize - 1, -1, -1)
    for i in range(numTuples):
        nTuple = coeffPad[i*nTupleSize:(i+1)*nTupleSize]
        huffIndex = int(np.abs(nTuple) @ powers)
        hexVal = LUT[huffIndex, 2]
        huffLen = LUT[huffIndex, 1]
        bits = format(int(hexVal), f'0{int(huffLen)}b')
        if signedValues:
            huffSec.append(bits)
        else:
            signBits = ''.join('1' if v < 0 else '0' for v in nTuple)
            huffSec.append(bits + signBits)
    return ''.join(huffSec)
 def huff_LUT_code_0():
    return ''
 def huff_LUT_code_ESC(huff_LUT, coeff_sec):
    LUT = huff_LUT['LUT']
    nTupleSize = huff_LUT['nTupleSize']
    maxAbsCodeVal = huff_LUT['maxAbsCodeVal']
    numTuples = int(np.ceil(len(coeff_sec) / nTupleSize))
    base = maxAbsCodeVal + 1
    coeffPad = np.zeros(numTuples * nTupleSize, dtype=int)
    coeffPad[:len(coeff_sec)] = coeff_sec
    huffSec = []
    powers = base ** np.arange(nTupleSize - 1, -1, -1)
    for i in range(numTuples):
        nTuple = coeffPad[i*nTupleSize:(i+1)*nTupleSize]
        lnTuple = nTuple.astype(float)
        lnTuple[lnTuple == 0] = np.finfo(float).eps
        N4 = np.maximum(0, np.floor(np.log2(np.abs(lnTuple))).astype(int))
        N = np.maximum(0, N4 - 4)
        esc = np.abs(nTuple) > 15
        nTupleESC = nTuple.copy()
        nTupleESC[esc] = np.sign(nTupleESC[esc]) * 16
        huffIndex = int(np.abs(nTupleESC) @ powers)
        hexVal = LUT[huffIndex, 2]
        huffLen = LUT[huffIndex, 1]
        bits = format(int(hexVal), f'0{int(huffLen)}b')
        escSeq = ''
        for k in range(nTupleSize):
            if esc[k]:
                escSeq += '1' * N[k]
                escSeq += '0'
                escSeq += format(abs(nTuple[k]) - (1 << N4[k]), f'0{N4[k]}b')
        signBits = ''.join('1' if v < 0 else '0' for v in nTuple)
        huffSec.append(bits + signBits + escSeq)
    return ''.join(huffSec)
 # ------------------ DECODE ------------------
 def decode_huff(huff_sec, huff_LUT):
    """
    Decode a Huffman-encoded stream.
    Parameters
    ----------
    huff_sec : array-like of int or str
        Huffman encoded stream as a sequence of 0 and 1 (string or list/array).
    huff_LUT : dict
        Huffman lookup table with keys:
            - 'invTable': inverse table (numpy array)
            - 'codebook': codebook number
            - 'nTupleSize': tuple size
            - 'maxAbsCodeVal': maximum absolute code value
            - 'signedValues': True/False
    Returns
    -------
    decCoeffs : list of int
        Decoded quantized coefficients.
    """
    h = huff_LUT['invTable']
    huffCodebook = huff_LUT['codebook']
    nTupleSize = huff_LUT['nTupleSize']
    maxAbsCodeVal = huff_LUT['maxAbsCodeVal']
    signedValues = huff_LUT['signedValues']
    # Convert string to array of ints
    if isinstance(huff_sec, str):
        huff_sec = np.array([int(b) for b in huff_sec])
    eos = False
    decCoeffs = []
    streamIndex = 0
    while not eos:
        wordbit = 0
        r = 0  # start at root
        # Decode Huffman word using inverse table
        while True:
            b = huff_sec[streamIndex + wordbit]
            wordbit += 1
            rOld = r
            r = h[rOld, b]
            if h[r, 0] == 0 and h[r, 1] == 0:
                symbolIndex = h[r, 2] - 1  # zero-based
                streamIndex += wordbit
                break
        # Decode n-tuple magnitudes
        if signedValues:
            base = 2 * maxAbsCodeVal + 1
            nTupleDec = []
            tmp = symbolIndex
            for p in reversed(range(nTupleSize)):
                val = tmp // (base ** p)
                nTupleDec.append(val - maxAbsCodeVal)
                tmp = tmp % (base ** p)
            nTupleDec = np.array(nTupleDec)
        else:
            base = maxAbsCodeVal + 1
            nTupleDec = []
            tmp = symbolIndex
            for p in reversed(range(nTupleSize)):
                val = tmp // (base ** p)
                nTupleDec.append(val)
                tmp = tmp % (base ** p)
            nTupleDec = np.array(nTupleDec)
            # Apply sign bits
            nTupleSignBits = huff_sec[streamIndex:streamIndex + nTupleSize]
            nTupleSign = -(np.sign(nTupleSignBits - 0.5))
            streamIndex += nTupleSize
            nTupleDec = nTupleDec * nTupleSign
        # Handle escape sequences
        escIndex = np.where(np.abs(nTupleDec) == 16)[0]
        if huffCodebook == 11 and escIndex.size > 0:
            for idx in escIndex:
                N = 0
                b = huff_sec[streamIndex]
                while b:
                    N += 1
                    b = huff_sec[streamIndex + N]
                streamIndex += N
                N4 = N + 4
                escape_word = huff_sec[streamIndex:streamIndex + N4]
                escape_value = 2 ** N4 + int("".join(map(str, escape_word)), 2)
                nTupleDec[idx] = escape_value
                streamIndex += N4 + 1
            # Apply signs again
            nTupleDec[escIndex] *= nTupleSign[escIndex]
        decCoeffs.extend(nTupleDec.tolist())
        if streamIndex >= len(huff_sec):
            eos = True
    return decCoeffs
--- a/source/level_2/core/aac_coder.py
+++ b/source/level_2/core/aac_coder.py
@ -26,14 +26,106 @@ from pathlib import Path
 from typing import Union
 import soundfile as sf
 from scipy.io import savemat
 from core.aac_configuration import WIN_TYPE
 from core.aac_filterbank import aac_filter_bank
-from core.aac_ssc import aac_SSC
+from core.aac_ssc import aac_ssc
 from core.aac_tns import aac_tns
 from core.aac_psycho import aac_psycho
 from core.aac_quantizer import aac_quantizer  # assumes your quantizer file is core/aac_quantizer.py
 from core.aac_huffman import aac_encode_huff
 from core.aac_utils import get_table, band_limits
 from material.huff_utils import load_LUT
 from core.aac_types import *
 # -----------------------------------------------------------------------------
 # Helpers for thresholds (T(b))
 # -----------------------------------------------------------------------------
 def _band_slices_from_table(frame_type: FrameType) -> list[tuple[int, int]]:
    """
    Return inclusive (lo, hi) band slices derived from TableB219.
    """
    table, _ = get_table(frame_type)
    wlow, whigh, _bval, _qthr_db = band_limits(table)
    return [(int(lo), int(hi)) for lo, hi in zip(wlow, whigh)]
 def _thresholds_from_smr(
    frame_F_ch: FrameChannelF,
    frame_type: FrameType,
    SMR: FloatArray,
 ) -> FloatArray:
    """
    Compute thresholds T(b) = P(b) / SMR(b), where P(b) is band energy.
    Shapes:
    - Long: returns (NB, 1)
    - ESH: returns (NB, 8)
    """
    bands = _band_slices_from_table(frame_type)
    NB = len(bands)
    X = np.asarray(frame_F_ch, dtype=np.float64)
    SMR = np.asarray(SMR, dtype=np.float64)
    if frame_type == "ESH":
        if X.shape != (128, 8):
            raise ValueError("For ESH, frame_F_ch must have shape (128, 8).")
        if SMR.shape != (NB, 8):
            raise ValueError(f"For ESH, SMR must have shape ({NB}, 8).")
        T = np.zeros((NB, 8), dtype=np.float64)
        for j in range(8):
            Xj = X[:, j]
            for b, (lo, hi) in enumerate(bands):
                P = float(np.sum(Xj[lo : hi + 1] ** 2))
                smr = float(SMR[b, j])
                T[b, j] = 0.0 if smr <= 1e-12 else (P / smr)
        return T
    # Long
    if X.shape == (1024,):
        Xv = X
    elif X.shape == (1024, 1):
        Xv = X[:, 0]
    else:
        raise ValueError("For non-ESH, frame_F_ch must be shape (1024,) or (1024, 1).")
    if SMR.shape == (NB,):
        SMRv = SMR
    elif SMR.shape == (NB, 1):
        SMRv = SMR[:, 0]
    else:
        raise ValueError(f"For non-ESH, SMR must be shape ({NB},) or ({NB}, 1).")
    T = np.zeros((NB, 1), dtype=np.float64)
    for b, (lo, hi) in enumerate(bands):
        P = float(np.sum(Xv[lo : hi + 1] ** 2))
        smr = float(SMRv[b])
        T[b, 0] = 0.0 if smr <= 1e-12 else (P / smr)
    return T
 def _normalize_global_gain(G: GlobalGain) -> float | FloatArray:
    """
    Normalize GlobalGain to match AACChannelFrameF3["G"] type:
    - long: return float
    - ESH: return float64 ndarray of shape (1, 8)
    """
    if np.isscalar(G):
        return float(G)
    G_arr = np.asarray(G)
    if G_arr.size == 1:
        return float(G_arr.reshape(-1)[0])
    return np.asarray(G_arr, dtype=np.float64)
 # -----------------------------------------------------------------------------
 # Public helpers (useful for level_x demo wrappers)
 # -----------------------------------------------------------------------------
@ -182,7 +274,7 @@ def aac_coder_1(filename_in: Union[str, Path]) -> AACSeq1:
            tail = np.zeros((win - next_t.shape[0], 2), dtype=np.float64)
            next_t = np.vstack([next_t, tail])
-        frame_type = aac_SSC(frame_t, next_t, prev_frame_type)
+        frame_type = aac_ssc(frame_t, next_t, prev_frame_type)
        frame_f = aac_filter_bank(frame_t, frame_type, win_type)
        chl_f, chr_f = aac_pack_frame_f_to_seq_channels(frame_type, frame_f)
@ -250,7 +342,7 @@ def aac_coder_2(filename_in: Union[str, Path]) -> AACSeq2:
            tail = np.zeros((win - next_t.shape[0], 2), dtype=np.float64)
            next_t = np.vstack([next_t, tail])
-        frame_type = aac_SSC(frame_t, next_t, prev_frame_type)
+        frame_type = aac_ssc(frame_t, next_t, prev_frame_type)
        # Level 1 analysis (packed stereo container)
        frame_f_stereo = aac_filter_bank(frame_t, frame_type, WIN_TYPE)
@ -282,3 +374,180 @@ def aac_coder_2(filename_in: Union[str, Path]) -> AACSeq2:
        prev_frame_type = frame_type
    return aac_seq
 def aac_coder_3(
    filename_in: Union[str, Path],
    filename_aac_coded: Union[str, Path] | None = None,
 ) -> AACSeq3:
    """
    Level-3 AAC encoder (Level 2 + Psycho + Quantizer + Huffman).
    Parameters
    ----------
    filename_in : Union[str, Path]
        Input WAV filename (stereo, 48 kHz).
    filename_aac_coded : Union[str, Path] | None
        Optional .mat filename to store aac_seq_3 (assignment convenience).
    Returns
    -------
    AACSeq3
        Encoded AAC sequence (Level 3 payload schema).
    """
    filename_in = Path(filename_in)
    x, _ = aac_read_wav_stereo_48k(filename_in)
    hop = 1024
    win = 2048
    pad_pre = np.zeros((hop, 2), dtype=np.float64)
    pad_post = np.zeros((hop, 2), dtype=np.float64)
    x_pad = np.vstack([pad_pre, x, pad_post])
    K = int((x_pad.shape[0] - win) // hop + 1)
    if K <= 0:
        raise ValueError("Input too short for framing.")
    # Load Huffman LUTs once.
    huff_LUT_list = load_LUT()
    aac_seq: AACSeq3 = []
    prev_frame_type: FrameType = "OLS"
    # Pin win_type to the WinType literal for type checkers.
    win_type: WinType = WIN_TYPE
    # Psycho model needs per-channel history (prev1, prev2) of 2048-sample frames.
    prev1_L = np.zeros((2048,), dtype=np.float64)
    prev2_L = np.zeros((2048,), dtype=np.float64)
    prev1_R = np.zeros((2048,), dtype=np.float64)
    prev2_R = np.zeros((2048,), dtype=np.float64)
    for i in range(K):
        start = i * hop
        frame_t: FrameT = x_pad[start : start + win, :]
        if frame_t.shape != (win, 2):
            raise ValueError("Internal framing error: frame_t has wrong shape.")
        next_t = x_pad[start + hop : start + hop + win, :]
        if next_t.shape[0] < win:
            tail = np.zeros((win - next_t.shape[0], 2), dtype=np.float64)
            next_t = np.vstack([next_t, tail])
        frame_type = aac_ssc(frame_t, next_t, prev_frame_type)
        # Analysis filterbank (stereo packed)
        frame_f_stereo = aac_filter_bank(frame_t, frame_type, win_type)
        chl_f, chr_f = aac_pack_frame_f_to_seq_channels(frame_type, frame_f_stereo)
        # TNS per channel
        chl_f_tns, chl_tns_coeffs = aac_tns(chl_f, frame_type)
        chr_f_tns, chr_tns_coeffs = aac_tns(chr_f, frame_type)
        # Psychoacoustic model per channel (time-domain)
        frame_L = np.asarray(frame_t[:, 0], dtype=np.float64)
        frame_R = np.asarray(frame_t[:, 1], dtype=np.float64)
        SMR_L = aac_psycho(frame_L, frame_type, prev1_L, prev2_L)
        SMR_R = aac_psycho(frame_R, frame_type, prev1_R, prev2_R)
        # Thresholds T(b) (stored, not entropy-coded)
        T_L = _thresholds_from_smr(chl_f_tns, frame_type, SMR_L)
        T_R = _thresholds_from_smr(chr_f_tns, frame_type, SMR_R)
        # Quantizer per channel
        S_L, sfc_L, G_L = aac_quantizer(chl_f_tns, frame_type, SMR_L)
        S_R, sfc_R, G_R = aac_quantizer(chr_f_tns, frame_type, SMR_R)
        # Normalize G types for AACSeq3 schema (float | float64 ndarray).
        G_Ln = _normalize_global_gain(G_L)
        G_Rn = _normalize_global_gain(G_R)
        # Huffman-code ONLY the DPCM differences for b>0.
        # sfc[0] corresponds to alpha(0)=G and is stored separately in the frame.
        sfc_L_dpcm = np.asarray(sfc_L, dtype=np.int64)[1:, ...]
        sfc_R_dpcm = np.asarray(sfc_R, dtype=np.int64)[1:, ...]
        # Codebook 11:
        # maxAbsCodeVal = 16 is RESERVED for ESCAPE.
        # We must stay strictly within [-15, +15] to avoid escape decoding.
        sf_cb = 11
        sf_max_abs = int(huff_LUT_list[sf_cb]["maxAbsCodeVal"]) - 1  # -> 15
        sfc_L_dpcm = np.clip(
            sfc_L_dpcm,
            -sf_max_abs,
            sf_max_abs,
        ).astype(np.int64, copy=False)
        sfc_R_dpcm = np.clip(
            sfc_R_dpcm,
            -sf_max_abs,
            sf_max_abs,
        ).astype(np.int64, copy=False)
        sfc_L_stream, _ = aac_encode_huff(
            sfc_L_dpcm.reshape(-1, order="F"),
            huff_LUT_list,
            force_codebook=sf_cb,
        )
        sfc_R_stream, _ = aac_encode_huff(
            sfc_R_dpcm.reshape(-1, order="F"),
            huff_LUT_list,
            force_codebook=sf_cb,
        )
        mdct_L_stream, cb_L = aac_encode_huff(
            np.asarray(S_L, dtype=np.int64).reshape(-1),
            huff_LUT_list,
        )
        mdct_R_stream, cb_R = aac_encode_huff(
            np.asarray(S_R, dtype=np.int64).reshape(-1),
            huff_LUT_list,
        )
        # Typed dict construction helps static analyzers validate the schema.
        frame_out: AACSeq3Frame = {
            "frame_type": frame_type,
            "win_type": win_type,
            "chl": {
                "tns_coeffs": np.asarray(chl_tns_coeffs, dtype=np.float64),
                "T": np.asarray(T_L, dtype=np.float64),
                "G": G_Ln,
                "sfc": sfc_L_stream,
                "stream": mdct_L_stream,
                "codebook": int(cb_L),
            },
            "chr": {
                "tns_coeffs": np.asarray(chr_tns_coeffs, dtype=np.float64),
                "T": np.asarray(T_R, dtype=np.float64),
                "G": G_Rn,
                "sfc": sfc_R_stream,
                "stream": mdct_R_stream,
                "codebook": int(cb_R),
            },
        }
        aac_seq.append(frame_out)
        # Update psycho history (shift register)
        prev2_L = prev1_L
        prev1_L = frame_L
        prev2_R = prev1_R
        prev1_R = frame_R
        prev_frame_type = frame_type
    # Optional: store to .mat for the assignment wrapper
    if filename_aac_coded is not None:
        filename_aac_coded = Path(filename_aac_coded)
        savemat(
            str(filename_aac_coded),
            {"aac_seq_3": np.array(aac_seq, dtype=object)},
            do_compression=True,
        )
    return aac_seq
--- a/source/level_2/core/aac_configuration.py
+++ b/source/level_2/core/aac_configuration.py
@ -15,6 +15,8 @@
 from __future__ import annotations
 # Imports
 from typing import Final
 from core.aac_types import WinType
 # Filterbank
@ -29,3 +31,11 @@ WIN_TYPE: WinType = "SIN"
 PRED_ORDER = 4
 QUANT_STEP = 0.1
 QUANT_MAX = 0.7  # 4-bit symmetric with step 0.1 -> clamp to [-0.7, +0.7]
 # -----------------------------------------------------------------------------
 # Psycho
 # -----------------------------------------------------------------------------
 NMT_DB: Final[float] = 6.0   # Noise Masking Tone (dB)
 TMN_DB: Final[float] = 18.0  # Tone Masking Noise (dB)
--- a/source/level_2/core/aac_decoder.py
+++ b/source/level_2/core/aac_decoder.py
@ -9,16 +9,9 @@
 #   cchoutou@ece.auth.gr
 #
 # Description:
-#   Level 1 AAC decoder orchestration (inverse of aac_coder_1()).
+#   - Level 1 AAC decoder orchestration (inverse of aac_coder_1()).
-#   Keeps the same functional behavior as the original level_1 implementation:
+#   - Level 2 AAC decoder orchestration (inverse of aac_coder_1()).
 #   - Re-pack per-channel spectra into FrameF expected by aac_i_filter_bank()
 #   - IMDCT synthesis per frame
 #   - Overlap-add with hop=1024
 #   - Remove encoder boundary padding: hop at start and hop at end
 #
 #   Note:
 #   This core module returns the reconstructed samples. Writing to disk is kept
 #   in level_x demos.
 # ------------------------------------------------------------
 from __future__ import annotations
@ -29,11 +22,24 @@ import soundfile as sf
 from core.aac_filterbank import aac_i_filter_bank
 from core.aac_tns import aac_i_tns
 from core.aac_quantizer import aac_i_quantizer
 from core.aac_huffman import aac_decode_huff
 from core.aac_utils import get_table, band_limits
 from material.huff_utils import load_LUT
 from core.aac_types import *
 # -----------------------------------------------------------------------------
-# Public helpers (useful for level_x demo wrappers)
+# Helper for NB
 # -----------------------------------------------------------------------------
 def _nbands(frame_type: FrameType) -> int:
    table, _ = get_table(frame_type)
    wlow, _whigh, _bval, _qthr_db = band_limits(table)
    return int(len(wlow))
 # -----------------------------------------------------------------------------
 # Public helpers
 # -----------------------------------------------------------------------------
 def aac_unpack_seq_channels_to_frame_f(frame_type: FrameType, chl_f: FrameChannelF, chr_f: FrameChannelF) -> FrameF:
@ -109,7 +115,7 @@ def aac_remove_padding(y_pad: StereoSignal, hop: int = 1024) -> StereoSignal:
 # -----------------------------------------------------------------------------
-# Level 1 decoder (core)
+# Level 1 decoder
 # -----------------------------------------------------------------------------
 def aac_decoder_1(aac_seq_1: AACSeq1, filename_out: Union[str, Path]) -> StereoSignal:
@ -167,6 +173,10 @@ def aac_decoder_1(aac_seq_1: AACSeq1, filename_out: Union[str, Path]) -> StereoS
    return y
 # -----------------------------------------------------------------------------
 # Level 2 decoder
 # -----------------------------------------------------------------------------
 def aac_decoder_2(aac_seq_2: AACSeq2, filename_out: Union[str, Path]) -> StereoSignal:
    """
    Level-2 AAC decoder (inverse of aac_coder_2).
@ -255,3 +265,144 @@ def aac_decoder_2(aac_seq_2: AACSeq2, filename_out: Union[str, Path]) -> StereoS
    sf.write(str(filename_out), y, 48000)
    return y
 def aac_decoder_3(aac_seq_3: AACSeq3, filename_out: Union[str, Path]) -> StereoSignal:
    """
    Level-3 AAC decoder (inverse of aac_coder_3).
    Steps per frame:
    - Huffman decode scalefactors (sfc) using codebook 11
    - Huffman decode MDCT symbols (stream) using stored codebook
    - iQuantizer -> MDCT coefficients after TNS
    - iTNS using stored predictor coefficients
    - IMDCT filterbank -> time domain
    - Overlap-add, remove padding, write WAV
    Parameters
    ----------
    aac_seq_3 : AACSeq3
        Encoded sequence as produced by aac_coder_3.
    filename_out : Union[str, Path]
        Output WAV filename.
    Returns
    -------
    StereoSignal
        Decoded audio samples (time-domain), stereo, shape (N, 2), dtype float64.
    """
    filename_out = Path(filename_out)
    hop = 1024
    win = 2048
    K = len(aac_seq_3)
    if K <= 0:
        raise ValueError("aac_seq_3 must contain at least one frame.")
    # Load Huffman LUTs once.
    huff_LUT_list = load_LUT()
    n_pad = (K - 1) * hop + win
    y_pad = np.zeros((n_pad, 2), dtype=np.float64)
    for i, fr in enumerate(aac_seq_3):
        frame_type: FrameType = fr["frame_type"]
        win_type: WinType = fr["win_type"]
        NB = _nbands(frame_type)
        # We store G separately, so Huffman stream contains only (NB-1) DPCM differences.
        sfc_len = (NB - 1) * (8 if frame_type == "ESH" else 1)
        # -------------------------
        # Left channel
        # -------------------------
        tns_L = np.asarray(fr["chl"]["tns_coeffs"], dtype=np.float64)
        G_L = fr["chl"]["G"]
        sfc_bits_L = fr["chl"]["sfc"]
        mdct_bits_L = fr["chl"]["stream"]
        cb_L = int(fr["chl"]["codebook"])
        sfc_dec_L = aac_decode_huff(sfc_bits_L, 11, huff_LUT_list)[:sfc_len].astype(np.int64, copy=False)
        if frame_type == "ESH":
            sfc_dpcm_L = sfc_dec_L.reshape(NB - 1, 8, order="F")
            sfc_L = np.zeros((NB, 8), dtype=np.int64)
            Gv = np.asarray(G_L, dtype=np.float64).reshape(1, 8)
            sfc_L[0, :] = Gv[0, :].astype(np.int64)
            sfc_L[1:, :] = sfc_dpcm_L
        else:
            sfc_dpcm_L = sfc_dec_L.reshape(NB - 1, 1, order="F")
            sfc_L = np.zeros((NB, 1), dtype=np.int64)
            sfc_L[0, 0] = int(float(G_L))
            sfc_L[1:, :] = sfc_dpcm_L
        # MDCT symbols: codebook 0 means "all-zero section"
        if cb_L == 0:
            S_dec_L = np.zeros((1024,), dtype=np.int64)
        else:
            S_tmp_L = aac_decode_huff(mdct_bits_L, cb_L, huff_LUT_list).astype(np.int64, copy=False)
            # Tuple coding may produce extra trailing symbols; caller knows the true length (1024).
            # Also guard against short outputs by zero-padding.
            if S_tmp_L.size < 1024:
                S_dec_L = np.zeros((1024,), dtype=np.int64)
                S_dec_L[: S_tmp_L.size] = S_tmp_L
            else:
                S_dec_L = S_tmp_L[:1024]
        S_L = S_dec_L.reshape(1024, 1)
        Xq_L = aac_i_quantizer(S_L, sfc_L, G_L, frame_type)
        X_L = aac_i_tns(Xq_L, frame_type, tns_L)
        # -------------------------
        # Right channel
        # -------------------------
        tns_R = np.asarray(fr["chr"]["tns_coeffs"], dtype=np.float64)
        G_R = fr["chr"]["G"]
        sfc_bits_R = fr["chr"]["sfc"]
        mdct_bits_R = fr["chr"]["stream"]
        cb_R = int(fr["chr"]["codebook"])
        sfc_dec_R = aac_decode_huff(sfc_bits_R, 11, huff_LUT_list)[:sfc_len].astype(np.int64, copy=False)
        if frame_type == "ESH":
            sfc_dpcm_R = sfc_dec_R.reshape(NB - 1, 8, order="F")
            sfc_R = np.zeros((NB, 8), dtype=np.int64)
            Gv = np.asarray(G_R, dtype=np.float64).reshape(1, 8)
            sfc_R[0, :] = Gv[0, :].astype(np.int64)
            sfc_R[1:, :] = sfc_dpcm_R
        else:
            sfc_dpcm_R = sfc_dec_R.reshape(NB - 1, 1, order="F")
            sfc_R = np.zeros((NB, 1), dtype=np.int64)
            sfc_R[0, 0] = int(float(G_R))
            sfc_R[1:, :] = sfc_dpcm_R
        if cb_R == 0:
            S_dec_R = np.zeros((1024,), dtype=np.int64)
        else:
            S_tmp_R = aac_decode_huff(mdct_bits_R, cb_R, huff_LUT_list).astype(np.int64, copy=False)
            if S_tmp_R.size < 1024:
                S_dec_R = np.zeros((1024,), dtype=np.int64)
                S_dec_R[: S_tmp_R.size] = S_tmp_R
            else:
                S_dec_R = S_tmp_R[:1024]
        S_R = S_dec_R.reshape(1024, 1)
        Xq_R = aac_i_quantizer(S_R, sfc_R, G_R, frame_type)
        X_R = aac_i_tns(Xq_R, frame_type, tns_R)
        # Re-pack to stereo container and inverse filterbank
        frame_f = aac_unpack_seq_channels_to_frame_f(frame_type, np.asarray(X_L), np.asarray(X_R))
        frame_t_hat: FrameT = aac_i_filter_bank(frame_f, frame_type, win_type)
        start = i * hop
        y_pad[start : start + win, :] += frame_t_hat
    y = aac_remove_padding(y_pad, hop=hop)
    sf.write(str(filename_out), y, 48000)
    return y
--- a/source/level_2/core/aac_filterbank.py
+++ b/source/level_2/core/aac_filterbank.py
@ -14,6 +14,7 @@
 # ------------------------------------------------------------
 from __future__ import annotations
 from core.aac_utils import mdct, imdct
 from core.aac_types import *
 from scipy.signal.windows import kaiser
@ -186,74 +187,6 @@ def _window_sequence(frame_type: FrameType, win_type: WinType) -> Window:
    raise ValueError(f"Invalid frame_type for long window sequence: {frame_type!r}")
 def _mdct(s: TimeSignal) -> MdctCoeffs:
    """
    MDCT (direct form) as specified in the assignment.
    Parameters
    ----------
    s : TimeSignal
        Windowed time samples, 1-D array of length N (N = 2048 or 256).
    Returns
    -------
    MdctCoeffs
        MDCT coefficients, 1-D array of length N/2.
    Definition
    ----------
    X[k] = 2 * sum_{n=0..N-1} s[n] * cos((2*pi/N) * (n + n0) * (k + 1/2)),
    where n0 = (N/2 + 1)/2.
    """
    s = np.asarray(s, dtype=np.float64).reshape(-1)
    N = int(s.shape[0])
    if N not in (2048, 256):
        raise ValueError("MDCT input length must be 2048 or 256.")
    n0 = (N / 2.0 + 1.0) / 2.0
    n = np.arange(N, dtype=np.float64) + n0
    k = np.arange(N // 2, dtype=np.float64) + 0.5
    C = np.cos((2.0 * np.pi / N) * np.outer(n, k))  # (N, N/2)
    X = 2.0 * (s @ C)  # (N/2,)
    return X
 def _imdct(X: MdctCoeffs) -> TimeSignal:
    """
    IMDCT (direct form) as specified in the assignment.
    Parameters
    ----------
    X : MdctCoeffs
        MDCT coefficients, 1-D array of length K (K = 1024 or 128).
    Returns
    -------
    TimeSignal
        Reconstructed time samples, 1-D array of length N = 2K.
    Definition
    ----------
    s[n] = (2/N) * sum_{k=0..N/2-1} X[k] * cos((2*pi/N) * (n + n0) * (k + 1/2)),
    where n0 = (N/2 + 1)/2.
    """
    X = np.asarray(X, dtype=np.float64).reshape(-1)
    K = int(X.shape[0])
    if K not in (1024, 128):
        raise ValueError("IMDCT input length must be 1024 or 128.")
    N = 2 * K
    n0 = (N / 2.0 + 1.0) / 2.0
    n = np.arange(N, dtype=np.float64) + n0
    k = np.arange(K, dtype=np.float64) + 0.5
    C = np.cos((2.0 * np.pi / N) * np.outer(n, k))  # (N, K)
    s = (2.0 / N) * (C @ X)  # (N,)
    return s
 def _filter_bank_esh_channel(x_ch: FrameChannelT, win_type: WinType) -> FrameChannelF:
    """
    ESH analysis for one channel.
@ -279,7 +212,7 @@ def _filter_bank_esh_channel(x_ch: FrameChannelT, win_type: WinType) -> FrameCha
    for j in range(8):
        start = 448 + 128 * j
        seg = x_ch[start:start + 256] * wS  # (256,)
-        X_esh[:, j] = _mdct(seg)           # (128,)
+        X_esh[:, j] = mdct(seg)           # (128,)
    return X_esh
@ -344,7 +277,7 @@ def _i_filter_bank_esh_channel(X_esh: FrameChannelF, win_type: WinType) -> Frame
    # Each short IMDCT returns 256 samples. Place them at:
    # start = 448 + 128*j, j=0..7 (50% overlap)
    for j in range(8):
-        seg = _imdct(X_esh[:, j]) * wS  # (256,)
+        seg = imdct(X_esh[:, j]) * wS  # (256,)
        start = 448 + 128 * j
        out[start:start + 256] += seg
@ -352,7 +285,7 @@ def _i_filter_bank_esh_channel(X_esh: FrameChannelF, win_type: WinType) -> Frame
 # -----------------------------------------------------------------------------
-# Public Function prototypes (Level 1)
+# Public Function prototypes
 # -----------------------------------------------------------------------------
 def aac_filter_bank(frame_T: FrameT, frame_type: FrameType, win_type: WinType) -> FrameF:
@ -385,8 +318,8 @@ def aac_filter_bank(frame_T: FrameT, frame_type: FrameType, win_type: WinType) -
    if frame_type in ("OLS", "LSS", "LPS"):
        w = _window_sequence(frame_type, win_type)  # length 2048
-        XL = _mdct(xL * w)  # length 1024
+        XL = mdct(xL * w)  # length 1024
-        XR = _mdct(xR * w)  # length 1024
+        XR = mdct(xR * w)  # length 1024
        out = np.empty((1024, 2), dtype=np.float64)
        out[:, 0] = XL
        out[:, 1] = XR
@ -430,8 +363,8 @@ def aac_i_filter_bank(frame_F: FrameF, frame_type: FrameType, win_type: WinType)
        w = _window_sequence(frame_type, win_type)
-        xL = _imdct(frame_F[:, 0]) * w
+        xL = imdct(frame_F[:, 0]) * w
-        xR = _imdct(frame_F[:, 1]) * w
+        xR = imdct(frame_F[:, 1]) * w
        out = np.empty((2048, 2), dtype=np.float64)
        out[:, 0] = xL
--- a/source/level_2/core/aac_snr_db.py
+++ b/source/level_2/core/aac_snr_db.py
@ -1,60 +0,0 @@
 # ------------------------------------------------------------
 # AAC Coder/Decoder - SNR dB calculator
 #
 # Multimedia course at Aristotle University of
 # Thessaloniki (AUTh)
 #
 # Author:
 #   Christos Choutouridis (ΑΕΜ 8997)
 #   cchoutou@ece.auth.gr
 #
 # Description:
 #   This module implements SNR calculation in dB
 # ------------------------------------------------------------
 from __future__ import annotations
 from core.aac_types import StereoSignal
 import numpy as np
 def snr_db(x_ref: StereoSignal, x_hat: StereoSignal) -> float:
    """
    Compute overall SNR (dB) over all samples and channels after aligning lengths.
    Parameters
    ----------
    x_ref : StereoSignal
        Reference stereo stream.
    x_hat : StereoSignal
        Reconstructed stereo stream.
    Returns
    -------
    float
        SNR in dB.
        - Returns +inf if noise power is zero.
        - Returns -inf if signal power is zero.
    """
    x_ref = np.asarray(x_ref, dtype=np.float64)
    x_hat = np.asarray(x_hat, dtype=np.float64)
    if x_ref.ndim == 1:
        x_ref = x_ref.reshape(-1, 1)
    if x_hat.ndim == 1:
        x_hat = x_hat.reshape(-1, 1)
    n = min(x_ref.shape[0], x_hat.shape[0])
    c = min(x_ref.shape[1], x_hat.shape[1])
    x_ref = x_ref[:n, :c]
    x_hat = x_hat[:n, :c]
    err = x_ref - x_hat
    ps = float(np.sum(x_ref * x_ref))
    pn = float(np.sum(err * err))
    if pn <= 0.0:
        return float("inf")
    if ps <= 0.0:
        return float("-inf")
    return float(10.0 * np.log10(ps / pn))
--- a/source/level_2/core/aac_ssc.py
+++ b/source/level_2/core/aac_ssc.py
@ -173,10 +173,10 @@ def _stereo_merge(ft_l: FrameType, ft_r: FrameType) -> FrameType:
 # -----------------------------------------------------------------------------
-# Public Function prototypes (Level 1)
+# Public Function prototypes
 # -----------------------------------------------------------------------------
-def aac_SSC(frame_T: FrameT, next_frame_T: FrameT, prev_frame_type: FrameType) -> FrameType:
+def aac_ssc(frame_T: FrameT, next_frame_T: FrameT, prev_frame_type: FrameType) -> FrameType:
    """
    Sequence Segmentation Control (SSC).
--- a/source/level_2/core/aac_tns.py
+++ b/source/level_2/core/aac_tns.py
@ -30,9 +30,7 @@ from __future__ import annotations
 from pathlib import Path
 from typing import Tuple
-import numpy as np
+from core.aac_utils import load_b219_tables
 from scipy.io import loadmat
 from core.aac_configuration import PRED_ORDER, QUANT_STEP, QUANT_MAX
 from core.aac_types import *
@ -40,41 +38,6 @@ from core.aac_types import *
 # Private helpers
 # -----------------------------------------------------------------------------
 _B219_CACHE: dict[str, FloatArray] | None = None
 def _load_b219_tables() -> dict[str, FloatArray]:
    """
    Load TableB219.mat and cache the contents.
    The project layout guarantees that a 'material' directory is discoverable
    from the current working directory (tests and level_123 entrypoints).
    Returns
    -------
    dict[str, FloatArray]
        Keys:
        - "B219a": long bands table (for K=1024 MDCT lines)
        - "B219b": short bands table (for K=128 MDCT lines)
    """
    global _B219_CACHE
    if _B219_CACHE is not None:
        return _B219_CACHE
    mat_path = Path("material") / "TableB219.mat"
    if not mat_path.exists():
        raise FileNotFoundError("Could not locate material/TableB219.mat in the current working directory.")
    d = loadmat(str(mat_path))
    if "B219a" not in d or "B219b" not in d:
        raise ValueError("TableB219.mat missing required variables B219a and/or B219b.")
    _B219_CACHE = {
        "B219a": np.asarray(d["B219a"], dtype=np.float64),
        "B219b": np.asarray(d["B219b"], dtype=np.float64),
    }
    return _B219_CACHE
 def _band_ranges_for_kcount(k_count: int) -> BandRanges:
    """
@ -92,7 +55,7 @@ def _band_ranges_for_kcount(k_count: int) -> BandRanges:
    BandRanges (list[tuple[int, int]])
        Each tuple is (start_k, end_k) inclusive.
    """
-    tables = _load_b219_tables()
+    tables = load_b219_tables()
    if k_count == 1024:
        tbl = tables["B219a"]
    elif k_count == 128:
@ -411,7 +374,9 @@ def _tns_one_vector(x: MdctCoeffs) -> tuple[MdctCoeffs, MdctCoeffs]:
    sw = _compute_sw(x)
    eps = 1e-12
-    xw = np.where(sw > eps, x / sw, 0.0)
+    xw = np.zeros_like(x, dtype=np.float64)
    mask = sw > eps
    np.divide(x, sw, out=xw, where=mask)
    a = _lpc_coeffs(xw, PRED_ORDER)
    a_q = _quantize_coeffs(a)
@ -425,7 +390,7 @@ def _tns_one_vector(x: MdctCoeffs) -> tuple[MdctCoeffs, MdctCoeffs]:
 # -----------------------------------------------------------------------------
-# Public Functions (Level 2)
+# Public Functions
 # -----------------------------------------------------------------------------
 def aac_tns(frame_F_in: FrameChannelF, frame_type: FrameType) -> Tuple[FrameChannelF, TnsCoeffs]:
--- a/source/level_2/core/aac_types.py
+++ b/source/level_2/core/aac_types.py
@ -193,6 +193,61 @@ Bark-band index ranges [start, end] (inclusive) for MDCT lines.
 Used by TNS to map MDCT indices k to Bark bands.
 """
 BarkTable: TypeAlias = FloatArray
 """
 Psychoacoustic Bark band table loaded from TableB219.mat.
 Typical shapes:
 - Long: (69, 6)
 - Short: (42, 6)
 """
 BandIndexArray: TypeAlias = NDArray[np.int_]
 """
 Array of FFT bin indices per psychoacoustic band.
 """
 BandValueArray: TypeAlias = FloatArray
 """
 Per-band psychoacoustic values (e.g. Bark position, thresholds).
 """
 # Quantizer-related semantic aliases
 QuantizedSymbols: TypeAlias = NDArray[np.generic]
 """
 Quantized MDCT symbols S(k).
 Shapes:
 - Always (1024, 1) at the quantizer output (ESH packed to 1024 symbols).
 """
 ScaleFactors: TypeAlias = NDArray[np.generic]
 """
 DPCM-coded scalefactors sfc(b) = alpha(b) - alpha(b-1).
 Shapes:
 - Long frames: (NB, 1)
 - ESH frames: (NB, 8)
 """
 GlobalGain: TypeAlias = float | NDArray[np.generic]
 """
 Global gain G = alpha(0).
 - Long frames: scalar float
 - ESH frames: array shape (1, 8)
 """
 # Huffman semantic aliases
 HuffmanBitstream: TypeAlias = str
 """Huffman-coded bitstream stored as a string of '0'/'1'."""
 HuffmanCodebook: TypeAlias = int
 """Huffman codebook id (e.g., 0..11)."""
 # -----------------------------------------------------------------------------
 # Level 1 AAC sequence payload types
 # -----------------------------------------------------------------------------
@ -280,3 +335,77 @@ Level 2 adds:
 and stores:
 - per-channel "frame_F" after applying TNS.
 """
 # -----------------------------------------------------------------------------
 # Level 3 AAC sequence payload types (Quantizer + Huffman)
 # -----------------------------------------------------------------------------
 class AACChannelFrameF3(TypedDict):
    """
    Per-channel payload for aac_seq_3[i]["chl"] or ["chr"] (Level 3).
    Keys
    ----
    tns_coeffs:
        Quantized TNS predictor coefficients for ONE channel.
        Shapes:
        - ESH: (PRED_ORDER, 8)
        - else: (PRED_ORDER, 1)
    T:
        Psychoacoustic thresholds per band.
        Shapes:
        - ESH: (NB, 8)
        - else: (NB, 1)
        Note: Stored for completeness / debugging; not entropy-coded.
    G:
        Quantized global gains.
        Shapes:
        - ESH: (1, 8)  (one per short subframe)
        - else: scalar (or compatible np scalar)
    sfc:
        Huffman-coded scalefactor differences (DPCM sequence).
    stream:
        Huffman-coded MDCT quantized symbols S(k) (packed to 1024 symbols).
    codebook:
        Huffman codebook id used for MDCT symbols (stream).
        (Scalefactors typically use fixed codebook 11 and do not need to store it.)
    """
    tns_coeffs: TnsCoeffs
    T: FloatArray
    G: FloatArray | float
    sfc: HuffmanBitstream
    stream: HuffmanBitstream
    codebook: HuffmanCodebook
 class AACSeq3Frame(TypedDict):
    """
    One frame dictionary element of aac_seq_3 (Level 3).
    """
    frame_type: FrameType
    win_type: WinType
    chl: AACChannelFrameF3
    chr: AACChannelFrameF3
 AACSeq3: TypeAlias = List[AACSeq3Frame]
 """
 AAC sequence for Level 3:
 List of length K (K = number of frames).
 Each element is a dict with keys:
 - "frame_type", "win_type", "chl", "chr"
 Level 3 adds (per channel):
 - "tns_coeffs"
 - "T" thresholds (not entropy-coded)
 - "G" global gain(s)
 - "sfc" Huffman-coded scalefactor differences
 - "stream" Huffman-coded MDCT quantized symbols
 - "codebook" Huffman codebook for MDCT symbols
 """
--- a/source/level_2/core/aac_utils.py
+++ b/source/level_2/core/aac_utils.py
@ -0,0 +1,270 @@
 # ------------------------------------------------------------
 # AAC Coder/Decoder - AAC Utilities
 #
 # Multimedia course at Aristotle University of
 # Thessaloniki (AUTh)
 #
 # Author:
 #   Christos Choutouridis (ΑΕΜ 8997)
 #   cchoutou@ece.auth.gr
 #
 # Description:
 #   Shared utility functions used across AAC encoder/decoder levels.
 #
 #   This module currently provides:
 #   - MDCT / IMDCT conversions
 #   - Signal-to-Noise Ratio (SNR) computation in dB
 #   - Loading and access helpers for psychoacoustic band tables
 #     (TableB219.mat, Tables B.2.1.9a / B.2.1.9b of the AAC specification)
 # ------------------------------------------------------------
 from __future__ import annotations
 import numpy as np
 from pathlib import Path
 from scipy.io import loadmat
 from core.aac_types import *
 # -----------------------------------------------------------------------------
 # Global cached data
 # -----------------------------------------------------------------------------
 # Cached contents of TableB219.mat to avoid repeated disk I/O.
 # Keys:
 #   - "B219a": long-window psychoacoustic bands (69 bands, FFT size 2048)
 #   - "B219b": short-window psychoacoustic bands (42 bands, FFT size 256)
 B219_CACHE: dict[str, BarkTable] | None = None
 # -----------------------------------------------------------------------------
 # MDCT / IMDCT
 # -----------------------------------------------------------------------------
 def mdct(s: TimeSignal) -> MdctCoeffs:
    """
    MDCT (direct form) as specified in the assignment.
    Parameters
    ----------
    s : TimeSignal
        Windowed time samples, 1-D array of length N (N = 2048 or 256).
    Returns
    -------
    MdctCoeffs
        MDCT coefficients, 1-D array of length N/2.
    Definition
    ----------
    X[k] = 2 * sum_{n=0..N-1} s[n] * cos((2*pi/N) * (n + n0) * (k + 1/2)),
    where n0 = (N/2 + 1)/2.
    """
    s = np.asarray(s, dtype=np.float64).reshape(-1)
    N = int(s.shape[0])
    if N not in (2048, 256):
        raise ValueError("MDCT input length must be 2048 or 256.")
    n0 = (N / 2.0 + 1.0) / 2.0
    n = np.arange(N, dtype=np.float64) + n0
    k = np.arange(N // 2, dtype=np.float64) + 0.5
    C = np.cos((2.0 * np.pi / N) * np.outer(n, k))  # (N, N/2)
    X = 2.0 * (s @ C)  # (N/2,)
    return X
 def imdct(X: MdctCoeffs) -> TimeSignal:
    """
    IMDCT (direct form) as specified in the assignment.
    Parameters
    ----------
    X : MdctCoeffs
        MDCT coefficients, 1-D array of length K (K = 1024 or 128).
    Returns
    -------
    TimeSignal
        Reconstructed time samples, 1-D array of length N = 2K.
    Definition
    ----------
    s[n] = (2/N) * sum_{k=0..N/2-1} X[k] * cos((2*pi/N) * (n + n0) * (k + 1/2)),
    where n0 = (N/2 + 1)/2.
    """
    X = np.asarray(X, dtype=np.float64).reshape(-1)
    K = int(X.shape[0])
    if K not in (1024, 128):
        raise ValueError("IMDCT input length must be 1024 or 128.")
    N = 2 * K
    n0 = (N / 2.0 + 1.0) / 2.0
    n = np.arange(N, dtype=np.float64) + n0
    k = np.arange(K, dtype=np.float64) + 0.5
    C = np.cos((2.0 * np.pi / N) * np.outer(n, k))  # (N, K)
    s = (2.0 / N) * (C @ X)  # (N,)
    return s
 # -----------------------------------------------------------------------------
 # Signal quality metrics
 # -----------------------------------------------------------------------------
 def snr_db(x_ref: StereoSignal, x_hat: StereoSignal) -> float:
    """
    Compute the overall Signal-to-Noise Ratio (SNR) in dB.
    The SNR is computed over all available samples and channels,
    after conservatively aligning the two signals to their common
    length and channel count.
    Parameters
    ----------
    x_ref : StereoSignal
        Reference (original) signal.
        Typical shape: (N, 2) for stereo.
    x_hat : StereoSignal
        Reconstructed or processed signal.
        Typical shape: (M, 2) for stereo.
    Returns
    -------
    float
        SNR in dB.
        - +inf if the noise power is zero (perfect reconstruction).
        - -inf if the reference signal power is zero.
    """
    x_ref = np.asarray(x_ref, dtype=np.float64)
    x_hat = np.asarray(x_hat, dtype=np.float64)
    # Ensure 2-D shape: (samples, channels)
    if x_ref.ndim == 1:
        x_ref = x_ref.reshape(-1, 1)
    if x_hat.ndim == 1:
        x_hat = x_hat.reshape(-1, 1)
    # Align lengths and channel count conservatively
    n = min(x_ref.shape[0], x_hat.shape[0])
    c = min(x_ref.shape[1], x_hat.shape[1])
    x_ref = x_ref[:n, :c]
    x_hat = x_hat[:n, :c]
    err = x_ref - x_hat
    ps = float(np.sum(x_ref * x_ref))     # signal power
    pn = float(np.sum(err * err))          # noise power
    if pn <= 0.0:
        return float("inf")
    if ps <= 0.0:
        return float("-inf")
    return float(10.0 * np.log10(ps / pn))
 # -----------------------------------------------------------------------------
 # Psychoacoustic band tables (TableB219.mat)
 # -----------------------------------------------------------------------------
 def load_b219_tables() -> dict[str, BarkTable]:
    """
    Load and cache psychoacoustic band tables from TableB219.mat.
    The assignment/project layout assumes that a 'material' directory
    is available in the current working directory when running:
    - tests
    - level_1 / level_2 / level_3 entrypoints
    This function loads the tables once and caches them for subsequent calls.
    Returns
    -------
    dict[str, BarkTable]
        Dictionary with the following entries:
        - "B219a": long-window psychoacoustic table
                   (69 bands, FFT size 2048 / 1024 spectral lines)
        - "B219b": short-window psychoacoustic table
                   (42 bands, FFT size 256 / 128 spectral lines)
    """
    global B219_CACHE
    if B219_CACHE is not None:
        return B219_CACHE
    mat_path = Path("material") / "TableB219.mat"
    if not mat_path.exists():
        raise FileNotFoundError(
            "Could not locate material/TableB219.mat in the current working directory."
        )
    data = loadmat(str(mat_path))
    if "B219a" not in data or "B219b" not in data:
        raise ValueError(
            "TableB219.mat missing required variables 'B219a' and/or 'B219b'."
        )
    B219_CACHE = {
        "B219a": np.asarray(data["B219a"], dtype=np.float64),
        "B219b": np.asarray(data["B219b"], dtype=np.float64),
    }
    return B219_CACHE
 def get_table(frame_type: FrameType) -> tuple[BarkTable, int]:
    """
    Select the appropriate psychoacoustic band table and FFT size
    based on the AAC frame type.
    Parameters
    ----------
    frame_type : FrameType
        AAC frame type ("OLS", "LSS", "ESH", "LPS").
    Returns
    -------
    table : BarkTable
        Psychoacoustic band table:
        - B219a for long frames
        - B219b for ESH short subframes
    N : int
        FFT size corresponding to the table:
        - 2048 for long frames
        - 256 for short frames (ESH)
    """
    tables = load_b219_tables()
    if frame_type == "ESH":
        return tables["B219b"], 256
    return tables["B219a"], 2048
 def band_limits(
    table: BarkTable,
 ) -> tuple[BandIndexArray, BandIndexArray, BandValueArray, BandValueArray]:
    """
    Extract per-band metadata from a TableB2.1.9 psychoacoustic table.
    The column layout follows the provided TableB219.mat file and the
    AAC specification tables B.2.1.9a / B.2.1.9b.
    Parameters
    ----------
    table : BarkTable
        Psychoacoustic band table (B219a or B219b).
    Returns
    -------
    wlow : BandIndexArray
        Lower FFT bin index (inclusive) for each band.
    whigh : BandIndexArray
        Upper FFT bin index (inclusive) for each band.
    bval : BandValueArray
        Bark-scale (or equivalent) band position values.
        Used in the spreading function.
    qthr_db : BandValueArray
        Threshold in quiet for each band, in dB.
    """
    wlow = table[:, 1].astype(int)
    whigh = table[:, 2].astype(int)
    bval = table[:, 4].astype(np.float64)
    qthr_db = table[:, 5].astype(np.float64)
    return wlow, whigh, bval, qthr_db
--- a/source/level_2/level_2.py
+++ b/source/level_2/level_2.py
@ -28,7 +28,7 @@ from core.aac_types   import AACSeq2, StereoSignal
 from core.aac_coder   import aac_coder_2 as core_aac_coder_2
 from core.aac_coder   import aac_read_wav_stereo_48k
 from core.aac_decoder import aac_decoder_2 as core_aac_decoder_2
-from core.aac_snr_db  import snr_db
+from core.aac_utils  import snr_db
 # -----------------------------------------------------------------------------
 # Public Level 2 API (wrappers)
--- a/source/level_2/material/huffCodebooks.mat
+++ b/source/level_2/material/huffCodebooks.mat
--- a/source/level_2/material/huff_utils.py
+++ b/source/level_2/material/huff_utils.py
@ -1,400 +0,0 @@
 import numpy as np
 import scipy.io as sio
 import os
 # ------------------ LOAD LUT ------------------
 def load_LUT(mat_filename=None):
    """
    Loads the list of Huffman Codebooks (LUTs)
    Returns:
        huffLUT : list (index 1..11 used, index 0 unused)
    """
    if mat_filename is None:
        current_dir = os.path.dirname(os.path.abspath(__file__))
        mat_filename = os.path.join(current_dir, "huffCodebooks.mat")
    mat = sio.loadmat(mat_filename)
    huffCodebooks_raw = mat['huffCodebooks'].squeeze()
    huffCodebooks = []
    for i in range(11):
        huffCodebooks.append(np.array(huffCodebooks_raw[i]))
    # Build inverse VLC tables
    invTable = [None] * 11
    for i in range(11):
        h = huffCodebooks[i][:, 2].astype(int)       # column 3
        hlength = huffCodebooks[i][:, 1].astype(int) # column 2
        hbin = []
        for j in range(len(h)):
            hbin.append(format(h[j], f'0{hlength[j]}b'))
        invTable[i] = vlc_table(hbin)
    # Build Huffman LUT dicts
    huffLUT = [None] * 12  # index 0 unused
    params = [
        (4, 1, True),
        (4, 1, True),
        (4, 2, False),
        (4, 2, False),
        (2, 4, True),
        (2, 4, True),
        (2, 7, False),
        (2, 7, False),
        (2, 12, False),
        (2, 12, False),
        (2, 16, False),
    ]
    for i, (nTupleSize, maxAbs, signed) in enumerate(params, start=1):
        huffLUT[i] = {
            'LUT': huffCodebooks[i-1],
            'invTable': invTable[i-1],
            'codebook': i,
            'nTupleSize': nTupleSize,
            'maxAbsCodeVal': maxAbs,
            'signedValues': signed
        }
    return huffLUT
 def vlc_table(code_array):
    """
    codeArray: list of strings, each string is a Huffman codeword (e.g. '0101')
    returns:
        h : NumPy array of shape (num_nodes, 3)
            columns:
              [ next_if_0 , next_if_1 , symbol_index ]
    """
    h = np.zeros((1, 3), dtype=int)
    for code_index, code in enumerate(code_array, start=1):
        word = [int(bit) for bit in code]
        h_index = 0
        for bit in word:
            k = bit
            next_node = h[h_index, k]
            if next_node == 0:
                h = np.vstack([h, [0, 0, 0]])
                new_index = h.shape[0] - 1
                h[h_index, k] = new_index
                h_index = new_index
            else:
                h_index = next_node
        h[h_index, 2] = code_index
    return h
 # ------------------ ENCODE ------------------
 def encode_huff(coeff_sec, huff_LUT_list, force_codebook = None):
    """
    Huffman-encode a sequence of quantized coefficients.
    This function selects the appropriate Huffman codebook based on the
    maximum absolute value of the input coefficients, encodes the coefficients
    into a binary Huffman bitstream, and returns both the bitstream and the
    selected codebook index.
    This is the Python equivalent of the MATLAB `encodeHuff.m` function used
    in audio/image coding (e.g., scale factor band encoding). The input
    coefficient sequence is grouped into fixed-size tuples as defined by
    the chosen Huffman LUT. Zero-padding may be applied internally.
    Parameters
    ----------
    coeff_sec : array_like of int
        1-D array of quantized integer coefficients to encode.
        Typically corresponds to a "section" or scale-factor band.
    huff_LUT_list : list
        List of Huffman lookup-table dictionaries as returned by `loadLUT()`.
        Index 1..11 correspond to valid Huffman codebooks.
        Index 0 is unused.
    Returns
    -------
    huffSec : str
        Huffman-encoded bitstream represented as a string of '0' and '1'
        characters.
    huffCodebook : int
        Index (1..11) of the Huffman codebook used for encoding.
        A value of 0 indicates a special all-zero section.
    """
    if force_codebook is not None:
            return huff_LUT_code_1(huff_LUT_list[force_codebook], coeff_sec)
    maxAbsVal = np.max(np.abs(coeff_sec))
    if maxAbsVal == 0:
        huffCodebook = 0
        huffSec = huff_LUT_code_0()
    elif maxAbsVal == 1:
        candidates = [1, 2]
        huffSec1 = huff_LUT_code_1(huff_LUT_list[candidates[0]], coeff_sec)
        huffSec2 = huff_LUT_code_1(huff_LUT_list[candidates[1]], coeff_sec)
        if len(huffSec1) <= len(huffSec2):
            huffSec = huffSec1
            huffCodebook = candidates[0]
        else:
            huffSec = huffSec2
            huffCodebook = candidates[1]
    elif maxAbsVal == 2:
        candidates = [3, 4]
        huffSec1 = huff_LUT_code_1(huff_LUT_list[candidates[0]], coeff_sec)
        huffSec2 = huff_LUT_code_1(huff_LUT_list[candidates[1]], coeff_sec)
        if len(huffSec1) <= len(huffSec2):
            huffSec = huffSec1
            huffCodebook = candidates[0]
        else:
            huffSec = huffSec2
            huffCodebook = candidates[1]
    elif maxAbsVal in (3, 4):
        candidates = [5, 6]
        huffSec1 = huff_LUT_code_1(huff_LUT_list[candidates[0]], coeff_sec)
        huffSec2 = huff_LUT_code_1(huff_LUT_list[candidates[1]], coeff_sec)
        if len(huffSec1) <= len(huffSec2):
            huffSec = huffSec1
            huffCodebook = candidates[0]
        else:
            huffSec = huffSec2
            huffCodebook = candidates[1]
    elif maxAbsVal in (5, 6, 7):
        candidates = [7, 8]
        huffSec1 = huff_LUT_code_1(huff_LUT_list[candidates[0]], coeff_sec)
        huffSec2 = huff_LUT_code_1(huff_LUT_list[candidates[1]], coeff_sec)
        if len(huffSec1) <= len(huffSec2):
            huffSec = huffSec1
            huffCodebook = candidates[0]
        else:
            huffSec = huffSec2
            huffCodebook = candidates[1]
    elif maxAbsVal in (8, 9, 10, 11, 12):
        candidates = [9, 10]
        huffSec1 = huff_LUT_code_1(huff_LUT_list[candidates[0]], coeff_sec)
        huffSec2 = huff_LUT_code_1(huff_LUT_list[candidates[1]], coeff_sec)
        if len(huffSec1) <= len(huffSec2):
            huffSec = huffSec1
            huffCodebook = candidates[0]
        else:
            huffSec = huffSec2
            huffCodebook = candidates[1]
    elif maxAbsVal in (13, 14, 15):
        huffCodebook = 11
        huffSec = huff_LUT_code_1(huff_LUT_list[huffCodebook], coeff_sec)
    else:
        huffCodebook = 11
        huffSec = huff_LUT_code_ESC(huff_LUT_list[huffCodebook], coeff_sec)
    return huffSec, huffCodebook
 def huff_LUT_code_1(huff_LUT, coeff_sec):
    LUT = huff_LUT['LUT']
    nTupleSize = huff_LUT['nTupleSize']
    maxAbsCodeVal = huff_LUT['maxAbsCodeVal']
    signedValues = huff_LUT['signedValues']
    numTuples = int(np.ceil(len(coeff_sec) / nTupleSize))
    if signedValues:
        coeff = coeff_sec + maxAbsCodeVal
        base = 2 * maxAbsCodeVal + 1
    else:
        coeff = coeff_sec
        base = maxAbsCodeVal + 1
    coeffPad = np.zeros(numTuples * nTupleSize, dtype=int)
    coeffPad[:len(coeff)] = coeff
    huffSec = []
    powers = base ** np.arange(nTupleSize - 1, -1, -1)
    for i in range(numTuples):
        nTuple = coeffPad[i*nTupleSize:(i+1)*nTupleSize]
        huffIndex = int(np.abs(nTuple) @ powers)
        hexVal = LUT[huffIndex, 2]
        huffLen = LUT[huffIndex, 1]
        bits = format(int(hexVal), f'0{int(huffLen)}b')
        if signedValues:
            huffSec.append(bits)
        else:
            signBits = ''.join('1' if v < 0 else '0' for v in nTuple)
            huffSec.append(bits + signBits)
    return ''.join(huffSec)
 def huff_LUT_code_0():
    return ''
 def huff_LUT_code_ESC(huff_LUT, coeff_sec):
    LUT = huff_LUT['LUT']
    nTupleSize = huff_LUT['nTupleSize']
    maxAbsCodeVal = huff_LUT['maxAbsCodeVal']
    numTuples = int(np.ceil(len(coeff_sec) / nTupleSize))
    base = maxAbsCodeVal + 1
    coeffPad = np.zeros(numTuples * nTupleSize, dtype=int)
    coeffPad[:len(coeff_sec)] = coeff_sec
    huffSec = []
    powers = base ** np.arange(nTupleSize - 1, -1, -1)
    for i in range(numTuples):
        nTuple = coeffPad[i*nTupleSize:(i+1)*nTupleSize]
        lnTuple = nTuple.astype(float)
        lnTuple[lnTuple == 0] = np.finfo(float).eps
        N4 = np.maximum(0, np.floor(np.log2(np.abs(lnTuple))).astype(int))
        N = np.maximum(0, N4 - 4)
        esc = np.abs(nTuple) > 15
        nTupleESC = nTuple.copy()
        nTupleESC[esc] = np.sign(nTupleESC[esc]) * 16
        huffIndex = int(np.abs(nTupleESC) @ powers)
        hexVal = LUT[huffIndex, 2]
        huffLen = LUT[huffIndex, 1]
        bits = format(int(hexVal), f'0{int(huffLen)}b')
        escSeq = ''
        for k in range(nTupleSize):
            if esc[k]:
                escSeq += '1' * N[k]
                escSeq += '0'
                escSeq += format(abs(nTuple[k]) - (1 << N4[k]), f'0{N4[k]}b')
        signBits = ''.join('1' if v < 0 else '0' for v in nTuple)
        huffSec.append(bits + signBits + escSeq)
    return ''.join(huffSec)
 # ------------------ DECODE ------------------
 def decode_huff(huff_sec, huff_LUT):
    """
    Decode a Huffman-encoded stream.
    Parameters
    ----------
    huff_sec : array-like of int or str
        Huffman encoded stream as a sequence of 0 and 1 (string or list/array).
    huff_LUT : dict
        Huffman lookup table with keys:
            - 'invTable': inverse table (numpy array)
            - 'codebook': codebook number
            - 'nTupleSize': tuple size
            - 'maxAbsCodeVal': maximum absolute code value
            - 'signedValues': True/False
    Returns
    -------
    decCoeffs : list of int
        Decoded quantized coefficients.
    """
    h = huff_LUT['invTable']
    huffCodebook = huff_LUT['codebook']
    nTupleSize = huff_LUT['nTupleSize']
    maxAbsCodeVal = huff_LUT['maxAbsCodeVal']
    signedValues = huff_LUT['signedValues']
    # Convert string to array of ints
    if isinstance(huff_sec, str):
        huff_sec = np.array([int(b) for b in huff_sec])
    eos = False
    decCoeffs = []
    streamIndex = 0
    while not eos:
        wordbit = 0
        r = 0  # start at root
        # Decode Huffman word using inverse table
        while True:
            b = huff_sec[streamIndex + wordbit]
            wordbit += 1
            rOld = r
            r = h[rOld, b]
            if h[r, 0] == 0 and h[r, 1] == 0:
                symbolIndex = h[r, 2] - 1  # zero-based
                streamIndex += wordbit
                break
        # Decode n-tuple magnitudes
        if signedValues:
            base = 2 * maxAbsCodeVal + 1
            nTupleDec = []
            tmp = symbolIndex
            for p in reversed(range(nTupleSize)):
                val = tmp // (base ** p)
                nTupleDec.append(val - maxAbsCodeVal)
                tmp = tmp % (base ** p)
            nTupleDec = np.array(nTupleDec)
        else:
            base = maxAbsCodeVal + 1
            nTupleDec = []
            tmp = symbolIndex
            for p in reversed(range(nTupleSize)):
                val = tmp // (base ** p)
                nTupleDec.append(val)
                tmp = tmp % (base ** p)
            nTupleDec = np.array(nTupleDec)
            # Apply sign bits
            nTupleSignBits = huff_sec[streamIndex:streamIndex + nTupleSize]
            nTupleSign = -(np.sign(nTupleSignBits - 0.5))
            streamIndex += nTupleSize
            nTupleDec = nTupleDec * nTupleSign
        # Handle escape sequences
        escIndex = np.where(np.abs(nTupleDec) == 16)[0]
        if huffCodebook == 11 and escIndex.size > 0:
            for idx in escIndex:
                N = 0
                b = huff_sec[streamIndex]
                while b:
                    N += 1
                    b = huff_sec[streamIndex + N]
                streamIndex += N
                N4 = N + 4
                escape_word = huff_sec[streamIndex:streamIndex + N4]
                escape_value = 2 ** N4 + int("".join(map(str, escape_word)), 2)
                nTupleDec[idx] = escape_value
                streamIndex += N4 + 1
            # Apply signs again
            nTupleDec[escIndex] *= nTupleSign[escIndex]
        decCoeffs.extend(nTupleDec.tolist())
        if streamIndex >= len(huff_sec):
            eos = True
    return decCoeffs
--- a/source/pytest.ini
+++ b/source/pytest.ini
@ -2,3 +2,6 @@
 pythonpath = .
 testpaths =
    core/tests
 filterwarnings =
    error::RuntimeWarning
Author	SHA1	Message	Date
Christos Choutouridis	4ebee28e4e	Level 3: A first failed attempt of encoding-decoding -> SNR=0	2026-02-09 01:58:21 +02:00
Christos Choutouridis	ae4ad82136	Level 2: Psychoacoustic first version	2026-02-08 22:53:52 +02:00