shithub: psxe

ref: 752d81359f71404b3cb410995ecbe43b0a11efa8
dir: /psx/dev/spu.c/

View raw version
#include <stdint.h>
#include <stdlib.h>
#include <string.h>

#include "spu.h"
#include "../log.h"

#define CLAMP(v, l, h) ((v <= l) ? l : ((v >= h) ? h : v))
#define MAX(a, b) (a > b ? a : b)

static const int g_spu_pos_adpcm_table[] = {
    0, +60, +115, +98, +122
};

static const int g_spu_neg_adpcm_table[] = {
    0,   0,  -52, -55,  -60
};

static const int16_t g_spu_gauss_table[] = {
    -0x001, -0x001, -0x001, -0x001, -0x001, -0x001, -0x001, -0x001,
    -0x001, -0x001, -0x001, -0x001, -0x001, -0x001, -0x001, -0x001,
    0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0000, 0x0001,
    0x0001, 0x0001, 0x0001, 0x0002, 0x0002, 0x0002, 0x0003, 0x0003,
    0x0003, 0x0004, 0x0004, 0x0005, 0x0005, 0x0006, 0x0007, 0x0007,
    0x0008, 0x0009, 0x0009, 0x000A, 0x000B, 0x000C, 0x000D, 0x000E,
    0x000F, 0x0010, 0x0011, 0x0012, 0x0013, 0x0015, 0x0016, 0x0018,
    0x0019, 0x001B, 0x001C, 0x001E, 0x0020, 0x0021, 0x0023, 0x0025,
    0x0027, 0x0029, 0x002C, 0x002E, 0x0030, 0x0033, 0x0035, 0x0038,
    0x003A, 0x003D, 0x0040, 0x0043, 0x0046, 0x0049, 0x004D, 0x0050,
    0x0054, 0x0057, 0x005B, 0x005F, 0x0063, 0x0067, 0x006B, 0x006F,
    0x0074, 0x0078, 0x007D, 0x0082, 0x0087, 0x008C, 0x0091, 0x0096,
    0x009C, 0x00A1, 0x00A7, 0x00AD, 0x00B3, 0x00BA, 0x00C0, 0x00C7,
    0x00CD, 0x00D4, 0x00DB, 0x00E3, 0x00EA, 0x00F2, 0x00FA, 0x0101,
    0x010A, 0x0112, 0x011B, 0x0123, 0x012C, 0x0135, 0x013F, 0x0148,
    0x0152, 0x015C, 0x0166, 0x0171, 0x017B, 0x0186, 0x0191, 0x019C,
    0x01A8, 0x01B4, 0x01C0, 0x01CC, 0x01D9, 0x01E5, 0x01F2, 0x0200,
    0x020D, 0x021B, 0x0229, 0x0237, 0x0246, 0x0255, 0x0264, 0x0273,
    0x0283, 0x0293, 0x02A3, 0x02B4, 0x02C4, 0x02D6, 0x02E7, 0x02F9,
    0x030B, 0x031D, 0x0330, 0x0343, 0x0356, 0x036A, 0x037E, 0x0392,
    0x03A7, 0x03BC, 0x03D1, 0x03E7, 0x03FC, 0x0413, 0x042A, 0x0441,
    0x0458, 0x0470, 0x0488, 0x04A0, 0x04B9, 0x04D2, 0x04EC, 0x0506,
    0x0520, 0x053B, 0x0556, 0x0572, 0x058E, 0x05AA, 0x05C7, 0x05E4,
    0x0601, 0x061F, 0x063E, 0x065C, 0x067C, 0x069B, 0x06BB, 0x06DC,
    0x06FD, 0x071E, 0x0740, 0x0762, 0x0784, 0x07A7, 0x07CB, 0x07EF,
    0x0813, 0x0838, 0x085D, 0x0883, 0x08A9, 0x08D0, 0x08F7, 0x091E,
    0x0946, 0x096F, 0x0998, 0x09C1, 0x09EB, 0x0A16, 0x0A40, 0x0A6C,
    0x0A98, 0x0AC4, 0x0AF1, 0x0B1E, 0x0B4C, 0x0B7A, 0x0BA9, 0x0BD8,
    0x0C07, 0x0C38, 0x0C68, 0x0C99, 0x0CCB, 0x0CFD, 0x0D30, 0x0D63,
    0x0D97, 0x0DCB, 0x0E00, 0x0E35, 0x0E6B, 0x0EA1, 0x0ED7, 0x0F0F,
    0x0F46, 0x0F7F, 0x0FB7, 0x0FF1, 0x102A, 0x1065, 0x109F, 0x10DB,
    0x1116, 0x1153, 0x118F, 0x11CD, 0x120B, 0x1249, 0x1288, 0x12C7,
    0x1307, 0x1347, 0x1388, 0x13C9, 0x140B, 0x144D, 0x1490, 0x14D4,
    0x1517, 0x155C, 0x15A0, 0x15E6, 0x162C, 0x1672, 0x16B9, 0x1700,
    0x1747, 0x1790, 0x17D8, 0x1821, 0x186B, 0x18B5, 0x1900, 0x194B,
    0x1996, 0x19E2, 0x1A2E, 0x1A7B, 0x1AC8, 0x1B16, 0x1B64, 0x1BB3,
    0x1C02, 0x1C51, 0x1CA1, 0x1CF1, 0x1D42, 0x1D93, 0x1DE5, 0x1E37,
    0x1E89, 0x1EDC, 0x1F2F, 0x1F82, 0x1FD6, 0x202A, 0x207F, 0x20D4,
    0x2129, 0x217F, 0x21D5, 0x222C, 0x2282, 0x22DA, 0x2331, 0x2389,
    0x23E1, 0x2439, 0x2492, 0x24EB, 0x2545, 0x259E, 0x25F8, 0x2653,
    0x26AD, 0x2708, 0x2763, 0x27BE, 0x281A, 0x2876, 0x28D2, 0x292E,
    0x298B, 0x29E7, 0x2A44, 0x2AA1, 0x2AFF, 0x2B5C, 0x2BBA, 0x2C18,
    0x2C76, 0x2CD4, 0x2D33, 0x2D91, 0x2DF0, 0x2E4F, 0x2EAE, 0x2F0D,
    0x2F6C, 0x2FCC, 0x302B, 0x308B, 0x30EA, 0x314A, 0x31AA, 0x3209,
    0x3269, 0x32C9, 0x3329, 0x3389, 0x33E9, 0x3449, 0x34A9, 0x3509,
    0x3569, 0x35C9, 0x3629, 0x3689, 0x36E8, 0x3748, 0x37A8, 0x3807,
    0x3867, 0x38C6, 0x3926, 0x3985, 0x39E4, 0x3A43, 0x3AA2, 0x3B00,
    0x3B5F, 0x3BBD, 0x3C1B, 0x3C79, 0x3CD7, 0x3D35, 0x3D92, 0x3DEF,
    0x3E4C, 0x3EA9, 0x3F05, 0x3F62, 0x3FBD, 0x4019, 0x4074, 0x40D0,
    0x412A, 0x4185, 0x41DF, 0x4239, 0x4292, 0x42EB, 0x4344, 0x439C,
    0x43F4, 0x444C, 0x44A3, 0x44FA, 0x4550, 0x45A6, 0x45FC, 0x4651,
    0x46A6, 0x46FA, 0x474E, 0x47A1, 0x47F4, 0x4846, 0x4898, 0x48E9,
    0x493A, 0x498A, 0x49D9, 0x4A29, 0x4A77, 0x4AC5, 0x4B13, 0x4B5F,
    0x4BAC, 0x4BF7, 0x4C42, 0x4C8D, 0x4CD7, 0x4D20, 0x4D68, 0x4DB0,
    0x4DF7, 0x4E3E, 0x4E84, 0x4EC9, 0x4F0E, 0x4F52, 0x4F95, 0x4FD7,
    0x5019, 0x505A, 0x509A, 0x50DA, 0x5118, 0x5156, 0x5194, 0x51D0,
    0x520C, 0x5247, 0x5281, 0x52BA, 0x52F3, 0x532A, 0x5361, 0x5397,
    0x53CC, 0x5401, 0x5434, 0x5467, 0x5499, 0x54CA, 0x54FA, 0x5529,
    0x5558, 0x5585, 0x55B2, 0x55DE, 0x5609, 0x5632, 0x565B, 0x5684,
    0x56AB, 0x56D1, 0x56F6, 0x571B, 0x573E, 0x5761, 0x5782, 0x57A3,
    0x57C3, 0x57E2, 0x57FF, 0x581C, 0x5838, 0x5853, 0x586D, 0x5886,
    0x589E, 0x58B5, 0x58CB, 0x58E0, 0x58F4, 0x5907, 0x5919, 0x592A,
    0x593A, 0x5949, 0x5958, 0x5965, 0x5971, 0x597C, 0x5986, 0x598F,
    0x5997, 0x599E, 0x59A4, 0x59A9, 0x59AD, 0x59B0, 0x59B2, 0x59B3
};

psx_spu_t* psx_spu_create() {
    return (psx_spu_t*)malloc(sizeof(psx_spu_t));
}

void psx_spu_init(psx_spu_t* spu) {
    memset(spu, 0, sizeof(psx_spu_t));

    spu->io_base = PSX_SPU_BEGIN;
    spu->io_size = PSX_SPU_SIZE;

    spu->ram = (uint8_t*)malloc(SPU_RAM_SIZE);

    memset(spu->ram, 0, SPU_RAM_SIZE);

    // Mute all voices
    spu->endx = 0x00ffffff;
}

uint32_t psx_spu_read32(psx_spu_t* spu, uint32_t offset) {
    const uint8_t* ptr = (uint8_t*)&spu->voice[0].volumel;

    return *((uint32_t*)(ptr + offset));
}

uint16_t psx_spu_read16(psx_spu_t* spu, uint32_t offset) {
    const uint8_t* ptr = (uint8_t*)&spu->voice[0].volumel;

    return *((uint16_t*)(ptr + offset));
}

uint8_t psx_spu_read8(psx_spu_t* spu, uint32_t offset) {
    log_fatal("Unhandled 8-bit SPU read at offset %08x", offset);

    return 0x0;
}

void spu_read_block(psx_spu_t* spu, int v) {
    uint32_t addr = spu->data[v].current_addr;
    uint8_t hdr = spu->ram[addr];

    spu->data[v].block_flags = spu->ram[addr + 1];

    unsigned shift  = 12 - (hdr & 0x0f);
    unsigned filter = (hdr >> 4) & 7;

    int32_t f0 = g_spu_pos_adpcm_table[filter];
    int32_t f1 = g_spu_neg_adpcm_table[filter];

    for (int j = 0; j < 28; j++) {
        uint16_t n = (spu->ram[addr + 2 + (j >> 1)] >> ((j & 1) * 4)) & 0xf;

        // Sign extend t
        int16_t t = (int16_t)(n << 12) >> 12; 
        int16_t s = (t << shift) + (((spu->data[v].h[0] * f0) + (spu->data[v].h[1] * f1) + 32) / 64);
        
        s = (s < INT16_MIN) ? INT16_MIN : ((s > INT16_MAX) ? INT16_MAX : s);

        spu->data[v].h[1] = spu->data[v].h[0];
        spu->data[v].h[0] = s;
        spu->data[v].buf[j] = s;
    }
}

#define PHASE spu->data[v].adsr_phase
#define CYCLES spu->data[v].adsr_cycles
#define EXPONENTIAL spu->data[v].adsr_mode
#define DECREASE spu->data[v].adsr_dir
#define SHIFT spu->data[v].adsr_shift
#define STEP spu->data[v].adsr_step
#define LEVEL_STEP spu->data[v].adsr_pending_step
#define LEVEL spu->voice[v].envcvol

/*
  ____lower 16bit (at 1F801C08h+N*10h)___________________________________
  15    Attack Mode       (0=Linear, 1=Exponential)
  -     Attack Direction  (Fixed, always Increase) (until Level 7FFFh)
  14-10 Attack Shift      (0..1Fh = Fast..Slow)
  9-8   Attack Step       (0..3 = "+7,+6,+5,+4")
  -     Decay Mode        (Fixed, always Exponential)
  -     Decay Direction   (Fixed, always Decrease) (until Sustain Level)
  7-4   Decay Shift       (0..0Fh = Fast..Slow)
  -     Decay Step        (Fixed, always "-8")
  3-0   Sustain Level     (0..0Fh)  ;Level=(N+1)*800h
  ____upper 16bit (at 1F801C0Ah+N*10h)___________________________________
  31    Sustain Mode      (0=Linear, 1=Exponential)
  30    Sustain Direction (0=Increase, 1=Decrease) (until Key OFF flag)
  29    Not used?         (should be zero)
  28-24 Sustain Shift     (0..1Fh = Fast..Slow)
  23-22 Sustain Step      (0..3 = "+7,+6,+5,+4" or "-8,-7,-6,-5") (inc/dec)
  21    Release Mode      (0=Linear, 1=Exponential)
  -     Release Direction (Fixed, always Decrease) (until Level 0000h)
  20-16 Release Shift     (0..1Fh = Fast..Slow)
  -     Release Step      (Fixed, always "-8")
*/

void spu_advance_adsr(psx_spu_t* spu, int v) {
    switch (spu->data[v].adsr_phase) {
        // KON->Attack
        case 0: {
            EXPONENTIAL = spu->voice[v].envctl1 >> 15;
            DECREASE    = 0;
            SHIFT       = (spu->voice[v].envctl1 >> 10) & 0x1f;
            STEP        = 7 - ((spu->voice[v].envctl1 >> 8) & 3);
            LEVEL       = 0;
        } break;

        // Attack->Decay
        case 1: {
            EXPONENTIAL = 1;
            DECREASE    = 1;
            SHIFT       = (spu->voice[v].envctl1 >> 4) & 0xf;
            STEP        = -8;
            LEVEL       = 0x7fff;
        } break;

        // Decay->Sustain
        case 2: {
            EXPONENTIAL = spu->voice[v].envctl2 >> 15;
            DECREASE    = (spu->voice[v].envctl2 >> 14) & 1;
            SHIFT       = (spu->voice[v].envctl2 >> 8) & 0x1f;
            STEP        = (spu->voice[v].envctl2 >> 6) & 3;
            LEVEL       = spu->data[v].adsr_sustain_level;

            STEP = DECREASE ? (-8 + STEP) : (7 - STEP);
        } break;

        // Sustain->Release
        case 3: {
            EXPONENTIAL = (spu->voice[v].envctl2 >> 5) & 1;
            DECREASE    = 1;
            SHIFT       = spu->voice[v].envctl2 & 0x1f;
            STEP        = -8;
            //LEVEL       = spu->data[v].adsr_sustain_level;
        } break;
    }

    CYCLES = 1 << MAX(0, SHIFT - 11);
    LEVEL_STEP = STEP << MAX(0, 11 - SHIFT);

    if (EXPONENTIAL && (LEVEL > 0x6000) && !DECREASE)
        CYCLES *= 4;
    
    if (EXPONENTIAL && DECREASE)
        LEVEL_STEP *= LEVEL / 0x8000;
    
    spu->data[v].adsr_cycles_reload = CYCLES;
    
    log_fatal("voice %u ADSR advance %u c=%u, s=%04x, step=%04x, level=%04x",
        v, spu->data[v].adsr_phase, CYCLES, LEVEL_STEP, STEP, LEVEL
    );
}

void spu_handle_adsr(psx_spu_t* spu, int v) {
    CYCLES = spu->data[v].adsr_cycles_reload;

    LEVEL += LEVEL_STEP;

    switch (spu->data[v].adsr_phase) {
        case 0: {
            LEVEL = CLAMP(LEVEL, 0x0000, 0x7fff);

            if (LEVEL == 0x7fff) {
                spu->data[v].adsr_phase = 1;

                spu_advance_adsr(spu, v);
            }
        } break;

        case 1: {
            LEVEL = CLAMP(LEVEL, 0x0000, 0x7fff);

            if (LEVEL >= spu->data[v].adsr_sustain_level) {
                spu->data[v].adsr_phase = 2;

                spu_advance_adsr(spu, v);
            }
        } break;

        case 3: {
            LEVEL = CLAMP(LEVEL, 0x0000, 0x7fff);

            if (!LEVEL) {
                spu->data[v].adsr_phase = 0;
                spu->data[v].playing = 0;
            }
        } break;
    }
}

#undef PHASE
#undef CYCLES
#undef MODE
#undef DIR
#undef SHIFT
#undef STEP
#undef PENDING_STEP

int spu_handle_write(psx_spu_t* spu, uint32_t offset, uint32_t value) {
    switch (offset) {
        case SPUR_KON: {
            if (!value)
                return 1;

            // log_set_quiet(0);
            log_fatal("KON %04x:", value);
            for (int i = 0; i < 24; i++) {
                if ((value & (1 << i))) {
                    spu->data[i].playing = 1;
                    spu->data[i].current_addr = spu->voice[i].adsaddr << 3;
                    spu->data[i].repeat_addr = spu->data[i].current_addr;
                    spu->data[i].lvol = (float)(spu->voice[i].volumel << 1) / (float)0x7fff;
                    spu->data[i].rvol = (float)(spu->voice[i].volumer << 1) / (float)0x7fff;
                    spu->data[i].adsr_sustain_level = ((spu->voice[i].envctl1 & 0xf) + 1) * 0x800;
                    spu->data[i].adsr_phase = 0;

                    log_fatal("    voice %2u s=%06x r=%06x p=%04x vol=%f,%f adsr=%04x,%04x cvol=%04x",
                        i,
                        spu->voice[i].adsaddr << 3,
                        spu->voice[i].adraddr << 3,
                        spu->voice[i].adsampr,
                        spu->data[i].lvol,
                        spu->data[i].rvol,
                        spu->voice[i].envctl1,
                        spu->voice[i].envctl2,
                        spu->voice[i].envcvol
                    );

                    spu_advance_adsr(spu, i);
                    spu_read_block(spu, i);
                }
            }
                    
            // log_set_quiet(1);
            spu->endx &= ~(value & 0x00ffffff);
        } return 1;

        case SPUR_KOFF: {
            // log_set_quiet(0);
            log_fatal("KOFF %04x:", value);
            for (int i = 0; i < 24; i++) {
                if ((value & (1 << i))) {
                    spu->data[i].adsr_phase = 3;
                    spu->data[i].playing = 0;

                    spu_advance_adsr(spu, i);

                    log_fatal("    voice %2u",
                        i,
                        spu->voice[i].adsaddr << 3,
                        spu->voice[i].adraddr << 3,
                        spu->voice[i].adsampr,
                        spu->data[i].lvol,
                        spu->data[i].rvol
                    );
                }
            }
            // log_set_quiet(1);

            //spu->endx |= value & 0x00ffffff;
        } return 1;

        case SPUR_TADDR: {
            spu->ramdta = value;
            spu->taddr = value << 3;

            // // log_set_quiet(0);
            // log_fatal("ramdta=%04x taddr=%08x", spu->ramdta, spu->taddr);
            // // log_set_quiet(1);
        } return 1;

        case SPUR_TFIFO: {
            // // log_set_quiet(0);
            // log_fatal("TFIFO write %04x (index=%u)", value, spu->tfifo_index);
            // // log_set_quiet(1);
            spu->ramdtf = value;
            spu->tfifo[spu->tfifo_index++] = value;

            if (spu->tfifo_index == 32) {
                if (((spu->spucnt >> 4) & 3) == 2) {
                    for (int i = 0; i < spu->tfifo_index; i++) {
                        spu->ram[spu->taddr++] = spu->tfifo[i] & 0xff;
                        spu->ram[spu->taddr++] = spu->tfifo[i] >> 8;
                    }

                    spu->tfifo_index = 0;
                }
            }
        } return 1;

        case SPUR_SPUCNT: {
            spu->spucnt = value;
            spu->spustat &= 0xffc0;
            spu->spustat |= value & 0x3f;

            if ((value >> 4) & 3) {
                for (int i = 0; i < spu->tfifo_index; i++) {
                    spu->ram[spu->taddr++] = spu->tfifo[i] & 0xff;
                    spu->ram[spu->taddr++] = spu->tfifo[i] >> 8;
                }
                    
                // // log_set_quiet(0);
                // log_fatal("Transfer start mode=%u size=%u", (value >> 4) & 3, spu->tfifo_index);
                // // log_set_quiet(1);

                spu->tfifo_index = 0;
            }
        } return 1;
    }

    return 0;
}

void psx_spu_write32(psx_spu_t* spu, uint32_t offset, uint32_t value) {
    // Handle special cases first
    if (spu_handle_write(spu, offset, value))
        return;

    const uint8_t* ptr = (uint8_t*)&spu->voice[0].volumel;

    *((uint32_t*)(ptr + offset)) = value;
}

void psx_spu_write16(psx_spu_t* spu, uint32_t offset, uint16_t value) {
    // Handle special cases first
    if (spu_handle_write(spu, offset, value))
        return;

    const uint8_t* ptr = (uint8_t*)&spu->voice[0].volumel;

    *((uint16_t*)(ptr + offset)) = value;
}

void psx_spu_write8(psx_spu_t* spu, uint32_t offset, uint8_t value) {
    log_fatal("Unhandled 8-bit SPU write at offset %08x (%02x)", offset, value);
}

void psx_spu_destroy(psx_spu_t* spu) {
    free(spu->ram);
    free(spu);
}

/*
  0-3   Shift  (0..12) (0=Loudest) (13..15=Reserved/Same as 9)
  4-5   Filter (0..3) (only four filters, unlike SPU-ADPCM which has five)
  6-7   Unused (should be 0)
*/

uint32_t psx_spu_get_sample(psx_spu_t* spu) {
    if (spu->endx == 0x00ffffff)
        return 0x0000;

    int voice_count = 0;
    int left = 0x0000;
    int right = 0x0000;

    for (int v = 0; v < 24; v++) {
        // if (spu->data[v].adsr_cycles) {
        //     --spu->data[v].adsr_cycles;

        //     if (!spu->data[v].adsr_cycles)
        //         spu_handle_adsr(spu, v);
        // }

        if (!spu->data[v].playing)
            continue;
        
        ++voice_count;

        // Shift 3 older samples around
        spu->data[v].s[3] = spu->data[v].s[2];
        spu->data[v].s[2] = spu->data[v].s[1];
        spu->data[v].s[1] = spu->data[v].s[0];

        uint32_t sample_index = spu->data[v].counter >> 12;

        if (sample_index >= 28) {
            sample_index -= 28;

            spu->data[v].counter &= 0xfff;
            spu->data[v].counter |= sample_index << 12;

            switch (spu->data[v].block_flags & 3) {
                case 0: case 2: {
                    spu->data[v].current_addr += 0x10;
                } break;

                case 1: {
                    spu->data[v].current_addr = spu->data[v].repeat_addr;
                    //spu->endx |= (1 << v);
                    spu->data[v].playing = 0;
                } break;

                case 3: {
                    spu->data[v].current_addr = spu->data[v].repeat_addr;
                } break;
            }

            if (spu->data[v].block_flags & 4)
                spu->data[v].repeat_addr = spu->data[v].current_addr;

            spu_read_block(spu, v);
        }

        // Fetch ADPCM sample
        spu->data[v].s[0] = spu->data[v].buf[sample_index];

        // Apply 4-point Gaussian interpolation
        uint8_t gauss_index = (spu->data[v].counter >> 4) & 0xff;
        int16_t g0 = g_spu_gauss_table[0x0ff - gauss_index];
        int16_t g1 = g_spu_gauss_table[0x1ff - gauss_index];
        int16_t g2 = g_spu_gauss_table[0x100 + gauss_index];
        int16_t g3 = g_spu_gauss_table[0x000 + gauss_index];
        int16_t out;

        out  = (g0 * spu->data[v].s[3]) >> 15;
        out += (g1 * spu->data[v].s[2]) >> 15;
        out += (g2 * spu->data[v].s[1]) >> 15;
        out += (g3 * spu->data[v].s[0]) >> 15;

        //float adsr_vol = (float)spu->voice[v].envcvol / 32767.0f;

        left += out * spu->data[v].lvol;
        right += out * spu->data[v].rvol;

        // left *= adsr_vol;
        // right *= adsr_vol;

        uint16_t step = spu->voice[v].adsampr;

        /* To-do: Do pitch modulation here */

        spu->data[v].counter += step;
    }

    if (!voice_count)
        return 0x00000000;

    uint16_t clampl = CLAMP(left, INT16_MIN, INT16_MAX);
    uint16_t clampr = CLAMP(right, INT16_MIN, INT16_MAX);

    return clampl | (((uint32_t)clampr) << 16);
}

#undef CLAMP
#undef MAX