/*
 * This Source Code Form is subject to the terms of the Mozilla Public
 * License, v. 2.0. If a copy of the MPL was not distributed with this file, 
 * You can obtain one at http://mozilla.org/MPL/2.0/.
 *
 * Copyright (c) 2014-2015, Normmatt
 *
 * Alternatively, the contents of this file may be used under the terms
 * of the GNU General Public License Version 2, as described below:
 *
 * This file is free software: you may copy, redistribute and/or modify
 * it under the terms of the GNU General Public License as published by the
 * Free Software Foundation, either version 2 of the License, or (at your
 * option) any later version.
 *
 * This file is distributed in the hope that it will be useful, but
 * WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General
 * Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with this program. If not, see http://www.gnu.org/licenses/.
 */

#include "sdmmc.h"
#include "delay.h"

static struct mmcdevice handleNAND;
static struct mmcdevice handleSD;

static inline u16 sdmmc_read16(u16 reg)
{
    return *(vu16 *)(SDMMC_BASE + reg);
}

static inline void sdmmc_write16(u16 reg, u16 val)
{
    *(vu16 *)(SDMMC_BASE + reg) = val;
}

static inline u32 sdmmc_read32(u16 reg)
{
    return *(vu32 *)(SDMMC_BASE + reg);
}

static inline void sdmmc_write32(u16 reg, u32 val)
{
    *(vu32 *)(SDMMC_BASE + reg) = val;
}

static inline void sdmmc_mask16(u16 reg, const u16 clear, const u16 set)
{
    u16 val = sdmmc_read16(reg);
    val &= ~clear;
    val |= set;
    sdmmc_write16(reg, val);
}

static inline void setckl(u32 data)
{
    sdmmc_mask16(REG_SDCLKCTL, 0x100, 0);
    sdmmc_mask16(REG_SDCLKCTL, 0x2FF, data & 0x2FF);
    sdmmc_mask16(REG_SDCLKCTL, 0x0, 0x100);
}

mmcdevice *getMMCDevice(int drive)
{
    if(drive == 0) return &handleNAND;
    return &handleSD;
}

static int geterror(struct mmcdevice *ctx)
{
    return (int)((ctx->error << 29) >> 31);
}

static void inittarget(struct mmcdevice *ctx)
{
    sdmmc_mask16(REG_SDPORTSEL, 0x3, (u16)ctx->devicenumber);
    setckl(ctx->clk);
    if(ctx->SDOPT == 0) sdmmc_mask16(REG_SDOPT, 0, 0x8000);
    else sdmmc_mask16(REG_SDOPT, 0x8000, 0);
}

static void __attribute__((noinline)) sdmmc_send_command(struct mmcdevice *ctx, u32 cmd, u32 args)
{
    u32 getSDRESP = (cmd << 15) >> 31;
    u16 flags = (cmd << 15) >> 31;
    const int readdata = cmd & 0x20000;
    const int writedata = cmd & 0x40000;

    if(readdata || writedata)
        flags |= TMIO_STAT0_DATAEND;

    ctx->error = 0;
    while((sdmmc_read16(REG_SDSTATUS1) & TMIO_STAT1_CMD_BUSY)); //mmc working?
    sdmmc_write16(REG_SDIRMASK0, 0);
    sdmmc_write16(REG_SDIRMASK1, 0);
    sdmmc_write16(REG_SDSTATUS0, 0);
    sdmmc_write16(REG_SDSTATUS1, 0);
    sdmmc_mask16(REG_DATACTL32, 0x1800, 0);
    sdmmc_write16(REG_SDCMDARG0, args & 0xFFFF);
    sdmmc_write16(REG_SDCMDARG1, args >> 16);
    sdmmc_write16(REG_SDCMD, cmd & 0xFFFF);

    u32 size = ctx->size;
    u8 *rDataPtr = ctx->rData;
    const u8 *tDataPtr = ctx->tData;

    bool rUseBuf = rDataPtr != NULL;
    bool tUseBuf = tDataPtr != NULL;

    u16 status0 = 0;
    while(true)
    {
        vu16 status1 = sdmmc_read16(REG_SDSTATUS1);
        vu16 ctl32 = sdmmc_read16(REG_DATACTL32);
        if((ctl32 & 0x100))
        {
            if(readdata)
            {
                if(rUseBuf)
                {
                    sdmmc_mask16(REG_SDSTATUS1, TMIO_STAT1_RXRDY, 0);
                    if(size > 0x1FF)
                    {
                        //Gabriel Marcano: This implementation doesn't assume alignment.
                        //I've removed the alignment check doen with former rUseBuf32 as a result
                        for(int i = 0; i < 0x200; i += 4)
                        {
                            u32 data = sdmmc_read32(REG_SDFIFO32);
                            *rDataPtr++ = data;
                            *rDataPtr++ = data >> 8;
                            *rDataPtr++ = data >> 16;
                            *rDataPtr++ = data >> 24;
                        }
                        size -= 0x200;
                    }
                }

                sdmmc_mask16(REG_DATACTL32, 0x800, 0);
            }
        }
        if(!(ctl32 & 0x200))
        {
            if(writedata)
            {
                if(tUseBuf)
                {
                    sdmmc_mask16(REG_SDSTATUS1, TMIO_STAT1_TXRQ, 0);
                    if(size > 0x1FF)
                    {
                        for(int i = 0; i < 0x200; i += 4)
                        {
                            u32 data = *tDataPtr++;
                            data |= (u32)*tDataPtr++ << 8;
                            data |= (u32)*tDataPtr++ << 16;
                            data |= (u32)*tDataPtr++ << 24;
                            sdmmc_write32(REG_SDFIFO32, data);
                        }
                        size -= 0x200;
                    }
                }

                sdmmc_mask16(REG_DATACTL32, 0x1000, 0);
            }
        }
        if(status1 & TMIO_MASK_GW)
        {
            ctx->error |= 4;
            break;
        }

        if(!(status1 & TMIO_STAT1_CMD_BUSY))
        {
            status0 = sdmmc_read16(REG_SDSTATUS0);
            if(sdmmc_read16(REG_SDSTATUS0) & TMIO_STAT0_CMDRESPEND)
            {
                ctx->error |= 0x1;
            }
            if(status0 & TMIO_STAT0_DATAEND)
            {
                ctx->error |= 0x2;
            }

            if((status0 & flags) == flags)
                break;
        }
    }
    ctx->stat0 = sdmmc_read16(REG_SDSTATUS0);
    ctx->stat1 = sdmmc_read16(REG_SDSTATUS1);
    sdmmc_write16(REG_SDSTATUS0, 0);
    sdmmc_write16(REG_SDSTATUS1, 0);

    if(getSDRESP != 0)
    {
        ctx->ret[0] = (u32)(sdmmc_read16(REG_SDRESP0) | (sdmmc_read16(REG_SDRESP1) << 16));
        ctx->ret[1] = (u32)(sdmmc_read16(REG_SDRESP2) | (sdmmc_read16(REG_SDRESP3) << 16));
        ctx->ret[2] = (u32)(sdmmc_read16(REG_SDRESP4) | (sdmmc_read16(REG_SDRESP5) << 16));
        ctx->ret[3] = (u32)(sdmmc_read16(REG_SDRESP6) | (sdmmc_read16(REG_SDRESP7) << 16));
    }
}

int __attribute__((noinline)) sdmmc_sdcard_writesectors(u32 sector_no, u32 numsectors, const u8 *in)
{
    if(handleSD.isSDHC == 0) sector_no <<= 9;
    inittarget(&handleSD);
    sdmmc_write16(REG_SDSTOP, 0x100);
    sdmmc_write16(REG_SDBLKCOUNT32, numsectors);
    sdmmc_write16(REG_SDBLKLEN32, 0x200);
    sdmmc_write16(REG_SDBLKCOUNT, numsectors);
    handleSD.tData = in;
    handleSD.size = numsectors << 9;
    sdmmc_send_command(&handleSD, 0x52C19, sector_no);
    return geterror(&handleSD);
}

int __attribute__((noinline)) sdmmc_sdcard_readsectors(u32 sector_no, u32 numsectors, u8 *out)
{
    if(handleSD.isSDHC == 0) sector_no <<= 9;
    inittarget(&handleSD);
    sdmmc_write16(REG_SDSTOP, 0x100);
    sdmmc_write16(REG_SDBLKCOUNT32, numsectors);
    sdmmc_write16(REG_SDBLKLEN32, 0x200);
    sdmmc_write16(REG_SDBLKCOUNT, numsectors);
    handleSD.rData = out;
    handleSD.size = numsectors << 9;
    sdmmc_send_command(&handleSD, 0x33C12, sector_no);
    return geterror(&handleSD);
}

int __attribute__((noinline)) sdmmc_nand_readsectors(u32 sector_no, u32 numsectors, u8 *out)
{
    if(handleNAND.isSDHC == 0) sector_no <<= 9;
    inittarget(&handleNAND);
    sdmmc_write16(REG_SDSTOP, 0x100);
    sdmmc_write16(REG_SDBLKCOUNT32, numsectors);
    sdmmc_write16(REG_SDBLKLEN32, 0x200);
    sdmmc_write16(REG_SDBLKCOUNT, numsectors);
    handleNAND.rData = out;
    handleNAND.size = numsectors << 9;
    sdmmc_send_command(&handleNAND, 0x33C12, sector_no);
    inittarget(&handleSD);
    return geterror(&handleNAND);
}

int __attribute__((noinline)) sdmmc_nand_writesectors(u32 sector_no, u32 numsectors, const u8 *in) //experimental
{
    if(handleNAND.isSDHC == 0) sector_no <<= 9;
    inittarget(&handleNAND);
    sdmmc_write16(REG_SDSTOP, 0x100);
    sdmmc_write16(REG_SDBLKCOUNT32, numsectors);
    sdmmc_write16(REG_SDBLKLEN32, 0x200);
    sdmmc_write16(REG_SDBLKCOUNT, numsectors);
    handleNAND.tData = in;
    handleNAND.size = numsectors << 9;
    sdmmc_send_command(&handleNAND, 0x52C19, sector_no);
    inittarget(&handleSD);
    return geterror(&handleNAND);
}

static u32 calcSDSize(u8 *csd, int type)
{
    u32 result = 0;
    if(type == -1) type = csd[14] >> 6;
    switch(type)
    {
        case 0:
        {
            u32 block_len = csd[9] & 0xF;
            block_len = 1u << block_len;
            u32 mult = (u32)((csd[4] >> 7) | ((csd[5] & 3) << 1));
            mult = 1u << (mult + 2);
            result = csd[8] & 3;
            result = (result << 8) | csd[7];
            result = (result << 2) | (csd[6] >> 6);
            result = (result + 1) * mult * block_len / 512;
            break;
        }
        case 1:
            result = csd[7] & 0x3F;
            result = (result << 8) | csd[6];
            result = (result << 8) | csd[5];
            result = (result + 1) * 1024;
            break;
        default:
            break; //Do nothing otherwise FIXME perhaps return some error?
    }
    return result;
}

static void InitSD()
{
    *(vu32 *)0x10000020 = 0; //InitFS stuff
    *(vu32 *)0x10000020 = 0x200; //InitFS stuff
    *(vu16 *)0x10006100 &= 0xF7FFu; //SDDATACTL32
    *(vu16 *)0x10006100 &= 0xEFFFu; //SDDATACTL32
    *(vu16 *)0x10006100 |= 0x402u; //SDDATACTL32
    *(vu16 *)0x100060D8 = (*(vu16 *)0x100060D8 & 0xFFDD) | 2;
    *(vu16 *)0x10006100 &= 0xFFFFu; //SDDATACTL32
    *(vu16 *)0x100060D8 &= 0xFFDFu; //SDDATACTL
    *(vu16 *)0x10006104 = 512; //SDBLKLEN32
    *(vu16 *)0x10006108 = 1; //SDBLKCOUNT32
    *(vu16 *)0x100060E0 &= 0xFFFEu; //SDRESET
    *(vu16 *)0x100060E0 |= 1u; //SDRESET
    *(vu16 *)0x10006020 |= TMIO_MASK_ALL; //SDIR_MASK0
    *(vu16 *)0x10006022 |= TMIO_MASK_ALL>>16; //SDIR_MASK1
    *(vu16 *)0x100060FC |= 0xDBu; //SDCTL_RESERVED7
    *(vu16 *)0x100060FE |= 0xDBu; //SDCTL_RESERVED8
    *(vu16 *)0x10006002 &= 0xFFFCu; //SDPORTSEL
    *(vu16 *)0x10006024 = 0x20;
    *(vu16 *)0x10006028 = 0x40EE;
    *(vu16 *)0x10006002 &= 0xFFFCu; ////SDPORTSEL
    *(vu16 *)0x10006026 = 512; //SDBLKLEN
    *(vu16 *)0x10006008 = 0; //SDSTOP
}

static int Nand_Init()
{
    //NAND
    handleNAND.isSDHC = 0;
    handleNAND.SDOPT = 0;
    handleNAND.res = 0;
    handleNAND.initarg = 1;
    handleNAND.clk = 0x80;
    handleNAND.devicenumber = 1;

    inittarget(&handleNAND);
    waitcycles(0xF000);

    sdmmc_send_command(&handleNAND, 0, 0);

    do
    {
        do
        {
            sdmmc_send_command(&handleNAND, 0x10701, 0x100000);
        }
        while(!(handleNAND.error & 1));
    }
    while((handleNAND.ret[0] & 0x80000000) == 0);

    sdmmc_send_command(&handleNAND, 0x10602, 0x0);
    if((handleNAND.error & 0x4)) return -1;

    sdmmc_send_command(&handleNAND, 0x10403, handleNAND.initarg << 0x10);
    if((handleNAND.error & 0x4)) return -1;

    sdmmc_send_command(&handleNAND, 0x10609, handleNAND.initarg << 0x10);
    if((handleNAND.error & 0x4)) return -1;

    handleNAND.total_size = calcSDSize((u8*)&handleNAND.ret[0], 0);
    handleNAND.clk = 1;
    setckl(1);

    sdmmc_send_command(&handleNAND, 0x10407, handleNAND.initarg << 0x10);
    if((handleNAND.error & 0x4)) return -1;

    handleNAND.SDOPT = 1;

    sdmmc_send_command(&handleNAND, 0x10506, 0x3B70100);
    if((handleNAND.error & 0x4)) return -1;

    sdmmc_send_command(&handleNAND, 0x10506, 0x3B90100);
    if((handleNAND.error & 0x4)) return -1;

    sdmmc_send_command(&handleNAND, 0x1040D, handleNAND.initarg << 0x10);
    if((handleNAND.error & 0x4)) return -1;

    sdmmc_send_command(&handleNAND, 0x10410, 0x200);
    if((handleNAND.error & 0x4)) return -1;

    handleNAND.clk |= 0x200;

    inittarget(&handleSD);

    return 0;
}

static int SD_Init()
{
    //SD
    handleSD.isSDHC = 0;
    handleSD.SDOPT = 0;
    handleSD.res = 0;
    handleSD.initarg = 0;
    handleSD.clk = 0x80;
    handleSD.devicenumber = 0;

    inittarget(&handleSD);

    waitcycles(1u << 22); //Card needs a little bit of time to be detected, it seems FIXME test again to see what a good number is for the delay

    //If not inserted
    if(!(*((vu16 *)(SDMMC_BASE + REG_SDSTATUS0)) & TMIO_STAT0_SIGSTATE)) return 5;

    sdmmc_send_command(&handleSD, 0, 0);
    sdmmc_send_command(&handleSD, 0x10408, 0x1AA);
    u32 temp = (handleSD.error & 0x1) << 0x1E;

    u32 temp2 = 0;
    do
    {
        do
        {
            sdmmc_send_command(&handleSD, 0x10437, handleSD.initarg << 0x10);
            sdmmc_send_command(&handleSD, 0x10769, 0x00FF8000 | temp);
            temp2 = 1;
        }
        while(!(handleSD.error & 1));
    }
    while((handleSD.ret[0] & 0x80000000) == 0);

    if(!((handleSD.ret[0] >> 30) & 1) || !temp)
        temp2 = 0;

    handleSD.isSDHC = temp2;

    sdmmc_send_command(&handleSD, 0x10602, 0);
    if((handleSD.error & 0x4)) return -1;

    sdmmc_send_command(&handleSD, 0x10403, 0);
    if((handleSD.error & 0x4)) return -2;
    handleSD.initarg = handleSD.ret[0] >> 0x10;

    sdmmc_send_command(&handleSD, 0x10609, handleSD.initarg << 0x10);
    if((handleSD.error & 0x4)) return -3;

    handleSD.total_size = calcSDSize((u8*)&handleSD.ret[0], -1);
    handleSD.clk = 1;
    setckl(1);

    sdmmc_send_command(&handleSD, 0x10507, handleSD.initarg << 0x10);
    if((handleSD.error & 0x4)) return -4;

    sdmmc_send_command(&handleSD, 0x10437, handleSD.initarg << 0x10);
    if((handleSD.error & 0x4)) return -5;

    handleSD.SDOPT = 1;
    sdmmc_send_command(&handleSD, 0x10446, 0x2);
    if((handleSD.error & 0x4)) return -6;

    sdmmc_send_command(&handleSD, 0x1040D, handleSD.initarg << 0x10);
    if((handleSD.error & 0x4)) return -7;

    sdmmc_send_command(&handleSD, 0x10410, 0x200);
    if((handleSD.error & 0x4)) return -8;
    handleSD.clk |= 0x200;

    return 0;
}

void sdmmc_get_cid(bool isNand, u32 *info)
{
    struct mmcdevice *device = isNand ? &handleNAND : &handleSD;

    inittarget(device);

    // use cmd7 to put sd card in standby mode
    // CMD7
    sdmmc_send_command(device, 0x10507, 0);

    // get sd card info
    // use cmd10 to read CID
    sdmmc_send_command(device, 0x1060A, device->initarg << 0x10);

    for(int i = 0; i < 4; ++i)
        info[i] = device->ret[i];

    // put sd card back to transfer mode
    // CMD7
    sdmmc_send_command(device, 0x10507, device->initarg << 0x10);
}

u32 sdmmc_sdcard_init()
{
    u32 ret = 0;
    InitSD();
    if(Nand_Init() != 0) ret |= 1;
    if(SD_Init() != 0) ret |= 2;
    return ret;
}