// This is all new to me so it's heavily commented so we can understand what is happening.
use bitflags::bitflags;

bitflags! {
    pub struct CpuFlags: u8 {
        // Represents whether the last operation caused a carry or borrow
        const CARRY = 0b00000001;
        // Set if the result of the last operation was zero
        const ZERO = 0b00000010;
        // Disables interrupts when set
        const INTERRUPT_DISABLE = 0b00000100;
        // Enables binary-coded decimal arithmetic
        const DECIMAL_MODE = 0b00001000;
        // Indicates the CPU is handling in interupt
        const BREAK = 0b00010000;
        // A duplicate "break" flag, as both bit 4 and 5 are set by the BRK instruction
        // Bit 5 is not explicitly used on NES
        const BREAK2 = 0b00100000;
        // Set if an arithmetic operation caused an overflow (adding two positive numbers results
        // in a negative value)
        const OVERFLOW = 0b01000000;
        // Indicates whether the result of the last operation was negative - determined by the MSB
        // of the result
        const NEGATIVE = 0b10000000;
    }
}

const STACK: u16 = 0x0100;
const STACK_RESET: u8 = 0xfd;

#[derive(Debug)]
#[allow(non_camel_case_types)]
// AddressingMode is a method used by a CPU to determine where the operand (data or memory
// location) for an instruction comes from. It basically defines how the CPU finds the data it
// needs to execute a given instruction.
//
// The zero page term refers to the first 256 bytes (from 0x0000 to 0x00FF). It's called zero page
// because the high page is always zero (e.g. 00XX). Instructions in this range use fewer bytes and
// cycles compared to acessing memory in other regions. This is due to the fact that only the low
// bytes need to be specified which makes the instruction shorter and faster.
pub enum AddressingMode {
    // Operand is provided directly as part of the instruction
    Immediate,
    //Operand is located in the zero page (memory address 0x00 to 0xFF)
    ZeroPage,
    // Operand is in the zero page, with an offet from the X register
    ZeroPage_X,
    // Operand is in the zero page, with an offet from the Y register
    ZeroPage_Y,
    // Operand is at the full 16-bit address (0x0000 to 0xFFFF)
    Absolute,
    // Operand is at an absolute address, with an offset from the X register
    Absolute_X,
    // Operand is at an absolute address, with an offset from the Y register
    Absolute_Y,
    // Operand is at an address stored in a zero-page address plus an X offset
    Indirect_X,
    // Operand is at an address stored in a zero-page address plus an Y offset
    Indirect_Y,
    // No addressing mode (used for instructions that don't require an operand like NOP)
    NoneAddressing,
}

pub struct CPU {
    // The accumulator register is a specific register used for arithmetic and logic operations.
    // The cpu instruction loads a value into the accumulator register and then updates certain
    // flags in the processor status register to relect the operation of the result.
    pub register_a: u8,
    // The Process Status Register is a collection of individual bits (flags) that represent the
    // current state of the CPU. Each bit has purpose such as if a calculation resulted in zero or
    // if the result is negative
    //
    // Zero flag:
    // - Bit 1 of the status register
    // - Set if register_a == 0, cleared otherwise
    //
    // Negative flag (N) - indicates whether the result of the most recent operation is negative
    // - Bit 7 of the status register (most significant bit is Bit 7 because it's zero based)
    // - Set if the most significant bit of register_a is 1, cleared otherwise
    pub status: CpuFlags,
    // track our current position in the program
    pub program_counter: u16,
    // most commonly used to hold counters or offsets for accessing memory. The value can be loaded
    // and saved in memory, compared with values held in memory or incremented and decremented.
    //
    // X register has one special function. It can be used to copy a stack pointer or change it's
    // value.
    pub register_x: u8,
    pub register_y: u8,
    // this creates an array with size of 0xFFFF and initializes all elements to 0 (see below in t
    // he new function). 0xFFFF is hexadecimal for 65535 in decimal. This defines the size of the
    // array with 65535 elements, the typical size for a 6502 CPU system.
    memory: [u8; 0xFFFF],
}

trait Mem {
    fn mem_read(&self, addr: u16) -> u8;

    fn mem_write(&mut self, addr: u16, data: u8);

    // combines two consecutives bytes in memory into a single 16 bit value
    fn mem_read_u16(&mut self, pos: u16) -> u16 {
        // read the low byte (pos)
        let lo = self.mem_read(pos) as u16;
        // read the high byte (pos + 1)
        let hi = self.mem_read(pos + 1) as u16;
        // combine the bytes. Shelf the high byte 8 bits to the left, effectively moving it into
        // the upper 8 bits of a 16-bit value. This will combine to a single 16 bit value.
        (hi << 8) | (lo as u16)
    }

    // split a 16-bit number into 2 8-bit pieces
    fn mem_write_u16(&mut self, pos: u16, data: u16) {
        // take the top half of the 16 bit number
        let hi = (data >> 8) as u8;
        // take the bottom half of the 16 bit number
        let lo = (data & 0xff) as u8;
        // store low byte in the first compartment of memory (pos)
        self.mem_write(pos, lo);
        // store the high byte in the next compartment (pos + 1)
        self.mem_write(pos + 1, hi)
    }
}

impl Mem for CPU {
    fn mem_read(&self, addr: u16) -> u8 {
        self.memory[addr as usize]
    }

    fn mem_write(&mut self, addr: u16, data: u8) {
        self.memory[addr as usize] = data;
    }
}

impl CPU {
    pub fn new() -> Self {
        CPU {
            register_a: 0,
            status: CpuFlags::from_bits_truncate(0b100100),
            program_counter: 0,
            register_x: 0,
            register_y: 0,
            memory: [0; 0xFFFF],
        }
    }

    /// Determines the memory address for the operand based on the specified addressing mode.
    ///
    /// # Arguments
    /// - `mode`: The addressing mode, which speicifies how the oeprand is accessed.
    ///
    /// # Returns
    /// - A 16 bit memory address where the operand can be found
    fn get_operand_address(&mut self, mode: &AddressingMode) -> u16 {
        match mode {
            // Immediate mode: The operand is part of the instruction itself, located at the
            // program counter
            AddressingMode::Immediate => self.program_counter,

            // ZeroPage mode: The operand is in the zero page (first 256 bytes of memory), with the
            // address specificed as a single byte at the program counter.
            AddressingMode::ZeroPage => self.mem_read(self.program_counter) as u16,

            // Absolute mode: The operand's address is a full 16-bit address, stored in two
            // consecutive bytes starting at the program counter
            AddressingMode::Absolute => self.mem_read_u16(self.program_counter),

            // ZeroPage_X mode: The operand is in the zero page, with it's address calculated by
            // adding the X register to a base address stored at the program counter
            AddressingMode::ZeroPage_X => {
                let pos = self.mem_read(self.program_counter);
                let addr = pos.wrapping_add(self.register_x) as u16;
                addr
            }

            // ZeroPage_Y mode: Similar to ZeroPage_X, but the address is calculated
            // using the Y register instead of the X register.
            AddressingMode::ZeroPage_Y => {
                let pos = self.mem_read(self.program_counter);
                let addr = pos.wrapping_add(self.register_y) as u16;
                addr
            }

            // Absolute_X mode: The operand's address is calculated by adding the X register
            // to a 16-bit base address stored at the program counter.
            AddressingMode::Absolute_X => {
                let base = self.mem_read_u16(self.program_counter);
                let addr = base.wrapping_add(self.register_x as u16);
                addr
            }

            // Absolute_Y mode: Similar to Absolute_X, but the address is calculated
            // by adding the Y register to the 16-bit base address.
            AddressingMode::Absolute_Y => {
                let base = self.mem_read_u16(self.program_counter);
                let addr = base.wrapping_add(self.register_x as u16);
                addr
            }

            // Indirect_X mode: The operand's address is calculated by first adding the X register
            // to a zero-page base address, then fetching the actual 16-bit address from
            // the zero page.
            AddressingMode::Indirect_X => {
                // read the single byte from the program counter. This is our base.
                let base = self.mem_read(self.program_counter);
                // Take the base and add the value in the X register. If the result goes passed
                // 0xFF, it wraps back around to 0x00 (like starting over in a circle). This is
                // essentially behaving like a ring buffer. Using wrapping_add ensures the
                // calculation stays within the valid range without requiring additional checks
                let ptr: u8 = (base as u8).wrapping_add(self.register_x);
                // Read the low byte of the memory address from memory at ptr. The goal here is
                // to fetch the 16 byte address from the zero page using the pointer.
                let lo = self.mem_read(ptr as u16);
                // read the high byte of the memory address from memory at ptr + 1
                let hi = self.mem_read(ptr.wrapping_add(1) as u16);
                // take the high byte and shift it left by 8 bits to place it in the upper half of
                // the 16 bit value. Then take the low byte and keep it in the lower half of the 16
                // bit value. Combine the two values using the bitwise OR (|) operator to form a
                // full 16 bit value.
                (hi as u16) << 8 | (lo as u16)
            }

            // Indirect_Y mode: The operand's address is calculated by first fetching a 16-bit address
            // from a zero-page base address, then adding the Y register to it.
            AddressingMode::Indirect_Y => {
                // read from the program counter (an 8 bit value). This pointer specifies a zero
                // page address where the actual 16 bit address is stored.
                let base = self.mem_read(self.program_counter);
                // read the low byte of the final address from the zero page address specificed by
                // `base`
                let lo = self.mem_read(base as u16);
                // read the high byte of the final address from the next consecutive zero-page
                // address (base +1). wrapping_add(1) ensures that if base = 0xFF, it wraps around
                // the 0x00
                let hi = self.mem_read((base as u8).wrapping_add(1) as u16);
                // Combine the low and high bytes into a 16 bit address
                let deref_base = (hi as u16) << 8 | (lo as u16);
                // Add the Y Registered to the dereferenced address
                let deref = deref_base.wrapping_add(self.register_y as u16);
                // Return the final address
                deref
            }

            // NoneAddressing: This mode is used for instructions that don't require an operand
            // or don't involve memory access.
            AddressingMode::NoneAddressing => {
                panic!("mode {:?} is not supported", mode);
            }
        }
    }

    /// Road the program, reset the state of the cpu and then run the program.
    pub fn load_and_run(&mut self, program: Vec<u8>) {
        self.load(program);
        self.reset();
        self.run();
    }

    /// Reset the state of the CPU
    pub fn reset(&mut self) {
        self.register_a = 0;
        self.register_x = 0;
        self.status = CpuFlags::from_bits_truncate(0b100100);

        self.program_counter = self.mem_read_u16(0xFFFC);
    }

    /// Load the program code into memroy starting at address 0x8000. 0x8000 .. 0xFFFF is reserved
    /// from program ROM and we can assume that the instructions should start somewhere here.
    pub fn load(&mut self, program: Vec<u8>) {
        self.memory[0x8000..(0x8000 + program.len())].copy_from_slice(&program[..]);
        self.mem_write_u16(0xFFFC, 0x8000);
    }

    /// LDA stands for Load Accumulator. It loads a value into the accumulator register. It affects
    /// the Zero Flag and Negative Flag.
    fn lda(&mut self, mode: &AddressingMode) {
        let addr = self.get_operand_address(mode);
        let value = self.mem_read(addr);

        self.register_a = value;
        self.update_zero_and_negative_flags(self.register_a);
    }

    /// TAX instruction copies the value from teh accumulator register (register_a) into the x
    /// register. The way this works is that the CPU takes the current value in the A register,
    /// copies it to the X register, updates the Zero Flag and Negative Flag in the status register.
    ///
    /// The Zero Flag is set if the value is copied to the X register is 0
    /// The Negative Flag is set if the most significant bit of the vlaue (Bit 7) is 1
    ///
    /// In the TAX instruction, we don't need any arguments because it always stransfers data from A
    /// to X.
    fn tax(&mut self) {
        self.register_x = self.register_a;
        self.update_zero_and_negative_flags(self.register_x);
    }

    /// STA stands for Store Accumulator. This instruction takes the value in the accumulator
    /// register (register_a) and stores it in a specified memory location.
    ///
    /// How this works is that the CPU reads the value currently in the accumulator (register_a)
    /// The CPu then writes this value to the specified memory address.
    fn sta(&mut self, mode: &AddressingMode) {
        let addr = self.get_operand_address(mode);
        self.mem_write(addr, self.register_a);
    }

    /// Perform a bitwise AND operation betwen the value in register_a and a value fetched from
    /// memory (determined by the addressing mode)
    ///
    /// The result is stored back in register_a. This is useful for isolating specific bits in the
    /// accumulator.
    fn and(&mut self, mode: &AddressingMode) {
        let addr = self.get_operand_address(mode);
        let data = self.mem_read(addr);

        self.set_register_a(data & self.register_a);
    }

    /// This is used to update the status register flags based on the operation. It updates the Zero
    /// Flag and the Negative Flag.
    ///
    /// This will ensure that the CPU's status register reflects whether the result is zerl (update
    /// the Zero Flag) and if the result is negative (update the Negative Flag)
    fn update_zero_and_negative_flags(&mut self, result: u8) {
        if result == 0 {
            self.status.insert(CpuFlags::ZERO)
        } else {
            self.status.remove(CpuFlags::ZERO);
        }

        if result & 0b1000_000 != 0 {
            self.status.insert(CpuFlags::NEGATIVE)
        } else {
            self.status.remove(CpuFlags::NEGATIVE);
        }
    }

    /// INX stands for Increment Index Register X - increase the value of the X register
    /// by one and update specific processor flags based on the result.
    fn inx(&mut self) {
        self.register_x = self.register_x.wrapping_add(1);
        self.update_zero_and_negative_flags(self.register_x);
    }

    /// Simulate the ADC (Add with Carry) instruction. It adds a value (data) to the accumulator
    /// register (register_a), optionally including the carry flag and updates the status falgs
    /// accordingly.
    fn add_to_register_a(&mut self, data: u8) {
        // Add register_a, data and carry flag togehter. All values are cast to u16 to prevent
        // overflow during the calculation (since the result might exceed 8 bits).
        let sum = self.register_a as u16
            + data as u16
            + (if self.status.contains(CpuFlags::CARRY) {
                1
            } else {
                0
            }) as u16;

        let carry = sum > 0xff;

        // the carry flag is set if the result exceeds 255 (0xFF), meaning the additon produced a
        // value that requires more than 8 bits to store.
        if carry {
            // this happens if the sum = 0x101
            self.status.insert(CpuFlags::CARRY);
        } else {
            // this happens if sum = 0xFE
            self.status.remove(CpuFlags::CARRY);
        }

        // reduce the sum down to a u8 which will discord any overflow beyond 8 bits
        let result = sum as u8;

        // update the overflow flag to be set if there is a signed arithmetic overflow.
        // A signed arithmetic overflow occurs when adding two signed numbers produces a result
        // that is outside th range of a signed 8-bit value (-128 to 127)
        //
        // `data ^ result` checks if the sign of data is different from the sign of result
        // `result ^ self.register_a` checks if the sign of result is different from the sign of
        // register_a.
        // `& 0x80` isolates the most significant bit whcih indicates the sign in signed arithmetic.
        if (data ^ result) & (result ^ self.register_a) & 0x80 != 0 {
            self.status.insert(CpuFlags::OVERFLOW)
        } else {
            self.status.remove(CpuFlags::OVERFLOW);
        }

        // store the final 8-bit result back in the accumulator
        self.set_register_a(result);
    }

    /// This will set the value of the A register (register_A)
    fn set_register_a(&mut self, value: u8) {
        self.register_a = value;
        self.update_zero_and_negative_flags(self.register_a);
    }

    /// SBC stands for Subtract with Borrow. It is the counter to ADC (Add with Carry) instruction
    /// and performs subtraction while considering the Carry Flag. This works with unsigned binary
    /// numbers or two's complement signed numbers.
    ///
    /// The Carry flag represents the absence of a borrow.
    /// The Overflow flag is set if the result goes outside the range of a signed 8-bit value
    /// The Negative flag and Zero flag are updated based on the result
    fn sbc(&mut self, mode: &AddressingMode) {
        let addr = self.get_operand_address(mode);
        let data = self.mem_read(addr);
        self.add_to_register_a(((data as i8).wrapping_neg().wrapping_sub(1)) as u8);
    }

    /// ADC stands for Add with Carry
    fn adc(&mut self, mode: &AddressingMode) {
        let addr = self.get_operand_address(mode);
        let value = self.mem_read(addr);
        self.add_to_register_a(value);
    }

    // The interpret method takes in mutalbe reference to self as we know we will need to modify
    // register_a during execution
    //
    // - Fetch next instruction from instruction memory
    // - Decode instruction
    // - Execute the instruction
    // - Repeat
    pub fn run(&mut self) {
        // We need an infinite loop to continuously fetch instructions from the program array. We
        // use the program_counter to keep track fo the current instruction.
        loop {
            // set the opscode to the current byte in the program at the address indicated by
            // program counter
            let opscode = self.mem_read(self.program_counter);
            // we increment program counterto point to the next byte
            self.program_counter += 1;

            match opscode {
                // This will implement LDA (0xA9) opcode. 0xA9 is the LDA Immediate instruction in
                // the 6502 CPU.
                //
                // 0x42 tells the CPU to execute a specific operation: LDA Immediate. An opscode is
                // a command for the CPU, instructing it what to do next. Essentially, this means
                // "Load the immediate value from the next memory location into the accumulator"
                //
                // Immediate value refers to the constant value that is directly embedded in the
                // instruction itself, rather than being fetched from memory or calculated
                // directly.
                0xA9 | 0xa5 | 0xb4 | 0xad | 0xbd | 0xb9 | 0xa1 | 0xb1 => {
                    self.lda(&AddressingMode::Immediate);
                    self.program_counter += 1;
                }
                0xA5 => {
                    self.lda(&AddressingMode::ZeroPage);
                    self.program_counter += 1;
                }
                0xAD => {
                    self.lda(&AddressingMode::Absolute);
                    self.program_counter += 2;
                }
                0x85 => {
                    self.sta(&AddressingMode::ZeroPage);
                    self.program_counter += 1;
                }
                0x95 => {
                    self.sta(&AddressingMode::ZeroPage);
                    self.program_counter += 1;
                }
                // implement the 0xAA opcode which corresponds to the TAX (transfer acculumater to
                // X register)
                0xAA => self.tax(),
                // INX stands for Increment Index Register X - increase the value of the X register
                // by one and update specific processor flags based on the result.
                0xe8 => self.inx(),
                0x00 => return,
                _ => todo!(),
            }
        }
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_lda_sets_register_a() {
        let mut cpu = CPU::new();
        cpu.load_and_run(vec![0xa9, 0x05, 0x00]);
        assert_eq!(cpu.register_a, 0x05);
        assert!(cpu.status & 0b0000_0010 == 0b00);
        assert!(cpu.status & 0b1000_0000 == 0);
    }

    #[test]
    fn test_0xa9_lda_zero_flag() {
        let mut cpu = CPU::new();
        cpu.load_and_run(vec![0xa9, 0x00, 0x00]);
        assert!(cpu.status & 0b0000_0010 == 0b10);
    }

    #[test]
    fn test_0xaa_tax_move_to_a_to_x() {
        let mut cpu = CPU::new();
        cpu.load_and_run(vec![0xa9, 0x0A, 0xaa, 0x00]);

        assert_eq!(cpu.register_x, 10)
    }

    #[test]
    fn test_5_ops_working_together() {
        let mut cpu = CPU::new();
        cpu.load_and_run(vec![0xa9, 0xc0, 0xaa, 0xe8, 0x00]);

        assert_eq!(cpu.register_x, 0xc1)
    }

    #[test]
    fn test_inx_overflow() {
        let mut cpu = CPU::new();
        cpu.load_and_run(vec![0xa9, 0xff, 0xaa, 0xe8, 0xe8, 0x00]);

        assert_eq!(cpu.register_x, 1)
    }
}