#![allow(dead_code)] use memory::VMem; use mos6502::CPU; use core::intrinsics::transmute; pub trait Screen { fn put(&self, x: u8, y: u8, color: u8); fn render(&self); } #[repr(C, packed)] #[derive(Copy, Clone)] struct Sprite { y: u8, /* is the (actualy y) - 1 */ tile: u8, attr: u8, x: u8 } pub struct PPU<'a> { scanline: u16, /* registers */ ppuctl: u8, ppumask: u8, ppustatus: u8, oamaddr: u8, reg: u8, x: u8, /* fine x scroll */ v: u16, /* current vram addr */ t: u16, /* temporary vram addr */ w: bool, /* first/second write toggle */ cycle: u16, /* cycle in the current scanline */ /* rendering regs & latches */ /* background registers */ bg_pixel: u64, /* background latches */ bg_nt: u8, bg_attr: u8, bg_bit_low: u8, bg_bit_high: u8, /* sprites */ oam: [Sprite; 64], oam2: [usize; 8], sp_pixel: [u32; 8], sp_idx: [usize; 8], sp_cnt: [u8; 8], rendering: bool, buffered_read: u8, early_read: bool, /* IO */ mem: &'a VMem, scr: &'a Screen, } impl<'a> PPU<'a> { #[inline] pub fn write_ctl(&mut self, data: u8) { self.reg = data; self.ppuctl = data; self.t = (self.t & 0x73ff) | ((data as u16 & 3) << 10); } #[inline] pub fn write_mask(&mut self, data: u8) { self.reg = data; self.ppumask = data; } #[inline] pub fn read_status(&mut self) -> u8 { let res = (self.ppustatus & !0x1fu8) | (self.reg & 0x1f); self.ppustatus &= !PPU::FLAG_VBLANK; self.w = false; if self.scanline == 241 && self.cycle == 0 { self.early_read = true; } res } #[inline] pub fn write_oamaddr(&mut self, data: u8) { self.reg = data; self.oamaddr = data; } #[inline] pub fn write_oamdata(&mut self, data: u8) { self.reg = data; if self.rendering { return } unsafe { let oam_raw = transmute::<&mut[Sprite; 64], &mut[u8; 256]>(&mut self.oam); oam_raw[self.oamaddr as usize] = data; self.oamaddr = self.oamaddr.wrapping_add(1); } } #[inline] pub fn read_oamdata(&self) -> u8 { unsafe { let oam_raw = transmute::<&[Sprite; 64], &[u8; 256]>(&self.oam); oam_raw[self.oamaddr as usize] } } #[inline] pub fn write_scroll(&mut self, data: u8) { self.reg = data; let data = data as u16; match self.w { false => { self.t = (self.t & 0x7fe0) | (data >> 3); self.x = (data & 0x07) as u8; //assert!(self.x == 0); self.w = true; }, true => { self.t = (self.t & 0x0c1f) | ((data & 0xf8) << 2) | ((data & 0x07) << 12); self.w = false; } } } #[inline] pub fn write_addr(&mut self, data: u8) { self.reg = data; let data = data as u16; match self.w { false => { self.t = (self.t & 0x00ff) | ((data & 0x3f) << 8); self.w = true; }, true => { self.t = (self.t & 0xff00) | data; self.v = self.t; self.w = false; } } } #[inline] pub fn read_data(&mut self) -> u8 { let data = self.mem.read(self.v); let res = if self.v & 0x3fff < 0x3f00 { let prev = self.buffered_read; self.buffered_read = data; prev } else { self.buffered_read = self.mem.read(self.v - 0x1000); data }; self.v = self.v.wrapping_add(match self.get_vram_inc() { 0 => 1, _ => 32 }); res } #[inline] pub fn write_data(&mut self, data: u8) { self.reg = data; self.mem.write(self.v, data); self.v = self.v.wrapping_add(match self.get_vram_inc() { 0 => 1, _ => 32 }); } #[inline] pub fn write_oamdma(&mut self, data: u8, cpu: &mut CPU) { self.reg = data; let mut addr = (data as u16) << 8; unsafe { let oam_raw = transmute::<&mut[Sprite; 64], &mut[u8; 256]>(&mut self.oam); for _ in 0..0x100 { oam_raw[self.oamaddr as usize] = cpu.mem.read(addr); addr = addr.wrapping_add(1); self.oamaddr = self.oamaddr.wrapping_add(1); } } cpu.cycle += 1; cpu.cycle += cpu.cycle & 1; cpu.cycle += 512; } #[inline(always)] fn get_spritesize(&self) -> u8 {(self.ppuctl >> 5) & 1} #[inline(always)] fn get_flag_nmi(&self) -> bool { (self.ppuctl >> 7) == 1 } #[inline(always)] fn get_vram_inc(&self) -> u8 { (self.ppuctl >> 2) & 1} #[inline(always)] fn get_show_leftmost_bg(&self) -> bool { (self.ppumask >> 1) & 1 == 1} #[inline(always)] fn get_show_leftmost_sp(&self) -> bool { (self.ppumask >> 2) & 1 == 1} #[inline(always)] fn get_show_bg(&self) -> bool { (self.ppumask >> 3) & 1 == 1} #[inline(always)] fn get_show_sp(&self) -> bool { (self.ppumask >> 4) & 1 == 1} #[inline(always)] pub fn get_flag_vblank(&self) -> bool { (self.ppustatus >> 7) & 1 == 1 } const FLAG_OVERFLOW: u8 = 1 << 5; const FLAG_SPRITE_ZERO: u8 = 1 << 6; const FLAG_VBLANK: u8 = 1 << 7; #[inline(always)] fn fetch_nametable_byte(&mut self) { self.bg_nt = self.mem.read(0x2000 | (self.v & 0x0fff)); } #[inline(always)] fn fetch_attrtable_byte(&mut self) { let v = self.v; /* the byte representing 4x4 tiles */ let b = self.mem.read(0x23c0 | (v & 0x0c00) | ((v >> 4) & 0x38) | ((v >> 2) & 0x07)); self.bg_attr = (b >> ((v & 2) | ((v & 0x40) >> 4))) & 3; } #[inline(always)] fn fetch_low_bgtile_byte(&mut self) { /* 0x?000 */ self.bg_bit_low = self.mem.read(((self.ppuctl as u16 & 0x10) << 8) | /* 0x-??0 */ ((self.bg_nt as u16) << 4) | /* 0x---? (0 - 7) */ ((self.v >> 12) & 7) | 0x0); } #[inline(always)] fn fetch_high_bgtile_byte(&mut self) { /* 0x?000 */ self.bg_bit_high = self.mem.read(((self.ppuctl as u16 & 0x10) << 8) | /* 0x-??0 */ ((self.bg_nt as u16) << 4) | /* 0x---? (8 - f) */ ((self.v >> 12) & 7) | 0x8); } #[inline(always)] fn load_bgtile(&mut self) { /* load the tile bitmap to high 8 bits of bitmap, * assume the high 8 bits are zeros */ assert!(self.bg_pixel >> 32 == 0); let mut t: u64 = 0; let mut bl = self.bg_bit_low; let mut bh = self.bg_bit_high; for _ in 0..8 { t = (t << 4) | ((self.bg_attr << 2) | (bl & 1) | ((bh & 1) << 1)) as u64; bl >>= 1; bh >>= 1; } self.bg_pixel |= t << 32; } #[inline(always)] fn shift_sprites(&mut self) { for (i, c) in self.sp_cnt.iter_mut().enumerate() { if self.sp_idx[i] > 0xff { break } let c0 = *c; match c0 { 0 => self.sp_pixel[i] >>= 4, _ => *c = c0 - 1 } } } #[inline(always)] fn shift_bgtile(&mut self) { self.bg_pixel >>= 4; } #[inline(always)] fn wrapping_inc_cx(&mut self) { match self.v & 0x001f { 31 => { self.v &= !0x001fu16; /* reset coarse x */ self.v ^= 0x0400; /* switch horizontal nametable */ } _ => self.v += 1 } } #[inline(always)] fn wrapping_inc_y(&mut self) { match (self.v & 0x7000) == 0x7000 { false => self.v += 0x1000, /* fine y < 7 */ true => { self.v &= !0x7000u16; /* fine y <- 0 */ let y = match (self.v & 0x03e0) >> 5 { 29 => {self.v ^= 0x0800; 0}, /* at bottom of scanline */ 31 => 0, /* do not switch nt */ y => y + 1 }; self.v = (self.v & !0x03e0u16) | (y << 5); } } } #[inline(always)] fn reset_cx(&mut self) { self.v = (self.v & !0x041fu16) | (self.t & 0x041f); } #[inline(always)] fn reset_y(&mut self) { self.v = (self.v & !0x7be0u16) | (self.t & 0x7be0); } #[inline(always)] fn clear_sprite(&mut self) { if self.scanline == 261 { return } self.oam2 = [0x100; 8]; } fn eval_sprite(&mut self) { if self.scanline == 261 { return } /* we use scanline here because s.y is the (actual y) - 1 */ let mut nidx = 0; let mut n = 0; let scanline = self.scanline; let h = match self.get_spritesize() { 0 => 8, _ => 16 }; for (i, s) in self.oam.iter().enumerate() { let y = s.y as u16; if y <= scanline && scanline < y + h { self.oam2[nidx] = i; nidx += 1; if nidx == 8 { n = i + 1; break; } } } if nidx == 8 { let mut m = 0; unsafe { let oam_raw = transmute::<&[Sprite; 64], &[[u8; 4]; 64]>(&self.oam); while n < 64 { let y = oam_raw[n][m] as u16; if y <= scanline && scanline < y + h { self.ppustatus |= PPU::FLAG_OVERFLOW; /* set overflow */ } else { m = (m + 1) & 3; /* emulates hardware bug */ } n += 1; } } } } #[inline(always)] fn reverse_byte(mut x: u8) -> u8 { x = ((x & 0xaa) >> 1) | ((x & 0x55) << 1); x = ((x & 0xcc) >> 2) | ((x & 0x33) << 2); x = ((x & 0xf0) >> 4) | ((x & 0x0f) << 4); x } fn fetch_sprite(&mut self) { if self.scanline == 261 { return } /* we use scanline here because s.y is the (actual y) - 1 */ self.sp_idx = [0x100; 8]; for (i, v) in self.oam2.iter().enumerate() { let j = *v; if j > 0xff { break } let s = &self.oam[j]; let vflip = (s.attr & 0x80) == 0x80; let y0 = self.scanline - s.y as u16; let (ptable, tidx, y) = match self.get_spritesize() { 0 => { let y = if vflip {7 - y0 as u8} else {y0 as u8}; ((self.ppuctl as u16 & 0x08) << 9, s.tile, y) }, _ => { //assert!(false); let y = if vflip {15 - y0 as u8} else {y0 as u8}; ((s.tile as u16 & 1) << 12, (s.tile & !1u8) | (y >> 3), y & 0x7) } }; self.sp_idx[i] = j; self.sp_cnt[i] = s.x; let mut low = self.mem.read(ptable | ((tidx as u16) << 4) | 0x0 | y as u16); let mut high = self.mem.read(ptable | ((tidx as u16) << 4) | 0x8 | y as u16); if (s.attr & 0x40) == 0x40 { low = PPU::reverse_byte(low); high = PPU::reverse_byte(high); } let attr = s.attr & 3; let mut t = 0u32; for _ in 0..8 { t = (t << 4) | ((attr << 2) | ((high & 1) << 1) | (low & 1)) as u32; high >>= 1; low >>= 1; } self.sp_pixel[i] = t; } } fn render_pixel(&mut self) { let x = self.cycle - 1; let bg = ((self.bg_pixel >> (self.x << 2)) & 0xf) as u16; let bg_pidx = if x >= 8 || self.get_show_leftmost_bg() { if self.get_show_bg() {bg & 3} else {0} } else {0}; let mut sp_pidx = 0x0; let mut pri = 0x1; let mut sp = 0; let show_sp = self.get_show_sp(); if x >= 8 || self.get_show_leftmost_sp() { for i in 0..8 { if self.sp_idx[i] > 0xff { break } if self.sp_cnt[i] != 0 { continue; } /* not active */ let s = &self.oam[self.sp_idx[i]]; sp = if show_sp {(self.sp_pixel[i] & 0xf) as u16} else { 0 }; match sp & 3 { 0x0 => (), pidx => { if bg_pidx != 0 && self.sp_idx[i] == 0 && x != 0xff && s.y != 0xff { self.ppustatus |= PPU::FLAG_SPRITE_ZERO; /* set sprite zero hit */ } sp_pidx = pidx; pri = (s.attr >> 5) & 1; break; } } } } assert!(0 < self.cycle && self.cycle < 257); assert!(self.scanline < 240); self.scr.put((self.cycle - 1) as u8, self.scanline as u8, self.mem.read(if (pri == 0 || bg_pidx == 0) && sp_pidx != 0 { 0x3f10 | sp } else { 0x3f00 | match bg_pidx { 0 => 0, _ => bg } })); } pub fn new(mem: &'a VMem, scr: &'a Screen) -> Self { let ppuctl = 0x00; let ppumask = 0x00; let ppustatus = 0xa0; let oamaddr = 0x00; let w = false; let buffered_read = 0x00; let cycle = 370; let scanline = 240; PPU { scanline, ppuctl, ppumask, ppustatus, oamaddr, reg: 0, x: 0, v: 0, t: 0, w, cycle, bg_pixel: 0, bg_nt: 0, bg_attr: 0, bg_bit_low: 0, bg_bit_high: 0, oam: [Sprite{y: 0, tile: 0, attr: 0, x: 0}; 64], oam2: [0x100; 8], sp_idx: [0x100; 8], sp_pixel: [0; 8], sp_cnt: [0; 8], rendering: false, buffered_read, early_read: false, mem, scr } } pub fn reset(&mut self) { self.ppuctl = 0x00; self.ppumask = 0x00; self.ppustatus = self.ppustatus & 0x80; self.w = false; self.buffered_read = 0x00; self.cycle = 370; self.scanline = 240; } pub fn tick(&mut self) -> bool { let cycle = self.cycle; if cycle == 0 { self.cycle = cycle + 1; return false; } let visible_line = self.scanline < 240; let pre_render = self.scanline == 261; self.rendering = pre_render || visible_line; if pre_render && cycle == 1 { /* clear vblank, sprite zero hit & overflow */ self.ppustatus &= !(PPU::FLAG_VBLANK | PPU::FLAG_SPRITE_ZERO | PPU::FLAG_OVERFLOW); } else if self.rendering && (self.get_show_bg() || self.get_show_sp()) { if pre_render && 279 < cycle && cycle < 305 { self.reset_y(); } else { let visible_cycle = 0 < cycle && cycle < 257; /* 1..256 */ let fetch_cycle = visible_cycle || (320 < cycle && cycle < 337); if fetch_cycle { /* 1..256 and 321..336 */ match cycle & 0x7 { 1 => { self.load_bgtile(); self.fetch_nametable_byte(); }, 3 => self.fetch_attrtable_byte(), 5 => self.fetch_low_bgtile_byte(), 7 => self.fetch_high_bgtile_byte(), 0 => self.wrapping_inc_cx(), _ => () } match cycle { 1 => self.clear_sprite(), /* clear secondary OAM */ 65 => self.eval_sprite(), /* sprite evaluation */ 256 => self.wrapping_inc_y(), _ => () } if visible_line && visible_cycle { self.render_pixel(); self.shift_sprites(); } self.shift_bgtile(); } else if cycle > 336 { /* 337..340 */ if cycle & 1 == 1 { self.fetch_nametable_byte(); } } else if cycle == 257 { /* we don't emulate fetch to per cycle precision because all data are fetched * from the secondary OAM which is not subject to any change during this * scanline */ self.reset_cx(); self.fetch_sprite(); } } } else if self.scanline == 241 && cycle == 1 { self.scr.render(); if !self.early_read { self.ppustatus |= PPU::FLAG_VBLANK; } self.cycle += 1; self.early_read = false; return !self.early_read && self.get_flag_nmi(); /* trigger cpu's NMI */ } self.cycle += 1; if self.cycle > 340 { self.cycle = 0; self.scanline += 1; if self.scanline > 261 { self.scanline = 0; } } false } }