use crate::std::*;
pub const CORE_MAX_ADDR_BITS: usize = 40;
pub const MESH_ROWS: usize = 16;
pub const MESH_COLS: usize = 16;
pub const TILE_ROWS: usize = 1;
pub const TILE_COLS: usize = 1;
pub const BLOCK_SIZE: usize = MESH_ROWS * TILE_ROWS;
pub const SP_BANKS: usize = 4;
pub const ACC_BANKS: usize = 2;
pub const RS_ENTRIES_LD: usize = 8;
pub const RS_ENTRIES_ST: usize = 4;
pub const RS_ENTRIES_EX: usize = 16;
pub const DMA_MAX_BYTES: usize = 64;
pub const SP_WIDTH: usize = MESH_COLS * TILE_COLS * 8;
pub const SP_BANK_ENTRIES: usize = 256 * 1024 * 8 / (SP_BANKS * SP_WIDTH);
pub const ACC_BANK_ENTRIES: usize = 64 * 1024 * 8 / (ACC_BANKS * MESH_COLS * TILE_COLS * 32);
pub const MVIN_SCALE_BITS: usize = 32;
pub const ACC_SCALE_BITS: usize = 32;
pub const MVIN_COLS_BITS: usize = clog2(max(DMA_MAX_BYTES, MESH_COLS * TILE_COLS) + 1);
pub const MVIN_ROWS_BITS: usize = clog2(MESH_ROWS * TILE_ROWS + 1);
pub const MVOUT_COLS_BITS: usize = clog2(max(DMA_MAX_BYTES, MESH_COLS * TILE_COLS) + 1);
pub const MVOUT_ROWS_BITS: usize = clog2(MESH_ROWS * TILE_ROWS + 1);
pub const LOAD_STATES: usize = 3;
pub const BLOCK_STRIDE_BITS: usize =
min(16, max(clog2(ACC_BANKS * ACC_BANK_ENTRIES), clog2(SP_BANKS * SP_BANK_ENTRIES)));
pub const A_STRIDE_BITS: usize = min(16, max(clog2(ACC_BANKS * ACC_BANK_ENTRIES), clog2(SP_BANKS * SP_BANK_ENTRIES)));
pub const C_STRIDE_BITS: usize = min(16, max(clog2(ACC_BANKS * ACC_BANK_ENTRIES), clog2(SP_BANKS * SP_BANK_ENTRIES)));
pub const PIXEL_REPEATS_BITS: usize = min(8, clog2(MESH_COLS * TILE_COLS + 1));
pub const RS_ENTRIES: usize = RS_MAX_PER_TYPE * 3;
pub const ROB_ENTRIES: usize = RS_ENTRIES;
pub const RS_MAX_PER_TYPE: usize = max(RS_ENTRIES_LD, max(RS_ENTRIES_EX, RS_ENTRIES_ST));
pub const CL_RS_MAX_PER_TYPE: usize = clog2(RS_MAX_PER_TYPE);
pub const INPUT_BITS: usize = 8;
pub const ACC_BITS: usize = 32;
pub const OUTPUT_BITS: usize = 20;