Firmwares/raven_spn/src/raven_spn.cpp

146 lines
4.8 KiB
C++

#include "raven_spn.h"
#include "spn_regs.h"
#include "init.h"
#include "spn_checker_regs.h"
using spn_1 = spn_regs<0x90000000>;
using spn_2 = spn_regs<0xC0000000>;
using spn_checker = spn_checker_regs<0x10040000>;
void run_xspn1(int in_addr, int out_addr, int num_samples, int in_beats, int out_beats) {
spn_1::mode_reg() = 0;
spn_1::input_length_reg() = num_samples; // each sample consists of 5 uint8 values
spn_1::input_addr_reg() = in_addr;
spn_1::output_addr_reg() = out_addr;
spn_1::num_of_in_beats_reg() = in_beats; // Number of AXI4 burst beats needed to load all input data
spn_1::num_of_out_beats_reg() = out_beats; // Number of AXI4 burst beats needed to store all result data
spn_1::start_reg() = 1;
printf("Starting first XSPN instance\n");
}
void run_xspn2(int in_addr, int out_addr, int num_samples, int in_beats, int out_beats) {
spn_2::mode_reg() = 0;
spn_2::input_length_reg() = num_samples; // each sample consists of 5 uint8 values
spn_2::input_addr_reg() = in_addr;
spn_2::output_addr_reg() = out_addr;
spn_2::num_of_in_beats_reg() = in_beats; // Number of AXI4 burst beats needed to load all input data
spn_2::num_of_out_beats_reg() = out_beats; // Number of AXI4 burst beats needed to store all result data
printf("Starting second XSPN instance\n");
spn_2::start_reg() = 1;
}
static void spn1_interrupt_handler(){
spn1_hw_interrupt = false;
spn_1::interrupt_reg() = 1;
}
static void spn2_interrupt_handler(){
spn2_hw_interrupt = false;
spn_2::interrupt_reg() = 1;
}
/*! \brief main function
*
*/
int main() {
platform_init();
configure_irq(2, spn1_interrupt_handler);
configure_irq(22, spn2_interrupt_handler);
uint32_t xspn_count = spn_checker::xspn_count_reg();
uint32_t batch_size = spn_checker::batch_size_reg();
uint32_t iterations = spn_checker::num_iterations_reg();
printf("XSPN COUNT: %d\n", xspn_count);
if (xspn_count < 1 || xspn_count > 2) {
printf("ERROR: invalid XSPN COUNT");
return 1;
}
printf("BATCH SIZE: %d\n", batch_size);
printf("ITERATIONS: %d\n", iterations);
int in_addr = 0x30000000; // place input samples in the SPI memory
int out_addr1 = 0x3C000000;
int out_addr2 = 0x3E000000;
spn_1::mode_reg() = 1;
spn_1::start_reg() = 1;
wait_for_spn1_interrupt();
uint32_t readout = spn_1::readout_reg();
printf("READOUT first HW instance:0x%x\n", readout);
if (xspn_count == 2) {
spn_2::mode_reg() = 1;
spn_2::start_reg() = 1;
wait_for_spn2_interrupt();
uint32_t readout2 = spn_2::readout_reg();
printf("READOUT second HW instance:0x%x\n", readout2);
}
uint32_t axi_bytes = readout;
axi_bytes = axi_bytes & 0xff;
axi_bytes = 1 << axi_bytes;
printf("AXI Bytes: %d\n", axi_bytes);
uint32_t sample_bytes = readout;
sample_bytes = sample_bytes >> 16;
sample_bytes = sample_bytes / 8;
printf("Sample Bytes: %d\n", sample_bytes);
uint32_t result_bytes = 8;
printf("Result Bytes: %d\n", result_bytes);
uint32_t in_bytes = batch_size * sample_bytes;
uint32_t out_bytes = batch_size * result_bytes;
uint32_t total_in = in_bytes * iterations;
if (total_in > (out_addr1 - in_addr)) {
printf("ERROR: input data requires %d bytes, only %d bytes available\n", total_in, out_addr1 - in_addr);
return 1;
}
if (out_bytes > (out_addr2 - out_addr1)) {
printf("ERROR: output data requires %d bytes, only %d bytes available\n", out_bytes, out_addr2 - out_addr1);
return 1;
}
uint32_t in_beats = in_bytes / axi_bytes;
if (in_beats * axi_bytes < batch_size * sample_bytes) in_beats++;
uint32_t out_beats = out_bytes / axi_bytes;
if (out_beats * axi_bytes < batch_size * result_bytes) out_beats++;
uint32_t current_in_addr = in_addr;
// inject SPN input data
spn_checker::input_addr_reg() = current_in_addr;
spn_checker::num_input_samples_reg() = sample_bytes * batch_size * iterations;
spn_checker::start_data_trans_reg() = 1;
spn_checker::output_addr_reg() = out_addr1;
if (xspn_count == 2) {
spn_checker::output_addr2_reg() = out_addr2;
}
for (int k = 0; k < iterations*batch_size; k+=batch_size) {
run_xspn1(current_in_addr, out_addr1, batch_size, in_beats, out_beats);
if (xspn_count == 2) {
run_xspn2(current_in_addr, out_addr2, batch_size, in_beats, out_beats);
wait_for_spn_interrupts();
} else {
wait_for_spn1_interrupt();
}
printf("XSPN finished\n");
spn_checker::offset_reg() = k;
spn_checker::length_reg() = batch_size;
spn_checker::start_result_check_reg() = 1;
current_in_addr += batch_size * sample_bytes; // 5 bytes in each sample (NIPS5)
}
return 0;
}