Compare commits
	
		
			216 Commits
		
	
	
		
			3fd51cc68c
			...
			featture/i
		
	
	| Author | SHA1 | Date | |
|---|---|---|---|
| 071cb4fdac | |||
| dd937710a7 | |||
| 047e2e12b0 | |||
| fe3ed49519 | |||
| 1afd77a942 | |||
| cdf5038e59 | |||
| 651897e1e4 | |||
| a1803c61c1 | |||
| bfa2182f8e | |||
| b01c9b27e5 | |||
| 07f394d5ff | |||
| 7e97329e78 | |||
| 8f5d666b7d | |||
| cc123939ce | |||
| a2e5405e25 | |||
| cd3ec0b79d | |||
| 0e35a2a8c9 | |||
| 8220c00a3d | |||
| ec5fb1e87e | |||
| 453407568c | |||
| 0fe9e6ebc8 | |||
| 484d9dbe08 | |||
| 7a7035f267 | |||
| d9f1e5d31b | |||
| 7b35f45a48 | |||
| ece6f7290f | |||
| 2166a6d81e | |||
| fe9f2a5455 | |||
| 42bf6ee380 | |||
| f0b582df6c | |||
| 6fcb3dbb66 | |||
| c01eb39a76 | |||
| 08280a094f | |||
| ae90adc854 | |||
| cd358198ad | |||
| 8746003d3e | |||
| 60d2b45a81 | |||
| 0264c5d66f | |||
| 528c2536af | |||
| 19e38ec898 | |||
| fd11ce18c4 | |||
| 9b7a9fa273 | |||
| e24c1874c4 | |||
| 221d2ee38c | |||
| 877cad27ba | |||
| a26505cb5c | |||
| c1277b6528 | |||
| 63889b02e7 | |||
| f049d8cbb3 | |||
| 28ac169cfe | |||
| a6f24db83a | |||
| e1911bc450 | |||
| 75d96bf18d | |||
| e59458aa0e | |||
| 77807fec01 | |||
| 6852d1d299 | |||
| ac1322d66b | |||
| 9ba9d2432c | |||
| c9b7962cd3 | |||
| ab31fd27c9 | |||
| b3f189145f | |||
| dd4416ab15 | |||
| 0027946f90 | |||
| feaff8c4a5 | |||
| af3e76cc98 | |||
| b1ceac2c2a | |||
| b5862039e7 | |||
| 51f3802394 | |||
| 6ce0d97e81 | |||
| 69c8fda5d2 | |||
| c1f9328528 | |||
| 2b85748279 | |||
| f7aa51b12e | |||
| 3428745a00 | |||
| 512b79a3e7 | |||
| 7a048f8b93 | |||
| 6f4daf91ed | |||
| 947d353bbf | |||
| b95f518c91 | |||
| 4cef0f57c1 | |||
| 28af695592 | |||
| f6cdd9d07c | |||
| 9e390971d4 | |||
| 2bb2e56310 | |||
| a0eeae7dd6 | |||
| 8f491ef36b | |||
| cbe4c2d62f | |||
| 31c6bb55f4 | |||
| 63d0162119 | |||
| 3b294d9da0 | |||
| 54233b448d | |||
| e238369e18 | |||
| cfc980a069 | |||
| 502f3e8df9 | |||
| 88475bfa55 | |||
| 71260a3ef4 | |||
| 23842742a6 | |||
| a13b7ac6d3 | |||
| aaebeaf023 | |||
| fb0f6255e9 | |||
| 57d5ea92be | |||
| 383d762abc | |||
| 03cbd305c6 | |||
| 9f5326c110 | |||
| f4718c6de3 | |||
| 53de21eef9 | |||
| d443c89c87 | |||
| 9a2df32d57 | |||
| be0f783af8 | |||
| 1089800682 | |||
| a6a6f51f0b | |||
| 21e1f791ad | |||
| be6f5791fa | |||
| d907dc7f54 | |||
| 75e81ce236 | |||
| 82a70efdb8 | |||
| 978c3db06e | |||
| 0e88664ff7 | |||
| ac818f304d | |||
| ad60449073 | |||
| b45b3589fa | |||
| 1fb7e8fcea | |||
| 5f9d0beafb | |||
| 4c0d1c75aa | |||
| 2f3abf2f76 | |||
| 62768bf81e | |||
| f6be8ec006 | |||
| a8f56b6e27 | |||
| 76ea0db25d | |||
| ec1b820c18 | |||
| 64329cf0f6 | |||
| 9de0aed84d | |||
| bb4e2766d1 | |||
| 0996d15bd4 | |||
| 6305efa7c2 | |||
| de79adc50d | |||
| 0473aa5344 | |||
| a45fcd28db | |||
| 0f15032210 | |||
| efc11d87a5 | |||
| 4a19e27926 | |||
| c15cdb0955 | |||
| 6609d12582 | |||
| b5341700aa | |||
| 0b5062d21c | |||
| fbca690b3b | |||
| 235a7e6e24 | |||
| 62d21e1156 | |||
| 9c51d6eade | |||
| 2878dca6b5 | |||
| c28e8fd00c | |||
| b3cc9d2346 | |||
| 933f08494c | |||
| 21f8eab432 | |||
| 6ddb8da07f | |||
| edf456c59f | |||
| 42efced1eb | |||
| c376e34b2b | |||
| f579ec6e48 | |||
| fd20e66f1f | |||
| 5d69b79232 | |||
| 2edd68d1bd | |||
| 7ffa7667b6 | |||
| 93d89e07ca | |||
| 17dcba4b90 | |||
| 39d2518fdd | |||
| a365110054 | |||
| d2efb23ff7 | |||
| 04b7a09b19 | |||
| 72b11beac5 | |||
| e87b7d5fd0 | |||
| 5a2b96ef3e | |||
| c6b99cd155 | |||
| b1306c3a47 | |||
| 0d6bf924ed | |||
| 86de536c8f | |||
| 051dd5e2d3 | |||
| e3942be776 | |||
| 6ee484a771 | |||
| 60808c8649 | |||
| 0432803d82 | |||
| 4f5d9214ed | |||
| d42d2ce533 | |||
| 236d12d7f5 | |||
| e1b6cab890 | |||
| 8361f88718 | |||
| 2ec7ea4b41 | |||
| b24965d321 | |||
| 244bf6d2f2 | |||
| 1a4465a371 | |||
| fa82a50824 | |||
| 6dc17857da | |||
| 11a30caae8 | |||
| ac1a26a10c | |||
| 7a199e122d | |||
| d8c3d2e19c | |||
| 375755999a | |||
| 9996fd4833 | |||
| 149b3136d2 | |||
| ac8f8b0539 | |||
| b2cbf90d0b | |||
| 373145478e | |||
| 55b0cea94f | |||
| 5b17599aa2 | |||
| 4cfb15c7cd | |||
| 63da7f8d57 | |||
| fb4012fbd1 | |||
| 24449f1c0f | |||
| fd303c8343 | |||
| 346b177a87 | |||
| d4ec131fa7 | |||
| 48370a4555 | |||
| 36b076774e | |||
| 482a4ec253 | |||
| 2fb28364c5 | |||
| 8460f4ab7f | 
| @@ -12,14 +12,18 @@ include(flink) | |||||||
| find_package(elfio QUIET) | find_package(elfio QUIET) | ||||||
| find_package(jsoncpp) | find_package(jsoncpp) | ||||||
| find_package(Boost COMPONENTS coroutine REQUIRED) | find_package(Boost COMPONENTS coroutine REQUIRED) | ||||||
|  | find_package(absl REQUIRED) | ||||||
|  |  | ||||||
| add_subdirectory(softfloat) | add_subdirectory(softfloat) | ||||||
|  |  | ||||||
| set(LIB_SOURCES | set(LIB_SOURCES | ||||||
|     src/iss/plugin/instruction_count.cpp |     src/iss/plugin/instruction_count.cpp | ||||||
|     src/iss/arch/tgc5c.cpp |     src/iss/arch/tgc5c.cpp | ||||||
|  |     src/iss/mem/memory_if.cpp | ||||||
|     src/vm/interp/vm_tgc5c.cpp |     src/vm/interp/vm_tgc5c.cpp | ||||||
|     src/vm/fp_functions.cpp |     src/vm/fp_functions.cpp | ||||||
|  |     src/vm/vector_functions.cpp | ||||||
|  |     src/iss/debugger/csr_names.cpp | ||||||
|     src/iss/semihosting/semihosting.cpp |     src/iss/semihosting/semihosting.cpp | ||||||
| ) | ) | ||||||
|  |  | ||||||
| @@ -101,23 +105,13 @@ if(NOT(DBT_CORE_DEFS STREQUAL DBT_CORE_DEFS-NOTFOUND)) | |||||||
|     target_compile_definitions(${PROJECT_NAME} INTERFACE ${DBT_CORE_DEFS}) |     target_compile_definitions(${PROJECT_NAME} INTERFACE ${DBT_CORE_DEFS}) | ||||||
| endif() | endif() | ||||||
|  |  | ||||||
| target_link_libraries(${PROJECT_NAME} PUBLIC elfio::elfio softfloat scc-util Boost::coroutine) | target_link_libraries(${PROJECT_NAME} PUBLIC elfio::elfio softfloat scc-util Boost::coroutine abseil::abseil) | ||||||
|  |  | ||||||
| if(TARGET yaml-cpp::yaml-cpp) | if(TARGET yaml-cpp::yaml-cpp) | ||||||
|     target_compile_definitions(${PROJECT_NAME} PUBLIC WITH_PLUGINS) |     target_compile_definitions(${PROJECT_NAME} PUBLIC WITH_PLUGINS) | ||||||
|     target_link_libraries(${PROJECT_NAME} PUBLIC yaml-cpp::yaml-cpp) |     target_link_libraries(${PROJECT_NAME} PUBLIC yaml-cpp::yaml-cpp) | ||||||
| endif() | endif() | ||||||
|  |  | ||||||
| if(WITH_LLVM) |  | ||||||
|     find_package(LLVM) |  | ||||||
|     target_compile_definitions(${PROJECT_NAME} PUBLIC ${LLVM_DEFINITIONS}) |  | ||||||
|     target_include_directories(${PROJECT_NAME} PUBLIC ${LLVM_INCLUDE_DIRS}) |  | ||||||
|  |  | ||||||
|     if(BUILD_SHARED_LIBS) |  | ||||||
|         target_link_libraries(${PROJECT_NAME} PUBLIC ${LLVM_LIBRARIES}) |  | ||||||
|     endif() |  | ||||||
| endif() |  | ||||||
|  |  | ||||||
| set_target_properties(${PROJECT_NAME} PROPERTIES | set_target_properties(${PROJECT_NAME} PROPERTIES | ||||||
|     VERSION ${PROJECT_VERSION} |     VERSION ${PROJECT_VERSION} | ||||||
|     FRAMEWORK FALSE |     FRAMEWORK FALSE | ||||||
| @@ -261,3 +255,9 @@ if(TARGET scc-sysc) | |||||||
|         INCLUDES DESTINATION ${CMAKE_INSTALL_INCLUDEDIR} # headers |         INCLUDES DESTINATION ${CMAKE_INSTALL_INCLUDEDIR} # headers | ||||||
|     ) |     ) | ||||||
| endif() | endif() | ||||||
|  |  | ||||||
|  | project(elfio-test) | ||||||
|  | find_package(Boost COMPONENTS program_options thread REQUIRED) | ||||||
|  |  | ||||||
|  | add_executable(${PROJECT_NAME} src/elfio.cpp) | ||||||
|  | target_link_libraries(${PROJECT_NAME} PUBLIC elfio::elfio) | ||||||
|   | |||||||
| @@ -20,7 +20,7 @@ RVI: | |||||||
|     mask: 0b00000000000000000000000001111111 |     mask: 0b00000000000000000000000001111111 | ||||||
|     size:   32 |     size:   32 | ||||||
|     branch:   true |     branch:   true | ||||||
|     delay:   1 |     delay:   [1,1] | ||||||
|   JALR: |   JALR: | ||||||
|     index: 3 |     index: 3 | ||||||
|     encoding: 0b00000000000000000000000001100111 |     encoding: 0b00000000000000000000000001100111 | ||||||
|   | |||||||
| @@ -1,5 +1,5 @@ | |||||||
| /******************************************************************************* | /******************************************************************************* | ||||||
|  * Copyright (C) 2017 - 2020 MINRES Technologies GmbH |  * Copyright (C) 2024 MINRES Technologies GmbH | ||||||
|  * All rights reserved. |  * All rights reserved. | ||||||
|  * |  * | ||||||
|  * Redistribution and use in source and binary forms, with or without |  * Redistribution and use in source and binary forms, with or without | ||||||
| @@ -47,10 +47,10 @@ def getRegisterSizes(){ | |||||||
|  |  | ||||||
| using namespace iss::arch; | using namespace iss::arch; | ||||||
|  |  | ||||||
| constexpr std::array<const char*, ${registers.size}>    iss::arch::traits<iss::arch::${coreDef.name.toLowerCase()}>::reg_names; | constexpr std::array<const char*, ${registers.size()}>    iss::arch::traits<iss::arch::${coreDef.name.toLowerCase()}>::reg_names; | ||||||
| constexpr std::array<const char*, ${registers.size}>    iss::arch::traits<iss::arch::${coreDef.name.toLowerCase()}>::reg_aliases; | constexpr std::array<const char*, ${registers.size()}>    iss::arch::traits<iss::arch::${coreDef.name.toLowerCase()}>::reg_aliases; | ||||||
| constexpr std::array<const uint32_t, ${getRegisterSizes().size}> iss::arch::traits<iss::arch::${coreDef.name.toLowerCase()}>::reg_bit_widths; | constexpr std::array<const uint32_t, ${getRegisterSizes().size()}> iss::arch::traits<iss::arch::${coreDef.name.toLowerCase()}>::reg_bit_widths; | ||||||
| constexpr std::array<const uint32_t, ${getRegisterSizes().size}> iss::arch::traits<iss::arch::${coreDef.name.toLowerCase()}>::reg_byte_offsets; | constexpr std::array<const uint32_t, ${getRegisterSizes().size()}> iss::arch::traits<iss::arch::${coreDef.name.toLowerCase()}>::reg_byte_offsets; | ||||||
|  |  | ||||||
| ${coreDef.name.toLowerCase()}::${coreDef.name.toLowerCase()}()  = default; | ${coreDef.name.toLowerCase()}::${coreDef.name.toLowerCase()}()  = default; | ||||||
|  |  | ||||||
|   | |||||||
| @@ -1,5 +1,5 @@ | |||||||
| /******************************************************************************* | /******************************************************************************* | ||||||
|  * Copyright (C) 2017 - 2021 MINRES Technologies GmbH |  * Copyright (C) 2024 MINRES Technologies GmbH | ||||||
|  * All rights reserved. |  * All rights reserved. | ||||||
|  * |  * | ||||||
|  * Redistribution and use in source and binary forms, with or without |  * Redistribution and use in source and binary forms, with or without | ||||||
| @@ -30,11 +30,21 @@ | |||||||
|  * |  * | ||||||
|  *******************************************************************************/ |  *******************************************************************************/ | ||||||
| <% | <% | ||||||
| def nativeTypeSize(int size){ | def nativeSize(int size){ | ||||||
|     if(size<=8) return 8; else if(size<=16) return 16; else if(size<=32) return 32; else return 64; |     if(size<=8) return 8; | ||||||
|  |     if(size<=16) return 16; | ||||||
|  |     if(size<=32) return 32; | ||||||
|  |     if(size<=64) return 64; | ||||||
|  |     if(size<=128) return 128; | ||||||
|  |     if(size<=256) return 256; | ||||||
|  |     if(size<=512) return 512; | ||||||
|  |     if(size<=1024) return 1024; | ||||||
|  |     if(size<=2048) return 2048; | ||||||
|  |     if(size<=4096) return 4096; | ||||||
|  |     throw new IllegalArgumentException("Unsupported size in nativeSize in CORENAME.h.gtl"); | ||||||
| } | } | ||||||
| def getRegisterSizes(){ | def getRegisterSizes(){ | ||||||
|     def regs = registers.collect{nativeTypeSize(it.size)} |     def regs = registers.collect{nativeSize(it.size)} | ||||||
|     regs+=[32,32, 64, 64, 64, 32, 32] // append TRAP_STATE, PENDING_TRAP, ICOUNT, CYCLE, INSTRET, INSTRUCTION, LAST_BRANCH |     regs+=[32,32, 64, 64, 64, 32, 32] // append TRAP_STATE, PENDING_TRAP, ICOUNT, CYCLE, INSTRET, INSTRUCTION, LAST_BRANCH | ||||||
|     return regs |     return regs | ||||||
| } | } | ||||||
| @@ -47,13 +57,7 @@ def getRegisterOffsets(){ | |||||||
|     } |     } | ||||||
|     return offsets |     return offsets | ||||||
| } | } | ||||||
| def byteSize(int size){ |  | ||||||
|     if(size<=8) return 8; |  | ||||||
|     if(size<=16) return 16; |  | ||||||
|     if(size<=32) return 32; |  | ||||||
|     if(size<=64) return 64; |  | ||||||
|     return 128; |  | ||||||
| } |  | ||||||
| def getCString(def val){ | def getCString(def val){ | ||||||
|     return val.toString()+'ULL' |     return val.toString()+'ULL' | ||||||
| } | } | ||||||
| @@ -75,15 +79,17 @@ template <> struct traits<${coreDef.name.toLowerCase()}> { | |||||||
|  |  | ||||||
|     constexpr static char const* const core_type = "${coreDef.name}"; |     constexpr static char const* const core_type = "${coreDef.name}"; | ||||||
|      |      | ||||||
|     static constexpr std::array<const char*, ${registers.size}> reg_names{ |     static constexpr std::array<const char*, ${registers.size()}> reg_names{ | ||||||
|         {"${registers.collect{it.name.toLowerCase()}.join('", "')}"}}; |         {"${registers.collect{it.name.toLowerCase()}.join('", "')}"}}; | ||||||
|   |   | ||||||
|     static constexpr std::array<const char*, ${registers.size}> reg_aliases{ |     static constexpr std::array<const char*, ${registers.size()}> reg_aliases{ | ||||||
|         {"${registers.collect{it.alias.toLowerCase()}.join('", "')}"}}; |         {"${registers.collect{it.alias.toLowerCase()}.join('", "')}"}}; | ||||||
|  |  | ||||||
|     enum constants {${constants.collect{c -> c.name+"="+getCString(c.value)}.join(', ')}}; |     enum constants {${constants.collect{c -> c.name+"="+getCString(c.value)}.join(', ')}}; | ||||||
|  |  | ||||||
|     constexpr static unsigned FP_REGS_SIZE = ${constants.find {it.name=='FLEN'}?.value?:0}; |     constexpr static unsigned FP_REGS_SIZE = ${constants.find {it.name=='FLEN'}?.value?:0}; | ||||||
|  |     constexpr static unsigned V_REGS_SIZE = ${constants.find {it.name=='VLEN'}?.value?:0}; | ||||||
|  |  | ||||||
|  |  | ||||||
|     enum reg_e { |     enum reg_e { | ||||||
|         ${registers.collect{it.name}.join(', ')}, NUM_REGS, TRAP_STATE=NUM_REGS, PENDING_TRAP, ICOUNT, CYCLE, INSTRET, INSTRUCTION, LAST_BRANCH |         ${registers.collect{it.name}.join(', ')}, NUM_REGS, TRAP_STATE=NUM_REGS, PENDING_TRAP, ICOUNT, CYCLE, INSTRET, INSTRUCTION, LAST_BRANCH | ||||||
| @@ -99,10 +105,10 @@ template <> struct traits<${coreDef.name.toLowerCase()}> { | |||||||
|  |  | ||||||
|     using phys_addr_t = iss::typed_addr_t<iss::address_type::PHYSICAL>; |     using phys_addr_t = iss::typed_addr_t<iss::address_type::PHYSICAL>; | ||||||
|  |  | ||||||
|     static constexpr std::array<const uint32_t, ${getRegisterSizes().size}> reg_bit_widths{ |     static constexpr std::array<const uint32_t, ${getRegisterSizes().size()}> reg_bit_widths{ | ||||||
|         {${getRegisterSizes().join(',')}}}; |         {${getRegisterSizes().join(',')}}}; | ||||||
|  |  | ||||||
|     static constexpr std::array<const uint32_t, ${getRegisterOffsets().size}> reg_byte_offsets{ |     static constexpr std::array<const uint32_t, ${getRegisterOffsets().size()}> reg_byte_offsets{ | ||||||
|         {${getRegisterOffsets().join(',')}}}; |         {${getRegisterOffsets().join(',')}}}; | ||||||
|  |  | ||||||
|     static const uint64_t addr_mask = (reg_t(1) << (XLEN - 1)) | ((reg_t(1) << (XLEN - 1)) - 1); |     static const uint64_t addr_mask = (reg_t(1) << (XLEN - 1)) | ((reg_t(1) << (XLEN - 1)) - 1); | ||||||
| @@ -131,8 +137,6 @@ struct ${coreDef.name.toLowerCase()}: public arch_if { | |||||||
|  |  | ||||||
|     uint8_t* get_regs_base_ptr() override; |     uint8_t* get_regs_base_ptr() override; | ||||||
|  |  | ||||||
|     inline uint64_t get_icount() { return reg.icount; } |  | ||||||
|  |  | ||||||
|     inline bool should_stop() { return interrupt_sim; } |     inline bool should_stop() { return interrupt_sim; } | ||||||
|  |  | ||||||
|     inline uint64_t stop_code() { return interrupt_sim; } |     inline uint64_t stop_code() { return interrupt_sim; } | ||||||
| @@ -141,20 +145,20 @@ struct ${coreDef.name.toLowerCase()}: public arch_if { | |||||||
|  |  | ||||||
|     virtual iss::sync_type needed_sync() const { return iss::NO_SYNC; } |     virtual iss::sync_type needed_sync() const { return iss::NO_SYNC; } | ||||||
|  |  | ||||||
|     inline uint32_t get_last_branch() { return reg.last_branch; } |  | ||||||
|  |  | ||||||
|  |  | ||||||
| #pragma pack(push, 1) | #pragma pack(push, 1) | ||||||
|     struct ${coreDef.name}_regs {<% |     struct ${coreDef.name}_regs {<% | ||||||
|         registers.each { reg -> if(reg.size>0) {%>  |         registers.each { reg -> if(reg.size>64) {%> | ||||||
|         uint${byteSize(reg.size)}_t ${reg.name} = 0;<% |         uint8_t ${reg.name}[${reg.size/8}] = {0};<% | ||||||
|  |         }else if(reg.size>0) {%> | ||||||
|  |         uint${nativeSize(reg.size)}_t ${reg.name} = 0;<% | ||||||
|         }}%> |         }}%> | ||||||
|         uint32_t trap_state = 0, pending_trap = 0; |         uint32_t trap_state = 0, pending_trap = 0; | ||||||
|         uint64_t icount = 0; |         uint64_t icount = 0;      // counts number of instructions undisturbed | ||||||
|         uint64_t cycle = 0; |         uint64_t cycle = 0;       // counts number of cycles, in functional mode equals icount | ||||||
|         uint64_t instret = 0; |         uint64_t instret = 0;     // counts number of instructions, can be reset via CSR write | ||||||
|         uint32_t instruction = 0; |         uint32_t instruction = 0; // holds op code of currently executed instruction | ||||||
|         uint32_t last_branch = 0; |         uint32_t last_branch = 0; // indicates if last branch was taken | ||||||
|     } reg; |     } reg; | ||||||
| #pragma pack(pop) | #pragma pack(pop) | ||||||
|     std::array<address_type, 4> addr_mode; |     std::array<address_type, 4> addr_mode; | ||||||
| @@ -168,6 +172,31 @@ if(fcsr != null) {%> | |||||||
| <%} else { %> | <%} else { %> | ||||||
|     uint32_t get_fcsr(){return 0;} |     uint32_t get_fcsr(){return 0;} | ||||||
|     void set_fcsr(uint32_t val){} |     void set_fcsr(uint32_t val){} | ||||||
|  | <%} | ||||||
|  | def vstart = registers.find {it.name=='vstart'} | ||||||
|  | def vl = registers.find {it.name=='vl'} | ||||||
|  | def vtype = registers.find {it.name=='vtype'} | ||||||
|  | def vxsat = registers.find {it.name=='vxsat'} | ||||||
|  | def vxrm = registers.find {it.name=='vxrm'} | ||||||
|  |  | ||||||
|  | if(vtype != null) {%> | ||||||
|  |     uint${vstart.size}_t get_vstart(){return reg.vstart;} | ||||||
|  |     void set_vstart(uint${vstart.size}_t val){reg.vstart = val;} | ||||||
|  |     uint${vl.size}_t get_vl(){return reg.vl;} | ||||||
|  |     uint${vtype.size}_t get_vtype(){return reg.vtype;} | ||||||
|  |     uint${vxsat.size}_t get_vxsat(){return reg.vxsat;} | ||||||
|  |     void set_vxsat(uint${vxsat.size}_t val){reg.vxsat = val;} | ||||||
|  |     uint${vxrm.size}_t get_vxrm(){return reg.vxrm;} | ||||||
|  |     void set_vxrm(uint${vxrm.size}_t val){reg.vxrm = val;} | ||||||
|  | <%} else { %> | ||||||
|  |     uint32_t get_vstart(){return 0;} | ||||||
|  |     void set_vstart(uint32_t val){} | ||||||
|  |     uint32_t get_vl(){return 0;} | ||||||
|  |     uint32_t get_vtype(){return 0;} | ||||||
|  |     uint32_t get_vxsat(){return 0;} | ||||||
|  |     void set_vxsat(uint32_t val){} | ||||||
|  |     uint32_t get_vxrm(){return 0;} | ||||||
|  |     void set_vxrm(uint32_t val){} | ||||||
| <%}%> | <%}%> | ||||||
| }; | }; | ||||||
|  |  | ||||||
|   | |||||||
| @@ -1,5 +1,5 @@ | |||||||
| /******************************************************************************* | /******************************************************************************* | ||||||
|  * Copyright (C) 2023 MINRES Technologies GmbH |  * Copyright (C) 2024 MINRES Technologies GmbH | ||||||
|  * All rights reserved. |  * All rights reserved. | ||||||
|  * |  * | ||||||
|  * Redistribution and use in source and binary forms, with or without |  * Redistribution and use in source and binary forms, with or without | ||||||
| @@ -45,17 +45,17 @@ namespace interp { | |||||||
| using namespace sysc; | using namespace sysc; | ||||||
| volatile std::array<bool, ${array_count}> ${coreDef.name.toLowerCase()}_init = { | volatile std::array<bool, ${array_count}> ${coreDef.name.toLowerCase()}_init = { | ||||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|interp", [](unsigned gdb_port, void* data) -> iss_factory::base_t { |         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|interp", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::${coreDef.name.toLowerCase()}>>(cc); |             auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::${coreDef.name.toLowerCase()}>>(cc); | ||||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; |             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||||
|         }), |         }), | ||||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|interp", [](unsigned gdb_port, void* data) -> iss_factory::base_t { |         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|interp", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}>>(cc); |             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}>>(cc); | ||||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; |             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||||
|         })<%if(coreDef.name.toLowerCase()=="tgc5d" || coreDef.name.toLowerCase()=="tgc5e") {%>, |         })<%if(coreDef.name.toLowerCase()=="tgc5d" || coreDef.name.toLowerCase()=="tgc5e") {%>, | ||||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p_clic_pmp|interp", [](unsigned gdb_port, void* data) -> iss_factory::base_t { |         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p_clic_pmp|interp", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_EXT_N | iss::arch::FEAT_CLIC)>>(cc); |             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_EXT_N | iss::arch::FEAT_CLIC)>>(cc); | ||||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; |             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||||
|         })<%}%> |         })<%}%> | ||||||
| @@ -66,17 +66,17 @@ namespace llvm { | |||||||
| using namespace sysc; | using namespace sysc; | ||||||
| volatile std::array<bool, ${array_count}> ${coreDef.name.toLowerCase()}_init = { | volatile std::array<bool, ${array_count}> ${coreDef.name.toLowerCase()}_init = { | ||||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|llvm", [](unsigned gdb_port, void* data) -> iss_factory::base_t { |         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|llvm", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::${coreDef.name.toLowerCase()}>>(cc); |             auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::${coreDef.name.toLowerCase()}>>(cc); | ||||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; |             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||||
|         }), |         }), | ||||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|llvm", [](unsigned gdb_port, void* data) -> iss_factory::base_t { |         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|llvm", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}>>(cc); |             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}>>(cc); | ||||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; |             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||||
|         })<%if(coreDef.name.toLowerCase()=="tgc5d" || coreDef.name.toLowerCase()=="tgc5e") {%>, |         })<%if(coreDef.name.toLowerCase()=="tgc5d" || coreDef.name.toLowerCase()=="tgc5e") {%>, | ||||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p_clic_pmp|llvm", [](unsigned gdb_port, void* data) -> iss_factory::base_t { |         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p_clic_pmp|llvm", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_EXT_N | iss::arch::FEAT_CLIC)>>(cc); |             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_EXT_N | iss::arch::FEAT_CLIC)>>(cc); | ||||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; |             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||||
|         })<%}%> |         })<%}%> | ||||||
| @@ -88,17 +88,17 @@ namespace tcc { | |||||||
| using namespace sysc; | using namespace sysc; | ||||||
| volatile std::array<bool, ${array_count}> ${coreDef.name.toLowerCase()}_init = { | volatile std::array<bool, ${array_count}> ${coreDef.name.toLowerCase()}_init = { | ||||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|tcc", [](unsigned gdb_port, void* data) -> iss_factory::base_t { |         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|tcc", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::${coreDef.name.toLowerCase()}>>(cc); |             auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::${coreDef.name.toLowerCase()}>>(cc); | ||||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; |             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||||
|         }), |         }), | ||||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|tcc", [](unsigned gdb_port, void* data) -> iss_factory::base_t { |         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|tcc", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}>>(cc); |             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}>>(cc); | ||||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; |             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||||
|         })<%if(coreDef.name.toLowerCase()=="tgc5d" || coreDef.name.toLowerCase()=="tgc5e") {%>, |         })<%if(coreDef.name.toLowerCase()=="tgc5d" || coreDef.name.toLowerCase()=="tgc5e") {%>, | ||||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p_clic_pmp|tcc", [](unsigned gdb_port, void* data) -> iss_factory::base_t { |         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p_clic_pmp|tcc", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_EXT_N | iss::arch::FEAT_CLIC)>>(cc); |             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_EXT_N | iss::arch::FEAT_CLIC)>>(cc); | ||||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; |             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||||
|         })<%}%> |         })<%}%> | ||||||
| @@ -110,17 +110,17 @@ namespace asmjit { | |||||||
| using namespace sysc; | using namespace sysc; | ||||||
| volatile std::array<bool, ${array_count}> ${coreDef.name.toLowerCase()}_init = { | volatile std::array<bool, ${array_count}> ${coreDef.name.toLowerCase()}_init = { | ||||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|asmjit", [](unsigned gdb_port, void* data) -> iss_factory::base_t { |         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|asmjit", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::${coreDef.name.toLowerCase()}>>(cc); |             auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::${coreDef.name.toLowerCase()}>>(cc); | ||||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; |             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||||
|         }), |         }), | ||||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|asmjit", [](unsigned gdb_port, void* data) -> iss_factory::base_t { |         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|asmjit", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}>>(cc); |             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}>>(cc); | ||||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; |             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||||
|         })<%if(coreDef.name.toLowerCase()=="tgc5d" || coreDef.name.toLowerCase()=="tgc5e") {%>, |         })<%if(coreDef.name.toLowerCase()=="tgc5d" || coreDef.name.toLowerCase()=="tgc5e") {%>, | ||||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p_clic_pmp|asmjit", [](unsigned gdb_port, void* data) -> iss_factory::base_t { |         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p_clic_pmp|asmjit", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_EXT_N | iss::arch::FEAT_CLIC)>>(cc); |             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_EXT_N | iss::arch::FEAT_CLIC)>>(cc); | ||||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; |             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||||
|         })<%}%> |         })<%}%> | ||||||
|   | |||||||
| @@ -1,5 +1,5 @@ | |||||||
| /******************************************************************************* | /******************************************************************************* | ||||||
|  * Copyright (C) 2017, 2023 MINRES Technologies GmbH |  * Copyright (C) 2017-2024 MINRES Technologies GmbH | ||||||
|  * All rights reserved. |  * All rights reserved. | ||||||
|  * |  * | ||||||
|  * Redistribution and use in source and binary forms, with or without |  * Redistribution and use in source and binary forms, with or without | ||||||
| @@ -37,7 +37,14 @@ | |||||||
| #include <iss/asmjit/vm_base.h> | #include <iss/asmjit/vm_base.h> | ||||||
| #include <asmjit/asmjit.h> | #include <asmjit/asmjit.h> | ||||||
| #include <util/logging.h> | #include <util/logging.h> | ||||||
|  | #include <iss/instruction_decoder.h> | ||||||
|  | <%def fcsr = registers.find {it.name=='FCSR'} | ||||||
|  | if(fcsr != null) {%> | ||||||
|  | #include <vm/fp_functions.h><%} | ||||||
|  | def aes = functions.find { it.contains('aes') } | ||||||
|  | if(aes != null) {%> | ||||||
|  | #include <vm/aes_sbox.h> | ||||||
|  | <%}%> | ||||||
| #ifndef FMT_HEADER_ONLY | #ifndef FMT_HEADER_ONLY | ||||||
| #define FMT_HEADER_ONLY | #define FMT_HEADER_ONLY | ||||||
| #endif | #endif | ||||||
| @@ -46,6 +53,22 @@ | |||||||
| #include <array> | #include <array> | ||||||
| #include <iss/debugger/riscv_target_adapter.h> | #include <iss/debugger/riscv_target_adapter.h> | ||||||
|  |  | ||||||
|  | #ifndef _MSC_VER | ||||||
|  | using int128_t = __int128; | ||||||
|  | using uint128_t = unsigned __int128; | ||||||
|  | namespace std { | ||||||
|  | template <> struct make_unsigned<__int128> { typedef unsigned __int128 type; }; | ||||||
|  | template <> class __make_unsigned_selector<__int128 unsigned, false, false> { | ||||||
|  | public: | ||||||
|  |     typedef unsigned __int128 __type; | ||||||
|  | }; | ||||||
|  | template <> struct is_signed<int128_t> { static constexpr bool value = true; }; | ||||||
|  | template <> struct is_signed<uint128_t> { static constexpr bool value = false; }; | ||||||
|  | template <> struct is_unsigned<int128_t> { static constexpr bool value = false; }; | ||||||
|  | template <> struct is_unsigned<uint128_t> { static constexpr bool value = true; }; | ||||||
|  | } // namespace std | ||||||
|  | #endif | ||||||
|  |  | ||||||
| namespace iss { | namespace iss { | ||||||
| namespace asmjit { | namespace asmjit { | ||||||
|  |  | ||||||
| @@ -80,28 +103,32 @@ public: | |||||||
|  |  | ||||||
| protected: | protected: | ||||||
|     using super::get_ptr_for; |     using super::get_ptr_for; | ||||||
| using super::get_reg; |  | ||||||
|     using super::get_reg_for; |     using super::get_reg_for; | ||||||
|  |     using super::get_reg_for_Gp; | ||||||
|     using super::load_reg_from_mem; |     using super::load_reg_from_mem; | ||||||
|  |     using super::load_reg_from_mem_Gp; | ||||||
|     using super::write_reg_to_mem; |     using super::write_reg_to_mem; | ||||||
|     using super::gen_ext; |  | ||||||
|     using super::gen_read_mem; |     using super::gen_read_mem; | ||||||
|     using super::gen_write_mem; |     using super::gen_write_mem; | ||||||
|     using super::gen_wait; |  | ||||||
|     using super::gen_leave; |     using super::gen_leave; | ||||||
|     using super::gen_operation; |     using super::gen_sync; | ||||||
|     |     | ||||||
|     using this_class = vm_impl<ARCH>; |     using this_class = vm_impl<ARCH>; | ||||||
|     using compile_func = continuation_e (this_class::*)(virt_addr_t&, code_word_t, jit_holder&); |     using compile_func = continuation_e (this_class::*)(virt_addr_t&, code_word_t, jit_holder&); | ||||||
|  |  | ||||||
|     continuation_e gen_single_inst_behavior(virt_addr_t&, unsigned int &, jit_holder&) override; |     continuation_e gen_single_inst_behavior(virt_addr_t&, jit_holder&) override; | ||||||
|  |     enum globals_e {TVAL = 0, GLOBALS_SIZE}; | ||||||
|     void gen_block_prologue(jit_holder& jh) override; |     void gen_block_prologue(jit_holder& jh) override; | ||||||
|     void gen_block_epilogue(jit_holder& jh) override; |     void gen_block_epilogue(jit_holder& jh) override; | ||||||
|     inline const char *name(size_t index){return traits::reg_aliases.at(index);} |     inline const char *name(size_t index){return traits::reg_aliases.at(index);} | ||||||
|  | <%if(fcsr != null) {%> | ||||||
|  |     inline const char *fname(size_t index){return index < 32?name(index+traits::F0):"illegal";}    | ||||||
|  | <%}%> | ||||||
|     void gen_instr_prologue(jit_holder& jh); |     void gen_instr_prologue(jit_holder& jh); | ||||||
|     void gen_instr_epilogue(jit_holder& jh); |     void gen_instr_epilogue(jit_holder& jh); | ||||||
|     inline void gen_raise(jit_holder& jh, uint16_t trap_id, uint16_t cause); |     inline void gen_raise(jit_holder& jh, uint16_t trap_id, uint16_t cause); | ||||||
|  |     template <typename T, typename = typename std::enable_if<std::is_integral<T>::value>::type> void gen_set_tval(jit_holder& jh, T new_tval) ; | ||||||
|  |     void gen_set_tval(jit_holder& jh, x86_reg_t _new_tval) ; | ||||||
|  |  | ||||||
|     template<unsigned W, typename U, typename S = typename std::make_signed<U>::type> |     template<unsigned W, typename U, typename S = typename std::make_signed<U>::type> | ||||||
|     inline S sext(U from) { |     inline S sext(U from) { | ||||||
| @@ -109,32 +136,34 @@ using super::get_reg; | |||||||
|         auto sign_mask = 1ULL<<(W-1); |         auto sign_mask = 1ULL<<(W-1); | ||||||
|         return (from & mask) | ((from & sign_mask) ? ~mask : 0); |         return (from & mask) | ((from & sign_mask) ? ~mask : 0); | ||||||
|     } |     } | ||||||
|  |     inline void raise(uint16_t trap_id, uint16_t cause){ | ||||||
|  |         auto trap_val =  0x80ULL << 24 | (cause << 16) | trap_id; | ||||||
|  |         this->core.reg.trap_state = trap_val; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  | <%functions.each{ it.eachLine { %> | ||||||
|  |     ${it}<%} | ||||||
|  | }%> | ||||||
| private: | private: | ||||||
|     /**************************************************************************** |     /**************************************************************************** | ||||||
|      * start opcode definitions |      * start opcode definitions | ||||||
|      ****************************************************************************/ |      ****************************************************************************/ | ||||||
|     struct instruction_descriptor { |     struct instruction_descriptor { | ||||||
|         size_t length; |         uint32_t length; | ||||||
|         uint32_t value; |         uint32_t value; | ||||||
|         uint32_t mask; |         uint32_t mask; | ||||||
|         compile_func op; |         compile_func op; | ||||||
|     }; |     }; | ||||||
|     struct decoding_tree_node{ |  | ||||||
|         std::vector<instruction_descriptor> instrs; |  | ||||||
|         std::vector<decoding_tree_node*> children; |  | ||||||
|         uint32_t submask = std::numeric_limits<uint32_t>::max(); |  | ||||||
|         uint32_t value; |  | ||||||
|         decoding_tree_node(uint32_t value) : value(value){} |  | ||||||
|     }; |  | ||||||
|  |  | ||||||
|     decoding_tree_node* root {nullptr}; |     const std::array<instruction_descriptor, ${instructions.size()}> instr_descr = {{ | ||||||
|  |  | ||||||
|     const std::array<instruction_descriptor, ${instructions.size}> instr_descr = {{ |  | ||||||
|          /* entries are: size, valid value, valid mask, function ptr */<%instructions.each{instr -> %> |          /* entries are: size, valid value, valid mask, function ptr */<%instructions.each{instr -> %> | ||||||
|         /* instruction ${instr.instruction.name}, encoding '${instr.encoding}' */ |         /* instruction ${instr.instruction.name}, encoding '${instr.encoding}' */ | ||||||
|         {${instr.length}, ${instr.encoding}, ${instr.mask}, &this_class::__${generator.functionName(instr.name)}},<%}%> |         {${instr.length}, ${instr.encoding}, ${instr.mask}, &this_class::__${generator.functionName(instr.name)}},<%}%> | ||||||
|     }}; |     }}; | ||||||
|  |  | ||||||
|  |     //needs to be declared after instr_descr | ||||||
|  |     decoder instr_decoder; | ||||||
|  |  | ||||||
|     /* instruction definitions */<%instructions.eachWithIndex{instr, idx -> %> |     /* instruction definitions */<%instructions.eachWithIndex{instr, idx -> %> | ||||||
|     /* instruction ${idx}: ${instr.name} */ |     /* instruction ${idx}: ${instr.name} */ | ||||||
|     continuation_e __${generator.functionName(instr.name)}(virt_addr_t& pc, code_word_t instr, jit_holder& jh){ |     continuation_e __${generator.functionName(instr.name)}(virt_addr_t& pc, code_word_t instr, jit_holder& jh){ | ||||||
| @@ -147,7 +176,7 @@ private: | |||||||
|             InvokeNode* call_print_disass; |             InvokeNode* call_print_disass; | ||||||
|             char* mnemonic_ptr = strdup(mnemonic.c_str()); |             char* mnemonic_ptr = strdup(mnemonic.c_str()); | ||||||
|             jh.disass_collection.push_back(mnemonic_ptr); |             jh.disass_collection.push_back(mnemonic_ptr); | ||||||
|             jh.cc.invoke(&call_print_disass, &print_disass, FuncSignatureT<void, void *, uint64_t, char *>()); |             jh.cc.invoke(&call_print_disass, &print_disass, FuncSignature::build<void, void *, uint64_t, char *>()); | ||||||
|             call_print_disass->setArg(0, jh.arch_if_ptr); |             call_print_disass->setArg(0, jh.arch_if_ptr); | ||||||
|             call_print_disass->setArg(1, pc.val); |             call_print_disass->setArg(1, pc.val); | ||||||
|             call_print_disass->setArg(2, mnemonic_ptr); |             call_print_disass->setArg(2, mnemonic_ptr); | ||||||
| @@ -155,87 +184,47 @@ private: | |||||||
|         } |         } | ||||||
|         x86::Compiler& cc = jh.cc; |         x86::Compiler& cc = jh.cc; | ||||||
|         cc.comment(fmt::format("${instr.name}_{:#x}:",pc.val).c_str()); |         cc.comment(fmt::format("${instr.name}_{:#x}:",pc.val).c_str()); | ||||||
|         this->gen_sync(jh, PRE_SYNC, ${idx}); |         gen_sync(jh, PRE_SYNC, ${idx}); | ||||||
|         cc.mov(jh.pc, pc.val); |         mov(cc, jh.pc, pc.val); | ||||||
|  |         gen_set_tval(jh, instr); | ||||||
|         pc = pc+${instr.length/8}; |         pc = pc+${instr.length/8}; | ||||||
|         cc.mov(jh.next_pc, pc.val); |         mov(cc, jh.next_pc, pc.val); | ||||||
|  |  | ||||||
|         gen_instr_prologue(jh); |         gen_instr_prologue(jh); | ||||||
|         cc.comment("//behavior:"); |  | ||||||
|         /*generate behavior*/ |         /*generate behavior*/ | ||||||
|         <%instr.behavior.eachLine{%>${it} |         <%instr.behavior.eachLine{%>${it} | ||||||
|         <%}%> |         <%}%> | ||||||
|  |         gen_sync(jh, POST_SYNC, ${idx}); | ||||||
|         gen_instr_epilogue(jh); |         gen_instr_epilogue(jh); | ||||||
|         this->gen_sync(jh, POST_SYNC, ${idx}); |  | ||||||
|     	return returnValue;         |     	return returnValue;         | ||||||
|     } |     } | ||||||
|     <%}%> |     <%}%> | ||||||
|     /**************************************************************************** |     /**************************************************************************** | ||||||
|      * end opcode definitions |      * end opcode definitions | ||||||
|      ****************************************************************************/ |      ****************************************************************************/ | ||||||
|     continuation_e illegal_intruction(virt_addr_t &pc, code_word_t instr, jit_holder& jh ) { |     continuation_e illegal_instruction(virt_addr_t &pc, code_word_t instr, jit_holder& jh ) { | ||||||
|         x86::Compiler& cc = jh.cc; |         x86::Compiler& cc = jh.cc; | ||||||
|         cc.comment(fmt::format("illegal_intruction{:#x}:",pc.val).c_str()); |         if(this->disass_enabled){           | ||||||
|         this->gen_sync(jh, PRE_SYNC, instr_descr.size()); |             auto mnemonic = std::string("illegal_instruction"); | ||||||
|  |             InvokeNode* call_print_disass; | ||||||
|  |             char* mnemonic_ptr = strdup(mnemonic.c_str()); | ||||||
|  |             jh.disass_collection.push_back(mnemonic_ptr); | ||||||
|  |             jh.cc.invoke(&call_print_disass, &print_disass, FuncSignature::build<void, void *, uint64_t, char *>()); | ||||||
|  |             call_print_disass->setArg(0, jh.arch_if_ptr); | ||||||
|  |             call_print_disass->setArg(1, pc.val); | ||||||
|  |             call_print_disass->setArg(2, mnemonic_ptr); | ||||||
|  |         } | ||||||
|  |         cc.comment(fmt::format("illegal_instruction{:#x}:",pc.val).c_str()); | ||||||
|  |         gen_sync(jh, PRE_SYNC, instr_descr.size()); | ||||||
|  |         mov(cc, jh.pc, pc.val); | ||||||
|  |         gen_set_tval(jh, instr); | ||||||
|         pc = pc + ((instr & 3) == 3 ? 4 : 2); |         pc = pc + ((instr & 3) == 3 ? 4 : 2); | ||||||
|  |         mov(cc, jh.next_pc, pc.val); | ||||||
|         gen_instr_prologue(jh); |         gen_instr_prologue(jh); | ||||||
|         cc.comment("//behavior:"); |         gen_raise(jh, 0, 2); | ||||||
|  |         gen_sync(jh, POST_SYNC, instr_descr.size()); | ||||||
|         gen_instr_epilogue(jh); |         gen_instr_epilogue(jh); | ||||||
|         this->gen_sync(jh, POST_SYNC, instr_descr.size()); |         return ILLEGAL_INSTR; | ||||||
|         return BRANCH; |  | ||||||
|     } |  | ||||||
|       |  | ||||||
|     //decoding functionality |  | ||||||
|  |  | ||||||
|     void populate_decoding_tree(decoding_tree_node* root){ |  | ||||||
|         //create submask |  | ||||||
|         for(auto instr: root->instrs){ |  | ||||||
|             root->submask &= instr.mask; |  | ||||||
|         } |  | ||||||
|         //put each instr according to submask&encoding into children |  | ||||||
|         for(auto instr: root->instrs){ |  | ||||||
|             bool foundMatch = false; |  | ||||||
|             for(auto child: root->children){ |  | ||||||
|                 //use value as identifying trait |  | ||||||
|                 if(child->value == (instr.value&root->submask)){ |  | ||||||
|                     child->instrs.push_back(instr); |  | ||||||
|                     foundMatch = true; |  | ||||||
|                 } |  | ||||||
|             } |  | ||||||
|             if(!foundMatch){ |  | ||||||
|                 decoding_tree_node* child = new decoding_tree_node(instr.value&root->submask); |  | ||||||
|                 child->instrs.push_back(instr); |  | ||||||
|                 root->children.push_back(child); |  | ||||||
|             } |  | ||||||
|         } |  | ||||||
|         root->instrs.clear(); |  | ||||||
|         //call populate_decoding_tree for all children |  | ||||||
|         if(root->children.size() >1) |  | ||||||
|             for(auto child: root->children){ |  | ||||||
|                 populate_decoding_tree(child);       |  | ||||||
|             } |  | ||||||
|         else{ |  | ||||||
|             //sort instrs by value of the mask, this works bc we want to have the least restrictive one last |  | ||||||
|             std::sort(root->children[0]->instrs.begin(), root->children[0]->instrs.end(), [](const instruction_descriptor& instr1, const instruction_descriptor& instr2) { |  | ||||||
|             return instr1.mask > instr2.mask; |  | ||||||
|             });  |  | ||||||
|         } |  | ||||||
|     } |  | ||||||
|     compile_func decode_instr(decoding_tree_node* node, code_word_t word){ |  | ||||||
|         if(!node->children.size()){ |  | ||||||
|             if(node->instrs.size() == 1) return node->instrs[0].op; |  | ||||||
|             for(auto instr : node->instrs){ |  | ||||||
|                 if((instr.mask&word) == instr.value) return instr.op; |  | ||||||
|             } |  | ||||||
|         } |  | ||||||
|         else{ |  | ||||||
|             for(auto child : node->children){ |  | ||||||
|                 if (child->value == (node->submask&word)){ |  | ||||||
|                     return decode_instr(child, word); |  | ||||||
|                 }   |  | ||||||
|             }   |  | ||||||
|         } |  | ||||||
|         return nullptr; |  | ||||||
|     } |     } | ||||||
| }; | }; | ||||||
|  |  | ||||||
| @@ -243,102 +232,119 @@ template <typename ARCH> vm_impl<ARCH>::vm_impl() { this(new ARCH()); } | |||||||
|  |  | ||||||
| template <typename ARCH> | template <typename ARCH> | ||||||
| vm_impl<ARCH>::vm_impl(ARCH &core, unsigned core_id, unsigned cluster_id) | vm_impl<ARCH>::vm_impl(ARCH &core, unsigned core_id, unsigned cluster_id) | ||||||
| : vm_base<ARCH>(core, core_id, cluster_id) { | : vm_base<ARCH>(core, core_id, cluster_id) | ||||||
|     root = new decoding_tree_node(std::numeric_limits<uint32_t>::max()); | , instr_decoder([this]() { | ||||||
|     for(auto instr: instr_descr){ |         std::vector<generic_instruction_descriptor> g_instr_descr; | ||||||
|         root->instrs.push_back(instr); |         g_instr_descr.reserve(instr_descr.size()); | ||||||
|     } |         for (uint32_t i = 0; i < instr_descr.size(); ++i) { | ||||||
|     populate_decoding_tree(root); |             generic_instruction_descriptor new_instr_descr {instr_descr[i].value, instr_descr[i].mask, i}; | ||||||
|  |             g_instr_descr.push_back(new_instr_descr); | ||||||
|         } |         } | ||||||
|  |         return std::move(g_instr_descr); | ||||||
|  |     }()) {} | ||||||
|  |  | ||||||
| template <typename ARCH> | template <typename ARCH> | ||||||
| continuation_e vm_impl<ARCH>::gen_single_inst_behavior(virt_addr_t &pc, unsigned int &inst_cnt, jit_holder& jh) { | continuation_e vm_impl<ARCH>::gen_single_inst_behavior(virt_addr_t &pc, jit_holder& jh) { | ||||||
|     enum {TRAP_ID=1<<16}; |     enum {TRAP_ID=1<<16}; | ||||||
|     code_word_t instr = 0; |     code_word_t instr = 0; | ||||||
|     phys_addr_t paddr(pc); |     phys_addr_t paddr(pc); | ||||||
|     auto *const data = (uint8_t *)&instr; |     auto *const data = (uint8_t *)&instr; | ||||||
|     if(this->core.has_mmu()) |  | ||||||
|         paddr = this->core.virt2phys(pc); |  | ||||||
|     auto res = this->core.read(paddr, 4, data); |     auto res = this->core.read(paddr, 4, data); | ||||||
|     if (res != iss::Ok) |     if (res != iss::Ok) | ||||||
|         throw trap_access(TRAP_ID, pc.val); |         return ILLEGAL_FETCH; | ||||||
|     if (instr == 0x0000006f || (instr&0xffff)==0xa001) |     if (instr == 0x0000006f || (instr&0xffff)==0xa001) | ||||||
|         throw simulation_stopped(0); // 'J 0' or 'C.J 0' |         return JUMP_TO_SELF; | ||||||
|     ++inst_cnt; |     uint32_t inst_index = instr_decoder.decode_instr(instr); | ||||||
|     auto f = decode_instr(root, instr); |     compile_func f = nullptr; | ||||||
|  |     if(inst_index < instr_descr.size()) | ||||||
|  |         f = instr_descr[inst_index].op; | ||||||
|     if (f == nullptr)  |     if (f == nullptr)  | ||||||
|         f = &this_class::illegal_intruction; |         f = &this_class::illegal_instruction; | ||||||
|     return (this->*f)(pc, instr, jh); |     return (this->*f)(pc, instr, jh); | ||||||
| } | } | ||||||
| template <typename ARCH> | template <typename ARCH> | ||||||
| void vm_impl<ARCH>::gen_instr_prologue(jit_holder& jh) { | void vm_impl<ARCH>::gen_instr_prologue(jit_holder& jh) { | ||||||
|     auto& cc = jh.cc; |     auto& cc = jh.cc; | ||||||
|  |  | ||||||
|     cc.comment("//gen_instr_prologue"); |     x86_reg_t current_trap_state = get_reg_for(cc, traits::TRAP_STATE); | ||||||
|     cc.inc(get_ptr_for(jh, traits::ICOUNT)); |     mov(cc, current_trap_state, get_ptr_for(jh, traits::TRAP_STATE)); | ||||||
|  |     mov(cc, get_ptr_for(jh, traits::PENDING_TRAP), current_trap_state); | ||||||
|     x86::Gp current_trap_state = get_reg_for(jh, traits::TRAP_STATE); |     cc.comment("//Instruction prologue end"); | ||||||
|     cc.mov(current_trap_state, get_ptr_for(jh, traits::TRAP_STATE)); |  | ||||||
|     cc.mov(get_ptr_for(jh, traits::PENDING_TRAP), current_trap_state); |  | ||||||
|  |  | ||||||
| } | } | ||||||
| template <typename ARCH> | template <typename ARCH> | ||||||
| void vm_impl<ARCH>::gen_instr_epilogue(jit_holder& jh) { | void vm_impl<ARCH>::gen_instr_epilogue(jit_holder& jh) { | ||||||
|     auto& cc = jh.cc; |     auto& cc = jh.cc; | ||||||
|  |  | ||||||
|     cc.comment("//gen_instr_epilogue"); |     cc.comment("//Instruction epilogue begin"); | ||||||
|     x86::Gp current_trap_state = get_reg_for(jh, traits::TRAP_STATE); |     x86_reg_t current_trap_state = get_reg_for(cc, traits::TRAP_STATE); | ||||||
|     cc.mov(current_trap_state, get_ptr_for(jh, traits::TRAP_STATE)); |     mov(cc, current_trap_state, get_ptr_for(jh, traits::TRAP_STATE)); | ||||||
|     cc.cmp(current_trap_state, 0); |     cmp(cc, current_trap_state, 0); | ||||||
|     cc.jne(jh.trap_entry); |     cc.jne(jh.trap_entry); | ||||||
|  |     cc.inc(get_ptr_for(jh, traits::ICOUNT)); | ||||||
|  |     cc.inc(get_ptr_for(jh, traits::CYCLE)); | ||||||
|  |     cc.comment("//Instruction epilogue end"); | ||||||
|  |  | ||||||
| } | } | ||||||
| template <typename ARCH> | template <typename ARCH> | ||||||
| void vm_impl<ARCH>::gen_block_prologue(jit_holder& jh){ | void vm_impl<ARCH>::gen_block_prologue(jit_holder& jh){ | ||||||
|  |     jh.pc = load_reg_from_mem_Gp(jh, traits::PC); | ||||||
|     jh.pc = load_reg_from_mem(jh, traits::PC); |     jh.next_pc = load_reg_from_mem_Gp(jh, traits::NEXT_PC); | ||||||
|     jh.next_pc = load_reg_from_mem(jh, traits::NEXT_PC); |     jh.globals.resize(GLOBALS_SIZE); | ||||||
|  |     jh.globals[TVAL] = get_reg_Gp(jh.cc, 64, false); | ||||||
| } | } | ||||||
| template <typename ARCH> | template <typename ARCH> | ||||||
| void vm_impl<ARCH>::gen_block_epilogue(jit_holder& jh){ | void vm_impl<ARCH>::gen_block_epilogue(jit_holder& jh){ | ||||||
|     x86::Compiler& cc = jh.cc; |     x86::Compiler& cc = jh.cc; | ||||||
|     cc.comment("//gen_block_epilogue"); |     cc.comment("//block epilogue begin"); | ||||||
|     cc.ret(jh.next_pc); |     cc.ret(jh.next_pc); | ||||||
|  |  | ||||||
|     cc.bind(jh.trap_entry); |     cc.bind(jh.trap_entry); | ||||||
|     this->write_back(jh); |     this->write_back(jh); | ||||||
|     this->gen_sync(jh, POST_SYNC, -1); |  | ||||||
|  |  | ||||||
|     x86::Gp current_trap_state = get_reg_for(jh, traits::TRAP_STATE); |     x86::Gp current_trap_state = get_reg_for_Gp(cc, traits::TRAP_STATE); | ||||||
|     cc.mov(current_trap_state, get_ptr_for(jh, traits::TRAP_STATE)); |     mov(cc, current_trap_state, get_ptr_for(jh, traits::TRAP_STATE)); | ||||||
|  |  | ||||||
|     x86::Gp current_pc = get_reg_for(jh, traits::PC); |     x86::Gp current_pc = get_reg_for_Gp(cc, traits::PC); | ||||||
|     cc.mov(current_pc, get_ptr_for(jh, traits::PC)); |     mov(cc, current_pc, get_ptr_for(jh, traits::PC)); | ||||||
|  |  | ||||||
|     x86::Gp instr = cc.newInt32("instr"); |  | ||||||
|     cc.mov(instr, 0); // FIXME:this is not correct |  | ||||||
|     cc.comment("//enter trap call;"); |  | ||||||
|     InvokeNode* call_enter_trap; |     InvokeNode* call_enter_trap; | ||||||
|     cc.invoke(&call_enter_trap, &enter_trap, FuncSignatureT<uint64_t, void*, uint64_t, uint64_t, uint64_t>()); |     cc.invoke(&call_enter_trap, &enter_trap, FuncSignature::build<uint64_t, void*, uint64_t, uint64_t, uint64_t>()); | ||||||
|     call_enter_trap->setArg(0, jh.arch_if_ptr); |     call_enter_trap->setArg(0, jh.arch_if_ptr); | ||||||
|     call_enter_trap->setArg(1, current_trap_state); |     call_enter_trap->setArg(1, current_trap_state); | ||||||
|     call_enter_trap->setArg(2, current_pc); |     call_enter_trap->setArg(2, current_pc); | ||||||
|     call_enter_trap->setArg(3, instr); |     call_enter_trap->setArg(3, jh.globals[TVAL]); | ||||||
|  |  | ||||||
|     x86::Gp current_next_pc = get_reg_for(jh, traits::NEXT_PC); |     x86_reg_t current_next_pc = get_reg_for(cc, traits::NEXT_PC); | ||||||
|     cc.mov(current_next_pc, get_ptr_for(jh, traits::NEXT_PC)); |     mov(cc, current_next_pc, get_ptr_for(jh, traits::NEXT_PC)); | ||||||
|     cc.mov(jh.next_pc, current_next_pc); |     mov(cc, jh.next_pc, current_next_pc); | ||||||
|  |  | ||||||
|     cc.mov(get_ptr_for(jh, traits::LAST_BRANCH), std::numeric_limits<uint32_t>::max()); |     mov(cc, get_ptr_for(jh, traits::LAST_BRANCH), static_cast<int>(UNKNOWN_JUMP)); | ||||||
|     cc.ret(jh.next_pc); |     cc.ret(jh.next_pc); | ||||||
| } | } | ||||||
| template <typename ARCH> | template <typename ARCH> | ||||||
| inline void vm_impl<ARCH>::gen_raise(jit_holder& jh, uint16_t trap_id, uint16_t cause) { | inline void vm_impl<ARCH>::gen_raise(jit_holder& jh, uint16_t trap_id, uint16_t cause) { | ||||||
|     auto& cc = jh.cc; |     auto& cc = jh.cc; | ||||||
|     cc.comment("//gen_raise"); |     auto tmp1 = get_reg_for(cc, traits::TRAP_STATE); | ||||||
|     auto tmp1 = get_reg_for(jh, traits::TRAP_STATE); |     mov(cc, tmp1, 0x80ULL << 24 | (cause << 16) | trap_id); | ||||||
|     cc.mov(tmp1, 0x80ULL << 24 | (cause << 16) | trap_id); |     mov(cc, get_ptr_for(jh, traits::TRAP_STATE), tmp1); | ||||||
|     cc.mov(get_ptr_for(jh, traits::TRAP_STATE), tmp1); |     cc.jmp(jh.trap_entry); | ||||||
|     cc.mov(jh.next_pc, std::numeric_limits<uint32_t>::max()); | } | ||||||
|  | template <typename ARCH> | ||||||
|  | template <typename T, typename> | ||||||
|  | void vm_impl<ARCH>::gen_set_tval(jit_holder& jh, T new_tval) { | ||||||
|  |         mov(jh.cc, jh.globals[TVAL], new_tval); | ||||||
|  |     } | ||||||
|  | template <typename ARCH> | ||||||
|  | void vm_impl<ARCH>::gen_set_tval(jit_holder& jh, x86_reg_t _new_tval) { | ||||||
|  |     if(nonstd::holds_alternative<x86::Gp>(_new_tval)) { | ||||||
|  |         x86::Gp new_tval = nonstd::get<x86::Gp>(_new_tval); | ||||||
|  |         if(new_tval.size() < 8) | ||||||
|  |             new_tval = gen_ext_Gp(jh.cc, new_tval, 64, false); | ||||||
|  |         mov(jh.cc, jh.globals[TVAL], new_tval); | ||||||
|  |     } else { | ||||||
|  |         throw std::runtime_error("Variant not supported in gen_set_tval"); | ||||||
|  |     } | ||||||
| } | } | ||||||
|  |  | ||||||
| } // namespace tgc5c | } // namespace tgc5c | ||||||
| @@ -363,7 +369,7 @@ volatile std::array<bool, 2> dummy = { | |||||||
| 		    auto vm = new asmjit::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | 		    auto vm = new asmjit::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | ||||||
| 		    if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | 		    if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | ||||||
|             if(init_data){ |             if(init_data){ | ||||||
|                 auto* cb = reinterpret_cast<std::function<void(arch_if*, arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t, arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t)>*>(init_data); |                 auto* cb = reinterpret_cast<semihosting_cb_t<arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t>*>(init_data); | ||||||
|                 cpu->set_semihosting_callback(*cb); |                 cpu->set_semihosting_callback(*cb); | ||||||
|             } |             } | ||||||
|             return {cpu_ptr{cpu}, vm_ptr{vm}}; |             return {cpu_ptr{cpu}, vm_ptr{vm}}; | ||||||
| @@ -373,7 +379,7 @@ volatile std::array<bool, 2> dummy = { | |||||||
| 		    auto vm = new asmjit::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | 		    auto vm = new asmjit::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | ||||||
| 		    if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | 		    if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | ||||||
|             if(init_data){ |             if(init_data){ | ||||||
|                 auto* cb = reinterpret_cast<std::function<void(arch_if*, arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t, arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t)>*>(init_data); |                 auto* cb = reinterpret_cast<semihosting_cb_t<arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t>*>(init_data); | ||||||
|                 cpu->set_semihosting_callback(*cb); |                 cpu->set_semihosting_callback(*cb); | ||||||
|             } |             } | ||||||
|             return {cpu_ptr{cpu}, vm_ptr{vm}}; |             return {cpu_ptr{cpu}, vm_ptr{vm}}; | ||||||
|   | |||||||
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							| @@ -1,5 +1,5 @@ | |||||||
| /******************************************************************************* | /******************************************************************************* | ||||||
|  * Copyright (C) 2017, 2018 MINRES Technologies GmbH |  * Copyright (C) 2017-2024 MINRES Technologies GmbH | ||||||
|  * All rights reserved. |  * All rights reserved. | ||||||
|  * |  * | ||||||
|  * Redistribution and use in source and binary forms, with or without |  * Redistribution and use in source and binary forms, with or without | ||||||
| @@ -31,12 +31,17 @@ | |||||||
|  *******************************************************************************/ |  *******************************************************************************/ | ||||||
| // clang-format off | // clang-format off | ||||||
| #include <iss/arch/${coreDef.name.toLowerCase()}.h> | #include <iss/arch/${coreDef.name.toLowerCase()}.h> | ||||||
|  | // vm_base needs to be included before gdb_session as termios.h (via boost and gdb_server) has a define which clashes with a variable | ||||||
|  | // name in ConstantRange.h | ||||||
|  | #include <iss/llvm/vm_base.h> | ||||||
|  | #include <iss/iss.h> | ||||||
| #include <iss/debugger/gdb_session.h> | #include <iss/debugger/gdb_session.h> | ||||||
| #include <iss/debugger/server.h> | #include <iss/debugger/server.h> | ||||||
| #include <iss/iss.h> | #include <iss/instruction_decoder.h> | ||||||
| #include <iss/llvm/vm_base.h> |  | ||||||
| #include <util/logging.h> | #include <util/logging.h> | ||||||
|  | <%def fcsr = registers.find {it.name=='FCSR'} | ||||||
|  | if(fcsr != null) {%> | ||||||
|  | #include <vm/fp_functions.h><%}%> | ||||||
| #ifndef FMT_HEADER_ONLY | #ifndef FMT_HEADER_ONLY | ||||||
| #define FMT_HEADER_ONLY | #define FMT_HEADER_ONLY | ||||||
| #endif | #endif | ||||||
| @@ -82,7 +87,9 @@ protected: | |||||||
|     using vm_base<ARCH>::get_reg_ptr; |     using vm_base<ARCH>::get_reg_ptr; | ||||||
|  |  | ||||||
|     inline const char *name(size_t index){return traits::reg_aliases.at(index);} |     inline const char *name(size_t index){return traits::reg_aliases.at(index);} | ||||||
|  | <%if(fcsr != null) {%> | ||||||
|  |     inline const char *fname(size_t index){return index < 32?name(index+traits::F0):"illegal";}    | ||||||
|  | <%}%> | ||||||
|     template <typename T> inline ConstantInt *size(T type) { |     template <typename T> inline ConstantInt *size(T type) { | ||||||
|         return ConstantInt::get(getContext(), APInt(32, type->getType()->getScalarSizeInBits())); |         return ConstantInt::get(getContext(), APInt(32, type->getType()->getScalarSizeInBits())); | ||||||
|     } |     } | ||||||
| @@ -96,13 +103,16 @@ protected: | |||||||
|         return super::gen_cond_assign(cond, this->gen_ext(trueVal, size), this->gen_ext(falseVal, size)); |         return super::gen_cond_assign(cond, this->gen_ext(trueVal, size), this->gen_ext(falseVal, size)); | ||||||
|     } |     } | ||||||
|  |  | ||||||
|     std::tuple<continuation_e, BasicBlock *> gen_single_inst_behavior(virt_addr_t &, unsigned int &, BasicBlock *) override; |     std::tuple<continuation_e, BasicBlock *> gen_single_inst_behavior(virt_addr_t &, BasicBlock *) override; | ||||||
|  |  | ||||||
|     void gen_leave_behavior(BasicBlock *leave_blk) override; |     void gen_leave_behavior(BasicBlock *leave_blk) override; | ||||||
|     void gen_raise_trap(uint16_t trap_id, uint16_t cause); |     void gen_raise_trap(uint16_t trap_id, uint16_t cause); | ||||||
|     void gen_leave_trap(unsigned lvl); |     void gen_leave_trap(unsigned lvl); | ||||||
|     void gen_wait(unsigned type); |     void gen_wait(unsigned type); | ||||||
|  |     void set_tval(uint64_t new_tval); | ||||||
|  |     void set_tval(Value* new_tval); | ||||||
|     void gen_trap_behavior(BasicBlock *) override; |     void gen_trap_behavior(BasicBlock *) override; | ||||||
|  |     void gen_instr_prologue(); | ||||||
|     void gen_instr_epilogue(BasicBlock *bb); |     void gen_instr_epilogue(BasicBlock *bb); | ||||||
|  |  | ||||||
|     inline Value *gen_reg_load(unsigned i, unsigned level = 0) { |     inline Value *gen_reg_load(unsigned i, unsigned level = 0) { | ||||||
| @@ -127,33 +137,50 @@ protected: | |||||||
|         auto sign_mask = 1ULL<<(W-1); |         auto sign_mask = 1ULL<<(W-1); | ||||||
|         return (from & mask) | ((from & sign_mask) ? ~mask : 0); |         return (from & mask) | ((from & sign_mask) ? ~mask : 0); | ||||||
|     } |     } | ||||||
|  | <%functions.each{ it.eachLine { %> | ||||||
|  |     ${it}<%} | ||||||
|  | } | ||||||
|  | if(fcsr != null) {%> | ||||||
|  |     Value* NaNBox16(BasicBlock* bb, Value* NaNBox16_val){ | ||||||
|  |         if(static_cast<uint32_t>(traits::FLEN) == 16) | ||||||
|  |             return this->gen_ext(NaNBox16_val, traits::FLEN, false); | ||||||
|  |         auto box = this->builder.CreateNot((this->gen_ext(0, 32, false))); | ||||||
|  |         return this->gen_ext((this->builder.CreateOr(this->builder.CreateShl(this->gen_ext(box, traits::FLEN), 16), this->gen_ext(NaNBox16_val, traits::FLEN))), traits::FLEN, false); | ||||||
|  |     } | ||||||
|  |     Value* NaNBox32(BasicBlock* bb, Value* NaNBox32_val){ | ||||||
|  |         if(static_cast<uint32_t>(traits::FLEN) == 32) | ||||||
|  |             return this->gen_ext(NaNBox32_val, traits::FLEN, false); | ||||||
|  |         auto box = this->builder.CreateNot((this->gen_ext(0, 64, false))); | ||||||
|  |         return this->gen_ext((this->builder.CreateOr(this->builder.CreateShl(this->gen_ext(box, traits::FLEN), 32), this->gen_ext(NaNBox32_val, traits::FLEN))), traits::FLEN, false); | ||||||
|  |     } | ||||||
|  |     Value* NaNBox64(BasicBlock* bb, Value* NaNBox64_val){ | ||||||
|  |         if(static_cast<uint32_t>(traits::FLEN) == 64) | ||||||
|  |             return this->gen_ext(NaNBox64_val, traits::FLEN, false); | ||||||
|  |         auto box = this->builder.CreateNot((this->gen_ext(0, 128, false))); | ||||||
|  |         return this->gen_ext((this->builder.CreateOr(this->builder.CreateShl(this->gen_ext(box, traits::FLEN), 64), this->gen_ext(NaNBox64_val, traits::FLEN))), traits::FLEN, false); | ||||||
|  |     } | ||||||
|  |  | ||||||
|  | <%}%> | ||||||
| private: | private: | ||||||
|     /**************************************************************************** |     /**************************************************************************** | ||||||
|      * start opcode definitions |      * start opcode definitions | ||||||
|      ****************************************************************************/ |      ****************************************************************************/ | ||||||
|     struct instruction_descriptor { |     struct instruction_descriptor { | ||||||
|         size_t length; |         uint32_t length; | ||||||
|         uint32_t value; |         uint32_t value; | ||||||
|         uint32_t mask; |         uint32_t mask; | ||||||
|         compile_func op; |         compile_func op; | ||||||
|     }; |     }; | ||||||
|     struct decoding_tree_node{ |  | ||||||
|         std::vector<instruction_descriptor> instrs; |  | ||||||
|         std::vector<decoding_tree_node*> children; |  | ||||||
|         uint32_t submask = std::numeric_limits<uint32_t>::max(); |  | ||||||
|         uint32_t value; |  | ||||||
|         decoding_tree_node(uint32_t value) : value(value){} |  | ||||||
|     }; |  | ||||||
|  |  | ||||||
|     decoding_tree_node* root {nullptr}; |     const std::array<instruction_descriptor, ${instructions.size()}> instr_descr = {{ | ||||||
|  |  | ||||||
|     const std::array<instruction_descriptor, ${instructions.size}> instr_descr = {{ |  | ||||||
|          /* entries are: size, valid value, valid mask, function ptr */<%instructions.each{instr -> %> |          /* entries are: size, valid value, valid mask, function ptr */<%instructions.each{instr -> %> | ||||||
|         /* instruction ${instr.instruction.name}, encoding '${instr.encoding}' */ |         /* instruction ${instr.instruction.name}, encoding '${instr.encoding}' */ | ||||||
|         {${instr.length}, ${instr.encoding}, ${instr.mask}, &this_class::__${generator.functionName(instr.name)}},<%}%> |         {${instr.length}, ${instr.encoding}, ${instr.mask}, &this_class::__${generator.functionName(instr.name)}},<%}%> | ||||||
|     }}; |     }}; | ||||||
|  |  | ||||||
|  |     //needs to be declared after instr_descr | ||||||
|  |     decoder instr_decoder; | ||||||
|  |  | ||||||
|     /* instruction definitions */<%instructions.eachWithIndex{instr, idx -> %> |     /* instruction definitions */<%instructions.eachWithIndex{instr, idx -> %> | ||||||
|     /* instruction ${idx}: ${instr.name} */ |     /* instruction ${idx}: ${instr.name} */ | ||||||
|     std::tuple<continuation_e, BasicBlock*> __${generator.functionName(instr.name)}(virt_addr_t& pc, code_word_t instr, BasicBlock* bb){ |     std::tuple<continuation_e, BasicBlock*> __${generator.functionName(instr.name)}(virt_addr_t& pc, code_word_t instr, BasicBlock* bb){ | ||||||
| @@ -162,18 +189,27 @@ private: | |||||||
|         <%}%>if(this->disass_enabled){ |         <%}%>if(this->disass_enabled){ | ||||||
|             /* generate console output when executing the command */<%instr.disass.eachLine{%> |             /* generate console output when executing the command */<%instr.disass.eachLine{%> | ||||||
|             ${it}<%}%> |             ${it}<%}%> | ||||||
|  |             std::vector<Value*> args { | ||||||
|  |                 this->core_ptr, | ||||||
|  |                 this->gen_const(64, pc.val), | ||||||
|  |                 this->builder.CreateGlobalStringPtr(mnemonic), | ||||||
|  |             }; | ||||||
|  |             this->builder.CreateCall(this->mod->getFunction("print_disass"), args); | ||||||
|         } |         } | ||||||
|         bb->setName(fmt::format("${instr.name}_0x{:X}",pc.val)); |         bb->setName(fmt::format("${instr.name}_0x{:X}",pc.val)); | ||||||
|         this->gen_sync(PRE_SYNC,${idx}); |         this->gen_sync(PRE_SYNC,${idx}); | ||||||
|         auto cur_pc_val = this->gen_const(32,pc.val); |          | ||||||
|  |         this->gen_set_pc(pc, traits::PC); | ||||||
|  |         this->set_tval(instr); | ||||||
|         pc=pc+ ${instr.length/8}; |         pc=pc+ ${instr.length/8}; | ||||||
|         this->gen_set_pc(pc, traits::NEXT_PC); |         this->gen_set_pc(pc, traits::NEXT_PC); | ||||||
|          |          | ||||||
|  |         this->gen_instr_prologue(); | ||||||
|         /*generate behavior*/ |         /*generate behavior*/ | ||||||
|         <%instr.behavior.eachLine{%>${it} |         <%instr.behavior.eachLine{%>${it} | ||||||
|         <%}%> |         <%}%> | ||||||
|         this->gen_instr_epilogue(bb); |  | ||||||
|         this->gen_sync(POST_SYNC, ${idx}); |         this->gen_sync(POST_SYNC, ${idx}); | ||||||
|  |         this->gen_instr_epilogue(bb); | ||||||
|         this->builder.CreateBr(bb); |         this->builder.CreateBr(bb); | ||||||
|     	return returnValue;         |     	return returnValue;         | ||||||
|     } |     } | ||||||
| @@ -181,7 +217,16 @@ private: | |||||||
|     /**************************************************************************** |     /**************************************************************************** | ||||||
|      * end opcode definitions |      * end opcode definitions | ||||||
|      ****************************************************************************/ |      ****************************************************************************/ | ||||||
|     std::tuple<continuation_e, BasicBlock *> illegal_intruction(virt_addr_t &pc, code_word_t instr, BasicBlock *bb) { |     std::tuple<continuation_e, BasicBlock *> illegal_instruction(virt_addr_t &pc, code_word_t instr, BasicBlock *bb) { | ||||||
|  |         if(this->disass_enabled){ | ||||||
|  |             auto mnemonic = std::string("illegal_instruction"); | ||||||
|  |             std::vector<Value*> args { | ||||||
|  |                 this->core_ptr, | ||||||
|  |                 this->gen_const(64, pc.val), | ||||||
|  |                 this->builder.CreateGlobalStringPtr(mnemonic), | ||||||
|  |             }; | ||||||
|  |             this->builder.CreateCall(this->mod->getFunction("print_disass"), args); | ||||||
|  |         } | ||||||
|         this->gen_sync(iss::PRE_SYNC, instr_descr.size()); |         this->gen_sync(iss::PRE_SYNC, instr_descr.size()); | ||||||
|         this->builder.CreateStore(this->builder.CreateLoad(this->get_typeptr(traits::NEXT_PC), get_reg_ptr(traits::NEXT_PC), true), |         this->builder.CreateStore(this->builder.CreateLoad(this->get_typeptr(traits::NEXT_PC), get_reg_ptr(traits::NEXT_PC), true), | ||||||
|                                    get_reg_ptr(traits::PC), true); |                                    get_reg_ptr(traits::PC), true); | ||||||
| @@ -190,62 +235,13 @@ private: | |||||||
|                                      this->gen_const(64U, 1)), |                                      this->gen_const(64U, 1)), | ||||||
|             get_reg_ptr(traits::ICOUNT), true); |             get_reg_ptr(traits::ICOUNT), true); | ||||||
|         pc = pc + ((instr & 3) == 3 ? 4 : 2); |         pc = pc + ((instr & 3) == 3 ? 4 : 2); | ||||||
|  |         this->set_tval(instr); | ||||||
|         this->gen_raise_trap(0, 2);     // illegal instruction trap |         this->gen_raise_trap(0, 2);     // illegal instruction trap | ||||||
| 		this->gen_sync(iss::POST_SYNC, instr_descr.size()); | 		this->gen_sync(iss::POST_SYNC, instr_descr.size()); | ||||||
|         this->gen_instr_epilogue(this->leave_blk); |         bb = this->leave_blk; | ||||||
|         return std::make_tuple(BRANCH, nullptr); |         this->gen_instr_epilogue(bb); | ||||||
|     }     |         this->builder.CreateBr(bb); | ||||||
|     //decoding functionality |         return std::make_tuple(ILLEGAL_INSTR, nullptr); | ||||||
|  |  | ||||||
|     void populate_decoding_tree(decoding_tree_node* root){ |  | ||||||
|         //create submask |  | ||||||
|         for(auto instr: root->instrs){ |  | ||||||
|             root->submask &= instr.mask; |  | ||||||
|         } |  | ||||||
|         //put each instr according to submask&encoding into children |  | ||||||
|         for(auto instr: root->instrs){ |  | ||||||
|             bool foundMatch = false; |  | ||||||
|             for(auto child: root->children){ |  | ||||||
|                 //use value as identifying trait |  | ||||||
|                 if(child->value == (instr.value&root->submask)){ |  | ||||||
|                     child->instrs.push_back(instr); |  | ||||||
|                     foundMatch = true; |  | ||||||
|                 } |  | ||||||
|             } |  | ||||||
|             if(!foundMatch){ |  | ||||||
|                 decoding_tree_node* child = new decoding_tree_node(instr.value&root->submask); |  | ||||||
|                 child->instrs.push_back(instr); |  | ||||||
|                 root->children.push_back(child); |  | ||||||
|             } |  | ||||||
|         } |  | ||||||
|         root->instrs.clear(); |  | ||||||
|         //call populate_decoding_tree for all children |  | ||||||
|         if(root->children.size() >1) |  | ||||||
|             for(auto child: root->children){ |  | ||||||
|                 populate_decoding_tree(child);       |  | ||||||
|             } |  | ||||||
|         else{ |  | ||||||
|             //sort instrs by value of the mask, this works bc we want to have the least restrictive one last |  | ||||||
|             std::sort(root->children[0]->instrs.begin(), root->children[0]->instrs.end(), [](const instruction_descriptor& instr1, const instruction_descriptor& instr2) { |  | ||||||
|             return instr1.mask > instr2.mask; |  | ||||||
|             });  |  | ||||||
|         } |  | ||||||
|     } |  | ||||||
|     compile_func decode_instr(decoding_tree_node* node, code_word_t word){ |  | ||||||
|         if(!node->children.size()){ |  | ||||||
|             if(node->instrs.size() == 1) return node->instrs[0].op; |  | ||||||
|             for(auto instr : node->instrs){ |  | ||||||
|                 if((instr.mask&word) == instr.value) return instr.op; |  | ||||||
|             } |  | ||||||
|         } |  | ||||||
|         else{ |  | ||||||
|             for(auto child : node->children){ |  | ||||||
|                 if (child->value == (node->submask&word)){ |  | ||||||
|                     return decode_instr(child, word); |  | ||||||
|                 }   |  | ||||||
|             }   |  | ||||||
|         } |  | ||||||
|         return nullptr; |  | ||||||
|     }     |     }     | ||||||
| }; | }; | ||||||
|  |  | ||||||
| @@ -258,42 +254,39 @@ template <typename ARCH> vm_impl<ARCH>::vm_impl() { this(new ARCH()); } | |||||||
|  |  | ||||||
| template <typename ARCH> | template <typename ARCH> | ||||||
| vm_impl<ARCH>::vm_impl(ARCH &core, unsigned core_id, unsigned cluster_id) | vm_impl<ARCH>::vm_impl(ARCH &core, unsigned core_id, unsigned cluster_id) | ||||||
| : vm_base<ARCH>(core, core_id, cluster_id) { | : vm_base<ARCH>(core, core_id, cluster_id) | ||||||
|     root = new decoding_tree_node(std::numeric_limits<uint32_t>::max()); | , instr_decoder([this]() { | ||||||
|     for(auto instr:instr_descr){ |         std::vector<generic_instruction_descriptor> g_instr_descr; | ||||||
|         root->instrs.push_back(instr); |         g_instr_descr.reserve(instr_descr.size()); | ||||||
|     } |         for (uint32_t i = 0; i < instr_descr.size(); ++i) { | ||||||
|     populate_decoding_tree(root); |             generic_instruction_descriptor new_instr_descr {instr_descr[i].value, instr_descr[i].mask, i}; | ||||||
|  |             g_instr_descr.push_back(new_instr_descr); | ||||||
|         } |         } | ||||||
|  |         return std::move(g_instr_descr); | ||||||
|  |     }()) {} | ||||||
|  |  | ||||||
| template <typename ARCH> | template <typename ARCH> | ||||||
| std::tuple<continuation_e, BasicBlock *> | std::tuple<continuation_e, BasicBlock *> | ||||||
| vm_impl<ARCH>::gen_single_inst_behavior(virt_addr_t &pc, unsigned int &inst_cnt, BasicBlock *this_block) { | vm_impl<ARCH>::gen_single_inst_behavior(virt_addr_t &pc, BasicBlock *this_block) { | ||||||
|     // we fetch at max 4 byte, alignment is 2 |     // we fetch at max 4 byte, alignment is 2 | ||||||
|     enum {TRAP_ID=1<<16}; |     enum {TRAP_ID=1<<16}; | ||||||
|     code_word_t instr = 0; |     code_word_t instr = 0; | ||||||
|     // const typename traits::addr_t upper_bits = ~traits::PGMASK; |     // const typename traits::addr_t upper_bits = ~traits::PGMASK; | ||||||
|     phys_addr_t paddr(pc); |     phys_addr_t paddr(pc); | ||||||
|     auto *const data = (uint8_t *)&instr; |     auto *const data = (uint8_t *)&instr; | ||||||
|     if(this->core.has_mmu()) |  | ||||||
|         paddr = this->core.virt2phys(pc); |  | ||||||
|     //TODO: re-add page handling |  | ||||||
| //    if ((pc.val & upper_bits) != ((pc.val + 2) & upper_bits)) { // we may cross a page boundary |  | ||||||
| //        auto res = this->core.read(paddr, 2, data); |  | ||||||
| //        if (res != iss::Ok) throw trap_access(TRAP_ID, pc.val); |  | ||||||
| //        if ((instr & 0x3) == 0x3) { // this is a 32bit instruction |  | ||||||
| //            res = this->core.read(this->core.v2p(pc + 2), 2, data + 2); |  | ||||||
| //        } |  | ||||||
| //    } else { |  | ||||||
|     auto res = this->core.read(paddr, 4, data); |     auto res = this->core.read(paddr, 4, data); | ||||||
|         if (res != iss::Ok) throw trap_access(TRAP_ID, pc.val); |     if (res != iss::Ok)  | ||||||
| //    } |         return std::make_tuple(ILLEGAL_FETCH, nullptr); | ||||||
|     if (instr == 0x0000006f || (instr&0xffff)==0xa001) throw simulation_stopped(0); // 'J 0' or 'C.J 0' |     if (instr == 0x0000006f || (instr&0xffff)==0xa001){ | ||||||
|     // curr pc on stack |         this->builder.CreateBr(this->leave_blk); | ||||||
|     ++inst_cnt; |         return std::make_tuple(JUMP_TO_SELF, nullptr); | ||||||
|     auto f = decode_instr(root, instr); |         } | ||||||
|  |     uint32_t inst_index = instr_decoder.decode_instr(instr); | ||||||
|  |     compile_func f = nullptr; | ||||||
|  |     if(inst_index < instr_descr.size()) | ||||||
|  |         f = instr_descr[inst_index].op; | ||||||
|     if (f == nullptr) { |     if (f == nullptr) { | ||||||
|         f = &this_class::illegal_intruction; |         f = &this_class::illegal_instruction; | ||||||
|     } |     } | ||||||
|     return (this->*f)(pc, instr, this_block); |     return (this->*f)(pc, instr, this_block); | ||||||
| } | } | ||||||
| @@ -308,16 +301,14 @@ template <typename ARCH> | |||||||
| void vm_impl<ARCH>::gen_raise_trap(uint16_t trap_id, uint16_t cause) { | void vm_impl<ARCH>::gen_raise_trap(uint16_t trap_id, uint16_t cause) { | ||||||
|     auto *TRAP_val = this->gen_const(32, 0x80 << 24 | (cause << 16) | trap_id); |     auto *TRAP_val = this->gen_const(32, 0x80 << 24 | (cause << 16) | trap_id); | ||||||
|     this->builder.CreateStore(TRAP_val, get_reg_ptr(traits::TRAP_STATE), true); |     this->builder.CreateStore(TRAP_val, get_reg_ptr(traits::TRAP_STATE), true); | ||||||
|     this->builder.CreateStore(this->gen_const(32U, std::numeric_limits<uint32_t>::max()), get_reg_ptr(traits::LAST_BRANCH), false); |     this->builder.CreateBr(this->trap_blk); | ||||||
| } | } | ||||||
|  |  | ||||||
| template <typename ARCH> | template <typename ARCH> | ||||||
| void vm_impl<ARCH>::gen_leave_trap(unsigned lvl) { | void vm_impl<ARCH>::gen_leave_trap(unsigned lvl) { | ||||||
|     std::vector<Value *> args{ this->core_ptr, ConstantInt::get(getContext(), APInt(64, lvl)) }; |     std::vector<Value *> args{ this->core_ptr, ConstantInt::get(getContext(), APInt(64, lvl)) }; | ||||||
|     this->builder.CreateCall(this->mod->getFunction("leave_trap"), args); |     this->builder.CreateCall(this->mod->getFunction("leave_trap"), args); | ||||||
|     auto *PC_val = this->gen_read_mem(traits::CSR, (lvl << 8) + 0x41, traits::XLEN / 8); |     this->builder.CreateStore(this->gen_const(32U, static_cast<int>(UNKNOWN_JUMP)), get_reg_ptr(traits::LAST_BRANCH), false); | ||||||
|     this->builder.CreateStore(PC_val, get_reg_ptr(traits::NEXT_PC), false); |  | ||||||
|     this->builder.CreateStore(this->gen_const(32U, std::numeric_limits<uint32_t>::max()), get_reg_ptr(traits::LAST_BRANCH), false); |  | ||||||
| } | } | ||||||
|  |  | ||||||
| template <typename ARCH> | template <typename ARCH> | ||||||
| @@ -326,19 +317,37 @@ void vm_impl<ARCH>::gen_wait(unsigned type) { | |||||||
|     this->builder.CreateCall(this->mod->getFunction("wait"), args); |     this->builder.CreateCall(this->mod->getFunction("wait"), args); | ||||||
| } | } | ||||||
|  |  | ||||||
|  | template <typename ARCH> | ||||||
|  | inline void vm_impl<ARCH>::set_tval(uint64_t tval) { | ||||||
|  |     auto tmp_tval = this->gen_const(64, tval); | ||||||
|  |     this->set_tval(tmp_tval); | ||||||
|  | } | ||||||
|  | template <typename ARCH> | ||||||
|  | inline void vm_impl<ARCH>::set_tval(Value* new_tval) { | ||||||
|  |     this->builder.CreateStore(this->gen_ext(new_tval, 64, false), this->tval); | ||||||
|  | } | ||||||
| template <typename ARCH>  | template <typename ARCH>  | ||||||
| void vm_impl<ARCH>::gen_trap_behavior(BasicBlock *trap_blk) { | void vm_impl<ARCH>::gen_trap_behavior(BasicBlock *trap_blk) { | ||||||
|     this->builder.SetInsertPoint(trap_blk); |     this->builder.SetInsertPoint(trap_blk); | ||||||
|     this->gen_sync(POST_SYNC, -1); //TODO get right InstrId |  | ||||||
|     auto *trap_state_val = this->builder.CreateLoad(this->get_typeptr(traits::TRAP_STATE), get_reg_ptr(traits::TRAP_STATE), true); |     auto *trap_state_val = this->builder.CreateLoad(this->get_typeptr(traits::TRAP_STATE), get_reg_ptr(traits::TRAP_STATE), true); | ||||||
|     this->builder.CreateStore(this->gen_const(32U, std::numeric_limits<uint32_t>::max()), |     auto *cur_pc_val = this->builder.CreateLoad(this->get_typeptr(traits::PC), get_reg_ptr(traits::PC), true); | ||||||
|                               get_reg_ptr(traits::LAST_BRANCH), false); |     std::vector<Value *> args{this->core_ptr, | ||||||
|     std::vector<Value *> args{this->core_ptr, this->adj_to64(trap_state_val), |                                 this->adj_to64(trap_state_val), | ||||||
|                               this->adj_to64(this->builder.CreateLoad(this->get_typeptr(traits::PC), get_reg_ptr(traits::PC), false))}; |                                 this->adj_to64(cur_pc_val), | ||||||
|  |                               this->adj_to64(this->builder.CreateLoad(this->get_type(64),this->tval))}; | ||||||
|     this->builder.CreateCall(this->mod->getFunction("enter_trap"), args); |     this->builder.CreateCall(this->mod->getFunction("enter_trap"), args); | ||||||
|  |     this->builder.CreateStore(this->gen_const(32U, static_cast<int>(UNKNOWN_JUMP)), get_reg_ptr(traits::LAST_BRANCH), false); | ||||||
|  |  | ||||||
|     auto *trap_addr_val = this->builder.CreateLoad(this->get_typeptr(traits::NEXT_PC), get_reg_ptr(traits::NEXT_PC), false); |     auto *trap_addr_val = this->builder.CreateLoad(this->get_typeptr(traits::NEXT_PC), get_reg_ptr(traits::NEXT_PC), false); | ||||||
|     this->builder.CreateRet(trap_addr_val); |     this->builder.CreateRet(trap_addr_val); | ||||||
| } | } | ||||||
|  | template <typename ARCH> | ||||||
|  | void vm_impl<ARCH>::gen_instr_prologue() { | ||||||
|  |     auto* trap_val = | ||||||
|  |         this->builder.CreateLoad(this->get_typeptr(arch::traits<ARCH>::PENDING_TRAP), get_reg_ptr(arch::traits<ARCH>::PENDING_TRAP)); | ||||||
|  |     this->builder.CreateStore(trap_val, get_reg_ptr(arch::traits<ARCH>::TRAP_STATE), false); | ||||||
|  | } | ||||||
|  |              | ||||||
|  |  | ||||||
| template <typename ARCH> | template <typename ARCH> | ||||||
| void vm_impl<ARCH>::gen_instr_epilogue(BasicBlock *bb) { | void vm_impl<ARCH>::gen_instr_epilogue(BasicBlock *bb) { | ||||||
| @@ -349,6 +358,14 @@ void vm_impl<ARCH>::gen_instr_epilogue(BasicBlock *bb) { | |||||||
|                               ConstantInt::get(getContext(), APInt(v->getType()->getIntegerBitWidth(), 0))), |                               ConstantInt::get(getContext(), APInt(v->getType()->getIntegerBitWidth(), 0))), | ||||||
|                           target_bb, this->trap_blk, 1); |                           target_bb, this->trap_blk, 1); | ||||||
|     this->builder.SetInsertPoint(target_bb); |     this->builder.SetInsertPoint(target_bb); | ||||||
|  |     // update icount | ||||||
|  |     auto* icount_val = this->builder.CreateAdd( | ||||||
|  |         this->builder.CreateLoad(this->get_typeptr(arch::traits<ARCH>::ICOUNT), get_reg_ptr(arch::traits<ARCH>::ICOUNT)), this->gen_const(64U, 1)); | ||||||
|  |     this->builder.CreateStore(icount_val, get_reg_ptr(arch::traits<ARCH>::ICOUNT), false); | ||||||
|  |     //increment cyclecount | ||||||
|  |     auto* cycle_val = this->builder.CreateAdd( | ||||||
|  |         this->builder.CreateLoad(this->get_typeptr(arch::traits<ARCH>::CYCLE), get_reg_ptr(arch::traits<ARCH>::CYCLE)), this->gen_const(64U, 1)); | ||||||
|  |     this->builder.CreateStore(cycle_val, get_reg_ptr(arch::traits<ARCH>::CYCLE), false); | ||||||
| } | } | ||||||
|  |  | ||||||
| } // namespace ${coreDef.name.toLowerCase()} | } // namespace ${coreDef.name.toLowerCase()} | ||||||
|   | |||||||
| @@ -1,5 +1,5 @@ | |||||||
| /******************************************************************************* | /******************************************************************************* | ||||||
|  * Copyright (C) 2020 MINRES Technologies GmbH |  * Copyright (C) 2020-2024 MINRES Technologies GmbH | ||||||
|  * All rights reserved. |  * All rights reserved. | ||||||
|  * |  * | ||||||
|  * Redistribution and use in source and binary forms, with or without |  * Redistribution and use in source and binary forms, with or without | ||||||
| @@ -37,7 +37,10 @@ | |||||||
| #include <iss/tcc/vm_base.h> | #include <iss/tcc/vm_base.h> | ||||||
| #include <util/logging.h> | #include <util/logging.h> | ||||||
| #include <sstream> | #include <sstream> | ||||||
|  | #include <iss/instruction_decoder.h> | ||||||
|  | <%def fcsr = registers.find {it.name=='FCSR'} | ||||||
|  | if(fcsr != null) {%> | ||||||
|  | #include <vm/fp_functions.h><%}%> | ||||||
| #ifndef FMT_HEADER_ONLY | #ifndef FMT_HEADER_ONLY | ||||||
| #define FMT_HEADER_ONLY | #define FMT_HEADER_ONLY | ||||||
| #endif | #endif | ||||||
| @@ -80,16 +83,21 @@ protected: | |||||||
|     using vm_base<ARCH>::get_reg_ptr; |     using vm_base<ARCH>::get_reg_ptr; | ||||||
|  |  | ||||||
|     using this_class = vm_impl<ARCH>; |     using this_class = vm_impl<ARCH>; | ||||||
|     using compile_ret_t = std::tuple<continuation_e>; |     using compile_ret_t = continuation_e; | ||||||
|     using compile_func = compile_ret_t (this_class::*)(virt_addr_t &pc, code_word_t instr, tu_builder&); |     using compile_func = compile_ret_t (this_class::*)(virt_addr_t &pc, code_word_t instr, tu_builder&); | ||||||
|  |  | ||||||
|     inline const char *name(size_t index){return traits::reg_aliases.at(index);} |     inline const char *name(size_t index){return traits::reg_aliases.at(index);} | ||||||
|  | <% | ||||||
|  | if(fcsr != null) {%> | ||||||
|  |     inline const char *fname(size_t index){return index < 32?name(index+traits::F0):"illegal";}    | ||||||
|  | <%}%> | ||||||
|  |     void add_prologue(tu_builder& tu) override; | ||||||
|  |  | ||||||
|     void setup_module(std::string m) override { |     void setup_module(std::string m) override { | ||||||
|         super::setup_module(m); |         super::setup_module(m); | ||||||
|     } |     } | ||||||
|  |  | ||||||
|     compile_ret_t gen_single_inst_behavior(virt_addr_t &, unsigned int &, tu_builder&) override; |     compile_ret_t gen_single_inst_behavior(virt_addr_t &, tu_builder&) override; | ||||||
|  |  | ||||||
|     void gen_trap_behavior(tu_builder& tu) override; |     void gen_trap_behavior(tu_builder& tu) override; | ||||||
|  |  | ||||||
| @@ -97,7 +105,9 @@ protected: | |||||||
|  |  | ||||||
|     void gen_leave_trap(tu_builder& tu, unsigned lvl); |     void gen_leave_trap(tu_builder& tu, unsigned lvl); | ||||||
|  |  | ||||||
|     void gen_wait(tu_builder& tu, unsigned type); |     inline void gen_set_tval(tu_builder& tu, uint64_t new_tval); | ||||||
|  |  | ||||||
|  |     inline void gen_set_tval(tu_builder& tu, value new_tval); | ||||||
|  |  | ||||||
|     inline void gen_trap_check(tu_builder& tu) { |     inline void gen_trap_check(tu_builder& tu) { | ||||||
|         tu("if(*trap_state!=0) goto trap_entry;"); |         tu("if(*trap_state!=0) goto trap_entry;"); | ||||||
| @@ -128,32 +138,56 @@ protected: | |||||||
|         return (from & mask) | ((from & sign_mask) ? ~mask : 0); |         return (from & mask) | ((from & sign_mask) ? ~mask : 0); | ||||||
|     } |     } | ||||||
|  |  | ||||||
|  | <%functions.each{ it.eachLine { %> | ||||||
|  |     ${it}<%} | ||||||
|  | } | ||||||
|  | if(fcsr != null) {%> | ||||||
|  |     value NaNBox16(tu_builder& tu, value NaNBox16_val){ | ||||||
|  |         if(static_cast<uint32_t>(traits::FLEN) == 16) | ||||||
|  |             return tu.ext(NaNBox16_val, traits::FLEN, false); | ||||||
|  |         else {          | ||||||
|  |             auto box = tu.assignment(tu.logical_neg((tu.ext(0, 32, false))), traits::FLEN) ; | ||||||
|  |             return tu.ext((tu.bitwise_or(tu.shl(box, 16), NaNBox16_val)), traits::FLEN, false); | ||||||
|  |         }  | ||||||
|  |     } | ||||||
|  |     value NaNBox32(tu_builder& tu, value NaNBox32_val){ | ||||||
|  |         if(static_cast<uint32_t>(traits::FLEN) == 32) | ||||||
|  |             return tu.ext(NaNBox32_val, traits::FLEN, false); | ||||||
|  |         else {          | ||||||
|  |             auto box = tu.assignment(tu.logical_neg((tu.ext(0, 64, false))), traits::FLEN) ; | ||||||
|  |             return tu.ext((tu.bitwise_or(tu.shl(box, 32), NaNBox32_val)), traits::FLEN, false); | ||||||
|  |         }  | ||||||
|  |     } | ||||||
|  |     value NaNBox64(tu_builder& tu, value NaNBox64_val){ | ||||||
|  |         if(static_cast<uint32_t>(traits::FLEN) == 64) | ||||||
|  |             return tu.ext(NaNBox64_val, traits::FLEN, false); | ||||||
|  |         else { | ||||||
|  |             throw new std::runtime_error("tcc does not support Registers wider than 64 bits");      | ||||||
|  |             auto box = tu.assignment(tu.logical_neg((tu.ext(0, 128, false))), traits::FLEN) ; | ||||||
|  |             return tu.ext((tu.bitwise_or(tu.shl(box, 64), NaNBox64_val)), traits::FLEN, false); | ||||||
|  |         } | ||||||
|  |     } | ||||||
|  | <%}%> | ||||||
| private: | private: | ||||||
|     /**************************************************************************** |     /**************************************************************************** | ||||||
|      * start opcode definitions |      * start opcode definitions | ||||||
|      ****************************************************************************/ |      ****************************************************************************/ | ||||||
|     struct instruction_descriptor { |     struct instruction_descriptor { | ||||||
|         size_t length; |         uint32_t length; | ||||||
|         uint32_t value; |         uint32_t value; | ||||||
|         uint32_t mask; |         uint32_t mask; | ||||||
|         compile_func op; |         compile_func op; | ||||||
|     }; |     }; | ||||||
|     struct decoding_tree_node{ |  | ||||||
|         std::vector<instruction_descriptor> instrs; |  | ||||||
|         std::vector<decoding_tree_node*> children; |  | ||||||
|         uint32_t submask = std::numeric_limits<uint32_t>::max(); |  | ||||||
|         uint32_t value; |  | ||||||
|         decoding_tree_node(uint32_t value) : value(value){} |  | ||||||
|     }; |  | ||||||
|  |  | ||||||
|     decoding_tree_node* root {nullptr}; |     const std::array<instruction_descriptor, ${instructions.size()}> instr_descr = {{ | ||||||
|  |  | ||||||
|     const std::array<instruction_descriptor, ${instructions.size}> instr_descr = {{ |  | ||||||
|          /* entries are: size, valid value, valid mask, function ptr */<%instructions.each{instr -> %> |          /* entries are: size, valid value, valid mask, function ptr */<%instructions.each{instr -> %> | ||||||
|         /* instruction ${instr.instruction.name}, encoding '${instr.encoding}' */ |         /* instruction ${instr.instruction.name}, encoding '${instr.encoding}' */ | ||||||
|         {${instr.length}, ${instr.encoding}, ${instr.mask}, &this_class::__${generator.functionName(instr.name)}},<%}%> |         {${instr.length}, ${instr.encoding}, ${instr.mask}, &this_class::__${generator.functionName(instr.name)}},<%}%> | ||||||
|     }}; |     }}; | ||||||
|  |  | ||||||
|  |     //needs to be declared after instr_descr | ||||||
|  |     decoder instr_decoder; | ||||||
|  |  | ||||||
|     /* instruction definitions */<%instructions.eachWithIndex{instr, idx -> %> |     /* instruction definitions */<%instructions.eachWithIndex{instr, idx -> %> | ||||||
|     /* instruction ${idx}: ${instr.name} */ |     /* instruction ${idx}: ${instr.name} */ | ||||||
|     compile_ret_t __${generator.functionName(instr.name)}(virt_addr_t& pc, code_word_t instr, tu_builder& tu){ |     compile_ret_t __${generator.functionName(instr.name)}(virt_addr_t& pc, code_word_t instr, tu_builder& tu){ | ||||||
| @@ -164,82 +198,39 @@ private: | |||||||
|         <%}%>if(this->disass_enabled){ |         <%}%>if(this->disass_enabled){ | ||||||
|             /* generate console output when executing the command */<%instr.disass.eachLine{%> |             /* generate console output when executing the command */<%instr.disass.eachLine{%> | ||||||
|             ${it}<%}%> |             ${it}<%}%> | ||||||
|  |             tu("print_disass(core_ptr, {:#x}, \"{}\");", pc.val, mnemonic); | ||||||
|         } |         } | ||||||
|         auto cur_pc_val = tu.constant(pc.val, traits::reg_bit_widths[traits::PC]); |         auto cur_pc_val = tu.constant(pc.val, traits::reg_bit_widths[traits::PC]); | ||||||
|         pc=pc+ ${instr.length/8}; |         pc=pc+ ${instr.length/8}; | ||||||
|         gen_set_pc(tu, pc, traits::NEXT_PC); |         gen_set_pc(tu, pc, traits::NEXT_PC); | ||||||
|  |         tu("(*cycle)++;"); | ||||||
|         tu.open_scope(); |         tu.open_scope(); | ||||||
|  |         this->gen_set_tval(tu, instr); | ||||||
|         <%instr.behavior.eachLine{%>${it} |         <%instr.behavior.eachLine{%>${it} | ||||||
|         <%}%> |         <%}%> | ||||||
|  |         tu("(*icount)++;"); | ||||||
|  |         tu("(*instret)++;"); | ||||||
|         tu.close_scope(); |         tu.close_scope(); | ||||||
|         gen_trap_check(tu);         |  | ||||||
|         vm_base<ARCH>::gen_sync(tu, POST_SYNC,${idx}); |         vm_base<ARCH>::gen_sync(tu, POST_SYNC,${idx}); | ||||||
|  |         gen_trap_check(tu);         | ||||||
|         return returnValue; |         return returnValue; | ||||||
|     } |     } | ||||||
|     <%}%> |     <%}%> | ||||||
|     /**************************************************************************** |     /**************************************************************************** | ||||||
|      * end opcode definitions |      * end opcode definitions | ||||||
|      ****************************************************************************/ |      ****************************************************************************/ | ||||||
|     compile_ret_t illegal_intruction(virt_addr_t &pc, code_word_t instr, tu_builder& tu) { |     compile_ret_t illegal_instruction(virt_addr_t &pc, code_word_t instr, tu_builder& tu) { | ||||||
|         vm_impl::gen_sync(tu, iss::PRE_SYNC, instr_descr.size()); |         vm_impl::gen_sync(tu, iss::PRE_SYNC, instr_descr.size()); | ||||||
|  |         if(this->disass_enabled){ | ||||||
|  |             /* generate console output when executing the command */ | ||||||
|  |             tu("print_disass(core_ptr, {:#x}, \"{}\");", pc.val, std::string("illegal_instruction")); | ||||||
|  |         } | ||||||
|         pc = pc + ((instr & 3) == 3 ? 4 : 2); |         pc = pc + ((instr & 3) == 3 ? 4 : 2); | ||||||
|         gen_raise_trap(tu, 0, 2);     // illegal instruction trap |         gen_raise_trap(tu, 0, static_cast<int32_t>(traits:: RV_CAUSE_ILLEGAL_INSTRUCTION)); | ||||||
|  |         this->gen_set_tval(tu, instr); | ||||||
|         vm_impl::gen_sync(tu, iss::POST_SYNC, instr_descr.size()); |         vm_impl::gen_sync(tu, iss::POST_SYNC, instr_descr.size()); | ||||||
|         vm_impl::gen_trap_check(tu); |         vm_impl::gen_trap_check(tu); | ||||||
|         return BRANCH; |         return ILLEGAL_INSTR; | ||||||
|     } |  | ||||||
|      |  | ||||||
|     //decoding functionality |  | ||||||
|  |  | ||||||
|     void populate_decoding_tree(decoding_tree_node* root){ |  | ||||||
|         //create submask |  | ||||||
|         for(auto instr: root->instrs){ |  | ||||||
|             root->submask &= instr.mask; |  | ||||||
|         } |  | ||||||
|         //put each instr according to submask&encoding into children |  | ||||||
|         for(auto instr: root->instrs){ |  | ||||||
|             bool foundMatch = false; |  | ||||||
|             for(auto child: root->children){ |  | ||||||
|                 //use value as identifying trait |  | ||||||
|                 if(child->value == (instr.value&root->submask)){ |  | ||||||
|                     child->instrs.push_back(instr); |  | ||||||
|                     foundMatch = true; |  | ||||||
|                 } |  | ||||||
|             } |  | ||||||
|             if(!foundMatch){ |  | ||||||
|                 decoding_tree_node* child = new decoding_tree_node(instr.value&root->submask); |  | ||||||
|                 child->instrs.push_back(instr); |  | ||||||
|                 root->children.push_back(child); |  | ||||||
|             } |  | ||||||
|         } |  | ||||||
|         root->instrs.clear(); |  | ||||||
|         //call populate_decoding_tree for all children |  | ||||||
|         if(root->children.size() >1) |  | ||||||
|             for(auto child: root->children){ |  | ||||||
|                 populate_decoding_tree(child);       |  | ||||||
|             } |  | ||||||
|         else{ |  | ||||||
|             //sort instrs by value of the mask, this works bc we want to have the least restrictive one last |  | ||||||
|             std::sort(root->children[0]->instrs.begin(), root->children[0]->instrs.end(), [](const instruction_descriptor& instr1, const instruction_descriptor& instr2) { |  | ||||||
|             return instr1.mask > instr2.mask; |  | ||||||
|             });  |  | ||||||
|         } |  | ||||||
|     } |  | ||||||
|     compile_func decode_instr(decoding_tree_node* node, code_word_t word){ |  | ||||||
|         if(!node->children.size()){ |  | ||||||
|             if(node->instrs.size() == 1) return node->instrs[0].op; |  | ||||||
|             for(auto instr : node->instrs){ |  | ||||||
|                 if((instr.mask&word) == instr.value) return instr.op; |  | ||||||
|             } |  | ||||||
|         } |  | ||||||
|         else{ |  | ||||||
|             for(auto child : node->children){ |  | ||||||
|                 if (child->value == (node->submask&word)){ |  | ||||||
|                     return decode_instr(child, word); |  | ||||||
|                 }   |  | ||||||
|             }   |  | ||||||
|         } |  | ||||||
|         return nullptr; |  | ||||||
|     } |     } | ||||||
| }; | }; | ||||||
|  |  | ||||||
| @@ -252,65 +243,139 @@ template <typename ARCH> vm_impl<ARCH>::vm_impl() { this(new ARCH()); } | |||||||
|  |  | ||||||
| template <typename ARCH> | template <typename ARCH> | ||||||
| vm_impl<ARCH>::vm_impl(ARCH &core, unsigned core_id, unsigned cluster_id) | vm_impl<ARCH>::vm_impl(ARCH &core, unsigned core_id, unsigned cluster_id) | ||||||
| : vm_base<ARCH>(core, core_id, cluster_id) { | : vm_base<ARCH>(core, core_id, cluster_id) | ||||||
|     root = new decoding_tree_node(std::numeric_limits<uint32_t>::max()); | , instr_decoder([this]() { | ||||||
|     for(auto instr:instr_descr){ |         std::vector<generic_instruction_descriptor> g_instr_descr; | ||||||
|         root->instrs.push_back(instr); |         g_instr_descr.reserve(instr_descr.size()); | ||||||
|     } |         for (uint32_t i = 0; i < instr_descr.size(); ++i) { | ||||||
|     populate_decoding_tree(root); |             generic_instruction_descriptor new_instr_descr {instr_descr[i].value, instr_descr[i].mask, i}; | ||||||
|  |             g_instr_descr.push_back(new_instr_descr); | ||||||
|         } |         } | ||||||
|  |         return std::move(g_instr_descr); | ||||||
|  |     }()) {} | ||||||
|  |  | ||||||
| template <typename ARCH> | template <typename ARCH> | ||||||
| std::tuple<continuation_e> | continuation_e | ||||||
| vm_impl<ARCH>::gen_single_inst_behavior(virt_addr_t &pc, unsigned int &inst_cnt, tu_builder& tu) { | vm_impl<ARCH>::gen_single_inst_behavior(virt_addr_t &pc, tu_builder& tu) { | ||||||
|     // we fetch at max 4 byte, alignment is 2 |     // we fetch at max 4 byte, alignment is 2 | ||||||
|     enum {TRAP_ID=1<<16}; |     enum {TRAP_ID=1<<16}; | ||||||
|     code_word_t instr = 0; |     code_word_t instr = 0; | ||||||
|     phys_addr_t paddr(pc); |     phys_addr_t paddr(pc); | ||||||
|     if(this->core.has_mmu()) |  | ||||||
|         paddr = this->core.virt2phys(pc); |  | ||||||
|     //TODO: re-add page handling |  | ||||||
| //    if ((pc.val & upper_bits) != ((pc.val + 2) & upper_bits)) { // we may cross a page boundary |  | ||||||
| //        auto res = this->core.read(paddr, 2, data); |  | ||||||
| //        if (res != iss::Ok) throw trap_access(TRAP_ID, pc.val); |  | ||||||
| //        if ((insn & 0x3) == 0x3) { // this is a 32bit instruction |  | ||||||
| //            res = this->core.read(this->core.v2p(pc + 2), 2, data + 2); |  | ||||||
| //        } |  | ||||||
| //    } else { |  | ||||||
|     auto res = this->core.read(paddr, 4, reinterpret_cast<uint8_t*>(&instr)); |     auto res = this->core.read(paddr, 4, reinterpret_cast<uint8_t*>(&instr)); | ||||||
|         if (res != iss::Ok) throw trap_access(TRAP_ID, pc.val); |     if (res != iss::Ok) | ||||||
| //    } |         return ILLEGAL_FETCH; | ||||||
|     if (instr == 0x0000006f || (instr&0xffff)==0xa001) throw simulation_stopped(0); // 'J 0' or 'C.J 0' |     if (instr == 0x0000006f || (instr&0xffff)==0xa001)  | ||||||
|     // curr pc on stack |         return JUMP_TO_SELF; | ||||||
|     ++inst_cnt; |     uint32_t inst_index = instr_decoder.decode_instr(instr); | ||||||
|     auto f = decode_instr(root, instr); |     compile_func f = nullptr; | ||||||
|  |     if(inst_index < instr_descr.size()) | ||||||
|  |         f = instr_descr[inst_index].op; | ||||||
|     if (f == nullptr) { |     if (f == nullptr) { | ||||||
|         f = &this_class::illegal_intruction; |         f = &this_class::illegal_instruction; | ||||||
|     } |     } | ||||||
|     return (this->*f)(pc, instr, tu); |     return (this->*f)(pc, instr, tu); | ||||||
| } | } | ||||||
|  |  | ||||||
| template <typename ARCH> void vm_impl<ARCH>::gen_raise_trap(tu_builder& tu, uint16_t trap_id, uint16_t cause) { | template <typename ARCH> void vm_impl<ARCH>::gen_raise_trap(tu_builder& tu, uint16_t trap_id, uint16_t cause) { | ||||||
|     tu("  *trap_state = {:#x};", 0x80 << 24 | (cause << 16) | trap_id); |     tu("  *trap_state = {:#x};", 0x80 << 24 | (cause << 16) | trap_id); | ||||||
|     tu.store(traits::NEXT_PC, tu.constant(std::numeric_limits<uint32_t>::max(), 32)); |  | ||||||
| } | } | ||||||
|  |  | ||||||
| template <typename ARCH> void vm_impl<ARCH>::gen_leave_trap(tu_builder& tu, unsigned lvl) { | template <typename ARCH> void vm_impl<ARCH>::gen_leave_trap(tu_builder& tu, unsigned lvl) { | ||||||
|     tu("leave_trap(core_ptr, {});", lvl); |     tu("leave_trap(core_ptr, {});", lvl); | ||||||
|     tu.store(traits::NEXT_PC, tu.read_mem(traits::CSR, (lvl << 8) + 0x41, traits::XLEN)); |     tu.store(traits::NEXT_PC, tu.read_mem(traits::CSR, (lvl << 8) + 0x41, traits::XLEN)); | ||||||
|     tu.store(traits::LAST_BRANCH, tu.constant(std::numeric_limits<uint32_t>::max(), 32)); |     tu.store(traits::LAST_BRANCH, tu.constant(static_cast<int>(UNKNOWN_JUMP), 32)); | ||||||
| } | } | ||||||
|  |  | ||||||
| template <typename ARCH> void vm_impl<ARCH>::gen_wait(tu_builder& tu, unsigned type) { | template <typename ARCH> void vm_impl<ARCH>::gen_set_tval(tu_builder& tu, uint64_t new_tval) { | ||||||
|  |     tu(fmt::format("tval = {};", new_tval)); | ||||||
|  | } | ||||||
|  | template <typename ARCH> void vm_impl<ARCH>::gen_set_tval(tu_builder& tu, value new_tval) { | ||||||
|  |     tu(fmt::format("tval = {};", new_tval.str)); | ||||||
| } | } | ||||||
|  |  | ||||||
| template <typename ARCH> void vm_impl<ARCH>::gen_trap_behavior(tu_builder& tu) { | template <typename ARCH> void vm_impl<ARCH>::gen_trap_behavior(tu_builder& tu) { | ||||||
|     tu("trap_entry:"); |     tu("trap_entry:"); | ||||||
|     this->gen_sync(tu, POST_SYNC, -1);     |     this->gen_sync(tu, POST_SYNC, -1);     | ||||||
|     tu("enter_trap(core_ptr, *trap_state, *pc, 0);"); |     tu("enter_trap(core_ptr, *trap_state, *pc, tval);"); | ||||||
|     tu.store(traits::LAST_BRANCH, tu.constant(std::numeric_limits<uint32_t>::max(),32)); |     tu.store(traits::LAST_BRANCH, tu.constant(static_cast<int>(UNKNOWN_JUMP),32)); | ||||||
|     tu("return *next_pc;"); |     tu("return *next_pc;"); | ||||||
| } | } | ||||||
|  | template <typename ARCH> void vm_impl<ARCH>::add_prologue(tu_builder& tu){ | ||||||
|  |     std::ostringstream os; | ||||||
|  |     os << tu.add_reg_ptr("trap_state", arch::traits<ARCH>::TRAP_STATE, this->regs_base_ptr); | ||||||
|  |     os << tu.add_reg_ptr("pending_trap", arch::traits<ARCH>::PENDING_TRAP, this->regs_base_ptr); | ||||||
|  |     os << tu.add_reg_ptr("cycle", arch::traits<ARCH>::CYCLE, this->regs_base_ptr); | ||||||
|  | <%if(fcsr != null) { | ||||||
|  |     def flen = constants.find { it.name == 'FLEN' }?.value ?: 0 | ||||||
|  |     %> | ||||||
|  |     os << "uint32_t (*fget_flags)()=" << (uintptr_t)&fget_flags << ";\\n"; | ||||||
|  |  | ||||||
|  |     os << "uint16_t (*fadd_h)(uint16_t v1, uint16_t v2, uint8_t mode)=" << (uintptr_t)&fadd_h << ";\\n"; | ||||||
|  |     os << "uint16_t (*fsub_h)(uint16_t v1, uint16_t v2, uint8_t mode)=" << (uintptr_t)&fsub_h << ";\\n"; | ||||||
|  |     os << "uint16_t (*fmul_h)(uint16_t v1, uint16_t v2, uint8_t mode)=" << (uintptr_t)&fmul_h << ";\\n"; | ||||||
|  |     os << "uint16_t (*fdiv_h)(uint16_t v1, uint16_t v2, uint8_t mode)=" << (uintptr_t)&fdiv_h << ";\\n"; | ||||||
|  |     os << "uint16_t (*fsqrt_h)(uint16_t v1, uint8_t mode)=" << (uintptr_t)&fsqrt_h << ";\\n"; | ||||||
|  |     os << "uint16_t (*fcmp_h)(uint16_t v1, uint16_t v2, uint16_t op)=" << (uintptr_t)&fcmp_h << ";\\n"; | ||||||
|  |     os << "uint16_t (*fmadd_h)(uint16_t v1, uint16_t v2, uint16_t v3, uint16_t op, uint8_t mode)=" << (uintptr_t)&fmadd_h << ";\\n"; | ||||||
|  |     os << "uint16_t (*fsel_h)(uint16_t v1, uint16_t v2, uint16_t op)=" << (uintptr_t)&fsel_h << ";\\n"; | ||||||
|  |     os << "uint16_t (*fclass_h)(uint16_t v1)=" << (uintptr_t)&fclass_h << ";\\n"; | ||||||
|  |     os << "uint16_t (*unbox_h)(uint8_t FLEN, uint64_t v)=" << (uintptr_t)&unbox_h << ";\\n"; | ||||||
|  |  | ||||||
|  |     os << "uint32_t (*f16toi32)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&f16toi32 << ";\\n"; | ||||||
|  |     os << "uint32_t (*f16toui32)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&f16toui32 << ";\\n"; | ||||||
|  |     os << "uint16_t (*i32tof16)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&i32tof16 << ";\\n"; | ||||||
|  |     os << "uint16_t (*ui32tof16)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&ui32tof16 << ";\\n"; | ||||||
|  |     os << "uint64_t (*f16toi64)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&f16toi64 <<";\\n"; | ||||||
|  |     os << "uint64_t (*f16toui64)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&f16toui64 <<";\\n"; | ||||||
|  |     os << "uint16_t (*i64tof16)(uint64_t v1, uint8_t mode)=" << (uintptr_t)&i64tof16 <<";\\n"; | ||||||
|  |     os << "uint16_t (*ui64tof16)(uint64_t v1, uint8_t mode)=" << (uintptr_t)&ui64tof16 <<";\\n"; | ||||||
|  |  | ||||||
|  |     os << "uint32_t (*fadd_s)(uint32_t v1, uint32_t v2, uint8_t mode)=" << (uintptr_t)&fadd_s << ";\\n"; | ||||||
|  |     os << "uint32_t (*fsub_s)(uint32_t v1, uint32_t v2, uint8_t mode)=" << (uintptr_t)&fsub_s << ";\\n"; | ||||||
|  |     os << "uint32_t (*fmul_s)(uint32_t v1, uint32_t v2, uint8_t mode)=" << (uintptr_t)&fmul_s << ";\\n"; | ||||||
|  |     os << "uint32_t (*fdiv_s)(uint32_t v1, uint32_t v2, uint8_t mode)=" << (uintptr_t)&fdiv_s << ";\\n"; | ||||||
|  |     os << "uint32_t (*fsqrt_s)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&fsqrt_s << ";\\n"; | ||||||
|  |     os << "uint32_t (*fcmp_s)(uint32_t v1, uint32_t v2, uint32_t op)=" << (uintptr_t)&fcmp_s << ";\\n"; | ||||||
|  |     os << "uint32_t (*fmadd_s)(uint32_t v1, uint32_t v2, uint32_t v3, uint32_t op, uint8_t mode)=" << (uintptr_t)&fmadd_s << ";\\n"; | ||||||
|  |     os << "uint32_t (*fsel_s)(uint32_t v1, uint32_t v2, uint32_t op)=" << (uintptr_t)&fsel_s << ";\\n"; | ||||||
|  |     os << "uint32_t (*fclass_s)( uint32_t v1 )=" << (uintptr_t)&fclass_s << ";\\n"; | ||||||
|  |     os << "uint32_t (*unbox_s)(uint8_t FLEN, uint64_t v)=" << (uintptr_t)&unbox_s << ";\\n"; | ||||||
|  |  | ||||||
|  |     os << "uint32_t (*f32toi32)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&f32toi32 << ";\\n"; | ||||||
|  |     os << "uint32_t (*f32toui32)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&f32toui32 << ";\\n"; | ||||||
|  |     os << "uint32_t (*i32tof32)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&i32tof32 << ";\\n"; | ||||||
|  |     os << "uint32_t (*ui32tof32)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&ui32tof32 << ";\\n"; | ||||||
|  |     os << "uint64_t (*f32toi64)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&f32toi64 <<";\\n"; | ||||||
|  |     os << "uint64_t (*f32toui64)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&f32toui64 <<";\\n"; | ||||||
|  |     os << "uint32_t (*i64tof32)(uint64_t v1, uint8_t mode)=" << (uintptr_t)&i64tof32 <<";\\n"; | ||||||
|  |     os << "uint32_t (*ui64tof32)(uint64_t v1, uint8_t mode)=" << (uintptr_t)&ui64tof32 <<";\\n"; | ||||||
|  |     <%if(flen > 32) {%> | ||||||
|  |  | ||||||
|  |     os << "uint64_t (*fadd_d)(uint64_t v1, uint64_t v2, uint8_t mode)=" << (uintptr_t)&fadd_d << ";\\n"; | ||||||
|  |     os << "uint64_t (*fsub_d)(uint64_t v1, uint64_t v2, uint8_t mode)=" << (uintptr_t)&fsub_d << ";\\n"; | ||||||
|  |     os << "uint64_t (*fmul_d)(uint64_t v1, uint64_t v2, uint8_t mode)=" << (uintptr_t)&fmul_d << ";\\n"; | ||||||
|  |     os << "uint64_t (*fdiv_d)(uint64_t v1, uint64_t v2, uint8_t mode)=" << (uintptr_t)&fdiv_d << ";\\n"; | ||||||
|  |     os << "uint64_t (*fsqrt_d)(uint64_t v1, uint8_t mode)=" << (uintptr_t)&fsqrt_d << ";\\n"; | ||||||
|  |     os << "uint64_t (*fcmp_d)(uint64_t v1, uint64_t v2, uint32_t op)=" << (uintptr_t)&fcmp_d << ";\\n"; | ||||||
|  |     os << "uint64_t (*fmadd_d)(uint64_t v1, uint64_t v2, uint64_t v3, uint32_t op, uint8_t mode)=" << (uintptr_t)&fmadd_d << ";\\n"; | ||||||
|  |     os << "uint64_t (*fsel_d)(uint64_t v1, uint64_t v2, uint32_t op)=" << (uintptr_t)&fsel_d << ";\\n"; | ||||||
|  |     os << "uint64_t (*fclass_d)(uint64_t v1  )=" << (uintptr_t)&fclass_d << ";\\n"; | ||||||
|  |     os << "uint64_t (*unbox_d)(uint8_t FLEN, uint64_t v)=" << (uintptr_t)&unbox_d << ";\\n"; | ||||||
|  |  | ||||||
|  |     os << "uint32_t (*f64tof32)(uint64_t v1, uint8_t mode)=" << (uintptr_t)&f64tof32 << ";\\n"; | ||||||
|  |     os << "uint64_t (*f32tof64)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&f32tof64 << ";\\n"; | ||||||
|  |     os << "uint64_t (*f64toi64)(uint64_t v1, uint8_t mode)=" << (uintptr_t)&f64toi64 <<";\\n"; | ||||||
|  |     os << "uint64_t (*f64toui64)(uint64_t v1, uint8_t mode)=" << (uintptr_t)&f64toui64 <<";\\n"; | ||||||
|  |     os << "uint64_t (*i64tof64)(uint64_t v1, uint8_t mode)=" << (uintptr_t)&i64tof64 <<";\\n"; | ||||||
|  |     os << "uint64_t (*ui64tof64)(uint64_t v1, uint8_t mode)=" << (uintptr_t)&ui64tof64 <<";\\n"; | ||||||
|  |     os << "uint64_t (*i32tof64)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&i32tof64 <<";\\n"; | ||||||
|  |     os << "uint64_t (*ui32tof64)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&ui32tof64 <<";\\n"; | ||||||
|  |     os << "uint32_t (*f64toi32)(uint64_t v1, uint8_t mode)=" << (uintptr_t)&f64toi32 <<";\\n"; | ||||||
|  |     os << "uint32_t (*f64toui32)(uint64_t v1, uint8_t mode)=" << (uintptr_t)&f64toui32 <<";\\n"; | ||||||
|  |     <%} | ||||||
|  |     }%> | ||||||
|  |     tu.add_prologue(os.str()); | ||||||
|  | } | ||||||
|  |  | ||||||
| } // namespace ${coreDef.name.toLowerCase()} | } // namespace ${coreDef.name.toLowerCase()} | ||||||
|  |  | ||||||
| @@ -334,7 +399,7 @@ volatile std::array<bool, 2> dummy = { | |||||||
| 		    auto vm = new tcc::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | 		    auto vm = new tcc::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | ||||||
| 		    if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | 		    if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | ||||||
|             if(init_data){ |             if(init_data){ | ||||||
|                 auto* cb = reinterpret_cast<std::function<void(arch_if*, arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t, arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t)>*>(init_data); |                 auto* cb = reinterpret_cast<semihosting_cb_t<arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t>*>(init_data); | ||||||
|                 cpu->set_semihosting_callback(*cb); |                 cpu->set_semihosting_callback(*cb); | ||||||
|             } |             } | ||||||
|             return {cpu_ptr{cpu}, vm_ptr{vm}}; |             return {cpu_ptr{cpu}, vm_ptr{vm}}; | ||||||
| @@ -344,7 +409,7 @@ volatile std::array<bool, 2> dummy = { | |||||||
| 		    auto vm = new tcc::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | 		    auto vm = new tcc::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | ||||||
| 		    if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | 		    if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | ||||||
|             if(init_data){ |             if(init_data){ | ||||||
|                 auto* cb = reinterpret_cast<std::function<void(arch_if*, arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t, arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t)>*>(init_data); |                 auto* cb = reinterpret_cast<semihosting_cb_t<arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t>*>(init_data); | ||||||
|                 cpu->set_semihosting_callback(*cb); |                 cpu->set_semihosting_callback(*cb); | ||||||
|             } |             } | ||||||
|             return {cpu_ptr{cpu}, vm_ptr{vm}}; |             return {cpu_ptr{cpu}, vm_ptr{vm}}; | ||||||
|   | |||||||
							
								
								
									
										2
									
								
								softfloat/.gitignore
									
									
									
									
										vendored
									
									
										Normal file
									
								
							
							
						
						
									
										2
									
								
								softfloat/.gitignore
									
									
									
									
										vendored
									
									
										Normal file
									
								
							| @@ -0,0 +1,2 @@ | |||||||
|  | build/*/*.o | ||||||
|  | build/*/*.a | ||||||
							
								
								
									
										24
									
								
								softfloat/README.md
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										24
									
								
								softfloat/README.md
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,24 @@ | |||||||
|  |  | ||||||
|  | Package Overview for Berkeley SoftFloat Release 3e | ||||||
|  | ================================================== | ||||||
|  |  | ||||||
|  | John R. Hauser<br> | ||||||
|  | 2018 January 20 | ||||||
|  |  | ||||||
|  |  | ||||||
|  | Berkeley SoftFloat is a software implementation of binary floating-point | ||||||
|  | that conforms to the IEEE Standard for Floating-Point Arithmetic.  SoftFloat | ||||||
|  | is distributed in the form of C source code.  Building the SoftFloat sources | ||||||
|  | generates a library file (typically `softfloat.a` or `libsoftfloat.a`) | ||||||
|  | containing the floating-point subroutines. | ||||||
|  |  | ||||||
|  |  | ||||||
|  | The SoftFloat package is documented in the following files in the `doc` | ||||||
|  | subdirectory: | ||||||
|  |  | ||||||
|  | * [SoftFloat.html](http://www.jhauser.us/arithmetic/SoftFloat-3/doc/SoftFloat.html) Documentation for using the SoftFloat functions. | ||||||
|  | * [SoftFloat-source.html](http://www.jhauser.us/arithmetic/SoftFloat-3/doc/SoftFloat-source.html) Documentation for building SoftFloat. | ||||||
|  | * [SoftFloat-history.html](http://www.jhauser.us/arithmetic/SoftFloat-3/doc/SoftFloat-history.html) History of the major changes to SoftFloat. | ||||||
|  |  | ||||||
|  | Other files in the package comprise the source code for SoftFloat. | ||||||
|  |  | ||||||
| @@ -50,3 +50,4 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| #define SOFTFLOAT_BUILTIN_CLZ 1 | #define SOFTFLOAT_BUILTIN_CLZ 1 | ||||||
| #include "opts-GCC.h" | #include "opts-GCC.h" | ||||||
|  |  | ||||||
|   | |||||||
| @@ -50,3 +50,4 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| #define SOFTFLOAT_BUILTIN_CLZ 1 | #define SOFTFLOAT_BUILTIN_CLZ 1 | ||||||
| #include "opts-GCC.h" | #include "opts-GCC.h" | ||||||
|  |  | ||||||
|   | |||||||
| @@ -50,3 +50,4 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| #define SOFTFLOAT_BUILTIN_CLZ 1 | #define SOFTFLOAT_BUILTIN_CLZ 1 | ||||||
| #include "opts-GCC.h" | #include "opts-GCC.h" | ||||||
|  |  | ||||||
|   | |||||||
							
								
								
									
										399
									
								
								softfloat/build/Linux-RISCV64-GCC/Makefile
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										399
									
								
								softfloat/build/Linux-RISCV64-GCC/Makefile
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,399 @@ | |||||||
|  |  | ||||||
|  | #============================================================================= | ||||||
|  | # | ||||||
|  | # This Makefile is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
|  | # Package, Release 3e, by John R. Hauser. | ||||||
|  | # | ||||||
|  | # Copyright 2011, 2012, 2013, 2014, 2015, 2016, 2017 The Regents of the | ||||||
|  | # University of California.  All rights reserved. | ||||||
|  | # | ||||||
|  | # Redistribution and use in source and binary forms, with or without | ||||||
|  | # modification, are permitted provided that the following conditions are met: | ||||||
|  | # | ||||||
|  | #  1. Redistributions of source code must retain the above copyright notice, | ||||||
|  | #     this list of conditions, and the following disclaimer. | ||||||
|  | # | ||||||
|  | #  2. Redistributions in binary form must reproduce the above copyright | ||||||
|  | #     notice, this list of conditions, and the following disclaimer in the | ||||||
|  | #     documentation and/or other materials provided with the distribution. | ||||||
|  | # | ||||||
|  | #  3. Neither the name of the University nor the names of its contributors | ||||||
|  | #     may be used to endorse or promote products derived from this software | ||||||
|  | #     without specific prior written permission. | ||||||
|  | # | ||||||
|  | # THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||||
|  | # EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||||
|  | # WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||||
|  | # DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||||
|  | # DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||||
|  | # (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||||
|  | # LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||||
|  | # ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||||
|  | # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF | ||||||
|  | # THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||||
|  | # | ||||||
|  | #============================================================================= | ||||||
|  |  | ||||||
|  | SOURCE_DIR ?= ../../source | ||||||
|  | SPECIALIZE_TYPE ?= RISCV | ||||||
|  | MARCH ?= rv64gcv_zfh_zfhmin | ||||||
|  | MABI ?= lp64d | ||||||
|  |  | ||||||
|  | SOFTFLOAT_OPTS ?= \ | ||||||
|  |   -DSOFTFLOAT_ROUND_ODD -DINLINE_LEVEL=5 -DSOFTFLOAT_FAST_DIV32TO16 \ | ||||||
|  |   -DSOFTFLOAT_FAST_DIV64TO32 | ||||||
|  |  | ||||||
|  | DELETE = rm -f | ||||||
|  | C_INCLUDES = -I. -I$(SOURCE_DIR)/$(SPECIALIZE_TYPE) -I$(SOURCE_DIR)/include | ||||||
|  | COMPILE_C = \ | ||||||
|  |   riscv64-unknown-linux-gnu-gcc -c -march=$(MARCH) -mabi=$(MABI) -Werror-implicit-function-declaration -DSOFTFLOAT_FAST_INT64 \ | ||||||
|  |     $(SOFTFLOAT_OPTS) $(C_INCLUDES) -O2 -o $@ | ||||||
|  | MAKELIB = ar crs $@ | ||||||
|  |  | ||||||
|  | OBJ = .o | ||||||
|  | LIB = .a | ||||||
|  |  | ||||||
|  | OTHER_HEADERS = $(SOURCE_DIR)/include/opts-GCC.h | ||||||
|  |  | ||||||
|  | .PHONY: all | ||||||
|  | all: softfloat$(LIB) | ||||||
|  |  | ||||||
|  | OBJS_PRIMITIVES = \ | ||||||
|  |   s_eq128$(OBJ) \ | ||||||
|  |   s_le128$(OBJ) \ | ||||||
|  |   s_lt128$(OBJ) \ | ||||||
|  |   s_shortShiftLeft128$(OBJ) \ | ||||||
|  |   s_shortShiftRight128$(OBJ) \ | ||||||
|  |   s_shortShiftRightJam64$(OBJ) \ | ||||||
|  |   s_shortShiftRightJam64Extra$(OBJ) \ | ||||||
|  |   s_shortShiftRightJam128$(OBJ) \ | ||||||
|  |   s_shortShiftRightJam128Extra$(OBJ) \ | ||||||
|  |   s_shiftRightJam32$(OBJ) \ | ||||||
|  |   s_shiftRightJam64$(OBJ) \ | ||||||
|  |   s_shiftRightJam64Extra$(OBJ) \ | ||||||
|  |   s_shiftRightJam128$(OBJ) \ | ||||||
|  |   s_shiftRightJam128Extra$(OBJ) \ | ||||||
|  |   s_shiftRightJam256M$(OBJ) \ | ||||||
|  |   s_countLeadingZeros8$(OBJ) \ | ||||||
|  |   s_countLeadingZeros16$(OBJ) \ | ||||||
|  |   s_countLeadingZeros32$(OBJ) \ | ||||||
|  |   s_countLeadingZeros64$(OBJ) \ | ||||||
|  |   s_add128$(OBJ) \ | ||||||
|  |   s_add256M$(OBJ) \ | ||||||
|  |   s_sub128$(OBJ) \ | ||||||
|  |   s_sub256M$(OBJ) \ | ||||||
|  |   s_mul64ByShifted32To128$(OBJ) \ | ||||||
|  |   s_mul64To128$(OBJ) \ | ||||||
|  |   s_mul128By32$(OBJ) \ | ||||||
|  |   s_mul128To256M$(OBJ) \ | ||||||
|  |   s_approxRecip_1Ks$(OBJ) \ | ||||||
|  |   s_approxRecip32_1$(OBJ) \ | ||||||
|  |   s_approxRecipSqrt_1Ks$(OBJ) \ | ||||||
|  |   s_approxRecipSqrt32_1$(OBJ) \ | ||||||
|  |  | ||||||
|  | OBJS_SPECIALIZE = \ | ||||||
|  |   softfloat_raiseFlags$(OBJ) \ | ||||||
|  |   s_f16UIToCommonNaN$(OBJ) \ | ||||||
|  |   s_commonNaNToF16UI$(OBJ) \ | ||||||
|  |   s_propagateNaNF16UI$(OBJ) \ | ||||||
|  |   s_bf16UIToCommonNaN$(OBJ) \ | ||||||
|  |   s_commonNaNToBF16UI$(OBJ) \ | ||||||
|  |   s_f32UIToCommonNaN$(OBJ) \ | ||||||
|  |   s_commonNaNToF32UI$(OBJ) \ | ||||||
|  |   s_propagateNaNF32UI$(OBJ) \ | ||||||
|  |   s_f64UIToCommonNaN$(OBJ) \ | ||||||
|  |   s_commonNaNToF64UI$(OBJ) \ | ||||||
|  |   s_propagateNaNF64UI$(OBJ) \ | ||||||
|  |   extF80M_isSignalingNaN$(OBJ) \ | ||||||
|  |   s_extF80UIToCommonNaN$(OBJ) \ | ||||||
|  |   s_commonNaNToExtF80UI$(OBJ) \ | ||||||
|  |   s_propagateNaNExtF80UI$(OBJ) \ | ||||||
|  |   f128M_isSignalingNaN$(OBJ) \ | ||||||
|  |   s_f128UIToCommonNaN$(OBJ) \ | ||||||
|  |   s_commonNaNToF128UI$(OBJ) \ | ||||||
|  |   s_propagateNaNF128UI$(OBJ) \ | ||||||
|  |  | ||||||
|  | OBJS_OTHERS = \ | ||||||
|  |   s_roundToUI32$(OBJ) \ | ||||||
|  |   s_roundToUI64$(OBJ) \ | ||||||
|  |   s_roundToI32$(OBJ) \ | ||||||
|  |   s_roundToI64$(OBJ) \ | ||||||
|  |   s_normSubnormalBF16Sig$(OBJ) \ | ||||||
|  |   s_roundPackToBF16$(OBJ) \ | ||||||
|  |   s_normSubnormalF16Sig$(OBJ) \ | ||||||
|  |   s_roundPackToF16$(OBJ) \ | ||||||
|  |   s_normRoundPackToF16$(OBJ) \ | ||||||
|  |   s_addMagsF16$(OBJ) \ | ||||||
|  |   s_subMagsF16$(OBJ) \ | ||||||
|  |   s_mulAddF16$(OBJ) \ | ||||||
|  |   s_normSubnormalF32Sig$(OBJ) \ | ||||||
|  |   s_roundPackToF32$(OBJ) \ | ||||||
|  |   s_normRoundPackToF32$(OBJ) \ | ||||||
|  |   s_addMagsF32$(OBJ) \ | ||||||
|  |   s_subMagsF32$(OBJ) \ | ||||||
|  |   s_mulAddF32$(OBJ) \ | ||||||
|  |   s_normSubnormalF64Sig$(OBJ) \ | ||||||
|  |   s_roundPackToF64$(OBJ) \ | ||||||
|  |   s_normRoundPackToF64$(OBJ) \ | ||||||
|  |   s_addMagsF64$(OBJ) \ | ||||||
|  |   s_subMagsF64$(OBJ) \ | ||||||
|  |   s_mulAddF64$(OBJ) \ | ||||||
|  |   s_normSubnormalExtF80Sig$(OBJ) \ | ||||||
|  |   s_roundPackToExtF80$(OBJ) \ | ||||||
|  |   s_normRoundPackToExtF80$(OBJ) \ | ||||||
|  |   s_addMagsExtF80$(OBJ) \ | ||||||
|  |   s_subMagsExtF80$(OBJ) \ | ||||||
|  |   s_normSubnormalF128Sig$(OBJ) \ | ||||||
|  |   s_roundPackToF128$(OBJ) \ | ||||||
|  |   s_normRoundPackToF128$(OBJ) \ | ||||||
|  |   s_addMagsF128$(OBJ) \ | ||||||
|  |   s_subMagsF128$(OBJ) \ | ||||||
|  |   s_mulAddF128$(OBJ) \ | ||||||
|  |   softfloat_state$(OBJ) \ | ||||||
|  |   ui32_to_f16$(OBJ) \ | ||||||
|  |   ui32_to_f32$(OBJ) \ | ||||||
|  |   ui32_to_f64$(OBJ) \ | ||||||
|  |   ui32_to_extF80$(OBJ) \ | ||||||
|  |   ui32_to_extF80M$(OBJ) \ | ||||||
|  |   ui32_to_f128$(OBJ) \ | ||||||
|  |   ui32_to_f128M$(OBJ) \ | ||||||
|  |   ui64_to_f16$(OBJ) \ | ||||||
|  |   ui64_to_f32$(OBJ) \ | ||||||
|  |   ui64_to_f64$(OBJ) \ | ||||||
|  |   ui64_to_extF80$(OBJ) \ | ||||||
|  |   ui64_to_extF80M$(OBJ) \ | ||||||
|  |   ui64_to_f128$(OBJ) \ | ||||||
|  |   ui64_to_f128M$(OBJ) \ | ||||||
|  |   i32_to_f16$(OBJ) \ | ||||||
|  |   i32_to_f32$(OBJ) \ | ||||||
|  |   i32_to_f64$(OBJ) \ | ||||||
|  |   i32_to_extF80$(OBJ) \ | ||||||
|  |   i32_to_extF80M$(OBJ) \ | ||||||
|  |   i32_to_f128$(OBJ) \ | ||||||
|  |   i32_to_f128M$(OBJ) \ | ||||||
|  |   i64_to_f16$(OBJ) \ | ||||||
|  |   i64_to_f32$(OBJ) \ | ||||||
|  |   i64_to_f64$(OBJ) \ | ||||||
|  |   i64_to_extF80$(OBJ) \ | ||||||
|  |   i64_to_extF80M$(OBJ) \ | ||||||
|  |   i64_to_f128$(OBJ) \ | ||||||
|  |   i64_to_f128M$(OBJ) \ | ||||||
|  |   bf16_isSignalingNaN$(OBJ) \ | ||||||
|  |   bf16_to_f32$(OBJ) \ | ||||||
|  |   f16_to_ui32$(OBJ) \ | ||||||
|  |   f16_to_ui64$(OBJ) \ | ||||||
|  |   f16_to_i32$(OBJ) \ | ||||||
|  |   f16_to_i64$(OBJ) \ | ||||||
|  |   f16_to_ui32_r_minMag$(OBJ) \ | ||||||
|  |   f16_to_ui64_r_minMag$(OBJ) \ | ||||||
|  |   f16_to_i32_r_minMag$(OBJ) \ | ||||||
|  |   f16_to_i64_r_minMag$(OBJ) \ | ||||||
|  |   f16_to_f32$(OBJ) \ | ||||||
|  |   f16_to_f64$(OBJ) \ | ||||||
|  |   f16_to_extF80$(OBJ) \ | ||||||
|  |   f16_to_extF80M$(OBJ) \ | ||||||
|  |   f16_to_f128$(OBJ) \ | ||||||
|  |   f16_to_f128M$(OBJ) \ | ||||||
|  |   f16_roundToInt$(OBJ) \ | ||||||
|  |   f16_add$(OBJ) \ | ||||||
|  |   f16_sub$(OBJ) \ | ||||||
|  |   f16_mul$(OBJ) \ | ||||||
|  |   f16_mulAdd$(OBJ) \ | ||||||
|  |   f16_div$(OBJ) \ | ||||||
|  |   f16_rem$(OBJ) \ | ||||||
|  |   f16_sqrt$(OBJ) \ | ||||||
|  |   f16_eq$(OBJ) \ | ||||||
|  |   f16_le$(OBJ) \ | ||||||
|  |   f16_lt$(OBJ) \ | ||||||
|  |   f16_eq_signaling$(OBJ) \ | ||||||
|  |   f16_le_quiet$(OBJ) \ | ||||||
|  |   f16_lt_quiet$(OBJ) \ | ||||||
|  |   f16_isSignalingNaN$(OBJ) \ | ||||||
|  |   f32_to_ui32$(OBJ) \ | ||||||
|  |   f32_to_ui64$(OBJ) \ | ||||||
|  |   f32_to_i32$(OBJ) \ | ||||||
|  |   f32_to_i64$(OBJ) \ | ||||||
|  |   f32_to_ui32_r_minMag$(OBJ) \ | ||||||
|  |   f32_to_ui64_r_minMag$(OBJ) \ | ||||||
|  |   f32_to_i32_r_minMag$(OBJ) \ | ||||||
|  |   f32_to_i64_r_minMag$(OBJ) \ | ||||||
|  |   f32_to_bf16$(OBJ) \ | ||||||
|  |   f32_to_f16$(OBJ) \ | ||||||
|  |   f32_to_f64$(OBJ) \ | ||||||
|  |   f32_to_extF80$(OBJ) \ | ||||||
|  |   f32_to_extF80M$(OBJ) \ | ||||||
|  |   f32_to_f128$(OBJ) \ | ||||||
|  |   f32_to_f128M$(OBJ) \ | ||||||
|  |   f32_roundToInt$(OBJ) \ | ||||||
|  |   f32_add$(OBJ) \ | ||||||
|  |   f32_sub$(OBJ) \ | ||||||
|  |   f32_mul$(OBJ) \ | ||||||
|  |   f32_mulAdd$(OBJ) \ | ||||||
|  |   f32_div$(OBJ) \ | ||||||
|  |   f32_rem$(OBJ) \ | ||||||
|  |   f32_sqrt$(OBJ) \ | ||||||
|  |   f32_eq$(OBJ) \ | ||||||
|  |   f32_le$(OBJ) \ | ||||||
|  |   f32_lt$(OBJ) \ | ||||||
|  |   f32_eq_signaling$(OBJ) \ | ||||||
|  |   f32_le_quiet$(OBJ) \ | ||||||
|  |   f32_lt_quiet$(OBJ) \ | ||||||
|  |   f32_isSignalingNaN$(OBJ) \ | ||||||
|  |   f64_to_ui32$(OBJ) \ | ||||||
|  |   f64_to_ui64$(OBJ) \ | ||||||
|  |   f64_to_i32$(OBJ) \ | ||||||
|  |   f64_to_i64$(OBJ) \ | ||||||
|  |   f64_to_ui32_r_minMag$(OBJ) \ | ||||||
|  |   f64_to_ui64_r_minMag$(OBJ) \ | ||||||
|  |   f64_to_i32_r_minMag$(OBJ) \ | ||||||
|  |   f64_to_i64_r_minMag$(OBJ) \ | ||||||
|  |   f64_to_f16$(OBJ) \ | ||||||
|  |   f64_to_f32$(OBJ) \ | ||||||
|  |   f64_to_extF80$(OBJ) \ | ||||||
|  |   f64_to_extF80M$(OBJ) \ | ||||||
|  |   f64_to_f128$(OBJ) \ | ||||||
|  |   f64_to_f128M$(OBJ) \ | ||||||
|  |   f64_roundToInt$(OBJ) \ | ||||||
|  |   f64_add$(OBJ) \ | ||||||
|  |   f64_sub$(OBJ) \ | ||||||
|  |   f64_mul$(OBJ) \ | ||||||
|  |   f64_mulAdd$(OBJ) \ | ||||||
|  |   f64_div$(OBJ) \ | ||||||
|  |   f64_rem$(OBJ) \ | ||||||
|  |   f64_sqrt$(OBJ) \ | ||||||
|  |   f64_eq$(OBJ) \ | ||||||
|  |   f64_le$(OBJ) \ | ||||||
|  |   f64_lt$(OBJ) \ | ||||||
|  |   f64_eq_signaling$(OBJ) \ | ||||||
|  |   f64_le_quiet$(OBJ) \ | ||||||
|  |   f64_lt_quiet$(OBJ) \ | ||||||
|  |   f64_isSignalingNaN$(OBJ) \ | ||||||
|  |   extF80_to_ui32$(OBJ) \ | ||||||
|  |   extF80_to_ui64$(OBJ) \ | ||||||
|  |   extF80_to_i32$(OBJ) \ | ||||||
|  |   extF80_to_i64$(OBJ) \ | ||||||
|  |   extF80_to_ui32_r_minMag$(OBJ) \ | ||||||
|  |   extF80_to_ui64_r_minMag$(OBJ) \ | ||||||
|  |   extF80_to_i32_r_minMag$(OBJ) \ | ||||||
|  |   extF80_to_i64_r_minMag$(OBJ) \ | ||||||
|  |   extF80_to_f16$(OBJ) \ | ||||||
|  |   extF80_to_f32$(OBJ) \ | ||||||
|  |   extF80_to_f64$(OBJ) \ | ||||||
|  |   extF80_to_f128$(OBJ) \ | ||||||
|  |   extF80_roundToInt$(OBJ) \ | ||||||
|  |   extF80_add$(OBJ) \ | ||||||
|  |   extF80_sub$(OBJ) \ | ||||||
|  |   extF80_mul$(OBJ) \ | ||||||
|  |   extF80_div$(OBJ) \ | ||||||
|  |   extF80_rem$(OBJ) \ | ||||||
|  |   extF80_sqrt$(OBJ) \ | ||||||
|  |   extF80_eq$(OBJ) \ | ||||||
|  |   extF80_le$(OBJ) \ | ||||||
|  |   extF80_lt$(OBJ) \ | ||||||
|  |   extF80_eq_signaling$(OBJ) \ | ||||||
|  |   extF80_le_quiet$(OBJ) \ | ||||||
|  |   extF80_lt_quiet$(OBJ) \ | ||||||
|  |   extF80_isSignalingNaN$(OBJ) \ | ||||||
|  |   extF80M_to_ui32$(OBJ) \ | ||||||
|  |   extF80M_to_ui64$(OBJ) \ | ||||||
|  |   extF80M_to_i32$(OBJ) \ | ||||||
|  |   extF80M_to_i64$(OBJ) \ | ||||||
|  |   extF80M_to_ui32_r_minMag$(OBJ) \ | ||||||
|  |   extF80M_to_ui64_r_minMag$(OBJ) \ | ||||||
|  |   extF80M_to_i32_r_minMag$(OBJ) \ | ||||||
|  |   extF80M_to_i64_r_minMag$(OBJ) \ | ||||||
|  |   extF80M_to_f16$(OBJ) \ | ||||||
|  |   extF80M_to_f32$(OBJ) \ | ||||||
|  |   extF80M_to_f64$(OBJ) \ | ||||||
|  |   extF80M_to_f128M$(OBJ) \ | ||||||
|  |   extF80M_roundToInt$(OBJ) \ | ||||||
|  |   extF80M_add$(OBJ) \ | ||||||
|  |   extF80M_sub$(OBJ) \ | ||||||
|  |   extF80M_mul$(OBJ) \ | ||||||
|  |   extF80M_div$(OBJ) \ | ||||||
|  |   extF80M_rem$(OBJ) \ | ||||||
|  |   extF80M_sqrt$(OBJ) \ | ||||||
|  |   extF80M_eq$(OBJ) \ | ||||||
|  |   extF80M_le$(OBJ) \ | ||||||
|  |   extF80M_lt$(OBJ) \ | ||||||
|  |   extF80M_eq_signaling$(OBJ) \ | ||||||
|  |   extF80M_le_quiet$(OBJ) \ | ||||||
|  |   extF80M_lt_quiet$(OBJ) \ | ||||||
|  |   f128_to_ui32$(OBJ) \ | ||||||
|  |   f128_to_ui64$(OBJ) \ | ||||||
|  |   f128_to_i32$(OBJ) \ | ||||||
|  |   f128_to_i64$(OBJ) \ | ||||||
|  |   f128_to_ui32_r_minMag$(OBJ) \ | ||||||
|  |   f128_to_ui64_r_minMag$(OBJ) \ | ||||||
|  |   f128_to_i32_r_minMag$(OBJ) \ | ||||||
|  |   f128_to_i64_r_minMag$(OBJ) \ | ||||||
|  |   f128_to_f16$(OBJ) \ | ||||||
|  |   f128_to_f32$(OBJ) \ | ||||||
|  |   f128_to_extF80$(OBJ) \ | ||||||
|  |   f128_to_f64$(OBJ) \ | ||||||
|  |   f128_roundToInt$(OBJ) \ | ||||||
|  |   f128_add$(OBJ) \ | ||||||
|  |   f128_sub$(OBJ) \ | ||||||
|  |   f128_mul$(OBJ) \ | ||||||
|  |   f128_mulAdd$(OBJ) \ | ||||||
|  |   f128_div$(OBJ) \ | ||||||
|  |   f128_rem$(OBJ) \ | ||||||
|  |   f128_sqrt$(OBJ) \ | ||||||
|  |   f128_eq$(OBJ) \ | ||||||
|  |   f128_le$(OBJ) \ | ||||||
|  |   f128_lt$(OBJ) \ | ||||||
|  |   f128_eq_signaling$(OBJ) \ | ||||||
|  |   f128_le_quiet$(OBJ) \ | ||||||
|  |   f128_lt_quiet$(OBJ) \ | ||||||
|  |   f128_isSignalingNaN$(OBJ) \ | ||||||
|  |   f128M_to_ui32$(OBJ) \ | ||||||
|  |   f128M_to_ui64$(OBJ) \ | ||||||
|  |   f128M_to_i32$(OBJ) \ | ||||||
|  |   f128M_to_i64$(OBJ) \ | ||||||
|  |   f128M_to_ui32_r_minMag$(OBJ) \ | ||||||
|  |   f128M_to_ui64_r_minMag$(OBJ) \ | ||||||
|  |   f128M_to_i32_r_minMag$(OBJ) \ | ||||||
|  |   f128M_to_i64_r_minMag$(OBJ) \ | ||||||
|  |   f128M_to_f16$(OBJ) \ | ||||||
|  |   f128M_to_f32$(OBJ) \ | ||||||
|  |   f128M_to_extF80M$(OBJ) \ | ||||||
|  |   f128M_to_f64$(OBJ) \ | ||||||
|  |   f128M_roundToInt$(OBJ) \ | ||||||
|  |   f128M_add$(OBJ) \ | ||||||
|  |   f128M_sub$(OBJ) \ | ||||||
|  |   f128M_mul$(OBJ) \ | ||||||
|  |   f128M_mulAdd$(OBJ) \ | ||||||
|  |   f128M_div$(OBJ) \ | ||||||
|  |   f128M_rem$(OBJ) \ | ||||||
|  |   f128M_sqrt$(OBJ) \ | ||||||
|  |   f128M_eq$(OBJ) \ | ||||||
|  |   f128M_le$(OBJ) \ | ||||||
|  |   f128M_lt$(OBJ) \ | ||||||
|  |   f128M_eq_signaling$(OBJ) \ | ||||||
|  |   f128M_le_quiet$(OBJ) \ | ||||||
|  |   f128M_lt_quiet$(OBJ) \ | ||||||
|  |  | ||||||
|  | OBJS_ALL = $(OBJS_PRIMITIVES) $(OBJS_SPECIALIZE) $(OBJS_OTHERS) | ||||||
|  |  | ||||||
|  | $(OBJS_ALL): \ | ||||||
|  |   $(OTHER_HEADERS) platform.h $(SOURCE_DIR)/include/primitiveTypes.h \ | ||||||
|  |   $(SOURCE_DIR)/include/primitives.h | ||||||
|  | $(OBJS_SPECIALIZE) $(OBJS_OTHERS): \ | ||||||
|  |   $(SOURCE_DIR)/include/softfloat_types.h $(SOURCE_DIR)/include/internals.h \ | ||||||
|  |   $(SOURCE_DIR)/$(SPECIALIZE_TYPE)/specialize.h \ | ||||||
|  |   $(SOURCE_DIR)/include/softfloat.h | ||||||
|  |  | ||||||
|  | $(OBJS_PRIMITIVES) $(OBJS_OTHERS): %$(OBJ): $(SOURCE_DIR)/%.c | ||||||
|  | 	$(COMPILE_C) $(SOURCE_DIR)/$*.c | ||||||
|  |  | ||||||
|  | $(OBJS_SPECIALIZE): %$(OBJ): $(SOURCE_DIR)/$(SPECIALIZE_TYPE)/%.c | ||||||
|  | 	$(COMPILE_C) $(SOURCE_DIR)/$(SPECIALIZE_TYPE)/$*.c | ||||||
|  |  | ||||||
|  | softfloat$(LIB): $(OBJS_ALL) | ||||||
|  | 	$(DELETE) $@ | ||||||
|  | 	$(MAKELIB) $^ | ||||||
|  |  | ||||||
|  | .PHONY: clean | ||||||
|  | clean: | ||||||
|  | 	$(DELETE) $(OBJS_ALL) softfloat$(LIB) | ||||||
|  |  | ||||||
							
								
								
									
										54
									
								
								softfloat/build/Linux-RISCV64-GCC/platform.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										54
									
								
								softfloat/build/Linux-RISCV64-GCC/platform.h
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,54 @@ | |||||||
|  |  | ||||||
|  | /*============================================================================ | ||||||
|  |  | ||||||
|  | This C header file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
|  | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
|  | Copyright 2011, 2012, 2013, 2014, 2015, 2016, 2017 The Regents of the | ||||||
|  | University of California.  All rights reserved. | ||||||
|  |  | ||||||
|  | Redistribution and use in source and binary forms, with or without | ||||||
|  | modification, are permitted provided that the following conditions are met: | ||||||
|  |  | ||||||
|  |  1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |     this list of conditions, and the following disclaimer. | ||||||
|  |  | ||||||
|  |  2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |     this list of conditions, and the following disclaimer in the documentation | ||||||
|  |     and/or other materials provided with the distribution. | ||||||
|  |  | ||||||
|  |  3. Neither the name of the University nor the names of its contributors may | ||||||
|  |     be used to endorse or promote products derived from this software without | ||||||
|  |     specific prior written permission. | ||||||
|  |  | ||||||
|  | THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||||
|  | EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||||
|  | WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||||
|  | DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||||
|  | DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||||
|  | (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||||
|  | LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||||
|  | ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||||
|  | (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||||
|  | SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  | ||||||
|  | =============================================================================*/ | ||||||
|  |  | ||||||
|  | /*---------------------------------------------------------------------------- | ||||||
|  | *----------------------------------------------------------------------------*/ | ||||||
|  | #define LITTLEENDIAN 1 | ||||||
|  |  | ||||||
|  | /*---------------------------------------------------------------------------- | ||||||
|  | *----------------------------------------------------------------------------*/ | ||||||
|  | #ifdef __GNUC_STDC_INLINE__ | ||||||
|  | #define INLINE inline | ||||||
|  | #else | ||||||
|  | #define INLINE extern inline | ||||||
|  | #endif | ||||||
|  |  | ||||||
|  | /*---------------------------------------------------------------------------- | ||||||
|  | *----------------------------------------------------------------------------*/ | ||||||
|  | #define SOFTFLOAT_BUILTIN_CLZ 1 | ||||||
|  | #define SOFTFLOAT_INTRINSIC_INT128 1 | ||||||
|  | #include "opts-GCC.h" | ||||||
|  |  | ||||||
| @@ -94,6 +94,8 @@ OBJS_SPECIALIZE = \ | |||||||
|   s_f16UIToCommonNaN$(OBJ) \ |   s_f16UIToCommonNaN$(OBJ) \ | ||||||
|   s_commonNaNToF16UI$(OBJ) \ |   s_commonNaNToF16UI$(OBJ) \ | ||||||
|   s_propagateNaNF16UI$(OBJ) \ |   s_propagateNaNF16UI$(OBJ) \ | ||||||
|  |   s_bf16UIToCommonNaN$(OBJ) \ | ||||||
|  |   s_commonNaNToBF16UI$(OBJ) \ | ||||||
|   s_f32UIToCommonNaN$(OBJ) \ |   s_f32UIToCommonNaN$(OBJ) \ | ||||||
|   s_commonNaNToF32UI$(OBJ) \ |   s_commonNaNToF32UI$(OBJ) \ | ||||||
|   s_propagateNaNF32UI$(OBJ) \ |   s_propagateNaNF32UI$(OBJ) \ | ||||||
| @@ -114,6 +116,8 @@ OBJS_OTHERS = \ | |||||||
|   s_roundToUI64$(OBJ) \ |   s_roundToUI64$(OBJ) \ | ||||||
|   s_roundToI32$(OBJ) \ |   s_roundToI32$(OBJ) \ | ||||||
|   s_roundToI64$(OBJ) \ |   s_roundToI64$(OBJ) \ | ||||||
|  |   s_normSubnormalBF16Sig$(OBJ) \ | ||||||
|  |   s_roundPackToBF16$(OBJ) \ | ||||||
|   s_normSubnormalF16Sig$(OBJ) \ |   s_normSubnormalF16Sig$(OBJ) \ | ||||||
|   s_roundPackToF16$(OBJ) \ |   s_roundPackToF16$(OBJ) \ | ||||||
|   s_normRoundPackToF16$(OBJ) \ |   s_normRoundPackToF16$(OBJ) \ | ||||||
| @@ -172,6 +176,8 @@ OBJS_OTHERS = \ | |||||||
|   i64_to_extF80M$(OBJ) \ |   i64_to_extF80M$(OBJ) \ | ||||||
|   i64_to_f128$(OBJ) \ |   i64_to_f128$(OBJ) \ | ||||||
|   i64_to_f128M$(OBJ) \ |   i64_to_f128M$(OBJ) \ | ||||||
|  |   bf16_isSignalingNaN$(OBJ) \ | ||||||
|  |   bf16_to_f32$(OBJ) \ | ||||||
|   f16_to_ui32$(OBJ) \ |   f16_to_ui32$(OBJ) \ | ||||||
|   f16_to_ui64$(OBJ) \ |   f16_to_ui64$(OBJ) \ | ||||||
|   f16_to_i32$(OBJ) \ |   f16_to_i32$(OBJ) \ | ||||||
| @@ -209,6 +215,7 @@ OBJS_OTHERS = \ | |||||||
|   f32_to_ui64_r_minMag$(OBJ) \ |   f32_to_ui64_r_minMag$(OBJ) \ | ||||||
|   f32_to_i32_r_minMag$(OBJ) \ |   f32_to_i32_r_minMag$(OBJ) \ | ||||||
|   f32_to_i64_r_minMag$(OBJ) \ |   f32_to_i64_r_minMag$(OBJ) \ | ||||||
|  |   f32_to_bf16$(OBJ) \ | ||||||
|   f32_to_f16$(OBJ) \ |   f32_to_f16$(OBJ) \ | ||||||
|   f32_to_f64$(OBJ) \ |   f32_to_f64$(OBJ) \ | ||||||
|   f32_to_extF80$(OBJ) \ |   f32_to_extF80$(OBJ) \ | ||||||
|   | |||||||
| @@ -50,3 +50,4 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| #define SOFTFLOAT_BUILTIN_CLZ 1 | #define SOFTFLOAT_BUILTIN_CLZ 1 | ||||||
| #include "opts-GCC.h" | #include "opts-GCC.h" | ||||||
|  |  | ||||||
|   | |||||||
| @@ -50,3 +50,4 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| #define SOFTFLOAT_BUILTIN_CLZ 1 | #define SOFTFLOAT_BUILTIN_CLZ 1 | ||||||
| #include "opts-GCC.h" | #include "opts-GCC.h" | ||||||
|  |  | ||||||
|   | |||||||
| @@ -51,3 +51,4 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
| #define SOFTFLOAT_BUILTIN_CLZ 1 | #define SOFTFLOAT_BUILTIN_CLZ 1 | ||||||
| #define SOFTFLOAT_INTRINSIC_INT128 1 | #define SOFTFLOAT_INTRINSIC_INT128 1 | ||||||
| #include "opts-GCC.h" | #include "opts-GCC.h" | ||||||
|  |  | ||||||
|   | |||||||
| @@ -115,6 +115,8 @@ OBJS_OTHERS = \ | |||||||
|   s_roundToUI64$(OBJ) \ |   s_roundToUI64$(OBJ) \ | ||||||
|   s_roundToI32$(OBJ) \ |   s_roundToI32$(OBJ) \ | ||||||
|   s_roundToI64$(OBJ) \ |   s_roundToI64$(OBJ) \ | ||||||
|  |   s_normSubnormalBF16Sig$(OBJ) \ | ||||||
|  |   s_roundPackToBF16$(OBJ) \ | ||||||
|   s_normSubnormalF16Sig$(OBJ) \ |   s_normSubnormalF16Sig$(OBJ) \ | ||||||
|   s_roundPackToF16$(OBJ) \ |   s_roundPackToF16$(OBJ) \ | ||||||
|   s_normRoundPackToF16$(OBJ) \ |   s_normRoundPackToF16$(OBJ) \ | ||||||
| @@ -173,6 +175,8 @@ OBJS_OTHERS = \ | |||||||
|   i64_to_extF80M$(OBJ) \ |   i64_to_extF80M$(OBJ) \ | ||||||
|   i64_to_f128$(OBJ) \ |   i64_to_f128$(OBJ) \ | ||||||
|   i64_to_f128M$(OBJ) \ |   i64_to_f128M$(OBJ) \ | ||||||
|  |   bf16_isSignalingNaN$(OBJ) \ | ||||||
|  |   bf16_to_f32$(OBJ) \ | ||||||
|   f16_to_ui32$(OBJ) \ |   f16_to_ui32$(OBJ) \ | ||||||
|   f16_to_ui64$(OBJ) \ |   f16_to_ui64$(OBJ) \ | ||||||
|   f16_to_i32$(OBJ) \ |   f16_to_i32$(OBJ) \ | ||||||
| @@ -210,6 +214,7 @@ OBJS_OTHERS = \ | |||||||
|   f32_to_ui64_r_minMag$(OBJ) \ |   f32_to_ui64_r_minMag$(OBJ) \ | ||||||
|   f32_to_i32_r_minMag$(OBJ) \ |   f32_to_i32_r_minMag$(OBJ) \ | ||||||
|   f32_to_i64_r_minMag$(OBJ) \ |   f32_to_i64_r_minMag$(OBJ) \ | ||||||
|  |   f32_to_bf16$(OBJ) \ | ||||||
|   f32_to_f16$(OBJ) \ |   f32_to_f16$(OBJ) \ | ||||||
|   f32_to_f64$(OBJ) \ |   f32_to_f64$(OBJ) \ | ||||||
|   f32_to_extF80$(OBJ) \ |   f32_to_extF80$(OBJ) \ | ||||||
|   | |||||||
| @@ -47,3 +47,4 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| ==> #define THREAD_LOCAL _Thread_local | ==> #define THREAD_LOCAL _Thread_local | ||||||
|  |  | ||||||
|   | |||||||
| @@ -47,3 +47,4 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| ==> #define THREAD_LOCAL _Thread_local | ==> #define THREAD_LOCAL _Thread_local | ||||||
|  |  | ||||||
|   | |||||||
| @@ -508,7 +508,7 @@ significant extra cost. | |||||||
| On computers where the word size is <NOBR>64 bits</NOBR> or larger, both | On computers where the word size is <NOBR>64 bits</NOBR> or larger, both | ||||||
| function versions (<CODE>f128M_add</CODE> and <CODE>f128_add</CODE>) are | function versions (<CODE>f128M_add</CODE> and <CODE>f128_add</CODE>) are | ||||||
| provided, because the cost of passing by value is then more reasonable. | provided, because the cost of passing by value is then more reasonable. | ||||||
| Applications that must be portable accross both classes of computers must use | Applications that must be portable across both classes of computers must use | ||||||
| the pointer-based functions, as these are always implemented. | the pointer-based functions, as these are always implemented. | ||||||
| However, if it is known that SoftFloat includes the by-value functions for all | However, if it is known that SoftFloat includes the by-value functions for all | ||||||
| platforms of interest, programmers can use whichever version they prefer. | platforms of interest, programmers can use whichever version they prefer. | ||||||
|   | |||||||
							
								
								
									
										59
									
								
								softfloat/source/8086-SSE/s_bf16UIToCommonNaN.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										59
									
								
								softfloat/source/8086-SSE/s_bf16UIToCommonNaN.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,59 @@ | |||||||
|  |  | ||||||
|  | /*============================================================================ | ||||||
|  |  | ||||||
|  | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
|  | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
|  | Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||||
|  | All rights reserved. | ||||||
|  |  | ||||||
|  | Redistribution and use in source and binary forms, with or without | ||||||
|  | modification, are permitted provided that the following conditions are met: | ||||||
|  |  | ||||||
|  |  1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |     this list of conditions, and the following disclaimer. | ||||||
|  |  | ||||||
|  |  2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |     this list of conditions, and the following disclaimer in the documentation | ||||||
|  |     and/or other materials provided with the distribution. | ||||||
|  |  | ||||||
|  |  3. Neither the name of the University nor the names of its contributors may | ||||||
|  |     be used to endorse or promote products derived from this software without | ||||||
|  |     specific prior written permission. | ||||||
|  |  | ||||||
|  | THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||||
|  | EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||||
|  | WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||||
|  | DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||||
|  | DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||||
|  | (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||||
|  | LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||||
|  | ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||||
|  | (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||||
|  | SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  | ||||||
|  | =============================================================================*/ | ||||||
|  |  | ||||||
|  | #include <stdint.h> | ||||||
|  | #include "platform.h" | ||||||
|  | #include "specialize.h" | ||||||
|  | #include "softfloat.h" | ||||||
|  |  | ||||||
|  | /*---------------------------------------------------------------------------- | ||||||
|  | | Assuming `uiA' has the bit pattern of a BF16 NaN, converts | ||||||
|  | | this NaN to the common NaN form, and stores the resulting common NaN at the | ||||||
|  | | location pointed to by `zPtr'.  If the NaN is a signaling NaN, the invalid | ||||||
|  | | exception is raised. | ||||||
|  | *----------------------------------------------------------------------------*/ | ||||||
|  | void softfloat_bf16UIToCommonNaN( uint_fast16_t uiA, struct commonNaN *zPtr ) | ||||||
|  | { | ||||||
|  |  | ||||||
|  |     if ( softfloat_isSigNaNBF16UI( uiA ) ) { | ||||||
|  |         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||||
|  |     } | ||||||
|  |     zPtr->sign = uiA>>15; | ||||||
|  |     zPtr->v64  = (uint_fast64_t) uiA<<56; | ||||||
|  |     zPtr->v0   = 0; | ||||||
|  |  | ||||||
|  | } | ||||||
|  |  | ||||||
							
								
								
									
										51
									
								
								softfloat/source/8086-SSE/s_commonNaNToBF16UI.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										51
									
								
								softfloat/source/8086-SSE/s_commonNaNToBF16UI.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,51 @@ | |||||||
|  |  | ||||||
|  | /*============================================================================ | ||||||
|  |  | ||||||
|  | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
|  | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
|  | Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||||
|  | All rights reserved. | ||||||
|  |  | ||||||
|  | Redistribution and use in source and binary forms, with or without | ||||||
|  | modification, are permitted provided that the following conditions are met: | ||||||
|  |  | ||||||
|  |  1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |     this list of conditions, and the following disclaimer. | ||||||
|  |  | ||||||
|  |  2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |     this list of conditions, and the following disclaimer in the documentation | ||||||
|  |     and/or other materials provided with the distribution. | ||||||
|  |  | ||||||
|  |  3. Neither the name of the University nor the names of its contributors may | ||||||
|  |     be used to endorse or promote products derived from this software without | ||||||
|  |     specific prior written permission. | ||||||
|  |  | ||||||
|  | THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||||
|  | EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||||
|  | WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||||
|  | DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||||
|  | DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||||
|  | (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||||
|  | LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||||
|  | ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||||
|  | (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||||
|  | SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  | ||||||
|  | =============================================================================*/ | ||||||
|  |  | ||||||
|  | #include <stdint.h> | ||||||
|  | #include "platform.h" | ||||||
|  | #include "specialize.h" | ||||||
|  |  | ||||||
|  | /*---------------------------------------------------------------------------- | ||||||
|  | | Converts the common NaN pointed to by `aPtr' into a BF16 NaN, and  | ||||||
|  | | returns the bit pattern of this value as an unsigned integer. | ||||||
|  | *----------------------------------------------------------------------------*/ | ||||||
|  | uint_fast16_t softfloat_commonNaNToBF16UI( const struct commonNaN *aPtr ) | ||||||
|  | { | ||||||
|  |  | ||||||
|  |     return (uint_fast16_t) aPtr->sign<<15 | 0x7FC0 | aPtr->v64>>56; | ||||||
|  |  | ||||||
|  | } | ||||||
|  |  | ||||||
| @@ -116,6 +116,27 @@ uint_fast16_t softfloat_commonNaNToF16UI(const struct commonNaN* aPtr); | |||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| uint_fast16_t softfloat_propagateNaNF16UI(uint_fast16_t uiA, uint_fast16_t uiB); | uint_fast16_t softfloat_propagateNaNF16UI(uint_fast16_t uiA, uint_fast16_t uiB); | ||||||
|  |  | ||||||
|  | /*---------------------------------------------------------------------------- | ||||||
|  | | Returns true when 16-bit unsigned integer 'uiA' has the bit pattern of a | ||||||
|  | | 16-bit brain floating-point (BF16) signaling NaN. | ||||||
|  | | Note:  This macro evaluates its argument more than once. | ||||||
|  | *----------------------------------------------------------------------------*/ | ||||||
|  | #define softfloat_isSigNaNBF16UI(uiA) ((((uiA)&0x7FC0) == 0x7F80) && ((uiA)&0x003F)) | ||||||
|  |  | ||||||
|  | /*---------------------------------------------------------------------------- | ||||||
|  | | Assuming 'uiA' has the bit pattern of a 16-bit BF16 floating-point NaN, converts | ||||||
|  | | this NaN to the common NaN form, and stores the resulting common NaN at the | ||||||
|  | | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||||
|  | | exception is raised. | ||||||
|  | *----------------------------------------------------------------------------*/ | ||||||
|  | void softfloat_bf16UIToCommonNaN(uint_fast16_t uiA, struct commonNaN* zPtr); | ||||||
|  |  | ||||||
|  | /*---------------------------------------------------------------------------- | ||||||
|  | | Converts the common NaN pointed to by 'aPtr' into a 16-bit floating-point | ||||||
|  | | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||||
|  | *----------------------------------------------------------------------------*/ | ||||||
|  | uint_fast16_t softfloat_commonNaNToBF16UI(const struct commonNaN* aPtr); | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | The bit pattern for a default generated 32-bit floating-point NaN. | | The bit pattern for a default generated 32-bit floating-point NaN. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
|   | |||||||
							
								
								
									
										5
									
								
								softfloat/source/RISCV/s_bf16UIToCommonNaN.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										5
									
								
								softfloat/source/RISCV/s_bf16UIToCommonNaN.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,5 @@ | |||||||
|  |  | ||||||
|  | /*---------------------------------------------------------------------------- | ||||||
|  | | This file intentionally contains no code. | ||||||
|  | *----------------------------------------------------------------------------*/ | ||||||
|  |  | ||||||
							
								
								
									
										5
									
								
								softfloat/source/RISCV/s_commonNaNToBF16UI.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										5
									
								
								softfloat/source/RISCV/s_commonNaNToBF16UI.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,5 @@ | |||||||
|  |  | ||||||
|  | /*---------------------------------------------------------------------------- | ||||||
|  | | This file intentionally contains no code. | ||||||
|  | *----------------------------------------------------------------------------*/ | ||||||
|  |  | ||||||
| @@ -4,8 +4,8 @@ | |||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
| Package, Release 3e, by John R. Hauser. | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||||
| All rights reserved. | California.  All rights reserved. | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without | Redistribution and use in source and binary forms, with or without | ||||||
| modification, are permitted provided that the following conditions are met: | modification, are permitted provided that the following conditions are met: | ||||||
| @@ -34,9 +34,10 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
|  |  | ||||||
| =============================================================================*/ | =============================================================================*/ | ||||||
|  |  | ||||||
| #include <stdint.h> |  | ||||||
| #include "platform.h" | #include "platform.h" | ||||||
| #include "internals.h" | #include "softfloat_types.h" | ||||||
|  |  | ||||||
|  | #define softfloat_commonNaNToExtF80M softfloat_commonNaNToExtF80M | ||||||
| #include "specialize.h" | #include "specialize.h" | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| @@ -49,8 +50,8 @@ void | |||||||
|      const struct commonNaN *aPtr, struct extFloat80M *zSPtr ) |      const struct commonNaN *aPtr, struct extFloat80M *zSPtr ) | ||||||
| { | { | ||||||
|  |  | ||||||
|     zSPtr->signExp = packToExtF80UI64( aPtr->sign, 0x7FFF ); |     zSPtr->signExp = defaultNaNExtF80UI64; | ||||||
|     zSPtr->signif = UINT64_C( 0xC000000000000000 ) | aPtr->v64>>1; |     zSPtr->signif  = defaultNaNExtF80UI0; | ||||||
|  |  | ||||||
| } | } | ||||||
|  |  | ||||||
|   | |||||||
| @@ -4,8 +4,8 @@ | |||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
| Package, Release 3e, by John R. Hauser. | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||||
| All rights reserved. | California.  All rights reserved. | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without | Redistribution and use in source and binary forms, with or without | ||||||
| modification, are permitted provided that the following conditions are met: | modification, are permitted provided that the following conditions are met: | ||||||
| @@ -34,9 +34,10 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
|  |  | ||||||
| =============================================================================*/ | =============================================================================*/ | ||||||
|  |  | ||||||
| #include <stdint.h> |  | ||||||
| #include "platform.h" | #include "platform.h" | ||||||
| #include "primitives.h" | #include "primitiveTypes.h" | ||||||
|  |  | ||||||
|  | #define softfloat_commonNaNToExtF80UI softfloat_commonNaNToExtF80UI | ||||||
| #include "specialize.h" | #include "specialize.h" | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| @@ -48,8 +49,8 @@ struct uint128 softfloat_commonNaNToExtF80UI( const struct commonNaN *aPtr ) | |||||||
| { | { | ||||||
|     struct uint128 uiZ; |     struct uint128 uiZ; | ||||||
|  |  | ||||||
|     uiZ.v64 = (uint_fast16_t) aPtr->sign<<15 | 0x7FFF; |     uiZ.v64 = defaultNaNExtF80UI64; | ||||||
|     uiZ.v0 = UINT64_C( 0xC000000000000000 ) | aPtr->v64>>1; |     uiZ.v0  = defaultNaNExtF80UI0; | ||||||
|     return uiZ; |     return uiZ; | ||||||
|  |  | ||||||
| } | } | ||||||
|   | |||||||
| @@ -4,8 +4,8 @@ | |||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
| Package, Release 3e, by John R. Hauser. | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||||
| All rights reserved. | California.  All rights reserved. | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without | Redistribution and use in source and binary forms, with or without | ||||||
| modification, are permitted provided that the following conditions are met: | modification, are permitted provided that the following conditions are met: | ||||||
| @@ -36,7 +36,9 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
|  |  | ||||||
| #include <stdint.h> | #include <stdint.h> | ||||||
| #include "platform.h" | #include "platform.h" | ||||||
| #include "primitives.h" | #include "primitiveTypes.h" | ||||||
|  |  | ||||||
|  | #define softfloat_commonNaNToF128M softfloat_commonNaNToF128M | ||||||
| #include "specialize.h" | #include "specialize.h" | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| @@ -49,8 +51,10 @@ void | |||||||
|  softfloat_commonNaNToF128M( const struct commonNaN *aPtr, uint32_t *zWPtr ) |  softfloat_commonNaNToF128M( const struct commonNaN *aPtr, uint32_t *zWPtr ) | ||||||
| { | { | ||||||
|  |  | ||||||
|     softfloat_shortShiftRight128M( (const uint32_t *) &aPtr->v0, 16, zWPtr ); |     zWPtr[indexWord( 4, 3 )] = defaultNaNF128UI96; | ||||||
|     zWPtr[indexWordHi( 4 )] |= (uint32_t) aPtr->sign<<31 | 0x7FFF8000; |     zWPtr[indexWord( 4, 2 )] = defaultNaNF128UI64; | ||||||
|  |     zWPtr[indexWord( 4, 1 )] = defaultNaNF128UI32; | ||||||
|  |     zWPtr[indexWord( 4, 0 )] = defaultNaNF128UI0; | ||||||
|  |  | ||||||
| } | } | ||||||
|  |  | ||||||
|   | |||||||
| @@ -4,8 +4,8 @@ | |||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
| Package, Release 3e, by John R. Hauser. | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||||
| All rights reserved. | California.  All rights reserved. | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without | Redistribution and use in source and binary forms, with or without | ||||||
| modification, are permitted provided that the following conditions are met: | modification, are permitted provided that the following conditions are met: | ||||||
| @@ -34,9 +34,10 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
|  |  | ||||||
| =============================================================================*/ | =============================================================================*/ | ||||||
|  |  | ||||||
| #include <stdint.h> |  | ||||||
| #include "platform.h" | #include "platform.h" | ||||||
| #include "primitives.h" | #include "primitiveTypes.h" | ||||||
|  |  | ||||||
|  | #define softfloat_commonNaNToF128UI softfloat_commonNaNToF128UI | ||||||
| #include "specialize.h" | #include "specialize.h" | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| @@ -47,8 +48,8 @@ struct uint128 softfloat_commonNaNToF128UI( const struct commonNaN *aPtr ) | |||||||
| { | { | ||||||
|     struct uint128 uiZ; |     struct uint128 uiZ; | ||||||
|  |  | ||||||
|     uiZ = softfloat_shortShiftRight128( aPtr->v64, aPtr->v0, 16 ); |     uiZ.v64 = defaultNaNF128UI64; | ||||||
|     uiZ.v64 |= (uint_fast64_t) aPtr->sign<<63 | UINT64_C( 0x7FFF800000000000 ); |     uiZ.v0  = defaultNaNF128UI0; | ||||||
|     return uiZ; |     return uiZ; | ||||||
|  |  | ||||||
| } | } | ||||||
|   | |||||||
| @@ -1,51 +1,5 @@ | |||||||
|  |  | ||||||
| /*============================================================================ |  | ||||||
|  |  | ||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic |  | ||||||
| Package, Release 3e, by John R. Hauser. |  | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of |  | ||||||
| California.  All rights reserved. |  | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without |  | ||||||
| modification, are permitted provided that the following conditions are met: |  | ||||||
|  |  | ||||||
|  1. Redistributions of source code must retain the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer. |  | ||||||
|  |  | ||||||
|  2. Redistributions in binary form must reproduce the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer in the documentation |  | ||||||
|     and/or other materials provided with the distribution. |  | ||||||
|  |  | ||||||
|  3. Neither the name of the University nor the names of its contributors may |  | ||||||
|     be used to endorse or promote products derived from this software without |  | ||||||
|     specific prior written permission. |  | ||||||
|  |  | ||||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY |  | ||||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED |  | ||||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE |  | ||||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY |  | ||||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES |  | ||||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |  | ||||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND |  | ||||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |  | ||||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |  | ||||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |  | ||||||
|  |  | ||||||
| =============================================================================*/ |  | ||||||
|  |  | ||||||
| #include <stdint.h> |  | ||||||
| #include "platform.h" |  | ||||||
| #include "specialize.h" |  | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Converts the common NaN pointed to by `aPtr' into a 16-bit floating-point | | This file intentionally contains no code. | ||||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. |  | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| uint_fast16_t softfloat_commonNaNToF16UI( const struct commonNaN *aPtr ) |  | ||||||
| { |  | ||||||
|  |  | ||||||
|     return (uint_fast16_t) aPtr->sign<<15 | 0x7E00 | aPtr->v64>>54; |  | ||||||
|  |  | ||||||
| } |  | ||||||
|  |  | ||||||
|   | |||||||
| @@ -1,51 +1,5 @@ | |||||||
|  |  | ||||||
| /*============================================================================ |  | ||||||
|  |  | ||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic |  | ||||||
| Package, Release 3e, by John R. Hauser. |  | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. |  | ||||||
| All rights reserved. |  | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without |  | ||||||
| modification, are permitted provided that the following conditions are met: |  | ||||||
|  |  | ||||||
|  1. Redistributions of source code must retain the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer. |  | ||||||
|  |  | ||||||
|  2. Redistributions in binary form must reproduce the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer in the documentation |  | ||||||
|     and/or other materials provided with the distribution. |  | ||||||
|  |  | ||||||
|  3. Neither the name of the University nor the names of its contributors may |  | ||||||
|     be used to endorse or promote products derived from this software without |  | ||||||
|     specific prior written permission. |  | ||||||
|  |  | ||||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY |  | ||||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED |  | ||||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE |  | ||||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY |  | ||||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES |  | ||||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |  | ||||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND |  | ||||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |  | ||||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |  | ||||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |  | ||||||
|  |  | ||||||
| =============================================================================*/ |  | ||||||
|  |  | ||||||
| #include <stdint.h> |  | ||||||
| #include "platform.h" |  | ||||||
| #include "specialize.h" |  | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Converts the common NaN pointed to by `aPtr' into a 32-bit floating-point | | This file intentionally contains no code. | ||||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. |  | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| uint_fast32_t softfloat_commonNaNToF32UI( const struct commonNaN *aPtr ) |  | ||||||
| { |  | ||||||
|  |  | ||||||
|     return (uint_fast32_t) aPtr->sign<<31 | 0x7FC00000 | aPtr->v64>>41; |  | ||||||
|  |  | ||||||
| } |  | ||||||
|  |  | ||||||
|   | |||||||
| @@ -1,53 +1,5 @@ | |||||||
|  |  | ||||||
| /*============================================================================ |  | ||||||
|  |  | ||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic |  | ||||||
| Package, Release 3e, by John R. Hauser. |  | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. |  | ||||||
| All rights reserved. |  | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without |  | ||||||
| modification, are permitted provided that the following conditions are met: |  | ||||||
|  |  | ||||||
|  1. Redistributions of source code must retain the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer. |  | ||||||
|  |  | ||||||
|  2. Redistributions in binary form must reproduce the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer in the documentation |  | ||||||
|     and/or other materials provided with the distribution. |  | ||||||
|  |  | ||||||
|  3. Neither the name of the University nor the names of its contributors may |  | ||||||
|     be used to endorse or promote products derived from this software without |  | ||||||
|     specific prior written permission. |  | ||||||
|  |  | ||||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY |  | ||||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED |  | ||||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE |  | ||||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY |  | ||||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES |  | ||||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |  | ||||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND |  | ||||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |  | ||||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |  | ||||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |  | ||||||
|  |  | ||||||
| =============================================================================*/ |  | ||||||
|  |  | ||||||
| #include <stdint.h> |  | ||||||
| #include "platform.h" |  | ||||||
| #include "specialize.h" |  | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Converts the common NaN pointed to by `aPtr' into a 64-bit floating-point | | This file intentionally contains no code. | ||||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. |  | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| uint_fast64_t softfloat_commonNaNToF64UI( const struct commonNaN *aPtr ) |  | ||||||
| { |  | ||||||
|  |  | ||||||
|     return |  | ||||||
|         (uint_fast64_t) aPtr->sign<<63 | UINT64_C( 0x7FF8000000000000 ) |  | ||||||
|             | aPtr->v64>>12; |  | ||||||
|  |  | ||||||
| } |  | ||||||
|  |  | ||||||
|   | |||||||
| @@ -1,62 +1,5 @@ | |||||||
|  |  | ||||||
| /*============================================================================ |  | ||||||
|  |  | ||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic |  | ||||||
| Package, Release 3e, by John R. Hauser. |  | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. |  | ||||||
| All rights reserved. |  | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without |  | ||||||
| modification, are permitted provided that the following conditions are met: |  | ||||||
|  |  | ||||||
|  1. Redistributions of source code must retain the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer. |  | ||||||
|  |  | ||||||
|  2. Redistributions in binary form must reproduce the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer in the documentation |  | ||||||
|     and/or other materials provided with the distribution. |  | ||||||
|  |  | ||||||
|  3. Neither the name of the University nor the names of its contributors may |  | ||||||
|     be used to endorse or promote products derived from this software without |  | ||||||
|     specific prior written permission. |  | ||||||
|  |  | ||||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY |  | ||||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED |  | ||||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE |  | ||||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY |  | ||||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES |  | ||||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |  | ||||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND |  | ||||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |  | ||||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |  | ||||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |  | ||||||
|  |  | ||||||
| =============================================================================*/ |  | ||||||
|  |  | ||||||
| #include <stdint.h> |  | ||||||
| #include "platform.h" |  | ||||||
| #include "internals.h" |  | ||||||
| #include "specialize.h" |  | ||||||
| #include "softfloat.h" |  | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Assuming the 80-bit extended floating-point value pointed to by `aSPtr' is | | This file intentionally contains no code. | ||||||
| | a NaN, converts this NaN to the common NaN form, and stores the resulting |  | ||||||
| | common NaN at the location pointed to by `zPtr'.  If the NaN is a signaling |  | ||||||
| | NaN, the invalid exception is raised. |  | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| void |  | ||||||
|  softfloat_extF80MToCommonNaN( |  | ||||||
|      const struct extFloat80M *aSPtr, struct commonNaN *zPtr ) |  | ||||||
| { |  | ||||||
|  |  | ||||||
|     if ( extF80M_isSignalingNaN( (const extFloat80_t *) aSPtr ) ) { |  | ||||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); |  | ||||||
|     } |  | ||||||
|     zPtr->sign = signExtF80UI64( aSPtr->signExp ); |  | ||||||
|     zPtr->v64 = aSPtr->signif<<1; |  | ||||||
|     zPtr->v0  = 0; |  | ||||||
|  |  | ||||||
| } |  | ||||||
|  |  | ||||||
|   | |||||||
| @@ -1,62 +1,5 @@ | |||||||
|  |  | ||||||
| /*============================================================================ |  | ||||||
|  |  | ||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic |  | ||||||
| Package, Release 3e, by John R. Hauser. |  | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. |  | ||||||
| All rights reserved. |  | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without |  | ||||||
| modification, are permitted provided that the following conditions are met: |  | ||||||
|  |  | ||||||
|  1. Redistributions of source code must retain the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer. |  | ||||||
|  |  | ||||||
|  2. Redistributions in binary form must reproduce the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer in the documentation |  | ||||||
|     and/or other materials provided with the distribution. |  | ||||||
|  |  | ||||||
|  3. Neither the name of the University nor the names of its contributors may |  | ||||||
|     be used to endorse or promote products derived from this software without |  | ||||||
|     specific prior written permission. |  | ||||||
|  |  | ||||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY |  | ||||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED |  | ||||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE |  | ||||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY |  | ||||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES |  | ||||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |  | ||||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND |  | ||||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |  | ||||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |  | ||||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |  | ||||||
|  |  | ||||||
| =============================================================================*/ |  | ||||||
|  |  | ||||||
| #include <stdint.h> |  | ||||||
| #include "platform.h" |  | ||||||
| #include "specialize.h" |  | ||||||
| #include "softfloat.h" |  | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Assuming the unsigned integer formed from concatenating `uiA64' and `uiA0' | | This file intentionally contains no code. | ||||||
| | has the bit pattern of an 80-bit extended floating-point NaN, converts |  | ||||||
| | this NaN to the common NaN form, and stores the resulting common NaN at the |  | ||||||
| | location pointed to by `zPtr'.  If the NaN is a signaling NaN, the invalid |  | ||||||
| | exception is raised. |  | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| void |  | ||||||
|  softfloat_extF80UIToCommonNaN( |  | ||||||
|      uint_fast16_t uiA64, uint_fast64_t uiA0, struct commonNaN *zPtr ) |  | ||||||
| { |  | ||||||
|  |  | ||||||
|     if ( softfloat_isSigNaNExtF80UI( uiA64, uiA0 ) ) { |  | ||||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); |  | ||||||
|     } |  | ||||||
|     zPtr->sign = uiA64>>15; |  | ||||||
|     zPtr->v64  = uiA0<<1; |  | ||||||
|     zPtr->v0   = 0; |  | ||||||
|  |  | ||||||
| } |  | ||||||
|  |  | ||||||
|   | |||||||
| @@ -1,62 +1,5 @@ | |||||||
|  |  | ||||||
| /*============================================================================ |  | ||||||
|  |  | ||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic |  | ||||||
| Package, Release 3e, by John R. Hauser. |  | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. |  | ||||||
| All rights reserved. |  | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without |  | ||||||
| modification, are permitted provided that the following conditions are met: |  | ||||||
|  |  | ||||||
|  1. Redistributions of source code must retain the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer. |  | ||||||
|  |  | ||||||
|  2. Redistributions in binary form must reproduce the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer in the documentation |  | ||||||
|     and/or other materials provided with the distribution. |  | ||||||
|  |  | ||||||
|  3. Neither the name of the University nor the names of its contributors may |  | ||||||
|     be used to endorse or promote products derived from this software without |  | ||||||
|     specific prior written permission. |  | ||||||
|  |  | ||||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY |  | ||||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED |  | ||||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE |  | ||||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY |  | ||||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES |  | ||||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |  | ||||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND |  | ||||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |  | ||||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |  | ||||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |  | ||||||
|  |  | ||||||
| =============================================================================*/ |  | ||||||
|  |  | ||||||
| #include <stdint.h> |  | ||||||
| #include "platform.h" |  | ||||||
| #include "primitives.h" |  | ||||||
| #include "specialize.h" |  | ||||||
| #include "softfloat.h" |  | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Assuming the 128-bit floating-point value pointed to by `aWPtr' is a NaN, | | This file intentionally contains no code. | ||||||
| | converts this NaN to the common NaN form, and stores the resulting common |  | ||||||
| | NaN at the location pointed to by `zPtr'.  If the NaN is a signaling NaN, |  | ||||||
| | the invalid exception is raised.  Argument `aWPtr' points to an array of |  | ||||||
| | four 32-bit elements that concatenate in the platform's normal endian order |  | ||||||
| | to form a 128-bit floating-point value. |  | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| void |  | ||||||
|  softfloat_f128MToCommonNaN( const uint32_t *aWPtr, struct commonNaN *zPtr ) |  | ||||||
| { |  | ||||||
|  |  | ||||||
|     if ( f128M_isSignalingNaN( (const float128_t *) aWPtr ) ) { |  | ||||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); |  | ||||||
|     } |  | ||||||
|     zPtr->sign = aWPtr[indexWordHi( 4 )]>>31; |  | ||||||
|     softfloat_shortShiftLeft128M( aWPtr, 16, (uint32_t *) &zPtr->v0 ); |  | ||||||
|  |  | ||||||
| } |  | ||||||
|  |  | ||||||
|   | |||||||
| @@ -1,65 +1,5 @@ | |||||||
|  |  | ||||||
| /*============================================================================ |  | ||||||
|  |  | ||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic |  | ||||||
| Package, Release 3e, by John R. Hauser. |  | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. |  | ||||||
| All rights reserved. |  | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without |  | ||||||
| modification, are permitted provided that the following conditions are met: |  | ||||||
|  |  | ||||||
|  1. Redistributions of source code must retain the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer. |  | ||||||
|  |  | ||||||
|  2. Redistributions in binary form must reproduce the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer in the documentation |  | ||||||
|     and/or other materials provided with the distribution. |  | ||||||
|  |  | ||||||
|  3. Neither the name of the University nor the names of its contributors may |  | ||||||
|     be used to endorse or promote products derived from this software without |  | ||||||
|     specific prior written permission. |  | ||||||
|  |  | ||||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY |  | ||||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED |  | ||||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE |  | ||||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY |  | ||||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES |  | ||||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |  | ||||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND |  | ||||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |  | ||||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |  | ||||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |  | ||||||
|  |  | ||||||
| =============================================================================*/ |  | ||||||
|  |  | ||||||
| #include <stdint.h> |  | ||||||
| #include "platform.h" |  | ||||||
| #include "primitives.h" |  | ||||||
| #include "specialize.h" |  | ||||||
| #include "softfloat.h" |  | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Assuming the unsigned integer formed from concatenating `uiA64' and `uiA0' | | This file intentionally contains no code. | ||||||
| | has the bit pattern of a 128-bit floating-point NaN, converts this NaN to |  | ||||||
| | the common NaN form, and stores the resulting common NaN at the location |  | ||||||
| | pointed to by `zPtr'.  If the NaN is a signaling NaN, the invalid exception |  | ||||||
| | is raised. |  | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| void |  | ||||||
|  softfloat_f128UIToCommonNaN( |  | ||||||
|      uint_fast64_t uiA64, uint_fast64_t uiA0, struct commonNaN *zPtr ) |  | ||||||
| { |  | ||||||
|     struct uint128 NaNSig; |  | ||||||
|  |  | ||||||
|     if ( softfloat_isSigNaNF128UI( uiA64, uiA0 ) ) { |  | ||||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); |  | ||||||
|     } |  | ||||||
|     NaNSig = softfloat_shortShiftLeft128( uiA64, uiA0, 16 ); |  | ||||||
|     zPtr->sign = uiA64>>63; |  | ||||||
|     zPtr->v64  = NaNSig.v64; |  | ||||||
|     zPtr->v0   = NaNSig.v0; |  | ||||||
|  |  | ||||||
| } |  | ||||||
|  |  | ||||||
|   | |||||||
| @@ -1,59 +1,5 @@ | |||||||
|  |  | ||||||
| /*============================================================================ |  | ||||||
|  |  | ||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic |  | ||||||
| Package, Release 3e, by John R. Hauser. |  | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of |  | ||||||
| California.  All rights reserved. |  | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without |  | ||||||
| modification, are permitted provided that the following conditions are met: |  | ||||||
|  |  | ||||||
|  1. Redistributions of source code must retain the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer. |  | ||||||
|  |  | ||||||
|  2. Redistributions in binary form must reproduce the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer in the documentation |  | ||||||
|     and/or other materials provided with the distribution. |  | ||||||
|  |  | ||||||
|  3. Neither the name of the University nor the names of its contributors may |  | ||||||
|     be used to endorse or promote products derived from this software without |  | ||||||
|     specific prior written permission. |  | ||||||
|  |  | ||||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY |  | ||||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED |  | ||||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE |  | ||||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY |  | ||||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES |  | ||||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |  | ||||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND |  | ||||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |  | ||||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |  | ||||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |  | ||||||
|  |  | ||||||
| =============================================================================*/ |  | ||||||
|  |  | ||||||
| #include <stdint.h> |  | ||||||
| #include "platform.h" |  | ||||||
| #include "specialize.h" |  | ||||||
| #include "softfloat.h" |  | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Assuming `uiA' has the bit pattern of a 16-bit floating-point NaN, converts | | This file intentionally contains no code. | ||||||
| | this NaN to the common NaN form, and stores the resulting common NaN at the |  | ||||||
| | location pointed to by `zPtr'.  If the NaN is a signaling NaN, the invalid |  | ||||||
| | exception is raised. |  | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| void softfloat_f16UIToCommonNaN( uint_fast16_t uiA, struct commonNaN *zPtr ) |  | ||||||
| { |  | ||||||
|  |  | ||||||
|     if ( softfloat_isSigNaNF16UI( uiA ) ) { |  | ||||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); |  | ||||||
|     } |  | ||||||
|     zPtr->sign = uiA>>15; |  | ||||||
|     zPtr->v64  = (uint_fast64_t) uiA<<54; |  | ||||||
|     zPtr->v0   = 0; |  | ||||||
|  |  | ||||||
| } |  | ||||||
|  |  | ||||||
|   | |||||||
| @@ -1,59 +1,5 @@ | |||||||
|  |  | ||||||
| /*============================================================================ |  | ||||||
|  |  | ||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic |  | ||||||
| Package, Release 3e, by John R. Hauser. |  | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. |  | ||||||
| All rights reserved. |  | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without |  | ||||||
| modification, are permitted provided that the following conditions are met: |  | ||||||
|  |  | ||||||
|  1. Redistributions of source code must retain the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer. |  | ||||||
|  |  | ||||||
|  2. Redistributions in binary form must reproduce the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer in the documentation |  | ||||||
|     and/or other materials provided with the distribution. |  | ||||||
|  |  | ||||||
|  3. Neither the name of the University nor the names of its contributors may |  | ||||||
|     be used to endorse or promote products derived from this software without |  | ||||||
|     specific prior written permission. |  | ||||||
|  |  | ||||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY |  | ||||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED |  | ||||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE |  | ||||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY |  | ||||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES |  | ||||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |  | ||||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND |  | ||||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |  | ||||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |  | ||||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |  | ||||||
|  |  | ||||||
| =============================================================================*/ |  | ||||||
|  |  | ||||||
| #include <stdint.h> |  | ||||||
| #include "platform.h" |  | ||||||
| #include "specialize.h" |  | ||||||
| #include "softfloat.h" |  | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Assuming `uiA' has the bit pattern of a 32-bit floating-point NaN, converts | | This file intentionally contains no code. | ||||||
| | this NaN to the common NaN form, and stores the resulting common NaN at the |  | ||||||
| | location pointed to by `zPtr'.  If the NaN is a signaling NaN, the invalid |  | ||||||
| | exception is raised. |  | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| void softfloat_f32UIToCommonNaN( uint_fast32_t uiA, struct commonNaN *zPtr ) |  | ||||||
| { |  | ||||||
|  |  | ||||||
|     if ( softfloat_isSigNaNF32UI( uiA ) ) { |  | ||||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); |  | ||||||
|     } |  | ||||||
|     zPtr->sign = uiA>>31; |  | ||||||
|     zPtr->v64  = (uint_fast64_t) uiA<<41; |  | ||||||
|     zPtr->v0   = 0; |  | ||||||
|  |  | ||||||
| } |  | ||||||
|  |  | ||||||
|   | |||||||
| @@ -1,59 +1,5 @@ | |||||||
|  |  | ||||||
| /*============================================================================ |  | ||||||
|  |  | ||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic |  | ||||||
| Package, Release 3e, by John R. Hauser. |  | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. |  | ||||||
| All rights reserved. |  | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without |  | ||||||
| modification, are permitted provided that the following conditions are met: |  | ||||||
|  |  | ||||||
|  1. Redistributions of source code must retain the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer. |  | ||||||
|  |  | ||||||
|  2. Redistributions in binary form must reproduce the above copyright notice, |  | ||||||
|     this list of conditions, and the following disclaimer in the documentation |  | ||||||
|     and/or other materials provided with the distribution. |  | ||||||
|  |  | ||||||
|  3. Neither the name of the University nor the names of its contributors may |  | ||||||
|     be used to endorse or promote products derived from this software without |  | ||||||
|     specific prior written permission. |  | ||||||
|  |  | ||||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY |  | ||||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED |  | ||||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE |  | ||||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY |  | ||||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES |  | ||||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; |  | ||||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND |  | ||||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |  | ||||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS |  | ||||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |  | ||||||
|  |  | ||||||
| =============================================================================*/ |  | ||||||
|  |  | ||||||
| #include <stdint.h> |  | ||||||
| #include "platform.h" |  | ||||||
| #include "specialize.h" |  | ||||||
| #include "softfloat.h" |  | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Assuming `uiA' has the bit pattern of a 64-bit floating-point NaN, converts | | This file intentionally contains no code. | ||||||
| | this NaN to the common NaN form, and stores the resulting common NaN at the |  | ||||||
| | location pointed to by `zPtr'.  If the NaN is a signaling NaN, the invalid |  | ||||||
| | exception is raised. |  | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| void softfloat_f64UIToCommonNaN( uint_fast64_t uiA, struct commonNaN *zPtr ) |  | ||||||
| { |  | ||||||
|  |  | ||||||
|     if ( softfloat_isSigNaNF64UI( uiA ) ) { |  | ||||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); |  | ||||||
|     } |  | ||||||
|     zPtr->sign = uiA>>63; |  | ||||||
|     zPtr->v64  = uiA<<12; |  | ||||||
|     zPtr->v0   = 0; |  | ||||||
|  |  | ||||||
| } |  | ||||||
|  |  | ||||||
|   | |||||||
| @@ -4,8 +4,8 @@ | |||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
| Package, Release 3e, by John R. Hauser. | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||||
| All rights reserved. | California.  All rights reserved. | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without | Redistribution and use in source and binary forms, with or without | ||||||
| modification, are permitted provided that the following conditions are met: | modification, are permitted provided that the following conditions are met: | ||||||
| @@ -34,10 +34,9 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
|  |  | ||||||
| =============================================================================*/ | =============================================================================*/ | ||||||
|  |  | ||||||
| #include <stdbool.h> |  | ||||||
| #include <stdint.h> | #include <stdint.h> | ||||||
| #include "platform.h" | #include "platform.h" | ||||||
| #include "internals.h" | #include "primitiveTypes.h" | ||||||
| #include "specialize.h" | #include "specialize.h" | ||||||
| #include "softfloat.h" | #include "softfloat.h" | ||||||
|  |  | ||||||
| @@ -54,54 +53,22 @@ void | |||||||
|      struct extFloat80M *zSPtr |      struct extFloat80M *zSPtr | ||||||
|  ) |  ) | ||||||
| { | { | ||||||
|     bool isSigNaNA; |     uint_fast16_t ui64; | ||||||
|     const struct extFloat80M *sPtr; |     uint_fast64_t ui0; | ||||||
|     bool isSigNaNB; |  | ||||||
|     uint_fast16_t uiB64; |  | ||||||
|     uint64_t uiB0; |  | ||||||
|     uint_fast16_t uiA64; |  | ||||||
|     uint64_t uiA0; |  | ||||||
|     uint_fast16_t uiMagA64, uiMagB64; |  | ||||||
|  |  | ||||||
|     isSigNaNA = extF80M_isSignalingNaN( (const extFloat80_t *) aSPtr ); |     ui64 = aSPtr->signExp; | ||||||
|     sPtr = aSPtr; |     ui0  = aSPtr->signif; | ||||||
|     if ( ! bSPtr ) { |     if ( | ||||||
|         if ( isSigNaNA ) softfloat_raiseFlags( softfloat_flag_invalid ); |         softfloat_isSigNaNExtF80UI( ui64, ui0 ) | ||||||
|         goto copy; |             || (bSPtr | ||||||
|     } |                     && (ui64 = bSPtr->signExp, | ||||||
|     isSigNaNB = extF80M_isSignalingNaN( (const extFloat80_t *) bSPtr ); |                         ui0  = bSPtr->signif, | ||||||
|     if ( isSigNaNA | isSigNaNB ) { |                         softfloat_isSigNaNExtF80UI( ui64, ui0 ))) | ||||||
|  |     ) { | ||||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); |         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||||
|         if ( isSigNaNA ) { |  | ||||||
|             uiB64 = bSPtr->signExp; |  | ||||||
|             if ( isSigNaNB ) goto returnLargerUIMag; |  | ||||||
|             uiB0 = bSPtr->signif; |  | ||||||
|             if ( isNaNExtF80UI( uiB64, uiB0 ) ) goto copyB; |  | ||||||
|             goto copy; |  | ||||||
|         } else { |  | ||||||
|             uiA64 = aSPtr->signExp; |  | ||||||
|             uiA0 = aSPtr->signif; |  | ||||||
|             if ( isNaNExtF80UI( uiA64, uiA0 ) ) goto copy; |  | ||||||
|             goto copyB; |  | ||||||
|     } |     } | ||||||
|     } |     zSPtr->signExp = defaultNaNExtF80UI64; | ||||||
|     uiB64 = bSPtr->signExp; |     zSPtr->signif  = defaultNaNExtF80UI0; | ||||||
|  returnLargerUIMag: |  | ||||||
|     uiA64 = aSPtr->signExp; |  | ||||||
|     uiMagA64 = uiA64 & 0x7FFF; |  | ||||||
|     uiMagB64 = uiB64 & 0x7FFF; |  | ||||||
|     if ( uiMagA64 < uiMagB64 ) goto copyB; |  | ||||||
|     if ( uiMagB64 < uiMagA64 ) goto copy; |  | ||||||
|     uiA0 = aSPtr->signif; |  | ||||||
|     uiB0 = bSPtr->signif; |  | ||||||
|     if ( uiA0 < uiB0 ) goto copyB; |  | ||||||
|     if ( uiB0 < uiA0 ) goto copy; |  | ||||||
|     if ( uiA64 < uiB64 ) goto copy; |  | ||||||
|  copyB: |  | ||||||
|     sPtr = bSPtr; |  | ||||||
|  copy: |  | ||||||
|     zSPtr->signExp = sPtr->signExp; |  | ||||||
|     zSPtr->signif = sPtr->signif | UINT64_C( 0xC000000000000000 ); |  | ||||||
|  |  | ||||||
| } | } | ||||||
|  |  | ||||||
|   | |||||||
| @@ -4,7 +4,7 @@ | |||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
| Package, Release 3e, by John R. Hauser. | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014, 2018 The Regents of the University of | Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||||
| California.  All rights reserved. | California.  All rights reserved. | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without | Redistribution and use in source and binary forms, with or without | ||||||
| @@ -34,17 +34,16 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
|  |  | ||||||
| =============================================================================*/ | =============================================================================*/ | ||||||
|  |  | ||||||
| #include <stdbool.h> |  | ||||||
| #include <stdint.h> | #include <stdint.h> | ||||||
| #include "platform.h" | #include "platform.h" | ||||||
| #include "internals.h" | #include "primitiveTypes.h" | ||||||
| #include "specialize.h" | #include "specialize.h" | ||||||
| #include "softfloat.h" | #include "softfloat.h" | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Interpreting the unsigned integer formed from concatenating 'uiA64' and | | Interpreting the unsigned integer formed from concatenating `uiA64' and | ||||||
| | 'uiA0' as an 80-bit extended floating-point value, and likewise interpreting | | `uiA0' as an 80-bit extended floating-point value, and likewise interpreting | ||||||
| | the unsigned integer formed from concatenating 'uiB64' and 'uiB0' as another | | the unsigned integer formed from concatenating `uiB64' and `uiB0' as another | ||||||
| | 80-bit extended floating-point value, and assuming at least on of these | | 80-bit extended floating-point value, and assuming at least on of these | ||||||
| | floating-point values is a NaN, returns the bit pattern of the combined NaN | | floating-point values is a NaN, returns the bit pattern of the combined NaN | ||||||
| | result.  If either original floating-point value is a signaling NaN, the | | result.  If either original floating-point value is a signaling NaN, the | ||||||
| @@ -58,48 +57,16 @@ struct uint128 | |||||||
|      uint_fast64_t uiB0 |      uint_fast64_t uiB0 | ||||||
|  ) |  ) | ||||||
| { | { | ||||||
|     bool isSigNaNA, isSigNaNB; |  | ||||||
|     uint_fast64_t uiNonsigA0, uiNonsigB0; |  | ||||||
|     uint_fast16_t uiMagA64, uiMagB64; |  | ||||||
|     struct uint128 uiZ; |     struct uint128 uiZ; | ||||||
|  |  | ||||||
|     /*------------------------------------------------------------------------ |     if ( | ||||||
|     *------------------------------------------------------------------------*/ |            softfloat_isSigNaNExtF80UI( uiA64, uiA0 ) | ||||||
|     isSigNaNA = softfloat_isSigNaNExtF80UI( uiA64, uiA0 ); |         || softfloat_isSigNaNExtF80UI( uiB64, uiB0 ) | ||||||
|     isSigNaNB = softfloat_isSigNaNExtF80UI( uiB64, uiB0 ); |     ) { | ||||||
|     /*------------------------------------------------------------------------ |  | ||||||
|     | Make NaNs non-signaling. |  | ||||||
|     *------------------------------------------------------------------------*/ |  | ||||||
|     uiNonsigA0 = uiA0 | UINT64_C( 0xC000000000000000 ); |  | ||||||
|     uiNonsigB0 = uiB0 | UINT64_C( 0xC000000000000000 ); |  | ||||||
|     /*------------------------------------------------------------------------ |  | ||||||
|     *------------------------------------------------------------------------*/ |  | ||||||
|     if ( isSigNaNA | isSigNaNB ) { |  | ||||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); |         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||||
|         if ( isSigNaNA ) { |  | ||||||
|             if ( isSigNaNB ) goto returnLargerMag; |  | ||||||
|             if ( isNaNExtF80UI( uiB64, uiB0 ) ) goto returnB; |  | ||||||
|             goto returnA; |  | ||||||
|         } else { |  | ||||||
|             if ( isNaNExtF80UI( uiA64, uiA0 ) ) goto returnA; |  | ||||||
|             goto returnB; |  | ||||||
|     } |     } | ||||||
|     } |     uiZ.v64 = defaultNaNExtF80UI64; | ||||||
|  returnLargerMag: |     uiZ.v0  = defaultNaNExtF80UI0; | ||||||
|     uiMagA64 = uiA64 & 0x7FFF; |  | ||||||
|     uiMagB64 = uiB64 & 0x7FFF; |  | ||||||
|     if ( uiMagA64 < uiMagB64 ) goto returnB; |  | ||||||
|     if ( uiMagB64 < uiMagA64 ) goto returnA; |  | ||||||
|     if ( uiA0 < uiB0 ) goto returnB; |  | ||||||
|     if ( uiB0 < uiA0 ) goto returnA; |  | ||||||
|     if ( uiA64 < uiB64 ) goto returnA; |  | ||||||
|  returnB: |  | ||||||
|     uiZ.v64 = uiB64; |  | ||||||
|     uiZ.v0  = uiNonsigB0; |  | ||||||
|     return uiZ; |  | ||||||
|  returnA: |  | ||||||
|     uiZ.v64 = uiA64; |  | ||||||
|     uiZ.v0  = uiNonsigA0; |  | ||||||
|     return uiZ; |     return uiZ; | ||||||
|  |  | ||||||
| } | } | ||||||
|   | |||||||
| @@ -4,8 +4,8 @@ | |||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
| Package, Release 3e, by John R. Hauser. | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | Copyright 2011, 2012, 2013, 2014, 2015, 2018 The Regents of the University of | ||||||
| All rights reserved. | California.  All rights reserved. | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without | Redistribution and use in source and binary forms, with or without | ||||||
| modification, are permitted provided that the following conditions are met: | modification, are permitted provided that the following conditions are met: | ||||||
| @@ -34,43 +34,35 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
|  |  | ||||||
| =============================================================================*/ | =============================================================================*/ | ||||||
|  |  | ||||||
| #include <stdbool.h> |  | ||||||
| #include <stdint.h> | #include <stdint.h> | ||||||
| #include "platform.h" | #include "platform.h" | ||||||
| #include "internals.h" | #include "primitiveTypes.h" | ||||||
| #include "specialize.h" | #include "specialize.h" | ||||||
| #include "softfloat.h" | #include "softfloat.h" | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Assuming at least one of the two 128-bit floating-point values pointed to by | | Assuming at least one of the two 128-bit floating-point values pointed to by | ||||||
| | `aWPtr' and `bWPtr' is a NaN, stores the combined NaN result at the location | | 'aWPtr' and 'bWPtr' is a NaN, stores the combined NaN result at the location | ||||||
| | pointed to by `zWPtr'.  If either original floating-point value is a | | pointed to by 'zWPtr'.  If either original floating-point value is a | ||||||
| | signaling NaN, the invalid exception is raised.  Each of `aWPtr', `bWPtr', | | signaling NaN, the invalid exception is raised.  Each of 'aWPtr', 'bWPtr', | ||||||
| | and `zWPtr' points to an array of four 32-bit elements that concatenate in | | and 'zWPtr' points to an array of four 32-bit elements that concatenate in | ||||||
| | the platform's normal endian order to form a 128-bit floating-point value. | | the platform's normal endian order to form a 128-bit floating-point value. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| void | void | ||||||
|  softfloat_propagateNaNF128M( |  softfloat_propagateNaNF128M( | ||||||
|      const uint32_t *aWPtr, const uint32_t *bWPtr, uint32_t *zWPtr ) |      const uint32_t *aWPtr, const uint32_t *bWPtr, uint32_t *zWPtr ) | ||||||
| { | { | ||||||
|     bool isSigNaNA; |  | ||||||
|     const uint32_t *ptr; |  | ||||||
|  |  | ||||||
|     ptr = aWPtr; |  | ||||||
|     isSigNaNA = f128M_isSignalingNaN( (const float128_t *) aWPtr ); |  | ||||||
|     if ( |     if ( | ||||||
|         isSigNaNA |         f128M_isSignalingNaN( (const float128_t *) aWPtr ) | ||||||
|             || (bWPtr && f128M_isSignalingNaN( (const float128_t *) bWPtr )) |             || (bWPtr && f128M_isSignalingNaN( (const float128_t *) bWPtr )) | ||||||
|     ) { |     ) { | ||||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); |         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||||
|         if ( isSigNaNA ) goto copy; |  | ||||||
|     } |     } | ||||||
|     if ( ! softfloat_isNaNF128M( aWPtr ) ) ptr = bWPtr; |     zWPtr[indexWord( 4, 3 )] = defaultNaNF128UI96; | ||||||
|  copy: |     zWPtr[indexWord( 4, 2 )] = defaultNaNF128UI64; | ||||||
|     zWPtr[indexWordHi( 4 )] = ptr[indexWordHi( 4 )] | 0x00008000; |     zWPtr[indexWord( 4, 1 )] = defaultNaNF128UI32; | ||||||
|     zWPtr[indexWord( 4, 2 )] = ptr[indexWord( 4, 2 )]; |     zWPtr[indexWord( 4, 0 )] = defaultNaNF128UI0; | ||||||
|     zWPtr[indexWord( 4, 1 )] = ptr[indexWord( 4, 1 )]; |  | ||||||
|     zWPtr[indexWord( 4, 0 )] = ptr[indexWord( 4, 0 )]; |  | ||||||
|  |  | ||||||
| } | } | ||||||
|  |  | ||||||
|   | |||||||
| @@ -4,8 +4,8 @@ | |||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
| Package, Release 3e, by John R. Hauser. | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||||
| All rights reserved. | California.  All rights reserved. | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without | Redistribution and use in source and binary forms, with or without | ||||||
| modification, are permitted provided that the following conditions are met: | modification, are permitted provided that the following conditions are met: | ||||||
| @@ -34,10 +34,9 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
|  |  | ||||||
| =============================================================================*/ | =============================================================================*/ | ||||||
|  |  | ||||||
| #include <stdbool.h> |  | ||||||
| #include <stdint.h> | #include <stdint.h> | ||||||
| #include "platform.h" | #include "platform.h" | ||||||
| #include "internals.h" | #include "primitiveTypes.h" | ||||||
| #include "specialize.h" | #include "specialize.h" | ||||||
| #include "softfloat.h" | #include "softfloat.h" | ||||||
|  |  | ||||||
| @@ -58,23 +57,16 @@ struct uint128 | |||||||
|      uint_fast64_t uiB0 |      uint_fast64_t uiB0 | ||||||
|  ) |  ) | ||||||
| { | { | ||||||
|     bool isSigNaNA; |  | ||||||
|     struct uint128 uiZ; |     struct uint128 uiZ; | ||||||
|  |  | ||||||
|     isSigNaNA = softfloat_isSigNaNF128UI( uiA64, uiA0 ); |     if ( | ||||||
|     if ( isSigNaNA || softfloat_isSigNaNF128UI( uiB64, uiB0 ) ) { |            softfloat_isSigNaNF128UI( uiA64, uiA0 ) | ||||||
|  |         || softfloat_isSigNaNF128UI( uiB64, uiB0 ) | ||||||
|  |     ) { | ||||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); |         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||||
|         if ( isSigNaNA ) goto returnNonsigA; |  | ||||||
|     } |     } | ||||||
|     if ( isNaNF128UI( uiA64, uiA0 ) ) { |     uiZ.v64 = defaultNaNF128UI64; | ||||||
|  returnNonsigA: |     uiZ.v0  = defaultNaNF128UI0; | ||||||
|         uiZ.v64 = uiA64; |  | ||||||
|         uiZ.v0  = uiA0; |  | ||||||
|     } else { |  | ||||||
|         uiZ.v64 = uiB64; |  | ||||||
|         uiZ.v0  = uiB0; |  | ||||||
|     } |  | ||||||
|     uiZ.v64 |= UINT64_C( 0x0000800000000000 ); |  | ||||||
|     return uiZ; |     return uiZ; | ||||||
|  |  | ||||||
| } | } | ||||||
|   | |||||||
| @@ -4,7 +4,7 @@ | |||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
| Package, Release 3e, by John R. Hauser. | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | Copyright 2011, 2012, 2013, 2014, 2015, 2016 The Regents of the University of | ||||||
| California.  All rights reserved. | California.  All rights reserved. | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without | Redistribution and use in source and binary forms, with or without | ||||||
| @@ -34,10 +34,8 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
|  |  | ||||||
| =============================================================================*/ | =============================================================================*/ | ||||||
|  |  | ||||||
| #include <stdbool.h> |  | ||||||
| #include <stdint.h> | #include <stdint.h> | ||||||
| #include "platform.h" | #include "platform.h" | ||||||
| #include "internals.h" |  | ||||||
| #include "specialize.h" | #include "specialize.h" | ||||||
| #include "softfloat.h" | #include "softfloat.h" | ||||||
|  |  | ||||||
| @@ -50,14 +48,11 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
| uint_fast16_t | uint_fast16_t | ||||||
|  softfloat_propagateNaNF16UI( uint_fast16_t uiA, uint_fast16_t uiB ) |  softfloat_propagateNaNF16UI( uint_fast16_t uiA, uint_fast16_t uiB ) | ||||||
| { | { | ||||||
|     bool isSigNaNA; |  | ||||||
|  |  | ||||||
|     isSigNaNA = softfloat_isSigNaNF16UI( uiA ); |     if ( softfloat_isSigNaNF16UI( uiA ) || softfloat_isSigNaNF16UI( uiB ) ) { | ||||||
|     if ( isSigNaNA || softfloat_isSigNaNF16UI( uiB ) ) { |  | ||||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); |         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||||
|         if ( isSigNaNA ) return uiA | 0x0200; |  | ||||||
|     } |     } | ||||||
|     return (isNaNF16UI( uiA ) ? uiA : uiB) | 0x0200; |     return defaultNaNF16UI; | ||||||
|  |  | ||||||
| } | } | ||||||
|  |  | ||||||
|   | |||||||
| @@ -4,8 +4,8 @@ | |||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
| Package, Release 3e, by John R. Hauser. | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||||
| All rights reserved. | California.  All rights reserved. | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without | Redistribution and use in source and binary forms, with or without | ||||||
| modification, are permitted provided that the following conditions are met: | modification, are permitted provided that the following conditions are met: | ||||||
| @@ -34,10 +34,8 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
|  |  | ||||||
| =============================================================================*/ | =============================================================================*/ | ||||||
|  |  | ||||||
| #include <stdbool.h> |  | ||||||
| #include <stdint.h> | #include <stdint.h> | ||||||
| #include "platform.h" | #include "platform.h" | ||||||
| #include "internals.h" |  | ||||||
| #include "specialize.h" | #include "specialize.h" | ||||||
| #include "softfloat.h" | #include "softfloat.h" | ||||||
|  |  | ||||||
| @@ -50,14 +48,11 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
| uint_fast32_t | uint_fast32_t | ||||||
|  softfloat_propagateNaNF32UI( uint_fast32_t uiA, uint_fast32_t uiB ) |  softfloat_propagateNaNF32UI( uint_fast32_t uiA, uint_fast32_t uiB ) | ||||||
| { | { | ||||||
|     bool isSigNaNA; |  | ||||||
|  |  | ||||||
|     isSigNaNA = softfloat_isSigNaNF32UI( uiA ); |     if ( softfloat_isSigNaNF32UI( uiA ) || softfloat_isSigNaNF32UI( uiB ) ) { | ||||||
|     if ( isSigNaNA || softfloat_isSigNaNF32UI( uiB ) ) { |  | ||||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); |         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||||
|         if ( isSigNaNA ) return uiA | 0x00400000; |  | ||||||
|     } |     } | ||||||
|     return (isNaNF32UI( uiA ) ? uiA : uiB) | 0x00400000; |     return defaultNaNF32UI; | ||||||
|  |  | ||||||
| } | } | ||||||
|  |  | ||||||
|   | |||||||
| @@ -4,8 +4,8 @@ | |||||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
| Package, Release 3e, by John R. Hauser. | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||||
| All rights reserved. | California.  All rights reserved. | ||||||
|  |  | ||||||
| Redistribution and use in source and binary forms, with or without | Redistribution and use in source and binary forms, with or without | ||||||
| modification, are permitted provided that the following conditions are met: | modification, are permitted provided that the following conditions are met: | ||||||
| @@ -34,10 +34,8 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
|  |  | ||||||
| =============================================================================*/ | =============================================================================*/ | ||||||
|  |  | ||||||
| #include <stdbool.h> |  | ||||||
| #include <stdint.h> | #include <stdint.h> | ||||||
| #include "platform.h" | #include "platform.h" | ||||||
| #include "internals.h" |  | ||||||
| #include "specialize.h" | #include "specialize.h" | ||||||
| #include "softfloat.h" | #include "softfloat.h" | ||||||
|  |  | ||||||
| @@ -50,14 +48,11 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
| uint_fast64_t | uint_fast64_t | ||||||
|  softfloat_propagateNaNF64UI( uint_fast64_t uiA, uint_fast64_t uiB ) |  softfloat_propagateNaNF64UI( uint_fast64_t uiA, uint_fast64_t uiB ) | ||||||
| { | { | ||||||
|     bool isSigNaNA; |  | ||||||
|  |  | ||||||
|     isSigNaNA = softfloat_isSigNaNF64UI( uiA ); |     if ( softfloat_isSigNaNF64UI( uiA ) || softfloat_isSigNaNF64UI( uiB ) ) { | ||||||
|     if ( isSigNaNA || softfloat_isSigNaNF64UI( uiB ) ) { |  | ||||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); |         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||||
|         if ( isSigNaNA ) return uiA | UINT64_C( 0x0008000000000000 ); |  | ||||||
|     } |     } | ||||||
|     return (isNaNF64UI( uiA ) ? uiA : uiB) | UINT64_C( 0x0008000000000000 ); |     return defaultNaNF64UI; | ||||||
|  |  | ||||||
| } | } | ||||||
|  |  | ||||||
|   | |||||||
| @@ -51,19 +51,19 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
| | The values to return on conversions to 32-bit integer formats that raise an | | The values to return on conversions to 32-bit integer formats that raise an | ||||||
| | invalid exception. | | invalid exception. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| #define ui32_fromPosOverflow UINT32_C(0xFFFFFFFF) | #define ui32_fromPosOverflow 0xFFFFFFFF | ||||||
| #define ui32_fromNegOverflow UINT32_C(0x0) | #define ui32_fromNegOverflow 0 | ||||||
| #define ui32_fromNaN UINT32_C(0xFFFFFFFF) | #define ui32_fromNaN 0xFFFFFFFF | ||||||
| #define i32_fromPosOverflow INT64_C(0x7FFFFFFF) | #define i32_fromPosOverflow 0x7FFFFFFF | ||||||
| #define i32_fromNegOverflow (-INT64_C(0x7FFFFFFF) - 1) | #define i32_fromNegOverflow (-0x7FFFFFFF - 1) | ||||||
| #define i32_fromNaN INT64_C(0x7FFFFFFF) | #define i32_fromNaN 0x7FFFFFFF | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | The values to return on conversions to 64-bit integer formats that raise an | | The values to return on conversions to 64-bit integer formats that raise an | ||||||
| | invalid exception. | | invalid exception. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| #define ui64_fromPosOverflow UINT64_C(0xFFFFFFFFFFFFFFFF) | #define ui64_fromPosOverflow UINT64_C(0xFFFFFFFFFFFFFFFF) | ||||||
| #define ui64_fromNegOverflow UINT64_C(0x0) | #define ui64_fromNegOverflow 0 | ||||||
| #define ui64_fromNaN UINT64_C(0xFFFFFFFFFFFFFFFF) | #define ui64_fromNaN UINT64_C(0xFFFFFFFFFFFFFFFF) | ||||||
| #define i64_fromPosOverflow INT64_C(0x7FFFFFFFFFFFFFFF) | #define i64_fromPosOverflow INT64_C(0x7FFFFFFFFFFFFFFF) | ||||||
| #define i64_fromNegOverflow (-INT64_C(0x7FFFFFFFFFFFFFFF) - 1) | #define i64_fromNegOverflow (-INT64_C(0x7FFFFFFFFFFFFFFF) - 1) | ||||||
| @@ -74,18 +74,13 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
| | to another. | | to another. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| struct commonNaN { | struct commonNaN { | ||||||
|     bool sign; |     char _unused; | ||||||
| #ifdef LITTLEENDIAN |  | ||||||
|     uint64_t v0, v64; |  | ||||||
| #else |  | ||||||
|     uint64_t v64, v0; |  | ||||||
| #endif |  | ||||||
| }; | }; | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | The bit pattern for a default generated 16-bit floating-point NaN. | | The bit pattern for a default generated 16-bit floating-point NaN. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| #define defaultNaNF16UI 0xFE00 | #define defaultNaNF16UI 0x7E00 | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Returns true when 16-bit unsigned integer 'uiA' has the bit pattern of a | | Returns true when 16-bit unsigned integer 'uiA' has the bit pattern of a | ||||||
| @@ -94,19 +89,38 @@ struct commonNaN { | |||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| #define softfloat_isSigNaNF16UI(uiA) ((((uiA)&0x7E00) == 0x7C00) && ((uiA)&0x01FF)) | #define softfloat_isSigNaNF16UI(uiA) ((((uiA)&0x7E00) == 0x7C00) && ((uiA)&0x01FF)) | ||||||
|  |  | ||||||
|  | /*---------------------------------------------------------------------------- | ||||||
|  | | Returns true when 16-bit unsigned integer 'uiA' has the bit pattern of a | ||||||
|  | | 16-bit brain floating-point (BF16) signaling NaN. | ||||||
|  | | Note:  This macro evaluates its argument more than once. | ||||||
|  | *----------------------------------------------------------------------------*/ | ||||||
|  | #define softfloat_isSigNaNBF16UI(uiA) ((((uiA)&0x7FC0) == 0x7F80) && ((uiA)&0x003F)) | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Assuming 'uiA' has the bit pattern of a 16-bit floating-point NaN, converts | | Assuming 'uiA' has the bit pattern of a 16-bit floating-point NaN, converts | ||||||
| | this NaN to the common NaN form, and stores the resulting common NaN at the | | this NaN to the common NaN form, and stores the resulting common NaN at the | ||||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||||
| | exception is raised. | | exception is raised. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| void softfloat_f16UIToCommonNaN(uint_fast16_t uiA, struct commonNaN* zPtr); | #define softfloat_f16UIToCommonNaN(uiA, zPtr)                                                                                              \ | ||||||
|  |     if(!((uiA)&0x0200))                                                                                                                    \ | ||||||
|  |     softfloat_raiseFlags(softfloat_flag_invalid) | ||||||
|  |  | ||||||
|  | /*---------------------------------------------------------------------------- | ||||||
|  | | Assuming 'uiA' has the bit pattern of a 16-bit BF16 floating-point NaN, converts | ||||||
|  | | this NaN to the common NaN form, and stores the resulting common NaN at the | ||||||
|  | | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||||
|  | | exception is raised. | ||||||
|  | *----------------------------------------------------------------------------*/ | ||||||
|  | #define softfloat_bf16UIToCommonNaN(uiA, zPtr)                                                                                             \ | ||||||
|  |     if(!((uiA)&0x0040))                                                                                                                    \ | ||||||
|  |     softfloat_raiseFlags(softfloat_flag_invalid) | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Converts the common NaN pointed to by 'aPtr' into a 16-bit floating-point | | Converts the common NaN pointed to by 'aPtr' into a 16-bit floating-point | ||||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| uint_fast16_t softfloat_commonNaNToF16UI(const struct commonNaN* aPtr); | #define softfloat_commonNaNToF16UI(aPtr) ((uint_fast16_t)defaultNaNF16UI) | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 16-bit floating- | | Interpreting 'uiA' and 'uiB' as the bit patterns of two 16-bit floating- | ||||||
| @@ -116,6 +130,17 @@ uint_fast16_t softfloat_commonNaNToF16UI(const struct commonNaN* aPtr); | |||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| uint_fast16_t softfloat_propagateNaNF16UI(uint_fast16_t uiA, uint_fast16_t uiB); | uint_fast16_t softfloat_propagateNaNF16UI(uint_fast16_t uiA, uint_fast16_t uiB); | ||||||
|  |  | ||||||
|  | /*---------------------------------------------------------------------------- | ||||||
|  | | The bit pattern for a default generated 16-bit BF16 floating-point NaN. | ||||||
|  | *----------------------------------------------------------------------------*/ | ||||||
|  | #define defaultNaNBF16UI 0x7FC0 | ||||||
|  |  | ||||||
|  | /*---------------------------------------------------------------------------- | ||||||
|  | | Converts the common NaN pointed to by 'aPtr' into a 16-bit floating-point | ||||||
|  | | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||||
|  | *----------------------------------------------------------------------------*/ | ||||||
|  | #define softfloat_commonNaNToBF16UI(aPtr) ((uint_fast16_t)defaultNaNBF16UI) | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | The bit pattern for a default generated 32-bit floating-point NaN. | | The bit pattern for a default generated 32-bit floating-point NaN. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| @@ -134,13 +159,15 @@ uint_fast16_t softfloat_propagateNaNF16UI(uint_fast16_t uiA, uint_fast16_t uiB); | |||||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||||
| | exception is raised. | | exception is raised. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| void softfloat_f32UIToCommonNaN(uint_fast32_t uiA, struct commonNaN* zPtr); | #define softfloat_f32UIToCommonNaN(uiA, zPtr)                                                                                              \ | ||||||
|  |     if(!((uiA)&0x00400000))                                                                                                                \ | ||||||
|  |     softfloat_raiseFlags(softfloat_flag_invalid) | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Converts the common NaN pointed to by 'aPtr' into a 32-bit floating-point | | Converts the common NaN pointed to by 'aPtr' into a 32-bit floating-point | ||||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| uint_fast32_t softfloat_commonNaNToF32UI(const struct commonNaN* aPtr); | #define softfloat_commonNaNToF32UI(aPtr) ((uint_fast32_t)defaultNaNF32UI) | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 32-bit floating- | | Interpreting 'uiA' and 'uiB' as the bit patterns of two 32-bit floating- | ||||||
| @@ -169,13 +196,15 @@ uint_fast32_t softfloat_propagateNaNF32UI(uint_fast32_t uiA, uint_fast32_t uiB); | |||||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||||
| | exception is raised. | | exception is raised. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| void softfloat_f64UIToCommonNaN(uint_fast64_t uiA, struct commonNaN* zPtr); | #define softfloat_f64UIToCommonNaN(uiA, zPtr)                                                                                              \ | ||||||
|  |     if(!((uiA)&UINT64_C(0x0008000000000000)))                                                                                              \ | ||||||
|  |     softfloat_raiseFlags(softfloat_flag_invalid) | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Converts the common NaN pointed to by 'aPtr' into a 64-bit floating-point | | Converts the common NaN pointed to by 'aPtr' into a 64-bit floating-point | ||||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| uint_fast64_t softfloat_commonNaNToF64UI(const struct commonNaN* aPtr); | #define softfloat_commonNaNToF64UI(aPtr) ((uint_fast64_t)defaultNaNF64UI) | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 64-bit floating- | | Interpreting 'uiA' and 'uiB' as the bit patterns of two 64-bit floating- | ||||||
| @@ -188,7 +217,7 @@ uint_fast64_t softfloat_propagateNaNF64UI(uint_fast64_t uiA, uint_fast64_t uiB); | |||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | The bit pattern for a default generated 80-bit extended floating-point NaN. | | The bit pattern for a default generated 80-bit extended floating-point NaN. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| #define defaultNaNExtF80UI64 0xFFFF | #define defaultNaNExtF80UI64 0x7FFF | ||||||
| #define defaultNaNExtF80UI0 UINT64_C(0xC000000000000000) | #define defaultNaNExtF80UI0 UINT64_C(0xC000000000000000) | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| @@ -214,14 +243,26 @@ uint_fast64_t softfloat_propagateNaNF64UI(uint_fast64_t uiA, uint_fast64_t uiB); | |||||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||||
| | exception is raised. | | exception is raised. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| void softfloat_extF80UIToCommonNaN(uint_fast16_t uiA64, uint_fast64_t uiA0, struct commonNaN* zPtr); | #define softfloat_extF80UIToCommonNaN(uiA64, uiA0, zPtr)                                                                                   \ | ||||||
|  |     if(!((uiA0)&UINT64_C(0x4000000000000000)))                                                                                             \ | ||||||
|  |     softfloat_raiseFlags(softfloat_flag_invalid) | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Converts the common NaN pointed to by 'aPtr' into an 80-bit extended | | Converts the common NaN pointed to by 'aPtr' into an 80-bit extended | ||||||
| | floating-point NaN, and returns the bit pattern of this value as an unsigned | | floating-point NaN, and returns the bit pattern of this value as an unsigned | ||||||
| | integer. | | integer. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
|  | #if defined INLINE && !defined softfloat_commonNaNToExtF80UI | ||||||
|  | INLINE | ||||||
|  | struct uint128 softfloat_commonNaNToExtF80UI(const struct commonNaN* aPtr) { | ||||||
|  |     struct uint128 uiZ; | ||||||
|  |     uiZ.v64 = defaultNaNExtF80UI64; | ||||||
|  |     uiZ.v0 = defaultNaNExtF80UI0; | ||||||
|  |     return uiZ; | ||||||
|  | } | ||||||
|  | #else | ||||||
| struct uint128 softfloat_commonNaNToExtF80UI(const struct commonNaN* aPtr); | struct uint128 softfloat_commonNaNToExtF80UI(const struct commonNaN* aPtr); | ||||||
|  | #endif | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Interpreting the unsigned integer formed from concatenating 'uiA64' and | | Interpreting the unsigned integer formed from concatenating 'uiA64' and | ||||||
| @@ -237,7 +278,7 @@ struct uint128 softfloat_propagateNaNExtF80UI(uint_fast16_t uiA64, uint_fast64_t | |||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | The bit pattern for a default generated 128-bit floating-point NaN. | | The bit pattern for a default generated 128-bit floating-point NaN. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| #define defaultNaNF128UI64 UINT64_C(0xFFFF800000000000) | #define defaultNaNF128UI64 UINT64_C(0x7FFF800000000000) | ||||||
| #define defaultNaNF128UI0 UINT64_C(0) | #define defaultNaNF128UI0 UINT64_C(0) | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| @@ -256,13 +297,25 @@ struct uint128 softfloat_propagateNaNExtF80UI(uint_fast16_t uiA64, uint_fast64_t | |||||||
| | pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid exception | | pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid exception | ||||||
| | is raised. | | is raised. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| void softfloat_f128UIToCommonNaN(uint_fast64_t uiA64, uint_fast64_t uiA0, struct commonNaN* zPtr); | #define softfloat_f128UIToCommonNaN(uiA64, uiA0, zPtr)                                                                                     \ | ||||||
|  |     if(!((uiA64)&UINT64_C(0x0000800000000000)))                                                                                            \ | ||||||
|  |     softfloat_raiseFlags(softfloat_flag_invalid) | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Converts the common NaN pointed to by 'aPtr' into a 128-bit floating-point | | Converts the common NaN pointed to by 'aPtr' into a 128-bit floating-point | ||||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
|  | #if defined INLINE && !defined softfloat_commonNaNToF128UI | ||||||
|  | INLINE | ||||||
|  | struct uint128 softfloat_commonNaNToF128UI(const struct commonNaN* aPtr) { | ||||||
|  |     struct uint128 uiZ; | ||||||
|  |     uiZ.v64 = defaultNaNF128UI64; | ||||||
|  |     uiZ.v0 = defaultNaNF128UI0; | ||||||
|  |     return uiZ; | ||||||
|  | } | ||||||
|  | #else | ||||||
| struct uint128 softfloat_commonNaNToF128UI(const struct commonNaN*); | struct uint128 softfloat_commonNaNToF128UI(const struct commonNaN*); | ||||||
|  | #endif | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Interpreting the unsigned integer formed from concatenating 'uiA64' and | | Interpreting the unsigned integer formed from concatenating 'uiA64' and | ||||||
| @@ -288,14 +341,24 @@ struct uint128 softfloat_propagateNaNF128UI(uint_fast64_t uiA64, uint_fast64_t u | |||||||
| | common NaN at the location pointed to by 'zPtr'.  If the NaN is a signaling | | common NaN at the location pointed to by 'zPtr'.  If the NaN is a signaling | ||||||
| | NaN, the invalid exception is raised. | | NaN, the invalid exception is raised. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| void softfloat_extF80MToCommonNaN(const struct extFloat80M* aSPtr, struct commonNaN* zPtr); | #define softfloat_extF80MToCommonNaN(aSPtr, zPtr)                                                                                          \ | ||||||
|  |     if(!((aSPtr)->signif & UINT64_C(0x4000000000000000)))                                                                                  \ | ||||||
|  |     softfloat_raiseFlags(softfloat_flag_invalid) | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Converts the common NaN pointed to by 'aPtr' into an 80-bit extended | | Converts the common NaN pointed to by 'aPtr' into an 80-bit extended | ||||||
| | floating-point NaN, and stores this NaN at the location pointed to by | | floating-point NaN, and stores this NaN at the location pointed to by | ||||||
| | 'zSPtr'. | | 'zSPtr'. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
|  | #if defined INLINE && !defined softfloat_commonNaNToExtF80M | ||||||
|  | INLINE | ||||||
|  | void softfloat_commonNaNToExtF80M(const struct commonNaN* aPtr, struct extFloat80M* zSPtr) { | ||||||
|  |     zSPtr->signExp = defaultNaNExtF80UI64; | ||||||
|  |     zSPtr->signif = defaultNaNExtF80UI0; | ||||||
|  | } | ||||||
|  | #else | ||||||
| void softfloat_commonNaNToExtF80M(const struct commonNaN* aPtr, struct extFloat80M* zSPtr); | void softfloat_commonNaNToExtF80M(const struct commonNaN* aPtr, struct extFloat80M* zSPtr); | ||||||
|  | #endif | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Assuming at least one of the two 80-bit extended floating-point values | | Assuming at least one of the two 80-bit extended floating-point values | ||||||
| @@ -308,7 +371,7 @@ void softfloat_propagateNaNExtF80M(const struct extFloat80M* aSPtr, const struct | |||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | The bit pattern for a default generated 128-bit floating-point NaN. | | The bit pattern for a default generated 128-bit floating-point NaN. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| #define defaultNaNF128UI96 0xFFFF8000 | #define defaultNaNF128UI96 0x7FFF8000 | ||||||
| #define defaultNaNF128UI64 0 | #define defaultNaNF128UI64 0 | ||||||
| #define defaultNaNF128UI32 0 | #define defaultNaNF128UI32 0 | ||||||
| #define defaultNaNF128UI0 0 | #define defaultNaNF128UI0 0 | ||||||
| @@ -321,7 +384,9 @@ void softfloat_propagateNaNExtF80M(const struct extFloat80M* aSPtr, const struct | |||||||
| | four 32-bit elements that concatenate in the platform's normal endian order | | four 32-bit elements that concatenate in the platform's normal endian order | ||||||
| | to form a 128-bit floating-point value. | | to form a 128-bit floating-point value. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| void softfloat_f128MToCommonNaN(const uint32_t* aWPtr, struct commonNaN* zPtr); | #define softfloat_f128MToCommonNaN(aWPtr, zPtr)                                                                                            \ | ||||||
|  |     if(!((aWPtr)[indexWordHi(4)] & UINT64_C(0x0000800000000000)))                                                                          \ | ||||||
|  |     softfloat_raiseFlags(softfloat_flag_invalid) | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Converts the common NaN pointed to by 'aPtr' into a 128-bit floating-point | | Converts the common NaN pointed to by 'aPtr' into a 128-bit floating-point | ||||||
| @@ -329,7 +394,17 @@ void softfloat_f128MToCommonNaN(const uint32_t* aWPtr, struct commonNaN* zPtr); | |||||||
| | 'zWPtr' points to an array of four 32-bit elements that concatenate in the | | 'zWPtr' points to an array of four 32-bit elements that concatenate in the | ||||||
| | platform's normal endian order to form a 128-bit floating-point value. | | platform's normal endian order to form a 128-bit floating-point value. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
|  | #if defined INLINE && !defined softfloat_commonNaNToF128M | ||||||
|  | INLINE | ||||||
|  | void softfloat_commonNaNToF128M(const struct commonNaN* aPtr, uint32_t* zWPtr) { | ||||||
|  |     zWPtr[indexWord(4, 3)] = defaultNaNF128UI96; | ||||||
|  |     zWPtr[indexWord(4, 2)] = defaultNaNF128UI64; | ||||||
|  |     zWPtr[indexWord(4, 1)] = defaultNaNF128UI32; | ||||||
|  |     zWPtr[indexWord(4, 0)] = defaultNaNF128UI0; | ||||||
|  | } | ||||||
|  | #else | ||||||
| void softfloat_commonNaNToF128M(const struct commonNaN* aPtr, uint32_t* zWPtr); | void softfloat_commonNaNToF128M(const struct commonNaN* aPtr, uint32_t* zWPtr); | ||||||
|  | #endif | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Assuming at least one of the two 128-bit floating-point values pointed to by | | Assuming at least one of the two 128-bit floating-point values pointed to by | ||||||
|   | |||||||
							
								
								
									
										51
									
								
								softfloat/source/bf16_isSignalingNaN.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										51
									
								
								softfloat/source/bf16_isSignalingNaN.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,51 @@ | |||||||
|  |  | ||||||
|  | /*============================================================================ | ||||||
|  |  | ||||||
|  | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
|  | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
|  | Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||||
|  | California.  All rights reserved. | ||||||
|  |  | ||||||
|  | Redistribution and use in source and binary forms, with or without | ||||||
|  | modification, are permitted provided that the following conditions are met: | ||||||
|  |  | ||||||
|  |  1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |     this list of conditions, and the following disclaimer. | ||||||
|  |  | ||||||
|  |  2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |     this list of conditions, and the following disclaimer in the documentation | ||||||
|  |     and/or other materials provided with the distribution. | ||||||
|  |  | ||||||
|  |  3. Neither the name of the University nor the names of its contributors may | ||||||
|  |     be used to endorse or promote products derived from this software without | ||||||
|  |     specific prior written permission. | ||||||
|  |  | ||||||
|  | THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||||
|  | EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||||
|  | WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||||
|  | DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||||
|  | DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||||
|  | (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||||
|  | LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||||
|  | ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||||
|  | (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||||
|  | SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  | ||||||
|  | =============================================================================*/ | ||||||
|  |  | ||||||
|  | #include <stdbool.h> | ||||||
|  | #include "platform.h" | ||||||
|  | #include "internals.h" | ||||||
|  | #include "specialize.h" | ||||||
|  | #include "softfloat.h" | ||||||
|  |  | ||||||
|  | bool bf16_isSignalingNaN( bfloat16_t a ) | ||||||
|  | { | ||||||
|  |     union ui16_bf16 uA; | ||||||
|  |  | ||||||
|  |     uA.f = a; | ||||||
|  |     return softfloat_isSigNaNBF16UI( uA.ui ); | ||||||
|  |  | ||||||
|  | } | ||||||
|  |  | ||||||
							
								
								
									
										90
									
								
								softfloat/source/bf16_to_f32.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										90
									
								
								softfloat/source/bf16_to_f32.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,90 @@ | |||||||
|  |  | ||||||
|  | /*============================================================================ | ||||||
|  |  | ||||||
|  | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
|  | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
|  | Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||||
|  | California.  All rights reserved. | ||||||
|  |  | ||||||
|  | Redistribution and use in source and binary forms, with or without | ||||||
|  | modification, are permitted provided that the following conditions are met: | ||||||
|  |  | ||||||
|  |  1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |     this list of conditions, and the following disclaimer. | ||||||
|  |  | ||||||
|  |  2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |     this list of conditions, and the following disclaimer in the documentation | ||||||
|  |     and/or other materials provided with the distribution. | ||||||
|  |  | ||||||
|  |  3. Neither the name of the University nor the names of its contributors may | ||||||
|  |     be used to endorse or promote products derived from this software without | ||||||
|  |     specific prior written permission. | ||||||
|  |  | ||||||
|  | THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||||
|  | EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||||
|  | WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||||
|  | DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||||
|  | DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||||
|  | (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||||
|  | LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||||
|  | ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||||
|  | (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||||
|  | SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  | ||||||
|  | =============================================================================*/ | ||||||
|  |  | ||||||
|  | #include <stdbool.h> | ||||||
|  | #include <stdint.h> | ||||||
|  | #include "platform.h" | ||||||
|  | #include "internals.h" | ||||||
|  | #include "specialize.h" | ||||||
|  | #include "softfloat.h" | ||||||
|  |  | ||||||
|  | float32_t bf16_to_f32( bfloat16_t a ) | ||||||
|  | { | ||||||
|  |     union ui16_bf16 uA; | ||||||
|  |     uint_fast16_t uiA; | ||||||
|  |     bool sign; | ||||||
|  |     int_fast16_t exp; | ||||||
|  |     uint_fast16_t frac; | ||||||
|  |     struct commonNaN commonNaN; | ||||||
|  |     uint_fast32_t uiZ; | ||||||
|  |     struct exp8_sig16 normExpSig; | ||||||
|  |     union ui32_f32 uZ; | ||||||
|  |  | ||||||
|  |     /*------------------------------------------------------------------------ | ||||||
|  |     *------------------------------------------------------------------------*/ | ||||||
|  |     uA.f = a; | ||||||
|  |     uiA = uA.ui; | ||||||
|  |     sign = signBF16UI( uiA ); | ||||||
|  |     exp  = expBF16UI( uiA ); | ||||||
|  |     frac = fracBF16UI( uiA ); | ||||||
|  |     /*------------------------------------------------------------------------ | ||||||
|  |     *------------------------------------------------------------------------*/ | ||||||
|  |     // NaN or Inf | ||||||
|  |     if ( exp == 0xFF ) { | ||||||
|  |         if ( frac ) { | ||||||
|  |             softfloat_bf16UIToCommonNaN( uiA, &commonNaN ); | ||||||
|  |             uiZ = softfloat_commonNaNToF32UI( &commonNaN ); | ||||||
|  |         } else { | ||||||
|  |             uiZ = packToF32UI( sign, 0xFF, 0 ); | ||||||
|  |         } | ||||||
|  |         goto uiZ; | ||||||
|  |     } | ||||||
|  |     /*------------------------------------------------------------------------ | ||||||
|  |     *------------------------------------------------------------------------*/ | ||||||
|  |     // packToF32UI simply packs bitfields without any numerical change | ||||||
|  |     // which means it can be used directly for any BF16 to f32 conversions which | ||||||
|  |     // does not require bits manipulation | ||||||
|  |     // (that is everything where the 16-bit are just padded right with 16 zeros, including | ||||||
|  |     //  subnormal numbers) | ||||||
|  |     uiZ = packToF32UI( sign, exp, ((uint_fast32_t) frac) <<16 ); | ||||||
|  |  uiZ: | ||||||
|  |     uZ.ui = uiZ; | ||||||
|  |     return uZ.f; | ||||||
|  |  | ||||||
|  | } | ||||||
|  |  | ||||||
|  |  | ||||||
|  |  | ||||||
							
								
								
									
										105
									
								
								softfloat/source/f32_to_bf16.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										105
									
								
								softfloat/source/f32_to_bf16.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,105 @@ | |||||||
|  |  | ||||||
|  | /*============================================================================ | ||||||
|  |  | ||||||
|  | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
|  | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
|  | Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||||
|  | California.  All rights reserved. | ||||||
|  |  | ||||||
|  | Redistribution and use in source and binary forms, with or without | ||||||
|  | modification, are permitted provided that the following conditions are met: | ||||||
|  |  | ||||||
|  |  1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |     this list of conditions, and the following disclaimer. | ||||||
|  |  | ||||||
|  |  2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |     this list of conditions, and the following disclaimer in the documentation | ||||||
|  |     and/or other materials provided with the distribution. | ||||||
|  |  | ||||||
|  |  3. Neither the name of the University nor the names of its contributors may | ||||||
|  |     be used to endorse or promote products derived from this software without | ||||||
|  |     specific prior written permission. | ||||||
|  |  | ||||||
|  | THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||||
|  | EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||||
|  | WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||||
|  | DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||||
|  | DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||||
|  | (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||||
|  | LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||||
|  | ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||||
|  | (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||||
|  | SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  | ||||||
|  | =============================================================================*/ | ||||||
|  |  | ||||||
|  | #include <stdbool.h> | ||||||
|  | #include <stdint.h> | ||||||
|  | #include "platform.h" | ||||||
|  | #include "internals.h" | ||||||
|  | #include "specialize.h" | ||||||
|  | #include "softfloat.h" | ||||||
|  |  | ||||||
|  | #include <inttypes.h> | ||||||
|  | #include <stdio.h> | ||||||
|  |  | ||||||
|  | bfloat16_t f32_to_bf16( float32_t a ) | ||||||
|  | { | ||||||
|  |     union ui32_f32 uA; | ||||||
|  |     uint_fast32_t uiA; | ||||||
|  |     bool sign; | ||||||
|  |     int_fast16_t exp; | ||||||
|  |     uint_fast32_t frac; | ||||||
|  |     struct commonNaN commonNaN; | ||||||
|  |     uint_fast16_t uiZ, frac16; | ||||||
|  |     union ui16_bf16 uZ; | ||||||
|  |  | ||||||
|  |     /*------------------------------------------------------------------------ | ||||||
|  |     *------------------------------------------------------------------------*/ | ||||||
|  |     uA.f = a; | ||||||
|  |     uiA = uA.ui; | ||||||
|  |     sign = signF32UI( uiA ); | ||||||
|  |     exp  = expF32UI( uiA ); | ||||||
|  |     frac = fracF32UI( uiA ); | ||||||
|  |     /*------------------------------------------------------------------------ | ||||||
|  |     *------------------------------------------------------------------------*/ | ||||||
|  |     // infinity or NaN cases | ||||||
|  |     if ( exp == 0xFF ) { | ||||||
|  |         if ( frac ) { | ||||||
|  |             // NaN case | ||||||
|  |             softfloat_f32UIToCommonNaN( uiA, &commonNaN ); | ||||||
|  |             uiZ = softfloat_commonNaNToBF16UI( &commonNaN ); | ||||||
|  |         } else { | ||||||
|  |             // infinity case | ||||||
|  |             uiZ = packToBF16UI( sign, 0xFF, 0 ); | ||||||
|  |         } | ||||||
|  |         goto uiZ; | ||||||
|  |     } | ||||||
|  |     /*------------------------------------------------------------------------ | ||||||
|  |     *------------------------------------------------------------------------*/ | ||||||
|  |     // frac is a 24-bit mantissa, right shifted by 9 | ||||||
|  |     // In the normal case, (24-9) = 15 are set  | ||||||
|  |     frac16 = frac>>9 | ((frac & 0x1FF) != 0); | ||||||
|  |     if ( ! (exp | frac16) ) { | ||||||
|  |         uiZ = packToBF16UI( sign, 0, 0 ); | ||||||
|  |         goto uiZ; | ||||||
|  |     } | ||||||
|  |     /*------------------------------------------------------------------------ | ||||||
|  |     *------------------------------------------------------------------------*/ | ||||||
|  |     // softfloat_roundPackToBF16 exponent argument (2nd argument) | ||||||
|  |     // must correspond to the exponent of fracIn[13] bits | ||||||
|  |     // (fracIn is the 3rd and last argument)  | ||||||
|  |     uint_fast32_t mask = exp ? 0x4000 : 0x0; // implicit one mask added if input is a normal number | ||||||
|  |     // exponent for the lowest normal and largest subnormal should be equal | ||||||
|  |     // but is not in IEEE encoding so mantissa must be partially normalized | ||||||
|  |     // (by one bit) for subnormal numbers. Such that (exp - 1) corresponds | ||||||
|  |     // to the exponent of frac16[13] | ||||||
|  |     frac16 = frac16 << (exp ? 0 : 1); | ||||||
|  |     return softfloat_roundPackToBF16( sign, exp - 1, frac16 | mask ); | ||||||
|  |  uiZ: | ||||||
|  |     uZ.ui = uiZ; | ||||||
|  |     return uZ.f; | ||||||
|  |  | ||||||
|  | } | ||||||
|  |  | ||||||
| @@ -72,6 +72,9 @@ float16_t f32_to_f16( float32_t a ) | |||||||
|     } |     } | ||||||
|     /*------------------------------------------------------------------------ |     /*------------------------------------------------------------------------ | ||||||
|     *------------------------------------------------------------------------*/ |     *------------------------------------------------------------------------*/ | ||||||
|  |     // frac is a 24-bit significand, the bottom 9 bits LSB are extracted and OR-red | ||||||
|  |     // into a sticky flag, the top 15 MSBs are extracted, the LSB of this top slice | ||||||
|  |     // is OR-red with the sticky  | ||||||
|     frac16 = frac>>9 | ((frac & 0x1FF) != 0); |     frac16 = frac>>9 | ((frac & 0x1FF) != 0); | ||||||
|     if ( ! (exp | frac16) ) { |     if ( ! (exp | frac16) ) { | ||||||
|         uiZ = packToF16UI( sign, 0, 0 ); |         uiZ = packToF16UI( sign, 0, 0 ); | ||||||
|   | |||||||
| @@ -46,6 +46,10 @@ union ui16_f16 { | |||||||
|     uint16_t ui; |     uint16_t ui; | ||||||
|     float16_t f; |     float16_t f; | ||||||
| }; | }; | ||||||
|  | union ui16_bf16 { | ||||||
|  |     uint16_t ui; | ||||||
|  |     bfloat16_t f; | ||||||
|  | }; | ||||||
| union ui32_f32 { | union ui32_f32 { | ||||||
|     uint32_t ui; |     uint32_t ui; | ||||||
|     float32_t f; |     float32_t f; | ||||||
| @@ -108,6 +112,18 @@ float16_t softfloat_addMagsF16(uint_fast16_t, uint_fast16_t); | |||||||
| float16_t softfloat_subMagsF16(uint_fast16_t, uint_fast16_t); | float16_t softfloat_subMagsF16(uint_fast16_t, uint_fast16_t); | ||||||
| float16_t softfloat_mulAddF16(uint_fast16_t, uint_fast16_t, uint_fast16_t, uint_fast8_t); | float16_t softfloat_mulAddF16(uint_fast16_t, uint_fast16_t, uint_fast16_t, uint_fast8_t); | ||||||
|  |  | ||||||
|  | /*---------------------------------------------------------------------------- | ||||||
|  |  *----------------------------------------------------------------------------*/ | ||||||
|  | #define signBF16UI(a) ((bool)((uint16_t)(a) >> 15)) | ||||||
|  | #define expBF16UI(a) ((int_fast16_t)((a) >> 7) & 0xFF) | ||||||
|  | #define fracBF16UI(a) ((a)&0x07F) | ||||||
|  | #define packToBF16UI(sign, exp, sig) (((uint16_t)(sign) << 15) + ((uint16_t)(exp) << 7) + (sig)) | ||||||
|  |  | ||||||
|  | #define isNaNBF16UI(a) (((~(a)&0x7FC0) == 0) && ((a)&0x07F)) | ||||||
|  |  | ||||||
|  | bfloat16_t softfloat_roundPackToBF16(bool, int_fast16_t, uint_fast16_t); | ||||||
|  | struct exp8_sig16 softfloat_normSubnormalBF16Sig(uint_fast16_t); | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
|  *----------------------------------------------------------------------------*/ |  *----------------------------------------------------------------------------*/ | ||||||
| #define signF32UI(a) ((bool)((uint32_t)(a) >> 31)) | #define signF32UI(a) ((bool)((uint32_t)(a) >> 31)) | ||||||
|   | |||||||
| @@ -76,13 +76,13 @@ enum { | |||||||
| | Software floating-point exception flags. | | Software floating-point exception flags. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
| extern THREAD_LOCAL uint_fast8_t softfloat_exceptionFlags; | extern THREAD_LOCAL uint_fast8_t softfloat_exceptionFlags; | ||||||
| enum { | typedef enum { | ||||||
|     softfloat_flag_inexact = 1, |     softfloat_flag_inexact = 1, | ||||||
|     softfloat_flag_underflow = 2, |     softfloat_flag_underflow = 2, | ||||||
|     softfloat_flag_overflow = 4, |     softfloat_flag_overflow = 4, | ||||||
|     softfloat_flag_infinite = 8, |     softfloat_flag_infinite = 8, | ||||||
|     softfloat_flag_invalid = 16 |     softfloat_flag_invalid = 16 | ||||||
| }; | } exceptionFlag_t; | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | Routine to raise any or all of the software floating-point exception flags. | | Routine to raise any or all of the software floating-point exception flags. | ||||||
| @@ -164,6 +164,13 @@ bool f16_le_quiet(float16_t, float16_t); | |||||||
| bool f16_lt_quiet(float16_t, float16_t); | bool f16_lt_quiet(float16_t, float16_t); | ||||||
| bool f16_isSignalingNaN(float16_t); | bool f16_isSignalingNaN(float16_t); | ||||||
|  |  | ||||||
|  | /*---------------------------------------------------------------------------- | ||||||
|  | | 16-bit (brain float 16) floating-point operations. | ||||||
|  | *----------------------------------------------------------------------------*/ | ||||||
|  | float32_t bf16_to_f32(bfloat16_t); | ||||||
|  | bfloat16_t f32_to_bf16(float32_t); | ||||||
|  | bool bf16_isSignalingNaN(bfloat16_t); | ||||||
|  |  | ||||||
| /*---------------------------------------------------------------------------- | /*---------------------------------------------------------------------------- | ||||||
| | 32-bit (single-precision) floating-point operations. | | 32-bit (single-precision) floating-point operations. | ||||||
| *----------------------------------------------------------------------------*/ | *----------------------------------------------------------------------------*/ | ||||||
|   | |||||||
| @@ -50,6 +50,9 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |||||||
| typedef struct { | typedef struct { | ||||||
|     uint16_t v; |     uint16_t v; | ||||||
| } float16_t; | } float16_t; | ||||||
|  | typedef struct { | ||||||
|  |     uint16_t v; | ||||||
|  | } bfloat16_t; | ||||||
| typedef struct { | typedef struct { | ||||||
|     uint32_t v; |     uint32_t v; | ||||||
| } float32_t; | } float32_t; | ||||||
|   | |||||||
| @@ -221,4 +221,3 @@ float32_t | |||||||
|     return uZ.f; |     return uZ.f; | ||||||
|  |  | ||||||
| } | } | ||||||
|  |  | ||||||
|   | |||||||
							
								
								
									
										52
									
								
								softfloat/source/s_normSubnormalBF16Sig.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										52
									
								
								softfloat/source/s_normSubnormalBF16Sig.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,52 @@ | |||||||
|  |  | ||||||
|  | /*============================================================================ | ||||||
|  |  | ||||||
|  | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
|  | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
|  | Copyright 2011, 2012, 2013, 2014, 2015, 2016 The Regents of the University of | ||||||
|  | California.  All rights reserved. | ||||||
|  |  | ||||||
|  | Redistribution and use in source and binary forms, with or without | ||||||
|  | modification, are permitted provided that the following conditions are met: | ||||||
|  |  | ||||||
|  |  1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |     this list of conditions, and the following disclaimer. | ||||||
|  |  | ||||||
|  |  2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |     this list of conditions, and the following disclaimer in the documentation | ||||||
|  |     and/or other materials provided with the distribution. | ||||||
|  |  | ||||||
|  |  3. Neither the name of the University nor the names of its contributors may | ||||||
|  |     be used to endorse or promote products derived from this software without | ||||||
|  |     specific prior written permission. | ||||||
|  |  | ||||||
|  | THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||||
|  | EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||||
|  | WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||||
|  | DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||||
|  | DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||||
|  | (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||||
|  | LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||||
|  | ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||||
|  | (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||||
|  | SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  | ||||||
|  | =============================================================================*/ | ||||||
|  |  | ||||||
|  | #include <stdint.h> | ||||||
|  | #include "platform.h" | ||||||
|  | #include "internals.h" | ||||||
|  |  | ||||||
|  | struct exp8_sig16 softfloat_normSubnormalBF16Sig( uint_fast16_t sig ) | ||||||
|  | { | ||||||
|  |     int_fast8_t shiftDist; | ||||||
|  |     struct exp8_sig16 z; | ||||||
|  |  | ||||||
|  |     shiftDist = softfloat_countLeadingZeros16( sig ) - 8; | ||||||
|  |     z.exp = 1 - shiftDist; | ||||||
|  |     z.sig = sig<<shiftDist; | ||||||
|  |     return z; | ||||||
|  |  | ||||||
|  | } | ||||||
|  |  | ||||||
							
								
								
									
										114
									
								
								softfloat/source/s_roundPackToBF16.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										114
									
								
								softfloat/source/s_roundPackToBF16.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,114 @@ | |||||||
|  |  | ||||||
|  | /*============================================================================ | ||||||
|  |  | ||||||
|  | This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||||
|  | Package, Release 3e, by John R. Hauser. | ||||||
|  |  | ||||||
|  | Copyright 2011, 2012, 2013, 2014, 2015, 2017 The Regents of the University of | ||||||
|  | California.  All rights reserved. | ||||||
|  |  | ||||||
|  | Redistribution and use in source and binary forms, with or without | ||||||
|  | modification, are permitted provided that the following conditions are met: | ||||||
|  |  | ||||||
|  |  1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |     this list of conditions, and the following disclaimer. | ||||||
|  |  | ||||||
|  |  2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |     this list of conditions, and the following disclaimer in the documentation | ||||||
|  |     and/or other materials provided with the distribution. | ||||||
|  |  | ||||||
|  |  3. Neither the name of the University nor the names of its contributors may | ||||||
|  |     be used to endorse or promote products derived from this software without | ||||||
|  |     specific prior written permission. | ||||||
|  |  | ||||||
|  | THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||||
|  | EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||||
|  | WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||||
|  | DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||||
|  | DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||||
|  | (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||||
|  | LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||||
|  | ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||||
|  | (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||||
|  | SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  | ||||||
|  | =============================================================================*/ | ||||||
|  |  | ||||||
|  | #include <stdbool.h> | ||||||
|  | #include <stdint.h> | ||||||
|  | #include "platform.h" | ||||||
|  | #include "internals.h" | ||||||
|  | #include "softfloat.h" | ||||||
|  |  | ||||||
|  | /** sig last significant bit is sig[7], the 7 LSBs will be used for rounding */ | ||||||
|  | bfloat16_t | ||||||
|  |  softfloat_roundPackToBF16( bool sign, int_fast16_t exp, uint_fast16_t sig ) | ||||||
|  | { | ||||||
|  |     uint_fast8_t roundingMode; | ||||||
|  |     bool roundNearEven; | ||||||
|  |     uint_fast8_t roundIncrement, roundBits; | ||||||
|  |     bool isTiny; | ||||||
|  |     uint_fast16_t uiZ; | ||||||
|  |     union ui16_bf16 uZ; | ||||||
|  |  | ||||||
|  |     /*------------------------------------------------------------------------ | ||||||
|  |     *------------------------------------------------------------------------*/ | ||||||
|  |     roundingMode = softfloat_roundingMode; | ||||||
|  |     roundNearEven = (roundingMode == softfloat_round_near_even); | ||||||
|  |     roundIncrement = 0x40; | ||||||
|  |     if ( ! roundNearEven && (roundingMode != softfloat_round_near_maxMag) ) { | ||||||
|  |         roundIncrement = | ||||||
|  |             (roundingMode | ||||||
|  |                  == (sign ? softfloat_round_min : softfloat_round_max)) | ||||||
|  |                 ? 0x7F | ||||||
|  |                 : 0; | ||||||
|  |     } | ||||||
|  |     roundBits = sig & 0x7F; | ||||||
|  |     /*------------------------------------------------------------------------ | ||||||
|  |     *------------------------------------------------------------------------*/ | ||||||
|  |     if ( 0xFD <= (unsigned int) exp ) { | ||||||
|  |         if ( exp < 0 ) { | ||||||
|  |             /*---------------------------------------------------------------- | ||||||
|  |             *----------------------------------------------------------------*/ | ||||||
|  |             isTiny = | ||||||
|  |                 (softfloat_detectTininess == softfloat_tininess_beforeRounding) | ||||||
|  |                     || (exp < -1) || (sig + roundIncrement < 0x8000); | ||||||
|  |             sig = softfloat_shiftRightJam32( sig, -exp ); | ||||||
|  |             exp = 0; | ||||||
|  |             roundBits = sig & 0x7F; | ||||||
|  |             if ( isTiny && roundBits ) { | ||||||
|  |                 softfloat_raiseFlags( softfloat_flag_underflow ); | ||||||
|  |             } | ||||||
|  |         } else if ( (0xFD < exp) || (0x8000 <= sig + roundIncrement) ) { | ||||||
|  |             /*---------------------------------------------------------------- | ||||||
|  |             *----------------------------------------------------------------*/ | ||||||
|  |             softfloat_raiseFlags( | ||||||
|  |                 softfloat_flag_overflow | softfloat_flag_inexact ); | ||||||
|  |             uiZ = packToBF16UI( sign, 0xFF, 0 ) - ! roundIncrement; | ||||||
|  |             goto uiZ; | ||||||
|  |         } | ||||||
|  |     } | ||||||
|  |     /*------------------------------------------------------------------------ | ||||||
|  |     *------------------------------------------------------------------------*/ | ||||||
|  |     sig = (sig + roundIncrement)>>7; | ||||||
|  |     if ( roundBits ) { | ||||||
|  |         softfloat_exceptionFlags |= softfloat_flag_inexact; | ||||||
|  | #ifdef SOFTFLOAT_ROUND_ODD | ||||||
|  |         if ( roundingMode == softfloat_round_odd ) { | ||||||
|  |             sig |= 1; | ||||||
|  |             goto packReturn; | ||||||
|  |         } | ||||||
|  | #endif | ||||||
|  |     } | ||||||
|  |     sig &= ~(uint_fast16_t) (! (roundBits ^ 0x40) & roundNearEven); | ||||||
|  |     if ( ! sig ) exp = 0; | ||||||
|  |     /*------------------------------------------------------------------------ | ||||||
|  |     *------------------------------------------------------------------------*/ | ||||||
|  |  packReturn: | ||||||
|  |     uiZ = packToBF16UI( sign, exp, sig ); | ||||||
|  |  uiZ: | ||||||
|  |     uZ.ui = uiZ; | ||||||
|  |     return uZ.f; | ||||||
|  |  | ||||||
|  | } | ||||||
|  |  | ||||||
							
								
								
									
										69
									
								
								src/elfio.cpp
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										69
									
								
								src/elfio.cpp
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,69 @@ | |||||||
|  | /******************************************************************************* | ||||||
|  |  * Copyright (C) 2024 MINRES Technologies GmbH | ||||||
|  |  * All rights reserved. | ||||||
|  |  * | ||||||
|  |  * Redistribution and use in source and binary forms, with or without | ||||||
|  |  * modification, are permitted provided that the following conditions are met: | ||||||
|  |  * | ||||||
|  |  * 1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer. | ||||||
|  |  * | ||||||
|  |  * 2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer in the documentation | ||||||
|  |  *    and/or other materials provided with the distribution. | ||||||
|  |  * | ||||||
|  |  * 3. Neither the name of the copyright holder nor the names of its contributors | ||||||
|  |  *    may be used to endorse or promote products derived from this software | ||||||
|  |  *    without specific prior written permission. | ||||||
|  |  * | ||||||
|  |  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  |  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  |  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||||
|  |  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||||
|  |  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||||
|  |  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||||
|  |  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||||
|  |  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||||
|  |  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||||
|  |  * POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  * | ||||||
|  |  * Contributors: | ||||||
|  |  *       eyck@minres.com - initial implementation | ||||||
|  |  ******************************************************************************/ | ||||||
|  |  | ||||||
|  | #ifdef _MSC_VER | ||||||
|  | #define _SCL_SECURE_NO_WARNINGS | ||||||
|  | #define ELFIO_NO_INTTYPES | ||||||
|  | #endif | ||||||
|  |  | ||||||
|  | #include <elfio/elfio_dump.hpp> | ||||||
|  | #include <iostream> | ||||||
|  |  | ||||||
|  | using namespace ELFIO; | ||||||
|  |  | ||||||
|  | int main(int argc, char** argv) { | ||||||
|  |     if(argc != 2) { | ||||||
|  |         printf("Usage: elfdump <file_name>\n"); | ||||||
|  |         return 1; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     elfio reader; | ||||||
|  |  | ||||||
|  |     if(!reader.load(argv[1])) { | ||||||
|  |         printf("File %s is not found or it is not an ELF file\n", argv[1]); | ||||||
|  |         return 1; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     dump::header(std::cout, reader); | ||||||
|  |     dump::section_headers(std::cout, reader); | ||||||
|  |     dump::segment_headers(std::cout, reader); | ||||||
|  |     dump::symbol_tables(std::cout, reader); | ||||||
|  |     dump::notes(std::cout, reader); | ||||||
|  |     dump::modinfo(std::cout, reader); | ||||||
|  |     dump::dynamic_tags(std::cout, reader); | ||||||
|  |     dump::section_datas(std::cout, reader); | ||||||
|  |     dump::segment_datas(std::cout, reader); | ||||||
|  |  | ||||||
|  |     return 0; | ||||||
|  | } | ||||||
| @@ -51,8 +51,8 @@ public: | |||||||
|     virtual ~hwl() = default; |     virtual ~hwl() = default; | ||||||
|  |  | ||||||
| protected: | protected: | ||||||
|     iss::status read_custom_csr_reg(unsigned addr, reg_t& val) override; |     iss::status read_custom_csr(unsigned addr, reg_t& val) override; | ||||||
|     iss::status write_custom_csr_reg(unsigned addr, reg_t val) override; |     iss::status write_custom_csr(unsigned addr, reg_t val) override; | ||||||
| }; | }; | ||||||
|  |  | ||||||
| template <typename BASE> | template <typename BASE> | ||||||
| @@ -68,7 +68,7 @@ inline hwl<BASE>::hwl(feature_config cfg) | |||||||
|     } |     } | ||||||
| } | } | ||||||
|  |  | ||||||
| template <typename BASE> inline iss::status iss::arch::hwl<BASE>::read_custom_csr_reg(unsigned addr, reg_t& val) { | template <typename BASE> inline iss::status iss::arch::hwl<BASE>::read_custom_csr(unsigned addr, reg_t& val) { | ||||||
|     switch(addr) { |     switch(addr) { | ||||||
|     case 0x800: |     case 0x800: | ||||||
|         val = this->reg.lpstart0; |         val = this->reg.lpstart0; | ||||||
| @@ -92,7 +92,7 @@ template <typename BASE> inline iss::status iss::arch::hwl<BASE>::read_custom_cs | |||||||
|     return iss::Ok; |     return iss::Ok; | ||||||
| } | } | ||||||
|  |  | ||||||
| template <typename BASE> inline iss::status iss::arch::hwl<BASE>::write_custom_csr_reg(unsigned addr, reg_t val) { | template <typename BASE> inline iss::status iss::arch::hwl<BASE>::write_custom_csr(unsigned addr, reg_t val) { | ||||||
|     switch(addr) { |     switch(addr) { | ||||||
|     case 0x800: |     case 0x800: | ||||||
|         this->reg.lpstart0 = val; |         this->reg.lpstart0 = val; | ||||||
|   | |||||||
							
								
								
									
										233
									
								
								src/iss/arch/mstatus.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										233
									
								
								src/iss/arch/mstatus.h
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,233 @@ | |||||||
|  | /******************************************************************************* | ||||||
|  |  * Copyright (C) 2025 MINRES Technologies GmbH | ||||||
|  |  * All rights reserved. | ||||||
|  |  * | ||||||
|  |  * Redistribution and use in source and binary forms, with or without | ||||||
|  |  * modification, are permitted provided that the following conditions are met: | ||||||
|  |  * | ||||||
|  |  * 1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer. | ||||||
|  |  * | ||||||
|  |  * 2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer in the documentation | ||||||
|  |  *    and/or other materials provided with the distribution. | ||||||
|  |  * | ||||||
|  |  * 3. Neither the name of the copyright holder nor the names of its contributors | ||||||
|  |  *    may be used to endorse or promote products derived from this software | ||||||
|  |  *    without specific prior written permission. | ||||||
|  |  * | ||||||
|  |  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  |  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  |  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||||
|  |  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||||
|  |  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||||
|  |  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||||
|  |  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||||
|  |  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||||
|  |  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||||
|  |  * POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  * | ||||||
|  |  * Contributors: | ||||||
|  |  *       eyck@minres.com - initial implementation | ||||||
|  |  ******************************************************************************/ | ||||||
|  | #ifndef _MSTATUS_TYPE | ||||||
|  | #define _MSTATUS_TYPE | ||||||
|  |  | ||||||
|  | #include <cstdint> | ||||||
|  | #include <type_traits> | ||||||
|  | #include <util/bit_field.h> | ||||||
|  | #include <util/ities.h> | ||||||
|  |  | ||||||
|  | namespace iss { | ||||||
|  | namespace arch { | ||||||
|  |  | ||||||
|  | template <class T, class Enable = void> struct status {}; | ||||||
|  | // specialization 32bit | ||||||
|  | template <typename T> struct status<T, typename std::enable_if<std::is_same<T, uint32_t>::value>::type> { | ||||||
|  |     static inline unsigned SD(T v) { return bit_sub<63, 1>(v); } | ||||||
|  |     // value of XLEN for S-mode | ||||||
|  |     static inline unsigned SXL(T v) { return bit_sub<34, 2>(v); }; | ||||||
|  |     // value of XLEN for U-mode | ||||||
|  |     static inline unsigned UXL(T v) { return bit_sub<32, 2>(v); }; | ||||||
|  |     // Trap SRET | ||||||
|  |     static inline unsigned TSR(T v) { return bit_sub<22, 1>(v); }; | ||||||
|  |     // Timeout Wait | ||||||
|  |     static inline unsigned TW(T v) { return bit_sub<21, 1>(v); }; | ||||||
|  |     // Trap Virtual Memory | ||||||
|  |     static inline unsigned TVM(T v) { return bit_sub<20, 1>(v); }; | ||||||
|  |     // Make eXecutable Readable | ||||||
|  |     static inline unsigned MXR(T v) { return bit_sub<19, 1>(v); }; | ||||||
|  |     // permit Supervisor User Memory access | ||||||
|  |     static inline unsigned SUM(T v) { return bit_sub<18, 1>(v); }; | ||||||
|  |     // Modify PRiVilege | ||||||
|  |     static inline unsigned MPRV(T v) { return bit_sub<17, 1>(v); }; | ||||||
|  |     // status of additional user-mode extensions and associated state, All off/None dirty or clean, some on/None | ||||||
|  |     // dirty, some clean/Some dirty | ||||||
|  |     static inline unsigned XS(T v) { return bit_sub<15, 2>(v); }; | ||||||
|  |     // floating-point unit status Off/Initial/Clean/Dirty | ||||||
|  |     static inline unsigned FS(T v) { return bit_sub<13, 2>(v); }; | ||||||
|  |     // machine previous privilege | ||||||
|  |     static inline unsigned MPP(T v) { return bit_sub<11, 2>(v); }; | ||||||
|  |     // supervisor previous privilege | ||||||
|  |     static inline unsigned SPP(T v) { return bit_sub<8, 1>(v); }; | ||||||
|  |     // previous machine interrupt-enable | ||||||
|  |     static inline unsigned MPIE(T v) { return bit_sub<7, 1>(v); }; | ||||||
|  |     // previous supervisor interrupt-enable | ||||||
|  |     static inline unsigned SPIE(T v) { return bit_sub<5, 1>(v); }; | ||||||
|  |     // previous user interrupt-enable | ||||||
|  |     static inline unsigned UPIE(T v) { return bit_sub<4, 1>(v); }; | ||||||
|  |     // machine interrupt-enable | ||||||
|  |     static inline unsigned MIE(T v) { return bit_sub<3, 1>(v); }; | ||||||
|  |     // supervisor interrupt-enable | ||||||
|  |     static inline unsigned SIE(T v) { return bit_sub<1, 1>(v); }; | ||||||
|  |     // user interrupt-enable | ||||||
|  |     static inline unsigned UIE(T v) { return bit_sub<0, 1>(v); }; | ||||||
|  | }; | ||||||
|  |  | ||||||
|  | template <typename T> struct status<T, typename std::enable_if<std::is_same<T, uint64_t>::value>::type> { | ||||||
|  | public: | ||||||
|  |     // SD bit is read-only and is set when either the FS or XS bits encode a Dirty state (i.e., SD=((FS==11) OR | ||||||
|  |     // XS==11))) | ||||||
|  |     static inline unsigned SD(T v) { return bit_sub<63, 1>(v); }; | ||||||
|  |     // value of XLEN for S-mode | ||||||
|  |     static inline unsigned SXL(T v) { return bit_sub<34, 2>(v); }; | ||||||
|  |     // value of XLEN for U-mode | ||||||
|  |     static inline unsigned UXL(T v) { return bit_sub<32, 2>(v); }; | ||||||
|  |     // Trap SRET | ||||||
|  |     static inline unsigned TSR(T v) { return bit_sub<22, 1>(v); }; | ||||||
|  |     // Timeout Wait | ||||||
|  |     static inline unsigned TW(T v) { return bit_sub<21, 1>(v); }; | ||||||
|  |     // Trap Virtual Memory | ||||||
|  |     static inline unsigned TVM(T v) { return bit_sub<20, 1>(v); }; | ||||||
|  |     // Make eXecutable Readable | ||||||
|  |     static inline unsigned MXR(T v) { return bit_sub<19, 1>(v); }; | ||||||
|  |     // permit Supervisor User Memory access | ||||||
|  |     static inline unsigned SUM(T v) { return bit_sub<18, 1>(v); }; | ||||||
|  |     // Modify PRiVilege | ||||||
|  |     static inline unsigned MPRV(T v) { return bit_sub<17, 1>(v); }; | ||||||
|  |     // status of additional user-mode extensions and associated state, All off/None dirty or clean, some on/None | ||||||
|  |     // dirty, some clean/Some dirty | ||||||
|  |     static inline unsigned XS(T v) { return bit_sub<15, 2>(v); }; | ||||||
|  |     // floating-point unit status Off/Initial/Clean/Dirty | ||||||
|  |     static inline unsigned FS(T v) { return bit_sub<13, 2>(v); }; | ||||||
|  |     // machine previous privilege | ||||||
|  |     static inline unsigned MPP(T v) { return bit_sub<11, 2>(v); }; | ||||||
|  |     // supervisor previous privilege | ||||||
|  |     static inline unsigned SPP(T v) { return bit_sub<8, 1>(v); }; | ||||||
|  |     // previous machine interrupt-enable | ||||||
|  |     static inline unsigned MPIE(T v) { return bit_sub<7, 1>(v); }; | ||||||
|  |     // previous supervisor interrupt-enable | ||||||
|  |     static inline unsigned SPIE(T v) { return bit_sub<5, 1>(v); }; | ||||||
|  |     // previous user interrupt-enable | ||||||
|  |     static inline unsigned UPIE(T v) { return bit_sub<4, 1>(v); }; | ||||||
|  |     // machine interrupt-enable | ||||||
|  |     static inline unsigned MIE(T v) { return bit_sub<3, 1>(v); }; | ||||||
|  |     // supervisor interrupt-enable | ||||||
|  |     static inline unsigned SIE(T v) { return bit_sub<1, 1>(v); }; | ||||||
|  |     // user interrupt-enable | ||||||
|  |     static inline unsigned UIE(T v) { return bit_sub<0, 1>(v); }; | ||||||
|  | }; | ||||||
|  |  | ||||||
|  | // primary template | ||||||
|  | template <class T, class Enable = void> struct hart_state {}; | ||||||
|  | // specialization 32bit | ||||||
|  | template <typename T> class hart_state<T, typename std::enable_if<std::is_same<T, uint32_t>::value>::type> { | ||||||
|  | public: | ||||||
|  |     BEGIN_BF_DECL(mstatus_t, T); | ||||||
|  |     // SD bit is read-only and is set when either the FS or XS bits encode a Dirty state (i.e., SD=((FS==11) OR | ||||||
|  |     // XS==11))) | ||||||
|  |     BF_FIELD(SD, 31, 1); | ||||||
|  |     // Trap SRET | ||||||
|  |     BF_FIELD(TSR, 22, 1); | ||||||
|  |     // Timeout Wait | ||||||
|  |     BF_FIELD(TW, 21, 1); | ||||||
|  |     // Trap Virtual Memory | ||||||
|  |     BF_FIELD(TVM, 20, 1); | ||||||
|  |     // Make eXecutable Readable | ||||||
|  |     BF_FIELD(MXR, 19, 1); | ||||||
|  |     // permit Supervisor User Memory access | ||||||
|  |     BF_FIELD(SUM, 18, 1); | ||||||
|  |     // Modify PRiVilege | ||||||
|  |     BF_FIELD(MPRV, 17, 1); | ||||||
|  |     // status of additional user-mode extensions and associated state, All off/None dirty or clean, some on/None | ||||||
|  |     // dirty, some clean/Some dirty | ||||||
|  |     BF_FIELD(XS, 15, 2); | ||||||
|  |     // floating-point unit status Off/Initial/Clean/Dirty | ||||||
|  |     BF_FIELD(FS, 13, 2); | ||||||
|  |     // machine previous privilege | ||||||
|  |     BF_FIELD(MPP, 11, 2); | ||||||
|  |     // supervisor previous privilege | ||||||
|  |     BF_FIELD(SPP, 8, 1); | ||||||
|  |     // previous machine interrupt-enable | ||||||
|  |     BF_FIELD(MPIE, 7, 1); | ||||||
|  |     // previous supervisor interrupt-enable | ||||||
|  |     BF_FIELD(SPIE, 5, 1); | ||||||
|  |     // previous user interrupt-enable | ||||||
|  |     BF_FIELD(UPIE, 4, 1); | ||||||
|  |     // machine interrupt-enable | ||||||
|  |     BF_FIELD(MIE, 3, 1); | ||||||
|  |     // supervisor interrupt-enable | ||||||
|  |     BF_FIELD(SIE, 1, 1); | ||||||
|  |     // user interrupt-enable | ||||||
|  |     BF_FIELD(UIE, 0, 1); | ||||||
|  |     END_BF_DECL(); | ||||||
|  |  | ||||||
|  |     mstatus_t mstatus; | ||||||
|  |  | ||||||
|  |     static const T mstatus_reset_val = 0x1800; | ||||||
|  | }; | ||||||
|  |  | ||||||
|  | // specialization 64bit | ||||||
|  | template <typename T> class hart_state<T, typename std::enable_if<std::is_same<T, uint64_t>::value>::type> { | ||||||
|  | public: | ||||||
|  |     BEGIN_BF_DECL(mstatus_t, T); | ||||||
|  |     // SD bit is read-only and is set when either the FS or XS bits encode a Dirty state (i.e., SD=((FS==11) OR | ||||||
|  |     // XS==11))) | ||||||
|  |     BF_FIELD(SD, 63, 1); | ||||||
|  |     // value of XLEN for S-mode | ||||||
|  |     BF_FIELD(SXL, 34, 2); | ||||||
|  |     // value of XLEN for U-mode | ||||||
|  |     BF_FIELD(UXL, 32, 2); | ||||||
|  |     // Trap SRET | ||||||
|  |     BF_FIELD(TSR, 22, 1); | ||||||
|  |     // Timeout Wait | ||||||
|  |     BF_FIELD(TW, 21, 1); | ||||||
|  |     // Trap Virtual Memory | ||||||
|  |     BF_FIELD(TVM, 20, 1); | ||||||
|  |     // Make eXecutable Readable | ||||||
|  |     BF_FIELD(MXR, 19, 1); | ||||||
|  |     // permit Supervisor User Memory access | ||||||
|  |     BF_FIELD(SUM, 18, 1); | ||||||
|  |     // Modify PRiVilege | ||||||
|  |     BF_FIELD(MPRV, 17, 1); | ||||||
|  |     // status of additional user-mode extensions and associated state, All off/None dirty or clean, some on/None | ||||||
|  |     // dirty, some clean/Some dirty | ||||||
|  |     BF_FIELD(XS, 15, 2); | ||||||
|  |     // floating-point unit status Off/Initial/Clean/Dirty | ||||||
|  |     BF_FIELD(FS, 13, 2); | ||||||
|  |     // machine previous privilege | ||||||
|  |     BF_FIELD(MPP, 11, 2); | ||||||
|  |     // supervisor previous privilege | ||||||
|  |     BF_FIELD(SPP, 8, 1); | ||||||
|  |     // previous machine interrupt-enable | ||||||
|  |     BF_FIELD(MPIE, 7, 1); | ||||||
|  |     // previous supervisor interrupt-enable | ||||||
|  |     BF_FIELD(SPIE, 5, 1); | ||||||
|  |     // previous user interrupt-enable | ||||||
|  |     BF_FIELD(UPIE, 4, 1); | ||||||
|  |     // machine interrupt-enable | ||||||
|  |     BF_FIELD(MIE, 3, 1); | ||||||
|  |     // supervisor interrupt-enable | ||||||
|  |     BF_FIELD(SIE, 1, 1); | ||||||
|  |     // user interrupt-enable | ||||||
|  |     BF_FIELD(UIE, 0, 1); | ||||||
|  |     END_BF_DECL(); | ||||||
|  |  | ||||||
|  |     mstatus_t mstatus; | ||||||
|  |  | ||||||
|  |     static const T mstatus_reset_val = 0x1800; | ||||||
|  | }; | ||||||
|  | } // namespace arch | ||||||
|  | } // namespace iss | ||||||
|  | #endif // _MSTATUS_TYPE | ||||||
| @@ -1,5 +1,5 @@ | |||||||
| /******************************************************************************* | /******************************************************************************* | ||||||
|  * Copyright (C) 2017, 2018, 2021 MINRES Technologies GmbH |  * Copyright (C) 2017 - 2025 MINRES Technologies GmbH | ||||||
|  * All rights reserved. |  * All rights reserved. | ||||||
|  * |  * | ||||||
|  * Redistribution and use in source and binary forms, with or without |  * Redistribution and use in source and binary forms, with or without | ||||||
| @@ -35,21 +35,38 @@ | |||||||
| #ifndef _RISCV_HART_COMMON | #ifndef _RISCV_HART_COMMON | ||||||
| #define _RISCV_HART_COMMON | #define _RISCV_HART_COMMON | ||||||
|  |  | ||||||
|  | #include "mstatus.h" | ||||||
|  | #include "util/delegate.h" | ||||||
|  | #include <absl/container/flat_hash_map.h> | ||||||
|  | #include <array> | ||||||
| #include <cstdint> | #include <cstdint> | ||||||
| #include <elfio/elfio.hpp> | #include <elfio/elfio.hpp> | ||||||
| #include <fmt/format.h> | #include <fmt/format.h> | ||||||
|  | #include <iss/arch/traits.h> | ||||||
| #include <iss/arch_if.h> | #include <iss/arch_if.h> | ||||||
| #include <iss/log_categories.h> | #include <iss/log_categories.h> | ||||||
|  | #include <iss/mem/memory_if.h> | ||||||
|  | #include <iss/semihosting/semihosting.h> | ||||||
|  | #include <iss/vm_types.h> | ||||||
|  | #include <limits> | ||||||
|  | #include <sstream> | ||||||
| #include <string> | #include <string> | ||||||
| #include <unordered_map> | #include <unordered_map> | ||||||
| #include <util/logging.h> | #include <util/logging.h> | ||||||
|  | #include <util/sparse_array.h> | ||||||
|  |  | ||||||
|  | #if defined(__GNUC__) | ||||||
|  | #define likely(x) ::__builtin_expect(!!(x), 1) | ||||||
|  | #define unlikely(x) ::__builtin_expect(!!(x), 0) | ||||||
|  | #else | ||||||
|  | #define likely(x) x | ||||||
|  | #define unlikely(x) x | ||||||
|  | #endif | ||||||
|  |  | ||||||
| namespace iss { | namespace iss { | ||||||
| namespace arch { | namespace arch { | ||||||
|  |  | ||||||
| enum { tohost_dflt = 0xF0001000, fromhost_dflt = 0xF0001040 }; | enum features_e { FEAT_NONE, FEAT_EXT_N = 1, FEAT_DEBUG = 2 }; | ||||||
|  |  | ||||||
| enum features_e { FEAT_NONE, FEAT_PMP = 1, FEAT_EXT_N = 2, FEAT_CLIC = 4, FEAT_DEBUG = 8, FEAT_TCM = 16 }; |  | ||||||
|  |  | ||||||
| enum riscv_csr { | enum riscv_csr { | ||||||
|     /* user-level CSR */ |     /* user-level CSR */ | ||||||
| @@ -178,26 +195,19 @@ enum riscv_csr { | |||||||
|     dcsr = 0x7B0, |     dcsr = 0x7B0, | ||||||
|     dpc = 0x7B1, |     dpc = 0x7B1, | ||||||
|     dscratch0 = 0x7B2, |     dscratch0 = 0x7B2, | ||||||
|     dscratch1 = 0x7B3 |     dscratch1 = 0x7B3, | ||||||
|  |     // vector CSR | ||||||
|  |     //  URW | ||||||
|  |     vstart = 0x008, | ||||||
|  |     vxsat = 0x009, | ||||||
|  |     vxrm = 0x00A, | ||||||
|  |     vcsr = 0x00F, | ||||||
|  |     // URO | ||||||
|  |     vl = 0xC20, | ||||||
|  |     vtype = 0xC21, | ||||||
|  |     vlenb = 0xC22, | ||||||
| }; | }; | ||||||
|  |  | ||||||
| enum { |  | ||||||
|     PGSHIFT = 12, |  | ||||||
|     PTE_PPN_SHIFT = 10, |  | ||||||
|     // page table entry (PTE) fields |  | ||||||
|     PTE_V = 0x001,   // Valid |  | ||||||
|     PTE_R = 0x002,   // Read |  | ||||||
|     PTE_W = 0x004,   // Write |  | ||||||
|     PTE_X = 0x008,   // Execute |  | ||||||
|     PTE_U = 0x010,   // User |  | ||||||
|     PTE_G = 0x020,   // Global |  | ||||||
|     PTE_A = 0x040,   // Accessed |  | ||||||
|     PTE_D = 0x080,   // Dirty |  | ||||||
|     PTE_SOFT = 0x300 // Reserved for Software |  | ||||||
| }; |  | ||||||
|  |  | ||||||
| template <typename T> inline bool PTE_TABLE(T PTE) { return (((PTE) & (PTE_V | PTE_R | PTE_W | PTE_X)) == PTE_V); } |  | ||||||
|  |  | ||||||
| enum { PRIV_U = 0, PRIV_S = 1, PRIV_M = 3, PRIV_D = 4 }; | enum { PRIV_U = 0, PRIV_S = 1, PRIV_M = 3, PRIV_D = 4 }; | ||||||
|  |  | ||||||
| enum { | enum { | ||||||
| @@ -216,25 +226,6 @@ enum { | |||||||
|     ISA_U = 1 << 20 |     ISA_U = 1 << 20 | ||||||
| }; | }; | ||||||
|  |  | ||||||
| struct vm_info { |  | ||||||
|     int levels; |  | ||||||
|     int idxbits; |  | ||||||
|     int ptesize; |  | ||||||
|     uint64_t ptbase; |  | ||||||
|     bool is_active() { return levels; } |  | ||||||
| }; |  | ||||||
|  |  | ||||||
| struct feature_config { |  | ||||||
|     uint64_t clic_base{0xc0000000}; |  | ||||||
|     unsigned clic_int_ctl_bits{4}; |  | ||||||
|     unsigned clic_num_irq{16}; |  | ||||||
|     unsigned clic_num_trigger{0}; |  | ||||||
|     uint64_t tcm_base{0x10000000}; |  | ||||||
|     uint64_t tcm_size{0x8000}; |  | ||||||
|     uint64_t io_address{0xf0000000}; |  | ||||||
|     uint64_t io_addr_mask{0xf0000000}; |  | ||||||
| }; |  | ||||||
|  |  | ||||||
| class trap_load_access_fault : public trap_access { | class trap_load_access_fault : public trap_access { | ||||||
| public: | public: | ||||||
|     trap_load_access_fault(uint64_t badaddr) |     trap_load_access_fault(uint64_t badaddr) | ||||||
| @@ -261,76 +252,189 @@ public: | |||||||
|     : trap_access(15 << 16, badaddr) {} |     : trap_access(15 << 16, badaddr) {} | ||||||
| }; | }; | ||||||
|  |  | ||||||
| inline void read_reg_uint32(uint64_t offs, uint32_t& reg, uint8_t* const data, unsigned length) { | template <typename WORD_TYPE> struct priv_if { | ||||||
|     auto reg_ptr = reinterpret_cast<uint8_t*>(®); |     using rd_csr_f = std::function<iss::status(unsigned addr, WORD_TYPE&)>; | ||||||
|     switch(offs & 0x3) { |     using wr_csr_f = std::function<iss::status(unsigned addr, WORD_TYPE)>; | ||||||
|     case 0: |  | ||||||
|         for(auto i = 0U; i < length; ++i) |     std::function<iss::status(unsigned, WORD_TYPE&)> read_csr; | ||||||
|             *(data + i) = *(reg_ptr + i); |     std::function<iss::status(unsigned, WORD_TYPE)> write_csr; | ||||||
|         break; |     std::function<iss::status(uint8_t const*)> exec_htif; | ||||||
|     case 1: |     std::function<void(uint16_t, uint16_t, WORD_TYPE)> raise_trap; // trap_id, cause, fault_data | ||||||
|         for(auto i = 0U; i < length; ++i) |     absl::flat_hash_map<unsigned, rd_csr_f>& csr_rd_cb; | ||||||
|             *(data + i) = *(reg_ptr + 1 + i); |     absl::flat_hash_map<unsigned, wr_csr_f>& csr_wr_cb; | ||||||
|         break; |     hart_state<WORD_TYPE>& state; | ||||||
|     case 2: |     uint8_t& PRIV; | ||||||
|         for(auto i = 0U; i < length; ++i) |     WORD_TYPE& PC; | ||||||
|             *(data + i) = *(reg_ptr + 2 + i); |     uint64_t& tohost; | ||||||
|         break; |     uint64_t& fromhost; | ||||||
|     case 3: |     unsigned& max_irq; | ||||||
|         *data = *(reg_ptr + 3); | }; | ||||||
|         break; |  | ||||||
|  | template <typename BASE, typename LOGCAT = logging::disass> struct riscv_hart_common : public BASE, public mem::memory_elem { | ||||||
|  |     const std::array<const char, 4> lvl = {{'U', 'S', 'H', 'M'}}; | ||||||
|  |     const std::array<const char*, 16> trap_str = {{"" | ||||||
|  |                                                    "Instruction address misaligned", // 0 | ||||||
|  |                                                    "Instruction access fault",       // 1 | ||||||
|  |                                                    "Illegal instruction",            // 2 | ||||||
|  |                                                    "Breakpoint",                     // 3 | ||||||
|  |                                                    "Load address misaligned",        // 4 | ||||||
|  |                                                    "Load access fault",              // 5 | ||||||
|  |                                                    "Store/AMO address misaligned",   // 6 | ||||||
|  |                                                    "Store/AMO access fault",         // 7 | ||||||
|  |                                                    "Environment call from U-mode",   // 8 | ||||||
|  |                                                    "Environment call from S-mode",   // 9 | ||||||
|  |                                                    "Reserved",                       // a | ||||||
|  |                                                    "Environment call from M-mode",   // b | ||||||
|  |                                                    "Instruction page fault",         // c | ||||||
|  |                                                    "Load page fault",                // d | ||||||
|  |                                                    "Reserved",                       // e | ||||||
|  |                                                    "Store/AMO page fault"}}; | ||||||
|  |     const std::array<const char*, 12> irq_str = {{"User software interrupt", "Supervisor software interrupt", "Reserved", | ||||||
|  |                                                   "Machine software interrupt", "User timer interrupt", "Supervisor timer interrupt", | ||||||
|  |                                                   "Reserved", "Machine timer interrupt", "User external interrupt", | ||||||
|  |                                                   "Supervisor external interrupt", "Reserved", "Machine external interrupt"}}; | ||||||
|  |     constexpr static unsigned MEM = traits<BASE>::MEM; | ||||||
|  |  | ||||||
|  |     using core = BASE; | ||||||
|  |     using this_class = riscv_hart_common<BASE, LOGCAT>; | ||||||
|  |     using phys_addr_t = typename core::phys_addr_t; | ||||||
|  |     using reg_t = typename core::reg_t; | ||||||
|  |     using addr_t = typename core::addr_t; | ||||||
|  |  | ||||||
|  |     using rd_csr_f = std::function<iss::status(unsigned addr, reg_t&)>; | ||||||
|  |     using wr_csr_f = std::function<iss::status(unsigned addr, reg_t)>; | ||||||
|  |  | ||||||
|  | #define MK_CSR_RD_CB(FCT) [this](unsigned a, reg_t& r) -> iss::status { return this->FCT(a, r); }; | ||||||
|  | #define MK_CSR_WR_CB(FCT) [this](unsigned a, reg_t r) -> iss::status { return this->FCT(a, r); }; | ||||||
|  |  | ||||||
|  |     riscv_hart_common() | ||||||
|  |     : state() | ||||||
|  |     , instr_if(*this) { | ||||||
|  |         // reset values | ||||||
|  |         csr[misa] = traits<BASE>::MISA_VAL; | ||||||
|  |         csr[mvendorid] = 0x669; | ||||||
|  |         csr[marchid] = traits<BASE>::MARCHID_VAL; | ||||||
|  |         csr[mimpid] = 1; | ||||||
|  |  | ||||||
|  |         if(traits<BASE>::FLEN > 0) { | ||||||
|  |             csr_rd_cb[fcsr] = MK_CSR_RD_CB(read_fcsr); | ||||||
|  |             csr_wr_cb[fcsr] = MK_CSR_WR_CB(write_fcsr); | ||||||
|  |             csr_rd_cb[fflags] = MK_CSR_RD_CB(read_fcsr); | ||||||
|  |             csr_wr_cb[fflags] = MK_CSR_WR_CB(write_fcsr); | ||||||
|  |             csr_rd_cb[frm] = MK_CSR_RD_CB(read_fcsr); | ||||||
|  |             csr_wr_cb[frm] = MK_CSR_WR_CB(write_fcsr); | ||||||
|  |         } | ||||||
|  |         if(traits<BASE>::V_REGS_SIZE > 0) { | ||||||
|  |             csr_rd_cb[vstart] = MK_CSR_RD_CB(read_vstart); | ||||||
|  |             csr_wr_cb[vstart] = MK_CSR_WR_CB(write_vstart); | ||||||
|  |             csr_rd_cb[vxsat] = MK_CSR_RD_CB(read_vxsat); | ||||||
|  |             csr_wr_cb[vxsat] = MK_CSR_WR_CB(write_vxsat); | ||||||
|  |             csr_rd_cb[vxrm] = MK_CSR_RD_CB(read_vxrm); | ||||||
|  |             csr_wr_cb[vxrm] = MK_CSR_WR_CB(write_vxrm); | ||||||
|  |             csr_rd_cb[vcsr] = MK_CSR_RD_CB(read_vcsr); | ||||||
|  |             csr_wr_cb[vcsr] = MK_CSR_WR_CB(write_vcsr); | ||||||
|  |             csr_rd_cb[vl] = MK_CSR_RD_CB(read_vl); | ||||||
|  |             csr_rd_cb[vtype] = MK_CSR_RD_CB(read_vtype); | ||||||
|  |             csr_rd_cb[vlenb] = MK_CSR_RD_CB(read_vlenb); | ||||||
|  |         } | ||||||
|  |         for(unsigned addr = mhpmcounter3; addr <= mhpmcounter31; ++addr) { | ||||||
|  |             csr_rd_cb[addr] = MK_CSR_RD_CB(read_null); | ||||||
|  |             csr_wr_cb[addr] = MK_CSR_WR_CB(write_plain); | ||||||
|  |         } | ||||||
|  |         if(traits<BASE>::XLEN == 32) | ||||||
|  |             for(unsigned addr = mhpmcounter3h; addr <= mhpmcounter31h; ++addr) { | ||||||
|  |                 csr_rd_cb[addr] = MK_CSR_RD_CB(read_null); | ||||||
|  |                 csr_wr_cb[addr] = MK_CSR_WR_CB(write_plain); | ||||||
|  |             } | ||||||
|  |         for(unsigned addr = mhpmevent3; addr <= mhpmevent31; ++addr) { | ||||||
|  |             csr_rd_cb[addr] = MK_CSR_RD_CB(read_null); | ||||||
|  |             csr_wr_cb[addr] = MK_CSR_WR_CB(write_plain); | ||||||
|  |         } | ||||||
|  |         for(unsigned addr = hpmcounter3; addr <= hpmcounter31; ++addr) { | ||||||
|  |             csr_rd_cb[addr] = MK_CSR_RD_CB(read_null); | ||||||
|  |         } | ||||||
|  |         if(traits<BASE>::XLEN == 32) | ||||||
|  |             for(unsigned addr = hpmcounter3h; addr <= hpmcounter31h; ++addr) { | ||||||
|  |                 csr_rd_cb[addr] = MK_CSR_RD_CB(read_null); | ||||||
|  |             } | ||||||
|  |         // common regs | ||||||
|  |         const std::array<unsigned, 4> roaddrs{{misa, mvendorid, marchid, mimpid}}; | ||||||
|  |         for(auto addr : roaddrs) { | ||||||
|  |             csr_rd_cb[addr] = MK_CSR_RD_CB(read_plain); | ||||||
|  |             csr_wr_cb[addr] = MK_CSR_WR_CB(write_null); | ||||||
|  |         } | ||||||
|  |         // special handling & overrides | ||||||
|  |         csr_rd_cb[time] = MK_CSR_RD_CB(read_time); | ||||||
|  |         if(traits<BASE>::XLEN == 32) | ||||||
|  |             csr_rd_cb[timeh] = MK_CSR_RD_CB(read_time); | ||||||
|  |         csr_rd_cb[cycle] = MK_CSR_RD_CB(read_cycle); | ||||||
|  |         if(traits<BASE>::XLEN == 32) | ||||||
|  |             csr_rd_cb[cycleh] = MK_CSR_RD_CB(read_cycle); | ||||||
|  |         csr_rd_cb[instret] = MK_CSR_RD_CB(read_instret); | ||||||
|  |         if(traits<BASE>::XLEN == 32) | ||||||
|  |             csr_rd_cb[instreth] = MK_CSR_RD_CB(read_instret); | ||||||
|  |  | ||||||
|  |         csr_rd_cb[mcycle] = MK_CSR_RD_CB(read_cycle); | ||||||
|  |         csr_wr_cb[mcycle] = MK_CSR_WR_CB(write_cycle); | ||||||
|  |         if(traits<BASE>::XLEN == 32) | ||||||
|  |             csr_rd_cb[mcycleh] = MK_CSR_RD_CB(read_cycle); | ||||||
|  |         if(traits<BASE>::XLEN == 32) | ||||||
|  |             csr_wr_cb[mcycleh] = MK_CSR_WR_CB(write_cycle); | ||||||
|  |         csr_rd_cb[minstret] = MK_CSR_RD_CB(read_instret); | ||||||
|  |         csr_wr_cb[minstret] = MK_CSR_WR_CB(write_instret); | ||||||
|  |         if(traits<BASE>::XLEN == 32) | ||||||
|  |             csr_rd_cb[minstreth] = MK_CSR_RD_CB(read_instret); | ||||||
|  |         if(traits<BASE>::XLEN == 32) | ||||||
|  |             csr_wr_cb[minstreth] = MK_CSR_WR_CB(write_instret); | ||||||
|  |         csr_rd_cb[mhartid] = MK_CSR_RD_CB(read_hartid); | ||||||
|  |     }; | ||||||
|  |  | ||||||
|  |     ~riscv_hart_common() { | ||||||
|  |         if(io_buf.str().length()) { | ||||||
|  |             CPPLOG(INFO) << "tohost send '" << io_buf.str() << "'"; | ||||||
|         } |         } | ||||||
|     } |     } | ||||||
|  |  | ||||||
| inline void write_reg_uint32(uint64_t offs, uint32_t& reg, const uint8_t* const data, unsigned length) { |  | ||||||
|     auto reg_ptr = reinterpret_cast<uint8_t*>(®); |  | ||||||
|     switch(offs & 0x3) { |  | ||||||
|     case 0: |  | ||||||
|         for(auto i = 0U; i < length; ++i) |  | ||||||
|             *(reg_ptr + i) = *(data + i); |  | ||||||
|         break; |  | ||||||
|     case 1: |  | ||||||
|         for(auto i = 0U; i < length; ++i) |  | ||||||
|             *(reg_ptr + 1 + i) = *(data + i); |  | ||||||
|         break; |  | ||||||
|     case 2: |  | ||||||
|         for(auto i = 0U; i < length; ++i) |  | ||||||
|             *(reg_ptr + 2 + i) = *(data + i); |  | ||||||
|         break; |  | ||||||
|     case 3: |  | ||||||
|         *(reg_ptr + 3) = *data; |  | ||||||
|         break; |  | ||||||
|     } |  | ||||||
| } |  | ||||||
| struct riscv_hart_common { |  | ||||||
|     riscv_hart_common(){}; |  | ||||||
|     ~riscv_hart_common(){}; |  | ||||||
|     std::unordered_map<std::string, uint64_t> symbol_table; |     std::unordered_map<std::string, uint64_t> symbol_table; | ||||||
|  |     uint64_t entry_address{0}; | ||||||
|  |     uint64_t tohost = std::numeric_limits<uint64_t>::max(); | ||||||
|  |     uint64_t fromhost = std::numeric_limits<uint64_t>::max(); | ||||||
|  |     std::stringstream io_buf; | ||||||
|  |  | ||||||
|     std::unordered_map<std::string, uint64_t> get_sym_table(std::string name) { |     void set_semihosting_callback(semihosting_cb_t<reg_t> cb) { semihosting_cb = cb; }; | ||||||
|         if(!symbol_table.empty()) |  | ||||||
|             return symbol_table; |     std::pair<uint64_t, bool> load_file(std::string name, int type) { | ||||||
|         FILE* fp = fopen(name.c_str(), "r"); |         return std::make_pair(entry_address, read_elf_file(name, sizeof(reg_t) == 4 ? ELFIO::ELFCLASS32 : ELFIO::ELFCLASS64)); | ||||||
|         if(fp) { |     } | ||||||
|             std::array<char, 5> buf; |  | ||||||
|             auto n = fread(buf.data(), 1, 4, fp); |     bool read_elf_file(std::string name, uint8_t expected_elf_class) { | ||||||
|             fclose(fp); |  | ||||||
|             if(n != 4) |  | ||||||
|                 throw std::runtime_error("input file has insufficient size"); |  | ||||||
|             buf[4] = 0; |  | ||||||
|             if(strcmp(buf.data() + 1, "ELF") == 0) { |  | ||||||
|         // Create elfio reader |         // Create elfio reader | ||||||
|         ELFIO::elfio reader; |         ELFIO::elfio reader; | ||||||
|         // Load ELF data |         // Load ELF data | ||||||
|                 if(!reader.load(name)) |         if(reader.load(name)) { | ||||||
|                     throw std::runtime_error("could not process elf file"); |  | ||||||
|             // check elf properties |             // check elf properties | ||||||
|                 if(reader.get_type() != ET_EXEC) |             if(reader.get_class() != expected_elf_class) { | ||||||
|                     throw std::runtime_error("wrong elf type in file"); |                 CPPLOG(ERR) << "ISA missmatch, selected XLEN does not match supplied file "; | ||||||
|                 if(reader.get_machine() != EM_RISCV) |                 return false; | ||||||
|                     throw std::runtime_error("wrong elf machine in file"); |             } | ||||||
|  |             if(reader.get_type() != ELFIO::ET_EXEC) | ||||||
|  |                 return false; | ||||||
|  |             if(reader.get_machine() != ELFIO::EM_RISCV) | ||||||
|  |                 return false; | ||||||
|  |             entry_address = reader.get_entry(); | ||||||
|  |             for(const auto& pseg : reader.segments) { | ||||||
|  |                 const auto fsize = pseg->get_file_size(); // 0x42c/0x0 | ||||||
|  |                 const auto seg_data = pseg->get_data(); | ||||||
|  |                 const auto type = pseg->get_type(); | ||||||
|  |                 if(type == ELFIO::PT_LOAD && fsize > 0) { | ||||||
|  |                     auto res = this->write(iss::address_type::PHYSICAL, iss::access_type::DEBUG_WRITE, traits<BASE>::MEM, | ||||||
|  |                                            pseg->get_physical_address(), fsize, reinterpret_cast<const uint8_t* const>(seg_data)); | ||||||
|  |                     if(res != iss::Ok) | ||||||
|  |                         CPPLOG(ERR) << "problem writing " << fsize << "bytes to 0x" << std::hex << pseg->get_physical_address(); | ||||||
|  |                 } | ||||||
|  |             } | ||||||
|             const auto sym_sec = reader.sections[".symtab"]; |             const auto sym_sec = reader.sections[".symtab"]; | ||||||
|                 if(SHT_SYMTAB == sym_sec->get_type() || SHT_DYNSYM == sym_sec->get_type()) { |             if(ELFIO::SHT_SYMTAB == sym_sec->get_type() || ELFIO::SHT_DYNSYM == sym_sec->get_type()) { | ||||||
|                 ELFIO::symbol_section_accessor symbols(reader, sym_sec); |                 ELFIO::symbol_section_accessor symbols(reader, sym_sec); | ||||||
|                 auto sym_no = symbols.get_symbols_num(); |                 auto sym_no = symbols.get_symbols_num(); | ||||||
|                 std::string name; |                 std::string name; | ||||||
| @@ -349,13 +453,459 @@ struct riscv_hart_common { | |||||||
| #endif | #endif | ||||||
|                     } |                     } | ||||||
|                 } |                 } | ||||||
|  |                 auto to_it = symbol_table.find("tohost"); | ||||||
|  |                 if(to_it != std::end(symbol_table)) | ||||||
|  |                     tohost = to_it->second; | ||||||
|  |                 auto from_it = symbol_table.find("tohost"); | ||||||
|  |                 if(from_it != std::end(symbol_table)) | ||||||
|  |                     tohost = from_it->second; | ||||||
|             } |             } | ||||||
|                 return symbol_table; |             return true; | ||||||
|         } |         } | ||||||
|             throw std::runtime_error(fmt::format("memory load file {} is not a valid elf file", name)); |         return false; | ||||||
|         } else |  | ||||||
|             throw std::runtime_error(fmt::format("memory load file not found, check if {} is a valid file", name)); |  | ||||||
|     }; |     }; | ||||||
|  |  | ||||||
|  |     iss::status execute_sys_write(arch_if* aif, const std::array<uint64_t, 8>& loaded_payload, unsigned mem_type) { | ||||||
|  |         uint64_t fd = loaded_payload[1]; | ||||||
|  |         uint64_t buf_ptr = loaded_payload[2]; | ||||||
|  |         uint64_t len = loaded_payload[3]; | ||||||
|  |         std::vector<char> buf(len); | ||||||
|  |         if(aif->read(address_type::PHYSICAL, access_type::DEBUG_READ, mem_type, buf_ptr, len, reinterpret_cast<uint8_t*>(buf.data()))) { | ||||||
|  |             CPPLOG(ERR) << "SYS_WRITE buffer read went wrong"; | ||||||
|  |             return iss::Err; | ||||||
|  |         } | ||||||
|  |         // we disregard the fd and just log to stdout | ||||||
|  |         for(size_t i = 0; i < len; i++) { | ||||||
|  |             if(buf[i] == '\n' || buf[i] == '\0') { | ||||||
|  |                 CPPLOG(INFO) << "tohost send '" << io_buf.str() << "'"; | ||||||
|  |                 io_buf.str(""); | ||||||
|  |             } else | ||||||
|  |                 io_buf << buf[i]; | ||||||
|  |         } | ||||||
|  |  | ||||||
|  |         // Not sure what the correct return value should be | ||||||
|  |         uint8_t ret_val = 1; | ||||||
|  |         if(fromhost != std::numeric_limits<uint64_t>::max()) | ||||||
|  |             if(aif->write(address_type::PHYSICAL, access_type::DEBUG_WRITE, mem_type, fromhost, 1, &ret_val)) { | ||||||
|  |                 CPPLOG(ERR) << "Fromhost write went wrong"; | ||||||
|  |                 return iss::Err; | ||||||
|  |             } | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     constexpr bool has_compressed() { return traits<BASE>::MISA_VAL & 0b0100; } | ||||||
|  |  | ||||||
|  |     constexpr reg_t get_pc_mask() { return has_compressed() ? (reg_t)~1 : (reg_t)~3; } | ||||||
|  |  | ||||||
|  |     void disass_output(uint64_t pc, const std::string instr) override { | ||||||
|  |         // NSCLOG(INFO, LOGCAT) << fmt::format("0x{:016x}    {:40} [p:{};s:0x{:x};c:{}]", pc, instr, lvl[this->reg.PRIV], | ||||||
|  |         // (reg_t)state.mstatus, | ||||||
|  |         //                                     this->reg.cycle + cycle_offset); | ||||||
|  |         NSCLOG(INFO, LOGCAT) << fmt::format("0x{:016x}    {:40} [p:{};c:{}]", pc, instr, lvl[this->reg.PRIV], | ||||||
|  |                                             this->reg.cycle + cycle_offset); | ||||||
|  |     }; | ||||||
|  |  | ||||||
|  |     void register_csr(unsigned addr, rd_csr_f f) { csr_rd_cb[addr] = f; } | ||||||
|  |     void register_csr(unsigned addr, wr_csr_f f) { csr_wr_cb[addr] = f; } | ||||||
|  |     void register_csr(unsigned addr, rd_csr_f rdf, wr_csr_f wrf) { | ||||||
|  |         csr_rd_cb[addr] = rdf; | ||||||
|  |         csr_wr_cb[addr] = wrf; | ||||||
|  |     } | ||||||
|  |     void unregister_csr_rd(unsigned addr) { csr_rd_cb.erase(addr); } | ||||||
|  |     void unregister_csr_wr(unsigned addr) { csr_wr_cb.erase(addr); } | ||||||
|  |  | ||||||
|  |     bool debug_mode_active() { return this->reg.PRIV & 0x4; } | ||||||
|  |  | ||||||
|  |     const reg_t& get_mhartid() const { return mhartid_reg; } | ||||||
|  |     void set_mhartid(reg_t mhartid) { mhartid_reg = mhartid; }; | ||||||
|  |  | ||||||
|  |     iss::status read_csr(unsigned addr, reg_t& val) { | ||||||
|  |         if(addr >= csr.size()) | ||||||
|  |             return iss::Err; | ||||||
|  |         auto req_priv_lvl = (addr >> 8) & 0x3; | ||||||
|  |         if(this->reg.PRIV < req_priv_lvl) // not having required privileges | ||||||
|  |             throw illegal_instruction_fault(this->fault_data); | ||||||
|  |         auto it = csr_rd_cb.find(addr); | ||||||
|  |         if(it == csr_rd_cb.end() || !it->second) // non existent register | ||||||
|  |             throw illegal_instruction_fault(this->fault_data); | ||||||
|  |         return it->second(addr, val); | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_csr(unsigned addr, reg_t val) { | ||||||
|  |         if(addr >= csr.size()) | ||||||
|  |             return iss::Err; | ||||||
|  |         auto req_priv_lvl = (addr >> 8) & 0x3; | ||||||
|  |         if(this->reg.PRIV < req_priv_lvl) // not having required privileges | ||||||
|  |             throw illegal_instruction_fault(this->fault_data); | ||||||
|  |         if((addr & 0xc00) == 0xc00) // writing to read-only region | ||||||
|  |             throw illegal_instruction_fault(this->fault_data); | ||||||
|  |         auto it = csr_wr_cb.find(addr); | ||||||
|  |         if(it == csr_wr_cb.end() || !it->second) // non existent register | ||||||
|  |             throw illegal_instruction_fault(this->fault_data); | ||||||
|  |         return it->second(addr, val); | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_null(unsigned addr, reg_t& val) { | ||||||
|  |         val = 0; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_null(unsigned addr, reg_t val) { return iss::status::Ok; } | ||||||
|  |  | ||||||
|  |     iss::status read_plain(unsigned addr, reg_t& val) { | ||||||
|  |         val = csr[addr]; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_plain(unsigned addr, reg_t val) { | ||||||
|  |         csr[addr] = val; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_cycle(unsigned addr, reg_t& val) { | ||||||
|  |         auto cycle_val = this->reg.cycle + cycle_offset; | ||||||
|  |         if(addr == mcycle) { | ||||||
|  |             val = static_cast<reg_t>(cycle_val); | ||||||
|  |         } else if(addr == mcycleh) { | ||||||
|  |             val = static_cast<reg_t>(cycle_val >> 32); | ||||||
|  |         } | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_cycle(unsigned addr, reg_t val) { | ||||||
|  |         if(sizeof(typename traits<BASE>::reg_t) != 4) { | ||||||
|  |             mcycle_csr = static_cast<uint64_t>(val); | ||||||
|  |         } else { | ||||||
|  |             if(addr == mcycle) { | ||||||
|  |                 mcycle_csr = (mcycle_csr & 0xffffffff00000000) + val; | ||||||
|  |             } else { | ||||||
|  |                 mcycle_csr = (static_cast<uint64_t>(val) << 32) + (mcycle_csr & 0xffffffff); | ||||||
|  |             } | ||||||
|  |         } | ||||||
|  |         cycle_offset = mcycle_csr - this->reg.cycle; // TODO: relying on wrap-around | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_instret(unsigned addr, reg_t& val) { | ||||||
|  |         if((addr & 0xff) == (minstret & 0xff)) { | ||||||
|  |             val = static_cast<reg_t>(this->reg.instret); | ||||||
|  |         } else if((addr & 0xff) == (minstreth & 0xff)) { | ||||||
|  |             val = static_cast<reg_t>(this->reg.instret >> 32); | ||||||
|  |         } | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_instret(unsigned addr, reg_t val) { | ||||||
|  |         if(sizeof(typename traits<BASE>::reg_t) != 4) { | ||||||
|  |             this->reg.instret = static_cast<uint64_t>(val); | ||||||
|  |         } else { | ||||||
|  |             if((addr & 0xff) == (minstret & 0xff)) { | ||||||
|  |                 this->reg.instret = (this->reg.instret & 0xffffffff00000000) + val; | ||||||
|  |             } else { | ||||||
|  |                 this->reg.instret = (static_cast<uint64_t>(val) << 32) + (this->reg.instret & 0xffffffff); | ||||||
|  |             } | ||||||
|  |         } | ||||||
|  |         this->reg.instret--; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_time(unsigned addr, reg_t& val) { | ||||||
|  |         uint64_t time_val = this->reg.cycle / (100000000 / 32768 - 1); //-> ~3052; | ||||||
|  |         if(addr == time) { | ||||||
|  |             val = static_cast<reg_t>(time_val); | ||||||
|  |         } else if(addr == timeh) { | ||||||
|  |             if(sizeof(typename traits<BASE>::reg_t) != 4) | ||||||
|  |                 return iss::Err; | ||||||
|  |             val = static_cast<reg_t>(time_val >> 32); | ||||||
|  |         } | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_tvec(unsigned addr, reg_t& val) { | ||||||
|  |         val = csr[addr] & ~2; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_hartid(unsigned addr, reg_t& val) { | ||||||
|  |         val = mhartid_reg; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_epc(unsigned addr, reg_t val) { | ||||||
|  |         csr[addr] = val & get_pc_mask(); | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_dcsr(unsigned addr, reg_t val) { | ||||||
|  |         if(!debug_mode_active()) | ||||||
|  |             throw illegal_instruction_fault(this->fault_data); | ||||||
|  |         //                  +-------------- ebreakm | ||||||
|  |         //                  |   +---------- stepi | ||||||
|  |         //                  |   |  +++----- cause | ||||||
|  |         //                  |   |  |||   +- step | ||||||
|  |         csr[addr] = val & 0b1000100111000100U; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_debug(unsigned addr, reg_t& val) { | ||||||
|  |         if(!debug_mode_active()) | ||||||
|  |             throw illegal_instruction_fault(this->fault_data); | ||||||
|  |         val = csr[addr]; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_dscratch(unsigned addr, reg_t val) { | ||||||
|  |         if(!debug_mode_active()) | ||||||
|  |             throw illegal_instruction_fault(this->fault_data); | ||||||
|  |         csr[addr] = val; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_dpc(unsigned addr, reg_t& val) { | ||||||
|  |         if(!debug_mode_active()) | ||||||
|  |             throw illegal_instruction_fault(this->fault_data); | ||||||
|  |         val = this->reg.DPC; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_dpc(unsigned addr, reg_t val) { | ||||||
|  |         if(!debug_mode_active()) | ||||||
|  |             throw illegal_instruction_fault(this->fault_data); | ||||||
|  |         this->reg.DPC = val; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_fcsr(unsigned addr, reg_t& val) { | ||||||
|  |         switch(addr) { | ||||||
|  |         case 1: // fflags, 4:0 | ||||||
|  |             val = bit_sub<0, 5>(this->get_fcsr()); | ||||||
|  |             break; | ||||||
|  |         case 2: // frm, 7:5 | ||||||
|  |             val = bit_sub<5, 3>(this->get_fcsr()); | ||||||
|  |             break; | ||||||
|  |         case 3: // fcsr | ||||||
|  |             val = this->get_fcsr(); | ||||||
|  |             break; | ||||||
|  |         default: | ||||||
|  |             return iss::Err; | ||||||
|  |         } | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_fcsr(unsigned addr, reg_t val) { | ||||||
|  |         switch(addr) { | ||||||
|  |         case 1: // fflags, 4:0 | ||||||
|  |             this->set_fcsr((this->get_fcsr() & 0xffffffe0) | (val & 0x1f)); | ||||||
|  |             break; | ||||||
|  |         case 2: // frm, 7:5 | ||||||
|  |             this->set_fcsr((this->get_fcsr() & 0xffffff1f) | ((val & 0x7) << 5)); | ||||||
|  |             break; | ||||||
|  |         case 3: // fcsr | ||||||
|  |             this->set_fcsr(val & 0xff); | ||||||
|  |             break; | ||||||
|  |         default: | ||||||
|  |             return iss::Err; | ||||||
|  |         } | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_vstart(unsigned addr, reg_t& val) { | ||||||
|  |         val = this->get_vstart(); | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_vstart(unsigned addr, reg_t val) { | ||||||
|  |         this->set_vstart(val); | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_vxsat(unsigned addr, reg_t& val) { | ||||||
|  |         val = this->get_vxsat(); | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_vxsat(unsigned addr, reg_t val) { | ||||||
|  |         this->set_vxsat(val & 1); | ||||||
|  |         csr[vcsr] = (~1ULL & csr[vcsr]) | (val & 1); | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_vxrm(unsigned addr, reg_t& val) { | ||||||
|  |         val = this->get_vxrm(); | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_vxrm(unsigned addr, reg_t val) { | ||||||
|  |         this->set_vxrm(val & 0b11); | ||||||
|  |         csr[vcsr] = (~0b110ULL & csr[vcsr]) | ((val & 0b11) << 1); | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_vcsr(unsigned addr, reg_t& val) { | ||||||
|  |         val = csr[vcsr]; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_vcsr(unsigned addr, reg_t val) { | ||||||
|  |         csr[vcsr] = val; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_vl(unsigned addr, reg_t& val) { | ||||||
|  |         val = this->get_vl(); | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_vtype(unsigned addr, reg_t& val) { | ||||||
|  |         val = this->get_vtype(); | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_vlenb(unsigned addr, reg_t& val) { | ||||||
|  |         val = csr[vlenb]; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     priv_if<reg_t> get_priv_if() { | ||||||
|  |         return priv_if<reg_t>{.read_csr = [this](unsigned addr, reg_t& val) -> iss::status { return read_csr(addr, val); }, | ||||||
|  |                               .write_csr = [this](unsigned addr, reg_t val) -> iss::status { return write_csr(addr, val); }, | ||||||
|  |                               .exec_htif = [this](uint8_t const* data) -> iss::status { return execute_htif(data); }, | ||||||
|  |                               .raise_trap = | ||||||
|  |                                   [this](uint16_t trap_id, uint16_t cause, reg_t fault_data) { | ||||||
|  |                                       this->reg.trap_state = 0x80ULL << 24 | (cause << 16) | trap_id; | ||||||
|  |                                       this->fault_data = fault_data; | ||||||
|  |                                   }, | ||||||
|  |                               .csr_rd_cb{this->csr_rd_cb}, | ||||||
|  |                               .csr_wr_cb{this->csr_wr_cb}, | ||||||
|  |                               .state{this->state}, | ||||||
|  |                               .PRIV{this->reg.PRIV}, | ||||||
|  |                               .PC{this->reg.PC}, | ||||||
|  |                               .tohost{this->tohost}, | ||||||
|  |                               .fromhost{this->fromhost}, | ||||||
|  |                               .max_irq{mcause_max_irq}}; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status execute_htif(uint8_t const* data) { | ||||||
|  |         reg_t cur_data = *reinterpret_cast<const reg_t*>(data); | ||||||
|  |         // Extract Device (bits 63:56) | ||||||
|  |         uint8_t device = traits<BASE>::XLEN == 32 ? 0 : (cur_data >> 56) & 0xFF; | ||||||
|  |         // Extract Command (bits 55:48) | ||||||
|  |         uint8_t command = traits<BASE>::XLEN == 32 ? 0 : (cur_data >> 48) & 0xFF; | ||||||
|  |         // Extract payload (bits 47:0) | ||||||
|  |         uint64_t payload_addr = cur_data & 0xFFFFFFFFFFFFULL; | ||||||
|  |         if(payload_addr & 1) { | ||||||
|  |             CPPLOG(FATAL) << "this->tohost value is 0x" << std::hex << payload_addr << std::dec << " (" << payload_addr | ||||||
|  |                           << "), stopping simulation"; | ||||||
|  |             this->reg.trap_state = std::numeric_limits<uint32_t>::max(); | ||||||
|  |             this->interrupt_sim = payload_addr; | ||||||
|  |             return iss::Ok; | ||||||
|  |         } else if(device == 0 && command == 0) { | ||||||
|  |             std::array<uint64_t, 8> loaded_payload; | ||||||
|  |             if(memory.rd_mem(access_type::DEBUG_READ, payload_addr, 8 * sizeof(uint64_t), | ||||||
|  |                              reinterpret_cast<uint8_t*>(loaded_payload.data())) == iss::Err) | ||||||
|  |                 CPPLOG(ERR) << "Syscall read went wrong"; | ||||||
|  |             uint64_t syscall_num = loaded_payload.at(0); | ||||||
|  |             if(syscall_num == 64) { // SYS_WRITE | ||||||
|  |                 return this->execute_sys_write(this, loaded_payload, traits<BASE>::MEM); | ||||||
|  |             } else { | ||||||
|  |                 CPPLOG(ERR) << "this->tohost syscall with number 0x" << std::hex << syscall_num << std::dec << " (" << syscall_num | ||||||
|  |                             << ") not implemented"; | ||||||
|  |                 this->reg.trap_state = std::numeric_limits<uint32_t>::max(); | ||||||
|  |                 this->interrupt_sim = payload_addr; | ||||||
|  |                 return iss::Ok; | ||||||
|  |             } | ||||||
|  |         } else { | ||||||
|  |             CPPLOG(ERR) << "this->tohost functionality not implemented for device " << device << " and command " << command; | ||||||
|  |             this->reg.trap_state = std::numeric_limits<uint32_t>::max(); | ||||||
|  |             this->interrupt_sim = payload_addr; | ||||||
|  |             return iss::Ok; | ||||||
|  |         } | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     mem::memory_hierarchy memories; | ||||||
|  |  | ||||||
|  |     mem::memory_if get_mem_if() override { | ||||||
|  |         assert(false || "This function should never be called"); | ||||||
|  |         return mem::memory_if{}; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     void set_next(mem::memory_if mem_if) override { memory = mem_if; }; | ||||||
|  |  | ||||||
|  |     void set_irq_num(unsigned i) { mcause_max_irq = 1 << util::ilog2(i); } | ||||||
|  |  | ||||||
|  | protected: | ||||||
|  |     hart_state<reg_t> state; | ||||||
|  |  | ||||||
|  |     static constexpr reg_t get_mstatus_mask_t(unsigned priv_lvl = PRIV_M) { | ||||||
|  |         if(sizeof(reg_t) == 4) { | ||||||
|  |             return priv_lvl == PRIV_U ? 0x80000011UL :   // 0b1...0 0001 0001 | ||||||
|  |                        priv_lvl == PRIV_S ? 0x800de133UL // 0b0...0 0001 1000 1001 1001; | ||||||
|  |                                           : 0x807ff9ddUL; | ||||||
|  |         } else { | ||||||
|  |             return priv_lvl == PRIV_U ? 0x011ULL : // 0b1...0 0001 0001 | ||||||
|  |                        priv_lvl == PRIV_S ? 0x000de133ULL | ||||||
|  |                                           : 0x007ff9ddULL; | ||||||
|  |         } | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     mem::memory_if memory; | ||||||
|  |     struct riscv_instrumentation_if : public iss::instrumentation_if { | ||||||
|  |  | ||||||
|  |         riscv_instrumentation_if(riscv_hart_common<BASE, LOGCAT>& arch) | ||||||
|  |         : arch(arch) {} | ||||||
|  |         /** | ||||||
|  |          * get the name of this architecture | ||||||
|  |          * | ||||||
|  |          * @return the name of this architecture | ||||||
|  |          */ | ||||||
|  |         const std::string core_type_name() const override { return traits<BASE>::core_type; } | ||||||
|  |  | ||||||
|  |         uint64_t get_pc() override { return arch.reg.PC; } | ||||||
|  |  | ||||||
|  |         uint64_t get_next_pc() override { return arch.reg.NEXT_PC; } | ||||||
|  |  | ||||||
|  |         uint64_t get_instr_word() override { return arch.reg.instruction; } | ||||||
|  |  | ||||||
|  |         uint64_t get_instr_count() override { return arch.reg.icount; } | ||||||
|  |  | ||||||
|  |         uint64_t get_pendig_traps() override { return arch.reg.trap_state; } | ||||||
|  |  | ||||||
|  |         uint64_t get_total_cycles() override { return arch.reg.cycle + arch.cycle_offset; } | ||||||
|  |  | ||||||
|  |         void update_last_instr_cycles(unsigned cycles) override { arch.cycle_offset += cycles - 1; } | ||||||
|  |  | ||||||
|  |         bool is_branch_taken() override { return arch.reg.last_branch; } | ||||||
|  |  | ||||||
|  |         unsigned get_reg_num() override { return traits<BASE>::NUM_REGS; } | ||||||
|  |  | ||||||
|  |         unsigned get_reg_size(unsigned num) override { return traits<BASE>::reg_bit_widths[num]; } | ||||||
|  |  | ||||||
|  |         std::unordered_map<std::string, uint64_t> const& get_symbol_table(std::string name) override { return arch.symbol_table; } | ||||||
|  |  | ||||||
|  |         riscv_hart_common<BASE, LOGCAT>& arch; | ||||||
|  |     }; | ||||||
|  |  | ||||||
|  |     friend struct riscv_instrumentation_if; | ||||||
|  |     riscv_instrumentation_if instr_if; | ||||||
|  |  | ||||||
|  |     instrumentation_if* get_instrumentation_if() override { return &instr_if; }; | ||||||
|  |  | ||||||
|  |     using csr_type = util::sparse_array<typename traits<BASE>::reg_t, 1ULL << 12, 12>; | ||||||
|  |     using csr_page_type = typename csr_type::page_type; | ||||||
|  |     csr_type csr; | ||||||
|  |  | ||||||
|  |     absl::flat_hash_map<unsigned, rd_csr_f> csr_rd_cb; | ||||||
|  |     absl::flat_hash_map<unsigned, wr_csr_f> csr_wr_cb; | ||||||
|  |  | ||||||
|  |     reg_t mhartid_reg{0x0}; | ||||||
|  |     uint64_t mcycle_csr{0}; | ||||||
|  |     uint64_t minstret_csr{0}; | ||||||
|  |     reg_t fault_data; | ||||||
|  |  | ||||||
|  |     int64_t cycle_offset{0}; | ||||||
|  |     int64_t instret_offset{0}; | ||||||
|  |     semihosting_cb_t<reg_t> semihosting_cb; | ||||||
|  |     unsigned mcause_max_irq{16U}; | ||||||
| }; | }; | ||||||
|  |  | ||||||
| } // namespace arch | } // namespace arch | ||||||
|   | |||||||
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							| @@ -1,5 +1,5 @@ | |||||||
| /******************************************************************************* | /******************************************************************************* | ||||||
|  * Copyright (C) 2017 - 2020 MINRES Technologies GmbH |  * Copyright (C) 2024 MINRES Technologies GmbH | ||||||
|  * All rights reserved. |  * All rights reserved. | ||||||
|  * |  * | ||||||
|  * Redistribution and use in source and binary forms, with or without |  * Redistribution and use in source and binary forms, with or without | ||||||
|   | |||||||
										
											
												File diff suppressed because one or more lines are too long
											
										
									
								
							| @@ -1,3 +1,37 @@ | |||||||
|  | /******************************************************************************* | ||||||
|  |  * Copyright (C) 2023 - 2025 MINRES Technologies GmbH | ||||||
|  |  * All rights reserved. | ||||||
|  |  * | ||||||
|  |  * Redistribution and use in source and binary forms, with or without | ||||||
|  |  * modification, are permitted provided that the following conditions are met: | ||||||
|  |  * | ||||||
|  |  * 1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer. | ||||||
|  |  * | ||||||
|  |  * 2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer in the documentation | ||||||
|  |  *    and/or other materials provided with the distribution. | ||||||
|  |  * | ||||||
|  |  * 3. Neither the name of the copyright holder nor the names of its contributors | ||||||
|  |  *    may be used to endorse or promote products derived from this software | ||||||
|  |  *    without specific prior written permission. | ||||||
|  |  * | ||||||
|  |  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  |  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  |  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||||
|  |  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||||
|  |  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||||
|  |  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||||
|  |  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||||
|  |  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||||
|  |  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||||
|  |  * POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  * | ||||||
|  |  * Contributors: | ||||||
|  |  *       eyck@minres.com - initial implementation | ||||||
|  |  ******************************************************************************/ | ||||||
|  |  | ||||||
| #ifndef _ISS_ARCH_TGC_MAPPER_H | #ifndef _ISS_ARCH_TGC_MAPPER_H | ||||||
| #define _ISS_ARCH_TGC_MAPPER_H | #define _ISS_ARCH_TGC_MAPPER_H | ||||||
|  |  | ||||||
| @@ -23,35 +57,29 @@ using tgc5c_xrb_nn_plat_type = iss::arch::hwl<iss::arch::riscv_hart_m_p<iss::arc | |||||||
| #ifdef CORE_TGC5D | #ifdef CORE_TGC5D | ||||||
| #include "riscv_hart_mu_p.h" | #include "riscv_hart_mu_p.h" | ||||||
| #include <iss/arch/tgc5d.h> | #include <iss/arch/tgc5d.h> | ||||||
| using tgc5d_plat_type = iss::arch::riscv_hart_mu_p<iss::arch::tgc5d, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_CLIC | | using tgc5d_plat_type = iss::arch::riscv_hart_mu_p<iss::arch::tgc5d, (iss::arch::features_e)(iss::arch::FEAT_EXT_N)>; | ||||||
|                                                                                              iss::arch::FEAT_EXT_N)>; |  | ||||||
| #endif | #endif | ||||||
| #ifdef CORE_TGC5D_XRB_MAC | #ifdef CORE_TGC5D_XRB_MAC | ||||||
| #include "riscv_hart_mu_p.h" | #include "riscv_hart_mu_p.h" | ||||||
| #include <iss/arch/tgc5d_xrb_mac.h> | #include <iss/arch/tgc5d_xrb_mac.h> | ||||||
| using tgc5d_xrb_mac_plat_type = | using tgc5d_xrb_mac_plat_type = iss::arch::riscv_hart_mu_p<iss::arch::tgc5d_xrb_mac(iss::arch::features_e)(iss::arch::FEAT_EXT_N)>; | ||||||
|     iss::arch::riscv_hart_mu_p<iss::arch::tgc5d_xrb_mac, |  | ||||||
|                                (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_CLIC | iss::arch::FEAT_EXT_N)>; |  | ||||||
| #endif | #endif | ||||||
| #ifdef CORE_TGC5D_XRB_NN | #ifdef CORE_TGC5D_XRB_NN | ||||||
| #include "hwl.h" | #include "hwl.h" | ||||||
| #include "riscv_hart_mu_p.h" | #include "riscv_hart_mu_p.h" | ||||||
| #include <iss/arch/tgc5d_xrb_nn.h> | #include <iss/arch/tgc5d_xrb_nn.h> | ||||||
| using tgc5d_xrb_nn_plat_type = | using tgc5d_xrb_nn_plat_type = | ||||||
|     iss::arch::hwl<iss::arch::riscv_hart_mu_p<iss::arch::tgc5d_xrb_nn, |     iss::arch::hwl<iss::arch::riscv_hart_mu_p<iss::arch::tgc5d_xrb_nn, (iss::arch::features_e)(iss::arch::FEAT_EXT_N)>>; | ||||||
|                                               (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_CLIC | iss::arch::FEAT_EXT_N)>>; |  | ||||||
| #endif | #endif | ||||||
| #ifdef CORE_TGC5E | #ifdef CORE_TGC5E | ||||||
| #include "riscv_hart_mu_p.h" | #include "riscv_hart_mu_p.h" | ||||||
| #include <iss/arch/tgc5e.h> | #include <iss/arch/tgc5e.h> | ||||||
| using tgc5e_plat_type = iss::arch::riscv_hart_mu_p<iss::arch::tgc5e, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_CLIC | | using tgc5e_plat_type = iss::arch::riscv_hart_mu_p<iss::arch::tgc5e, (iss::arch::features_e)(iss::arch::FEAT_EXT_N)>; | ||||||
|                                                                                              iss::arch::FEAT_EXT_N)>; |  | ||||||
| #endif | #endif | ||||||
| #ifdef CORE_TGC5X | #ifdef CORE_TGC5X | ||||||
| #include "riscv_hart_mu_p.h" | #include "riscv_hart_mu_p.h" | ||||||
| #include <iss/arch/tgc5x.h> | #include <iss/arch/tgc5x.h> | ||||||
| using tgc5x_plat_type = iss::arch::riscv_hart_mu_p<iss::arch::tgc5x, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_CLIC | | using tgc5x_plat_type = iss::arch::riscv_hart_mu_p<iss::arch::tgc5x, (iss::arch::features_e)(iss::arch::FEAT_EXT_N)>; | ||||||
|                                                                                              iss::arch::FEAT_EXT_N | iss::arch::FEAT_TCM)>; |  | ||||||
| #endif | #endif | ||||||
|  |  | ||||||
| #endif | #endif | ||||||
|   | |||||||
| @@ -87,7 +87,7 @@ public: | |||||||
|     virtual ~wt_cache() = default; |     virtual ~wt_cache() = default; | ||||||
|  |  | ||||||
|     unsigned size{4096}; |     unsigned size{4096}; | ||||||
|     unsigned line_sz{32}; |     unsigned line_sz{64}; | ||||||
|     unsigned ways{1}; |     unsigned ways{1}; | ||||||
|     uint64_t io_address{0xf0000000}; |     uint64_t io_address{0xf0000000}; | ||||||
|     uint64_t io_addr_mask{0xf0000000}; |     uint64_t io_addr_mask{0xf0000000}; | ||||||
| @@ -119,7 +119,7 @@ template <typename BASE> iss::status iss::arch::wt_cache<BASE>::read_cache(phys_ | |||||||
|         icache_ptr.reset(new cache::cache(size, line_sz, ways)); |         icache_ptr.reset(new cache::cache(size, line_sz, ways)); | ||||||
|         dcache_ptr.reset(new cache::cache(size, line_sz, ways)); |         dcache_ptr.reset(new cache::cache(size, line_sz, ways)); | ||||||
|     } |     } | ||||||
|     if((a.val & io_addr_mask) != io_address) { |     if((a.access & iss::access_type::FETCH) == iss::access_type::FETCH || (a.val & io_addr_mask) != io_address) { | ||||||
|         auto set_addr = (a.val & (size - 1)) >> util::ilog2(line_sz * ways); |         auto set_addr = (a.val & (size - 1)) >> util::ilog2(line_sz * ways); | ||||||
|         auto tag_addr = a.val >> util::ilog2(line_sz); |         auto tag_addr = a.val >> util::ilog2(line_sz); | ||||||
|         auto& set = (is_fetch(a.access) ? icache_ptr : dcache_ptr)->sets[set_addr]; |         auto& set = (is_fetch(a.access) ? icache_ptr : dcache_ptr)->sets[set_addr]; | ||||||
|   | |||||||
							
								
								
									
										4142
									
								
								src/iss/debugger/csr_names.cpp
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										4142
									
								
								src/iss/debugger/csr_names.cpp
									
									
									
									
									
										Normal file
									
								
							
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							| @@ -30,8 +30,8 @@ | |||||||
|  * |  * | ||||||
|  *******************************************************************************/ |  *******************************************************************************/ | ||||||
|  |  | ||||||
| #ifndef _ISS_DEBUGGER_RISCV_TARGET_ADAPTER_H_ | #ifndef _ISS_ARCH_DEBUGGER_RISCV_TARGET_ADAPTER_H_ | ||||||
| #define _ISS_DEBUGGER_RISCV_TARGET_ADAPTER_H_ | #define _ISS_ARCH_DEBUGGER_RISCV_TARGET_ADAPTER_H_ | ||||||
|  |  | ||||||
| #include "iss/arch_if.h" | #include "iss/arch_if.h" | ||||||
| #include <iss/arch/traits.h> | #include <iss/arch/traits.h> | ||||||
| @@ -48,6 +48,10 @@ | |||||||
|  |  | ||||||
| namespace iss { | namespace iss { | ||||||
| namespace debugger { | namespace debugger { | ||||||
|  |  | ||||||
|  | char const* const get_csr_name(unsigned); | ||||||
|  | constexpr auto csr_offset = 100U; | ||||||
|  |  | ||||||
| using namespace iss::arch; | using namespace iss::arch; | ||||||
| using namespace iss::debugger; | using namespace iss::debugger; | ||||||
|  |  | ||||||
| @@ -129,11 +133,17 @@ public: | |||||||
|  |  | ||||||
| protected: | protected: | ||||||
|     static inline constexpr addr_t map_addr(const addr_t& i) { return i; } |     static inline constexpr addr_t map_addr(const addr_t& i) { return i; } | ||||||
|  |     std::string csr_xml; | ||||||
|     iss::arch_if* core; |     iss::arch_if* core; | ||||||
|     rp_thread_ref thread_idx; |     rp_thread_ref thread_idx; | ||||||
| }; | }; | ||||||
|  |  | ||||||
|  | template <typename ARCH> typename std::enable_if<iss::arch::traits<ARCH>::FLEN != 0, unsigned>::type get_f0_offset() { | ||||||
|  |     return iss::arch::traits<ARCH>::F0; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | template <typename ARCH> typename std::enable_if<iss::arch::traits<ARCH>::FLEN == 0, unsigned>::type get_f0_offset() { return 0; } | ||||||
|  |  | ||||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::set_gen_thread(rp_thread_ref& thread) { | template <typename ARCH> status riscv_target_adapter<ARCH>::set_gen_thread(rp_thread_ref& thread) { | ||||||
|     thread_idx = thread; |     thread_idx = thread; | ||||||
|     return Ok; |     return Ok; | ||||||
| @@ -175,12 +185,29 @@ template <typename ARCH> status riscv_target_adapter<ARCH>::current_thread_query | |||||||
|  |  | ||||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::read_registers(std::vector<uint8_t>& data, std::vector<uint8_t>& avail) { | template <typename ARCH> status riscv_target_adapter<ARCH>::read_registers(std::vector<uint8_t>& data, std::vector<uint8_t>& avail) { | ||||||
|     CPPLOG(TRACE) << "reading target registers"; |     CPPLOG(TRACE) << "reading target registers"; | ||||||
|     // return idx<0?:; |  | ||||||
|     data.clear(); |     data.clear(); | ||||||
|     avail.clear(); |     avail.clear(); | ||||||
|     const uint8_t* reg_base = core->get_regs_base_ptr(); |     const uint8_t* reg_base = core->get_regs_base_ptr(); | ||||||
|     auto start_reg = arch::traits<ARCH>::X0; |     auto start_reg = arch::traits<ARCH>::X0; | ||||||
|     for(size_t reg_no = start_reg; reg_no < start_reg + 33 /*arch::traits<ARCH>::NUM_REGS*/; ++reg_no) { |     for(size_t i = 0; i < 33; ++i) { | ||||||
|  |         if(i < arch::traits<ARCH>::RFS || i == arch::traits<ARCH>::PC) { | ||||||
|  |             auto reg_no = i < 32 ? start_reg + i : arch::traits<ARCH>::PC; | ||||||
|  |             unsigned offset = traits<ARCH>::reg_byte_offsets[reg_no]; | ||||||
|  |             for(size_t j = 0; j < arch::traits<ARCH>::XLEN / 8; ++j) { | ||||||
|  |                 data.push_back(*(reg_base + offset + j)); | ||||||
|  |                 avail.push_back(0xff); | ||||||
|  |             } | ||||||
|  |         } else { | ||||||
|  |             for(size_t j = 0; j < arch::traits<ARCH>::XLEN / 8; ++j) { | ||||||
|  |                 data.push_back(0); | ||||||
|  |                 avail.push_back(0); | ||||||
|  |             } | ||||||
|  |         } | ||||||
|  |     } | ||||||
|  |     if(iss::arch::traits<ARCH>::FLEN > 0) { | ||||||
|  |         auto fstart_reg = get_f0_offset<ARCH>(); | ||||||
|  |         for(size_t i = 0; i < 32; ++i) { | ||||||
|  |             auto reg_no = fstart_reg + i; | ||||||
|             auto reg_width = arch::traits<ARCH>::reg_bit_widths[reg_no] / 8; |             auto reg_width = arch::traits<ARCH>::reg_bit_widths[reg_no] / 8; | ||||||
|             unsigned offset = traits<ARCH>::reg_byte_offsets[reg_no]; |             unsigned offset = traits<ARCH>::reg_byte_offsets[reg_no]; | ||||||
|             for(size_t j = 0; j < reg_width; ++j) { |             for(size_t j = 0; j < reg_width; ++j) { | ||||||
| @@ -188,21 +215,7 @@ template <typename ARCH> status riscv_target_adapter<ARCH>::read_registers(std:: | |||||||
|                 avail.push_back(0xff); |                 avail.push_back(0xff); | ||||||
|             } |             } | ||||||
|         } |         } | ||||||
|     // work around fill with F type registers |     } | ||||||
|     //    if (arch::traits<ARCH>::NUM_REGS < 65) { |  | ||||||
|     //        auto reg_width = sizeof(typename arch::traits<ARCH>::reg_t); |  | ||||||
|     //        for (size_t reg_no = 0; reg_no < 33; ++reg_no) { |  | ||||||
|     //            for (size_t j = 0; j < reg_width; ++j) { |  | ||||||
|     //                data.push_back(0x0); |  | ||||||
|     //                avail.push_back(0x00); |  | ||||||
|     //            } |  | ||||||
|     //            // if(arch::traits<ARCH>::XLEN < 64) |  | ||||||
|     //            //     for(unsigned j=0; j<4; ++j){ |  | ||||||
|     //            //         data.push_back(0x0); |  | ||||||
|     //            //         avail.push_back(0x00); |  | ||||||
|     //            //     } |  | ||||||
|     //        } |  | ||||||
|     //    } |  | ||||||
|     return Ok; |     return Ok; | ||||||
| } | } | ||||||
|  |  | ||||||
| @@ -210,25 +223,25 @@ template <typename ARCH> status riscv_target_adapter<ARCH>::write_registers(cons | |||||||
|     auto start_reg = arch::traits<ARCH>::X0; |     auto start_reg = arch::traits<ARCH>::X0; | ||||||
|     auto* reg_base = core->get_regs_base_ptr(); |     auto* reg_base = core->get_regs_base_ptr(); | ||||||
|     auto iter = data.data(); |     auto iter = data.data(); | ||||||
|     bool e_ext = arch::traits<ARCH>::PC < 32; |     auto iter_end = data.data() + data.size(); | ||||||
|     for(size_t reg_no = 0; reg_no < start_reg + 33 /*arch::traits<ARCH>::NUM_REGS*/; ++reg_no) { |     for(size_t i = 0; i < 33 && iter < iter_end; ++i) { | ||||||
|         if(e_ext && reg_no > 15) { |         auto reg_width = arch::traits<ARCH>::XLEN / 8; | ||||||
|             if(reg_no == 32) { |         if(i < arch::traits<ARCH>::RFS) { | ||||||
|                 auto reg_width = arch::traits<ARCH>::reg_bit_widths[arch::traits<ARCH>::PC] / 8; |             auto offset = traits<ARCH>::reg_byte_offsets[start_reg + i]; | ||||||
|  |             std::copy(iter, iter + reg_width, reg_base + offset); | ||||||
|  |         } else if(i == 32) { | ||||||
|             auto offset = traits<ARCH>::reg_byte_offsets[arch::traits<ARCH>::PC]; |             auto offset = traits<ARCH>::reg_byte_offsets[arch::traits<ARCH>::PC]; | ||||||
|                 std::copy(iter, iter + reg_width, reg_base); |             std::copy(iter, iter + reg_width, reg_base + offset); | ||||||
|             } else { |  | ||||||
|                 const uint64_t zero_val = 0; |  | ||||||
|                 auto reg_width = arch::traits<ARCH>::reg_bit_widths[15] / 8; |  | ||||||
|                 auto iter = (uint8_t*)&zero_val; |  | ||||||
|                 std::copy(iter, iter + reg_width, reg_base); |  | ||||||
|         } |         } | ||||||
|         } else { |         iter += reg_width; | ||||||
|             auto reg_width = arch::traits<ARCH>::reg_bit_widths[reg_no] / 8; |     } | ||||||
|             auto offset = traits<ARCH>::reg_byte_offsets[reg_no]; |     if(iss::arch::traits<ARCH>::FLEN > 0) { | ||||||
|             std::copy(iter, iter + reg_width, reg_base); |         auto fstart_reg = get_f0_offset<ARCH>(); | ||||||
|             iter += 4; |         auto reg_width = arch::traits<ARCH>::FLEN / 8; | ||||||
|             reg_base += offset; |         for(size_t i = 0; i < 32 && iter < iter_end; ++i) { | ||||||
|  |             unsigned offset = traits<ARCH>::reg_byte_offsets[fstart_reg + i]; | ||||||
|  |             std::copy(iter, iter + reg_width, reg_base + offset); | ||||||
|  |             iter += reg_width; | ||||||
|         } |         } | ||||||
|     } |     } | ||||||
|     return Ok; |     return Ok; | ||||||
| @@ -236,7 +249,7 @@ template <typename ARCH> status riscv_target_adapter<ARCH>::write_registers(cons | |||||||
|  |  | ||||||
| template <typename ARCH> | template <typename ARCH> | ||||||
| status riscv_target_adapter<ARCH>::read_single_register(unsigned int reg_no, std::vector<uint8_t>& data, std::vector<uint8_t>& avail) { | status riscv_target_adapter<ARCH>::read_single_register(unsigned int reg_no, std::vector<uint8_t>& data, std::vector<uint8_t>& avail) { | ||||||
|     if(reg_no < 65) { |     if(reg_no < csr_offset) { | ||||||
|         // auto reg_size = arch::traits<ARCH>::reg_bit_width(static_cast<typename |         // auto reg_size = arch::traits<ARCH>::reg_bit_width(static_cast<typename | ||||||
|         // arch::traits<ARCH>::reg_e>(reg_no))/8; |         // arch::traits<ARCH>::reg_e>(reg_no))/8; | ||||||
|         auto* reg_base = core->get_regs_base_ptr(); |         auto* reg_base = core->get_regs_base_ptr(); | ||||||
| @@ -247,23 +260,24 @@ status riscv_target_adapter<ARCH>::read_single_register(unsigned int reg_no, std | |||||||
|         std::copy(reg_base + offset, reg_base + offset + reg_width, data.begin()); |         std::copy(reg_base + offset, reg_base + offset + reg_width, data.begin()); | ||||||
|         std::fill(avail.begin(), avail.end(), 0xff); |         std::fill(avail.begin(), avail.end(), 0xff); | ||||||
|     } else { |     } else { | ||||||
|         typed_addr_t<iss::address_type::PHYSICAL> a(iss::access_type::DEBUG_READ, traits<ARCH>::CSR, reg_no - 65); |         typed_addr_t<iss::address_type::PHYSICAL> a(iss::access_type::DEBUG_READ, traits<ARCH>::CSR, reg_no - csr_offset); | ||||||
|         data.resize(sizeof(typename traits<ARCH>::reg_t)); |         data.resize(sizeof(typename traits<ARCH>::reg_t)); | ||||||
|         avail.resize(sizeof(typename traits<ARCH>::reg_t)); |         avail.resize(sizeof(typename traits<ARCH>::reg_t)); | ||||||
|         std::fill(avail.begin(), avail.end(), 0xff); |         std::fill(avail.begin(), avail.end(), 0xff); | ||||||
|         core->read(a, data.size(), data.data()); |         core->read(a, data.size(), data.data()); | ||||||
|  |         std::fill(avail.begin(), avail.end(), 0xff); | ||||||
|     } |     } | ||||||
|     return data.size() > 0 ? Ok : Err; |     return data.size() > 0 ? Ok : Err; | ||||||
| } | } | ||||||
|  |  | ||||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::write_single_register(unsigned int reg_no, const std::vector<uint8_t>& data) { | template <typename ARCH> status riscv_target_adapter<ARCH>::write_single_register(unsigned int reg_no, const std::vector<uint8_t>& data) { | ||||||
|     if(reg_no < 65) { |     if(reg_no < csr_offset) { | ||||||
|         auto* reg_base = core->get_regs_base_ptr(); |         auto* reg_base = core->get_regs_base_ptr(); | ||||||
|         auto reg_width = arch::traits<ARCH>::reg_bit_widths[static_cast<typename arch::traits<ARCH>::reg_e>(reg_no)] / 8; |         auto reg_width = arch::traits<ARCH>::reg_bit_widths[static_cast<typename arch::traits<ARCH>::reg_e>(reg_no)] / 8; | ||||||
|         auto offset = traits<ARCH>::reg_byte_offsets[reg_no]; |         auto offset = traits<ARCH>::reg_byte_offsets[reg_no]; | ||||||
|         std::copy(data.begin(), data.begin() + reg_width, reg_base + offset); |         std::copy(data.begin(), data.begin() + reg_width, reg_base + offset); | ||||||
|     } else { |     } else { | ||||||
|         typed_addr_t<iss::address_type::PHYSICAL> a(iss::access_type::DEBUG_WRITE, traits<ARCH>::CSR, reg_no - 65); |         typed_addr_t<iss::address_type::PHYSICAL> a(iss::access_type::DEBUG_WRITE, traits<ARCH>::CSR, reg_no - csr_offset); | ||||||
|         core->write(a, data.size(), data.data()); |         core->write(a, data.size(), data.data()); | ||||||
|     } |     } | ||||||
|     return Ok; |     return Ok; | ||||||
| @@ -276,7 +290,7 @@ template <typename ARCH> status riscv_target_adapter<ARCH>::read_mem(uint64_t ad | |||||||
| } | } | ||||||
|  |  | ||||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::write_mem(uint64_t addr, const std::vector<uint8_t>& data) { | template <typename ARCH> status riscv_target_adapter<ARCH>::write_mem(uint64_t addr, const std::vector<uint8_t>& data) { | ||||||
|     auto a = map_addr({iss::access_type::DEBUG_READ, iss::address_type::VIRTUAL, 0, addr}); |     auto a = map_addr({iss::access_type::DEBUG_WRITE, iss::address_type::VIRTUAL, 0, addr}); | ||||||
|     auto f = [&]() -> status { return core->write(a, data.size(), data.data()); }; |     auto f = [&]() -> status { return core->write(a, data.size(), data.data()); }; | ||||||
|     return srv->execute_syncronized(f); |     return srv->execute_syncronized(f); | ||||||
| } | } | ||||||
| @@ -369,93 +383,57 @@ status riscv_target_adapter<ARCH>::resume_from_addr(bool step, int sig, uint64_t | |||||||
| } | } | ||||||
|  |  | ||||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::target_xml_query(std::string& out_buf) { | template <typename ARCH> status riscv_target_adapter<ARCH>::target_xml_query(std::string& out_buf) { | ||||||
|     const std::string res{"<?xml version=\"1.0\"?><!DOCTYPE target SYSTEM \"gdb-target.dtd\">" |     if(!csr_xml.size()) { | ||||||
|                           "<target><architecture>riscv:rv32</architecture>" |         std::ostringstream oss; | ||||||
|                           //"  <feature name=\"org.gnu.gdb.riscv.rv32i\">\n" |         oss << "<?xml version=\"1.0\"?><!DOCTYPE feature SYSTEM \"gdb-target.dtd\"><target version=\"1.0\">\n"; | ||||||
|                           //"    <reg name=\"x0\"  bitsize=\"32\" group=\"general\"/>\n" |         if(iss::arch::traits<ARCH>::XLEN == 32) | ||||||
|                           //"    <reg name=\"x1\"  bitsize=\"32\" group=\"general\"/>\n" |             oss << "<architecture>riscv:rv32</architecture>\n"; | ||||||
|                           //"    <reg name=\"x2\"  bitsize=\"32\" group=\"general\"/>\n" |         else if(iss::arch::traits<ARCH>::XLEN == 64) | ||||||
|                           //"    <reg name=\"x3\"  bitsize=\"32\" group=\"general\"/>\n" |             oss << "  <architectureriscv:rv64</architecture>\n"; | ||||||
|                           //"    <reg name=\"x4\"  bitsize=\"32\" group=\"general\"/>\n" |         oss << "  <feature name=\"org.gnu.gdb.riscv.cpu\">\n"; | ||||||
|                           //"    <reg name=\"x5\"  bitsize=\"32\" group=\"general\"/>\n" |         auto reg_base_num = iss::arch::traits<ARCH>::X0; | ||||||
|                           //"    <reg name=\"x6\"  bitsize=\"32\" group=\"general\"/>\n" |         for(auto i = 0U; i < iss::arch::traits<ARCH>::RFS; ++i) { | ||||||
|                           //"    <reg name=\"x7\"  bitsize=\"32\" group=\"general\"/>\n" |             oss << "    <reg name=\"x" << i << "\" bitsize=\"" << iss::arch::traits<ARCH>::reg_bit_widths[reg_base_num + i] | ||||||
|                           //"    <reg name=\"x8\"  bitsize=\"32\" group=\"general\"/>\n" |                 << "\" type=\"int\" regnum=\"" << i << "\"/>\n"; | ||||||
|                           //"    <reg name=\"x9\"  bitsize=\"32\" group=\"general\"/>\n" |         } | ||||||
|                           //"    <reg name=\"x10\" bitsize=\"32\" group=\"general\"/>\n" |         oss << "    <reg name=\"pc\" bitsize=\"" << iss::arch::traits<ARCH>::reg_bit_widths[iss::arch::traits<ARCH>::PC] | ||||||
|                           //"    <reg name=\"x11\" bitsize=\"32\" group=\"general\"/>\n" |             << "\" type=\"code_ptr\" regnum=\"" << 32U << "\"/>\n"; | ||||||
|                           //"    <reg name=\"x12\" bitsize=\"32\" group=\"general\"/>\n" |         oss << "  </feature>\n"; | ||||||
|                           //"    <reg name=\"x13\" bitsize=\"32\" group=\"general\"/>\n" |         if(iss::arch::traits<ARCH>::FLEN > 0) { | ||||||
|                           //"    <reg name=\"x14\" bitsize=\"32\" group=\"general\"/>\n" |             oss << "  <feature name=\"org.gnu.gdb.riscv.fpu\">\n"; | ||||||
|                           //"    <reg name=\"x15\" bitsize=\"32\" group=\"general\"/>\n" |             auto reg_base_num = get_f0_offset<ARCH>(); | ||||||
|                           //"    <reg name=\"x16\" bitsize=\"32\" group=\"general\"/>\n" |             auto type = iss::arch::traits<ARCH>::FLEN == 32 ? "ieee_single" : "riscv_double"; | ||||||
|                           //"    <reg name=\"x17\" bitsize=\"32\" group=\"general\"/>\n" |             for(auto i = 0U; i < 32; ++i) { | ||||||
|                           //"    <reg name=\"x18\" bitsize=\"32\" group=\"general\"/>\n" |                 oss << "    <reg name=\"f" << i << "\" bitsize=\"" << iss::arch::traits<ARCH>::reg_bit_widths[reg_base_num + i] | ||||||
|                           //"    <reg name=\"x19\" bitsize=\"32\" group=\"general\"/>\n" |                     << "\" type=\"" << type << "\" regnum=\"" << i + 33 << "\"/>\n"; | ||||||
|                           //"    <reg name=\"x20\" bitsize=\"32\" group=\"general\"/>\n" |             } | ||||||
|                           //"    <reg name=\"x21\" bitsize=\"32\" group=\"general\"/>\n" |             oss << "    <reg name=\"fcsr\" bitsize=\"" << iss::arch::traits<ARCH>::XLEN << "\" regnum=\"103\" type int/>\n"; | ||||||
|                           //"    <reg name=\"x22\" bitsize=\"32\" group=\"general\"/>\n" |             oss << "    <reg name=\"fflags\" bitsize=\"" << iss::arch::traits<ARCH>::XLEN << "\" regnum=\"101\" type int/>\n"; | ||||||
|                           //"    <reg name=\"x23\" bitsize=\"32\" group=\"general\"/>\n" |             oss << "    <reg name=\"frm\" bitsize=\"" << iss::arch::traits<ARCH>::XLEN << "\" regnum=\"102\" type int/>\n"; | ||||||
|                           //"    <reg name=\"x24\" bitsize=\"32\" group=\"general\"/>\n" |             oss << "  </feature>\n"; | ||||||
|                           //"    <reg name=\"x25\" bitsize=\"32\" group=\"general\"/>\n" |         } | ||||||
|                           //"    <reg name=\"x26\" bitsize=\"32\" group=\"general\"/>\n" |         oss << "  <feature name=\"org.gnu.gdb.riscv.csr\">\n"; | ||||||
|                           //"    <reg name=\"x27\" bitsize=\"32\" group=\"general\"/>\n" |         std::vector<uint8_t> data; | ||||||
|                           //"    <reg name=\"x28\" bitsize=\"32\" group=\"general\"/>\n" |         std::vector<uint8_t> avail; | ||||||
|                           //"    <reg name=\"x29\" bitsize=\"32\" group=\"general\"/>\n" |         data.resize(sizeof(typename traits<ARCH>::reg_t)); | ||||||
|                           //"    <reg name=\"x30\" bitsize=\"32\" group=\"general\"/>\n" |         avail.resize(sizeof(typename traits<ARCH>::reg_t)); | ||||||
|                           //"    <reg name=\"x31\" bitsize=\"32\" group=\"general\"/>\n" |         for(auto i = 0U; i < 4096; ++i) { | ||||||
|                           //"  </feature>\n" |             typed_addr_t<iss::address_type::PHYSICAL> a(iss::access_type::DEBUG_READ, traits<ARCH>::CSR, i); | ||||||
|                           "</target>"}; |             std::fill(avail.begin(), avail.end(), 0xff); | ||||||
|     out_buf = res; |             auto res = core->read(a, data.size(), data.data()); | ||||||
|  |             if(res == iss::Ok) { | ||||||
|  |                 oss << "    <reg name=\"" << get_csr_name(i) << "\" bitsize=\"" << iss::arch::traits<ARCH>::XLEN | ||||||
|  |                     << "\"  type=\"int\" regnum=\"" << (i + csr_offset) << "\"/>\n"; | ||||||
|  |             } | ||||||
|  |         } | ||||||
|  |         oss << "  </feature>\n"; | ||||||
|  |         oss << "</target>\n"; | ||||||
|  |         csr_xml = oss.str(); | ||||||
|  |     } | ||||||
|  |     out_buf = csr_xml; | ||||||
|     return Ok; |     return Ok; | ||||||
| } | } | ||||||
|  |  | ||||||
| /* |  | ||||||
|  * |  | ||||||
| <?xml version="1.0"?> |  | ||||||
| <!DOCTYPE target SYSTEM "gdb-target.dtd"> |  | ||||||
| <target> |  | ||||||
|   <architecture>riscv:rv32</architecture> |  | ||||||
|  |  | ||||||
|   <feature name="org.gnu.gdb.riscv.rv32i"> |  | ||||||
|     <reg name="x0"  bitsize="32" group="general"/> |  | ||||||
|     <reg name="x1"  bitsize="32" group="general"/> |  | ||||||
|     <reg name="x2"  bitsize="32" group="general"/> |  | ||||||
|     <reg name="x3"  bitsize="32" group="general"/> |  | ||||||
|     <reg name="x4"  bitsize="32" group="general"/> |  | ||||||
|     <reg name="x5"  bitsize="32" group="general"/> |  | ||||||
|     <reg name="x6"  bitsize="32" group="general"/> |  | ||||||
|     <reg name="x7"  bitsize="32" group="general"/> |  | ||||||
|     <reg name="x8"  bitsize="32" group="general"/> |  | ||||||
|     <reg name="x9"  bitsize="32" group="general"/> |  | ||||||
|     <reg name="x10" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x11" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x12" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x13" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x14" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x15" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x16" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x17" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x18" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x19" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x20" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x21" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x22" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x23" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x24" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x25" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x26" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x27" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x28" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x29" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x30" bitsize="32" group="general"/> |  | ||||||
|     <reg name="x31" bitsize="32" group="general"/> |  | ||||||
|   </feature> |  | ||||||
|  |  | ||||||
| </target> |  | ||||||
|  |  | ||||||
|  */ |  | ||||||
| } // namespace debugger | } // namespace debugger | ||||||
| } // namespace iss | } // namespace iss | ||||||
|  |  | ||||||
| #endif /* _ISS_DEBUGGER_RISCV_TARGET_ADAPTER_H_ */ | #endif /* _ISS_ARCH_DEBUGGER_RISCV_TARGET_ADAPTER_H_ */ | ||||||
|   | |||||||
							
								
								
									
										285
									
								
								src/iss/mem/clic.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										285
									
								
								src/iss/mem/clic.h
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,285 @@ | |||||||
|  | /******************************************************************************* | ||||||
|  |  * Copyright (C) 2025 MINRES Technologies GmbH | ||||||
|  |  * All rights reserved. | ||||||
|  |  * | ||||||
|  |  * Redistribution and use in source and binary forms, with or without | ||||||
|  |  * modification, are permitted provided that the following conditions are met: | ||||||
|  |  * | ||||||
|  |  * 1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer. | ||||||
|  |  * | ||||||
|  |  * 2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer in the documentation | ||||||
|  |  *    and/or other materials provided with the distribution. | ||||||
|  |  * | ||||||
|  |  * 3. Neither the name of the copyright holder nor the names of its contributors | ||||||
|  |  *    may be used to endorse or promote products derived from this software | ||||||
|  |  *    without specific prior written permission. | ||||||
|  |  * | ||||||
|  |  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  |  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  |  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||||
|  |  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||||
|  |  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||||
|  |  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||||
|  |  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||||
|  |  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||||
|  |  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||||
|  |  * POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  * | ||||||
|  |  * Contributors: | ||||||
|  |  *       eyck@minres.com - initial implementation | ||||||
|  |  ******************************************************************************/ | ||||||
|  |  | ||||||
|  | #include "memory_if.h" | ||||||
|  | #include "iss/arch/riscv_hart_common.h" | ||||||
|  | #include "iss/vm_types.h" | ||||||
|  | #include <util/logging.h> | ||||||
|  |  | ||||||
|  | namespace iss { | ||||||
|  | namespace mem { | ||||||
|  | struct clic_config { | ||||||
|  |     uint64_t clic_base{0xc0000000}; | ||||||
|  |     unsigned clic_int_ctl_bits{4}; | ||||||
|  |     unsigned clic_num_irq{16}; | ||||||
|  |     unsigned clic_num_trigger{0}; | ||||||
|  |     bool nmode{false}; | ||||||
|  | }; | ||||||
|  |  | ||||||
|  | inline void read_reg_with_offset(uint32_t reg, uint8_t offs, uint8_t* const data, unsigned length) { | ||||||
|  |     auto reg_ptr = reinterpret_cast<uint8_t*>(®); | ||||||
|  |     switch(offs) { | ||||||
|  |     default: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(data + i) = *(reg_ptr + i); | ||||||
|  |         break; | ||||||
|  |     case 1: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(data + i) = *(reg_ptr + 1 + i); | ||||||
|  |         break; | ||||||
|  |     case 2: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(data + i) = *(reg_ptr + 2 + i); | ||||||
|  |         break; | ||||||
|  |     case 3: | ||||||
|  |         *data = *(reg_ptr + 3); | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  | } | ||||||
|  |  | ||||||
|  | inline void write_reg_with_offset(uint32_t& reg, uint8_t offs, const uint8_t* const data, unsigned length) { | ||||||
|  |     auto reg_ptr = reinterpret_cast<uint8_t*>(®); | ||||||
|  |     switch(offs) { | ||||||
|  |     default: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(reg_ptr + i) = *(data + i); | ||||||
|  |         break; | ||||||
|  |     case 1: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(reg_ptr + 1 + i) = *(data + i); | ||||||
|  |         break; | ||||||
|  |     case 2: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(reg_ptr + 2 + i) = *(data + i); | ||||||
|  |         break; | ||||||
|  |     case 3: | ||||||
|  |         *(reg_ptr + 3) = *data; | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  | } | ||||||
|  |  | ||||||
|  | template <typename WORD_TYPE> struct clic : public memory_elem { | ||||||
|  |     using this_class = clic<WORD_TYPE>; | ||||||
|  |     using reg_t = WORD_TYPE; | ||||||
|  |     constexpr static unsigned WORD_LEN = sizeof(WORD_TYPE) * 8; | ||||||
|  |  | ||||||
|  |     clic(arch::priv_if<WORD_TYPE> hart_if, clic_config cfg) | ||||||
|  |     : hart_if(hart_if) | ||||||
|  |     , cfg(cfg) { | ||||||
|  |         clic_int_reg.resize(cfg.clic_num_irq, clic_int_reg_t{.raw = 0}); | ||||||
|  |         clic_cfg_reg = 0x30; | ||||||
|  |         clic_mact_lvl = clic_mprev_lvl = (1 << (cfg.clic_int_ctl_bits)) - 1; | ||||||
|  |         clic_uact_lvl = clic_uprev_lvl = (1 << (cfg.clic_int_ctl_bits)) - 1; | ||||||
|  |         hart_if.csr_rd_cb[arch::mtvt] = MK_CSR_RD_CB(read_plain); | ||||||
|  |         hart_if.csr_wr_cb[arch::mtvt] = MK_CSR_WR_CB(write_xtvt); | ||||||
|  |         //        hart_if.csr_rd_cb[mxnti] = MK_CSR_RD_CB(read_plain(a,r);}; | ||||||
|  |         //        hart_if.csr_wr_cb[mxnti] = MK_CSR_WR_CB(write_plain(a,r);}; | ||||||
|  |         hart_if.csr_rd_cb[arch::mintstatus] = MK_CSR_RD_CB(read_intstatus); | ||||||
|  |         hart_if.csr_wr_cb[arch::mintstatus] = MK_CSR_WR_CB(write_null); | ||||||
|  |         //        hart_if.csr_rd_cb[mscratchcsw] = MK_CSR_RD_CB(read_plain(a,r);}; | ||||||
|  |         //        hart_if.csr_wr_cb[mscratchcsw] = MK_CSR_WR_CB(write_plain(a,r);}; | ||||||
|  |         //        hart_if.csr_rd_cb[mscratchcswl] = MK_CSR_RD_CB(read_plain(a,r);}; | ||||||
|  |         //        hart_if.csr_wr_cb[mscratchcswl] = MK_CSR_WR_CB(write_plain(a,r);}; | ||||||
|  |         hart_if.csr_rd_cb[arch::mintthresh] = MK_CSR_RD_CB(read_plain); | ||||||
|  |         hart_if.csr_wr_cb[arch::mintthresh] = MK_CSR_WR_CB(write_intthresh); | ||||||
|  |         if(cfg.nmode) { | ||||||
|  |             hart_if.csr_rd_cb[arch::utvt] = MK_CSR_RD_CB(read_plain); | ||||||
|  |             hart_if.csr_wr_cb[arch::utvt] = MK_CSR_WR_CB(write_xtvt); | ||||||
|  |             hart_if.csr_rd_cb[arch::uintstatus] = MK_CSR_RD_CB(read_intstatus); | ||||||
|  |             hart_if.csr_wr_cb[arch::uintstatus] = MK_CSR_WR_CB(write_null); | ||||||
|  |             hart_if.csr_rd_cb[arch::uintthresh] = MK_CSR_RD_CB(read_plain); | ||||||
|  |             hart_if.csr_wr_cb[arch::uintthresh] = MK_CSR_WR_CB(write_intthresh); | ||||||
|  |         } | ||||||
|  |         hart_if.csr[arch::mintthresh] = (1 << (cfg.clic_int_ctl_bits)) - 1; | ||||||
|  |         hart_if.csr[arch::uintthresh] = (1 << (cfg.clic_int_ctl_bits)) - 1; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     ~clic() = default; | ||||||
|  |  | ||||||
|  |     memory_if get_mem_if() override { | ||||||
|  |         return memory_if{.rd_mem{util::delegate<rd_mem_func_sig>::from<this_class, &this_class::read_mem>(this)}, | ||||||
|  |                          .wr_mem{util::delegate<wr_mem_func_sig>::from<this_class, &this_class::write_mem>(this)}}; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     void set_next(memory_if mem) override { down_stream_mem = mem; } | ||||||
|  |  | ||||||
|  |     std::tuple<uint64_t, uint64_t> get_range() override { return {cfg.clic_base, cfg.clic_base + 0x7fff}; } | ||||||
|  |  | ||||||
|  | private: | ||||||
|  |     iss::status read_mem(iss::access_type access, uint64_t addr, unsigned length, uint8_t* data) { | ||||||
|  |         if(addr >= cfg.clic_base && (addr + length) < (cfg.clic_base + 0x8000)) | ||||||
|  |             return read_clic(addr, length, data); | ||||||
|  |         return down_stream_mem.rd_mem(access, addr, length, data); | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_mem(iss::access_type access, uint64_t addr, unsigned length, uint8_t const* data) { | ||||||
|  |         if(addr >= cfg.clic_base && (addr + length) < (cfg.clic_base + 0x8000)) | ||||||
|  |             return write_clic(addr, length, data); | ||||||
|  |         return down_stream_mem.wr_mem(access, addr, length, data); | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_clic(uint64_t addr, unsigned length, uint8_t* data); | ||||||
|  |  | ||||||
|  |     iss::status write_clic(uint64_t addr, unsigned length, uint8_t const* data); | ||||||
|  |  | ||||||
|  |     iss::status write_null(unsigned addr, reg_t val) { return iss::status::Ok; } | ||||||
|  |  | ||||||
|  |     iss::status read_plain(unsigned addr, reg_t& val) { | ||||||
|  |         val = hart_if.csr[addr]; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_xtvt(unsigned addr, reg_t val) { | ||||||
|  |         hart_if.csr[addr] = val & ~0x3fULL; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_cause(unsigned addr, reg_t& val); | ||||||
|  |     iss::status write_cause(unsigned addr, reg_t val); | ||||||
|  |  | ||||||
|  |     iss::status read_intstatus(unsigned addr, reg_t& val); | ||||||
|  |     iss::status write_intthresh(unsigned addr, reg_t val); | ||||||
|  |  | ||||||
|  | protected: | ||||||
|  |     arch::priv_if<WORD_TYPE> hart_if; | ||||||
|  |     memory_if down_stream_mem; | ||||||
|  |     clic_config cfg; | ||||||
|  |     uint8_t clic_cfg_reg{0}; | ||||||
|  |     std::array<uint32_t, 32> clic_inttrig_reg; | ||||||
|  |     union clic_int_reg_t { | ||||||
|  |         struct { | ||||||
|  |             uint8_t ip; | ||||||
|  |             uint8_t ie; | ||||||
|  |             uint8_t attr; | ||||||
|  |             uint8_t ctl; | ||||||
|  |         }; | ||||||
|  |         uint32_t raw; | ||||||
|  |     }; | ||||||
|  |     std::vector<clic_int_reg_t> clic_int_reg; | ||||||
|  |     uint8_t clic_mprev_lvl{0}, clic_uprev_lvl{0}; | ||||||
|  |     uint8_t clic_mact_lvl{0}, clic_uact_lvl{0}; | ||||||
|  | }; | ||||||
|  |  | ||||||
|  | template <typename WORD_TYPE> iss::status clic<WORD_TYPE>::read_clic(uint64_t addr, unsigned length, uint8_t* const data) { | ||||||
|  |     if(addr == cfg.clic_base) { // cliccfg | ||||||
|  |         *data = clic_cfg_reg; | ||||||
|  |         for(auto i = 1; i < length; ++i) | ||||||
|  |             *(data + i) = 0; | ||||||
|  |     } else if(addr >= (cfg.clic_base + 0x40) && (addr + length) <= (cfg.clic_base + 0x40 + cfg.clic_num_trigger * 4)) { // clicinttrig | ||||||
|  |         auto offset = ((addr & 0x7fff) - 0x40) / 4; | ||||||
|  |         read_reg_with_offset(clic_inttrig_reg[offset], addr & 0x3, data, length); | ||||||
|  |     } else if(addr >= (cfg.clic_base + 0x1000) && | ||||||
|  |               (addr + length) <= (cfg.clic_base + 0x1000 + cfg.clic_num_irq * 4)) { // clicintip/clicintie/clicintattr/clicintctl | ||||||
|  |         auto offset = ((addr & 0x7fff) - 0x1000) / 4; | ||||||
|  |         read_reg_with_offset(clic_int_reg[offset].raw, addr & 0x3, data, length); | ||||||
|  |     } else { | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(data + i) = 0; | ||||||
|  |     } | ||||||
|  |     return iss::Ok; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | template <typename WORD_TYPE> iss::status clic<WORD_TYPE>::write_clic(uint64_t addr, unsigned length, const uint8_t* const data) { | ||||||
|  |     if(addr == cfg.clic_base) { // cliccfg | ||||||
|  |         clic_cfg_reg = (clic_cfg_reg & ~0x1e) | (*data & 0x1e); | ||||||
|  |     } else if(addr >= (cfg.clic_base + 0x40) && (addr + length) <= (cfg.clic_base + 0x40 + cfg.clic_num_trigger * 4)) { // clicinttrig | ||||||
|  |         auto offset = ((addr & 0x7fff) - 0x40) / 4; | ||||||
|  |         write_reg_with_offset(clic_inttrig_reg[offset], addr & 0x3, data, length); | ||||||
|  |     } else if(addr >= (cfg.clic_base + 0x1000) && | ||||||
|  |               (addr + length) <= (cfg.clic_base + 0x1000 + cfg.clic_num_irq * 4)) { // clicintip/clicintie/clicintattr/clicintctl | ||||||
|  |         auto offset = ((addr & 0x7fff) - 0x1000) / 4; | ||||||
|  |         write_reg_with_offset(clic_int_reg[offset].raw, addr & 0x3, data, length); | ||||||
|  |         clic_int_reg[offset].raw &= 0xf0c70101; // clicIntCtlBits->0xf0, clicintattr->0xc7, clicintie->0x1, clicintip->0x1 | ||||||
|  |     } | ||||||
|  |     return iss::Ok; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | template <typename WORD_TYPE> iss::status clic<WORD_TYPE>::read_cause(unsigned addr, reg_t& val) { | ||||||
|  |     if((hart_if.csr[arch::mtvec] & 0x3) == 3) { | ||||||
|  |         val = hart_if.csr[addr] & (1UL << (sizeof(reg_t) * 8) | (hart_if.mcause_max_irq - 1) | (0xfUL << 16)); | ||||||
|  |         auto mode = (addr >> 8) & 0x3; | ||||||
|  |         switch(mode) { | ||||||
|  |         case 0: | ||||||
|  |             val |= clic_uprev_lvl << 16; | ||||||
|  |             val |= hart_if.state.mstatus.UPIE << 27; | ||||||
|  |             break; | ||||||
|  |         default: | ||||||
|  |             val |= clic_mprev_lvl << 16; | ||||||
|  |             val |= hart_if.state.mstatus.MPIE << 27; | ||||||
|  |             val |= hart_if.state.mstatus.MPP << 28; | ||||||
|  |             break; | ||||||
|  |         } | ||||||
|  |     } else | ||||||
|  |         val = hart_if.csr[addr] & ((1UL << (sizeof(WORD_TYPE) * 8 - 1)) | (hart_if.mcause_max_irq - 1)); | ||||||
|  |     return iss::Ok; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | template <typename WORD_TYPE> iss::status clic<WORD_TYPE>::write_cause(unsigned addr, reg_t val) { | ||||||
|  |     if((hart_if.csr[arch::mtvec] & 0x3) == 3) { | ||||||
|  |         auto mask = ((1UL << (sizeof(WORD_TYPE) * 8 - 1)) | (hart_if.mcause_max_irq - 1) | (0xfUL << 16)); | ||||||
|  |         hart_if.csr[addr] = (val & mask) | (hart_if.csr[addr] & ~mask); | ||||||
|  |         auto mode = (addr >> 8) & 0x3; | ||||||
|  |         switch(mode) { | ||||||
|  |         case 0: | ||||||
|  |             clic_uprev_lvl = ((val >> 16) & 0xff) | (1 << (8 - cfg.clic_int_ctl_bits)) - 1; | ||||||
|  |             hart_if.state.mstatus.UPIE = (val >> 27) & 0x1; | ||||||
|  |             break; | ||||||
|  |         default: | ||||||
|  |             clic_mprev_lvl = ((val >> 16) & 0xff) | (1 << (8 - cfg.clic_int_ctl_bits)) - 1; | ||||||
|  |             hart_if.state.mstatus.MPIE = (val >> 27) & 0x1; | ||||||
|  |             hart_if.state.mstatus.MPP = (val >> 28) & 0x3; | ||||||
|  |             break; | ||||||
|  |         } | ||||||
|  |     } else { | ||||||
|  |         auto mask = ((1UL << (sizeof(WORD_TYPE) * 8 - 1)) | (hart_if.mcause_max_irq - 1)); | ||||||
|  |         hart_if.csr[addr] = (val & mask) | (hart_if.csr[addr] & ~mask); | ||||||
|  |     } | ||||||
|  |     return iss::Ok; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | template <typename WORD_TYPE> iss::status clic<WORD_TYPE>::read_intstatus(unsigned addr, reg_t& val) { | ||||||
|  |     auto mode = (addr >> 8) & 0x3; | ||||||
|  |     val = clic_uact_lvl & 0xff; | ||||||
|  |     if(mode == 0x3) | ||||||
|  |         val += (clic_mact_lvl & 0xff) << 24; | ||||||
|  |     return iss::Ok; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | template <typename WORD_TYPE> iss::status clic<WORD_TYPE>::write_intthresh(unsigned addr, reg_t val) { | ||||||
|  |     hart_if.csr[addr] = (val & 0xff) | (1 << (cfg.clic_int_ctl_bits)) - 1; | ||||||
|  |     return iss::Ok; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | } // namespace mem | ||||||
|  | } // namespace iss | ||||||
							
								
								
									
										101
									
								
								src/iss/mem/memory_if.cpp
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										101
									
								
								src/iss/mem/memory_if.cpp
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,101 @@ | |||||||
|  | /******************************************************************************* | ||||||
|  |  * Copyright (C) 2025 MINRES Technologies GmbH | ||||||
|  |  * All rights reserved. | ||||||
|  |  * | ||||||
|  |  * Redistribution and use in source and binary forms, with or without | ||||||
|  |  * modification, are permitted provided that the following conditions are met: | ||||||
|  |  * | ||||||
|  |  * 1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer. | ||||||
|  |  * | ||||||
|  |  * 2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer in the documentation | ||||||
|  |  *    and/or other materials provided with the distribution. | ||||||
|  |  * | ||||||
|  |  * 3. Neither the name of the copyright holder nor the names of its contributors | ||||||
|  |  *    may be used to endorse or promote products derived from this software | ||||||
|  |  *    without specific prior written permission. | ||||||
|  |  * | ||||||
|  |  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  |  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  |  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||||
|  |  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||||
|  |  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||||
|  |  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||||
|  |  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||||
|  |  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||||
|  |  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||||
|  |  * POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  * | ||||||
|  |  * Contributors: | ||||||
|  |  *       eyck@minres.com - initial implementation | ||||||
|  |  ******************************************************************************/ | ||||||
|  |  | ||||||
|  | #include "memory_if.h" | ||||||
|  | #include <algorithm> | ||||||
|  |  | ||||||
|  | namespace iss { | ||||||
|  | namespace mem { | ||||||
|  | void memory_hierarchy::root(memory_elem& e) { | ||||||
|  |     hierarchy.push_front(&e); | ||||||
|  |     root_set = true; | ||||||
|  |     update_chain(); | ||||||
|  | } | ||||||
|  | void memory_hierarchy::prepend(memory_elem& e) { | ||||||
|  |     if(root_set) | ||||||
|  |         hierarchy.insert(hierarchy.begin() + 1, &e); | ||||||
|  |     else | ||||||
|  |         hierarchy.push_front(&e); | ||||||
|  |     update_chain(); | ||||||
|  | } | ||||||
|  | void memory_hierarchy::append(memory_elem& e) { | ||||||
|  |     hierarchy.push_back(&e); | ||||||
|  |     update_chain(); | ||||||
|  | } | ||||||
|  | void memory_hierarchy::insert_before(memory_elem&) {} | ||||||
|  | void memory_hierarchy::insert_after(memory_elem&) {} | ||||||
|  | void memory_hierarchy::replace_last(memory_elem& e) { | ||||||
|  |     auto old = hierarchy.back(); | ||||||
|  |     auto it = std::find_if(std::begin(owned_elems), std::end(owned_elems), | ||||||
|  |                            [old](std::unique_ptr<memory_elem> const& p) { return p.get() == old; }); | ||||||
|  |     hierarchy.pop_back(); | ||||||
|  |     if(it != std::end(owned_elems)) | ||||||
|  |         owned_elems.erase(it); | ||||||
|  |     hierarchy.push_back(&e); | ||||||
|  |     update_chain(); | ||||||
|  | } | ||||||
|  | void memory_hierarchy::update_chain() { | ||||||
|  |     bool tail = false; | ||||||
|  |     for(size_t i = 1; i < hierarchy.size(); ++i) { | ||||||
|  |         hierarchy[i - 1]->set_next(hierarchy[i]->get_mem_if()); | ||||||
|  |     } | ||||||
|  | } | ||||||
|  |  | ||||||
|  | void memory_hierarchy::prepend(std::unique_ptr<memory_elem>&& p) { | ||||||
|  |     prepend(*p); | ||||||
|  |     owned_elems.push_back(std::move(p)); | ||||||
|  | } | ||||||
|  |  | ||||||
|  | void memory_hierarchy::append(std::unique_ptr<memory_elem>&& p) { | ||||||
|  |     append(*p); | ||||||
|  |     owned_elems.push_back(std::move(p)); | ||||||
|  | } | ||||||
|  |  | ||||||
|  | void memory_hierarchy::insert_before(std::unique_ptr<memory_elem>&& p) { | ||||||
|  |     insert_before(*p); | ||||||
|  |     owned_elems.push_back(std::move(p)); | ||||||
|  | } | ||||||
|  |  | ||||||
|  | void memory_hierarchy::insert_after(std::unique_ptr<memory_elem>&& p) { | ||||||
|  |     insert_after(*p); | ||||||
|  |     owned_elems.push_back(std::move(p)); | ||||||
|  | } | ||||||
|  |  | ||||||
|  | void memory_hierarchy::replace_last(std::unique_ptr<memory_elem>&& p) { | ||||||
|  |     replace_last(*p); | ||||||
|  |     owned_elems.push_back(std::move(p)); | ||||||
|  | } | ||||||
|  |  | ||||||
|  | } // namespace mem | ||||||
|  | } // namespace iss | ||||||
							
								
								
									
										86
									
								
								src/iss/mem/memory_if.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										86
									
								
								src/iss/mem/memory_if.h
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,86 @@ | |||||||
|  | /******************************************************************************* | ||||||
|  |  * Copyright (C) 2025 MINRES Technologies GmbH | ||||||
|  |  * All rights reserved. | ||||||
|  |  * | ||||||
|  |  * Redistribution and use in source and binary forms, with or without | ||||||
|  |  * modification, are permitted provided that the following conditions are met: | ||||||
|  |  * | ||||||
|  |  * 1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer. | ||||||
|  |  * | ||||||
|  |  * 2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer in the documentation | ||||||
|  |  *    and/or other materials provided with the distribution. | ||||||
|  |  * | ||||||
|  |  * 3. Neither the name of the copyright holder nor the names of its contributors | ||||||
|  |  *    may be used to endorse or promote products derived from this software | ||||||
|  |  *    without specific prior written permission. | ||||||
|  |  * | ||||||
|  |  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  |  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  |  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||||
|  |  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||||
|  |  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||||
|  |  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||||
|  |  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||||
|  |  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||||
|  |  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||||
|  |  * POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  * | ||||||
|  |  * Contributors: | ||||||
|  |  *       eyck@minres.com - initial implementation | ||||||
|  |  ******************************************************************************/ | ||||||
|  |  | ||||||
|  | #ifndef _MEMORY_MEMORY_IF_ | ||||||
|  | #define _MEMORY_MEMORY_IF_ | ||||||
|  |  | ||||||
|  | #include "iss/vm_types.h" | ||||||
|  | #include <deque> | ||||||
|  | #include <functional> | ||||||
|  | #include <limits> | ||||||
|  | #include <memory> | ||||||
|  | #include <util/delegate.h> | ||||||
|  | #include <vector> | ||||||
|  |  | ||||||
|  | namespace iss { | ||||||
|  | namespace mem { | ||||||
|  |  | ||||||
|  | using rd_mem_func_sig = iss::status(iss::access_type, uint64_t, unsigned, uint8_t*); | ||||||
|  | using wr_mem_func_sig = iss::status(iss::access_type, uint64_t, unsigned, uint8_t const*); | ||||||
|  |  | ||||||
|  | struct memory_if { | ||||||
|  |     util::delegate<iss::status(access_type, uint64_t, unsigned, uint8_t*)> rd_mem; | ||||||
|  |     util::delegate<iss::status(access_type, uint64_t, unsigned, uint8_t const*)> wr_mem; | ||||||
|  | }; | ||||||
|  |  | ||||||
|  | struct memory_elem { | ||||||
|  |     virtual ~memory_elem() = default; | ||||||
|  |     virtual memory_if get_mem_if() = 0; | ||||||
|  |     virtual void set_next(memory_if) = 0; | ||||||
|  |     virtual std::tuple<uint64_t, uint64_t> get_range() { return {0, std::numeric_limits<uint64_t>::max()}; } | ||||||
|  | }; | ||||||
|  |  | ||||||
|  | struct memory_hierarchy { | ||||||
|  |     void root(memory_elem&); | ||||||
|  |     void prepend(memory_elem&); | ||||||
|  |     void append(memory_elem&); | ||||||
|  |     void insert_before(memory_elem&); | ||||||
|  |     void insert_after(memory_elem&); | ||||||
|  |     void replace_last(memory_elem&); | ||||||
|  |     void prepend(std::unique_ptr<memory_elem>&&); | ||||||
|  |     void append(std::unique_ptr<memory_elem>&&); | ||||||
|  |     void insert_before(std::unique_ptr<memory_elem>&&); | ||||||
|  |     void insert_after(std::unique_ptr<memory_elem>&&); | ||||||
|  |     void replace_last(std::unique_ptr<memory_elem>&&); | ||||||
|  |  | ||||||
|  | protected: | ||||||
|  |     void update_chain(); | ||||||
|  |     std::deque<memory_elem*> hierarchy; | ||||||
|  |     std::vector<std::unique_ptr<memory_elem>> owned_elems; | ||||||
|  |     bool root_set{false}; | ||||||
|  | }; | ||||||
|  |  | ||||||
|  | } // namespace mem | ||||||
|  | } // namespace iss | ||||||
|  | #endif | ||||||
							
								
								
									
										90
									
								
								src/iss/mem/memory_with_htif.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										90
									
								
								src/iss/mem/memory_with_htif.h
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,90 @@ | |||||||
|  | /******************************************************************************* | ||||||
|  |  * Copyright (C) 2025 MINRES Technologies GmbH | ||||||
|  |  * All rights reserved. | ||||||
|  |  * | ||||||
|  |  * Redistribution and use in source and binary forms, with or without | ||||||
|  |  * modification, are permitted provided that the following conditions are met: | ||||||
|  |  * | ||||||
|  |  * 1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer. | ||||||
|  |  * | ||||||
|  |  * 2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer in the documentation | ||||||
|  |  *    and/or other materials provided with the distribution. | ||||||
|  |  * | ||||||
|  |  * 3. Neither the name of the copyright holder nor the names of its contributors | ||||||
|  |  *    may be used to endorse or promote products derived from this software | ||||||
|  |  *    without specific prior written permission. | ||||||
|  |  * | ||||||
|  |  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  |  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  |  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||||
|  |  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||||
|  |  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||||
|  |  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||||
|  |  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||||
|  |  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||||
|  |  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||||
|  |  * POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  * | ||||||
|  |  * Contributors: | ||||||
|  |  *       eyck@minres.com - initial implementation | ||||||
|  |  ******************************************************************************/ | ||||||
|  |  | ||||||
|  | #ifndef _MEMORY_WITH_HTIF_ | ||||||
|  | #define _MEMORY_WITH_HTIF_ | ||||||
|  |  | ||||||
|  | #include "memory_if.h" | ||||||
|  | #include "iss/arch/riscv_hart_common.h" | ||||||
|  | #include "iss/vm_types.h" | ||||||
|  | #include <util/logging.h> | ||||||
|  | #include <util/sparse_array.h> | ||||||
|  |  | ||||||
|  | namespace iss { | ||||||
|  | namespace mem { | ||||||
|  | template <typename WORD_TYPE> struct memory_with_htif : public memory_elem { | ||||||
|  |     using this_class = memory_with_htif<WORD_TYPE>; | ||||||
|  |     constexpr static unsigned WORD_LEN = sizeof(WORD_TYPE) * 8; | ||||||
|  |  | ||||||
|  |     memory_with_htif(arch::priv_if<WORD_TYPE> hart_if) | ||||||
|  |     : hart_if(hart_if) {} | ||||||
|  |  | ||||||
|  |     ~memory_with_htif() = default; | ||||||
|  |  | ||||||
|  |     memory_if get_mem_if() override { | ||||||
|  |         return memory_if{.rd_mem{util::delegate<rd_mem_func_sig>::from<this_class, &this_class::read_mem>(this)}, | ||||||
|  |                          .wr_mem{util::delegate<wr_mem_func_sig>::from<this_class, &this_class::write_mem>(this)}}; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     void set_next(memory_if) override { | ||||||
|  |         // intenrionally left empty, leaf element | ||||||
|  |     } | ||||||
|  |  | ||||||
|  | private: | ||||||
|  |     iss::status read_mem(iss::access_type access, uint64_t addr, unsigned length, uint8_t* data) { | ||||||
|  |         for(auto offs = 0U; offs < length; ++offs) { | ||||||
|  |             *(data + offs) = mem[(addr + offs) % mem.size()]; | ||||||
|  |         } | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_mem(iss::access_type access, uint64_t addr, unsigned length, uint8_t const* data) { | ||||||
|  |         mem_type::page_type& p = mem(addr / mem.page_size); | ||||||
|  |         std::copy(data, data + length, p.data() + (addr & mem.page_addr_mask)); | ||||||
|  |         // this->tohost handling in case of riscv-test | ||||||
|  |         // according to https://github.com/riscv-software-src/riscv-isa-sim/issues/364#issuecomment-607657754: | ||||||
|  |         if(access && iss::access_type::FUNC && addr == hart_if.tohost) { | ||||||
|  |             return hart_if.exec_htif(data); | ||||||
|  |         } | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  | protected: | ||||||
|  |     using mem_type = util::sparse_array<uint8_t, 1ULL << 32>; | ||||||
|  |     mem_type mem; | ||||||
|  |     arch::priv_if<WORD_TYPE> hart_if; | ||||||
|  | }; | ||||||
|  | } // namespace mem | ||||||
|  | } // namespace iss | ||||||
|  | #endif // _MEMORY_WITH_HTIF_ | ||||||
							
								
								
									
										353
									
								
								src/iss/mem/mmu.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										353
									
								
								src/iss/mem/mmu.h
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,353 @@ | |||||||
|  | /******************************************************************************* | ||||||
|  |  * Copyright (C) 2025 MINRES Technologies GmbH | ||||||
|  |  * All rights reserved. | ||||||
|  |  * | ||||||
|  |  * Redistribution and use in source and binary forms, with or without | ||||||
|  |  * modification, are permitted provided that the following conditions are met: | ||||||
|  |  * | ||||||
|  |  * 1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer. | ||||||
|  |  * | ||||||
|  |  * 2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer in the documentation | ||||||
|  |  *    and/or other materials provided with the distribution. | ||||||
|  |  * | ||||||
|  |  * 3. Neither the name of the copyright holder nor the names of its contributors | ||||||
|  |  *    may be used to endorse or promote products derived from this software | ||||||
|  |  *    without specific prior written permission. | ||||||
|  |  * | ||||||
|  |  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  |  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  |  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||||
|  |  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||||
|  |  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||||
|  |  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||||
|  |  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||||
|  |  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||||
|  |  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||||
|  |  * POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  * | ||||||
|  |  * Contributors: | ||||||
|  |  *       eyck@minres.com - initial implementation | ||||||
|  |  ******************************************************************************/ | ||||||
|  |  | ||||||
|  | #include "iss/arch/riscv_hart_common.h" | ||||||
|  | #include "iss/vm_types.h" | ||||||
|  | #include "memory_if.h" | ||||||
|  | #include <util/logging.h> | ||||||
|  |  | ||||||
|  | namespace iss { | ||||||
|  | namespace mem { | ||||||
|  | enum { | ||||||
|  |     PGSHIFT = 12, | ||||||
|  |     PTE_PPN_SHIFT = 10, | ||||||
|  |     // page table entry (PTE) fields | ||||||
|  |     PTE_V = 0x001,   // Valid | ||||||
|  |     PTE_R = 0x002,   // Read | ||||||
|  |     PTE_W = 0x004,   // Write | ||||||
|  |     PTE_X = 0x008,   // Execute | ||||||
|  |     PTE_U = 0x010,   // User | ||||||
|  |     PTE_G = 0x020,   // Global | ||||||
|  |     PTE_A = 0x040,   // Accessed | ||||||
|  |     PTE_D = 0x080,   // Dirty | ||||||
|  |     PTE_SOFT = 0x300 // Reserved for Software | ||||||
|  | }; | ||||||
|  |  | ||||||
|  | template <typename T> inline bool PTE_TABLE(T PTE) { return (((PTE) & (PTE_V | PTE_R | PTE_W | PTE_X)) == PTE_V); } | ||||||
|  |  | ||||||
|  | struct vm_info { | ||||||
|  |     int levels; | ||||||
|  |     int idxbits; | ||||||
|  |     int ptesize; | ||||||
|  |     uint64_t ptbase; | ||||||
|  |     bool is_active() { return levels; } | ||||||
|  | }; | ||||||
|  |  | ||||||
|  | inline void read_reg_with_offset(uint32_t reg, uint8_t offs, uint8_t* const data, unsigned length) { | ||||||
|  |     auto reg_ptr = reinterpret_cast<uint8_t*>(®); | ||||||
|  |     switch(offs) { | ||||||
|  |     default: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(data + i) = *(reg_ptr + i); | ||||||
|  |         break; | ||||||
|  |     case 1: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(data + i) = *(reg_ptr + 1 + i); | ||||||
|  |         break; | ||||||
|  |     case 2: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(data + i) = *(reg_ptr + 2 + i); | ||||||
|  |         break; | ||||||
|  |     case 3: | ||||||
|  |         *data = *(reg_ptr + 3); | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  | } | ||||||
|  |  | ||||||
|  | inline void write_reg_with_offset(uint32_t& reg, uint8_t offs, const uint8_t* const data, unsigned length) { | ||||||
|  |     auto reg_ptr = reinterpret_cast<uint8_t*>(®); | ||||||
|  |     switch(offs) { | ||||||
|  |     default: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(reg_ptr + i) = *(data + i); | ||||||
|  |         break; | ||||||
|  |     case 1: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(reg_ptr + 1 + i) = *(data + i); | ||||||
|  |         break; | ||||||
|  |     case 2: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(reg_ptr + 2 + i) = *(data + i); | ||||||
|  |         break; | ||||||
|  |     case 3: | ||||||
|  |         *(reg_ptr + 3) = *data; | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  | } | ||||||
|  | // TODO: update vminfo on trap enter and leave as well as mstatus write, reset | ||||||
|  | template <typename WORD_TYPE> struct mmu : public memory_elem { | ||||||
|  |     using this_class = mmu<WORD_TYPE>; | ||||||
|  |     using reg_t = WORD_TYPE; | ||||||
|  |     constexpr static unsigned WORD_LEN = sizeof(WORD_TYPE) * 8; | ||||||
|  |  | ||||||
|  |     constexpr static reg_t PGSIZE = 1 << PGSHIFT; | ||||||
|  |     constexpr static reg_t PGMASK = PGSIZE - 1; | ||||||
|  |  | ||||||
|  |     mmu(arch::priv_if<WORD_TYPE> hart_if) | ||||||
|  |     : hart_if(hart_if) { | ||||||
|  |         hart_if.csr_rd_cb[satp] = MK_CSR_RD_CB(read_satp); | ||||||
|  |         hart_if.csr_wr_cb[satp] = MK_CSR_WR_CB(write_satp); | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     virtual ~mmu() = default; | ||||||
|  |  | ||||||
|  |     memory_if get_mem_if() override { | ||||||
|  |         return memory_if{.rd_mem{util::delegate<rd_mem_func_sig>::from<this_class, &this_class::read_mem>(this)}, | ||||||
|  |                          .wr_mem{util::delegate<wr_mem_func_sig>::from<this_class, &this_class::write_mem>(this)}}; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     void set_next(memory_if mem) override { down_stream_mem = mem; } | ||||||
|  |  | ||||||
|  | private: | ||||||
|  |     iss::status read_mem(iss::access_type access, uint64_t addr, unsigned length, uint8_t* data) { | ||||||
|  |         if(unlikely((addr & ~PGMASK) != ((addr + length - 1) & ~PGMASK))) { // we may cross a page boundary | ||||||
|  |             vm_info vm = decode_vm_info(hart_if.PRIV, satp); | ||||||
|  |             if(vm.levels != 0) { // VM is active | ||||||
|  |                 auto split_addr = (addr + length) & ~PGMASK; | ||||||
|  |                 auto len1 = split_addr - addr; | ||||||
|  |                 auto res = down_stream_mem.rd_mem(access, addr, len1, data); | ||||||
|  |                 if(res == iss::Ok) | ||||||
|  |                     res = down_stream_mem.rd_mem(access, split_addr, length - len1, data + len1); | ||||||
|  |                 return res; | ||||||
|  |             } | ||||||
|  |         } | ||||||
|  |         return down_stream_mem.rd_mem(access, addr, length, data); | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_mem(iss::access_type access, uint64_t addr, unsigned length, uint8_t const* data) { | ||||||
|  |         if(unlikely((addr & ~PGMASK) != ((addr + length - 1) & ~PGMASK))) { // we may cross a page boundary | ||||||
|  |             vm_info vm = decode_vm_info(hart_if.PRIV, satp); | ||||||
|  |             if(vm.levels != 0) { // VM is active | ||||||
|  |                 auto split_addr = (addr + length) & ~PGMASK; | ||||||
|  |                 auto len1 = split_addr - addr; | ||||||
|  |                 auto res = down_stream_mem.wr_mem(access, addr, len1, data); | ||||||
|  |                 if(res == iss::Ok) | ||||||
|  |                     res = down_stream_mem.wr_mem(access, split_addr, length - len1, data + len1); | ||||||
|  |                 return res; | ||||||
|  |             } | ||||||
|  |         } | ||||||
|  |         return down_stream_mem.wr_mem(access, virt2phys(access, addr), length, data); | ||||||
|  |     } | ||||||
|  |     void update_vm_info(); | ||||||
|  |  | ||||||
|  |     iss::status read_plain(unsigned addr, reg_t& val) { | ||||||
|  |         val = hart_if.csr[addr]; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_plain(unsigned addr, reg_t const& val) { | ||||||
|  |         hart_if.csr[addr] = val; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_satp(unsigned addr, reg_t& val) { | ||||||
|  |         auto tvm = bit_sub<20, 1>(hart_if.state.mstatus()); | ||||||
|  |         if(hart_if.PRIV == arch::PRIV_S & tvm != 0) { | ||||||
|  |             hart_if.raise_trap(2, 0, hart_if.PC); | ||||||
|  |             //            hart_if.reg.trap_state = (1 << 31) | (2 << 16); | ||||||
|  |             //            hart_if.fault_data = hart_if.reg.PC; | ||||||
|  |             return iss::Err; | ||||||
|  |         } | ||||||
|  |         val = satp; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_satp(unsigned addr, reg_t val) { | ||||||
|  |         reg_t tvm = hart_if.state.mstatus.TVM; | ||||||
|  |         if(hart_if.PRIV == arch::PRIV_S & tvm != 0) { | ||||||
|  |             hart_if.raise_trap(2, 0, hart_if.PC); | ||||||
|  |             //            hart_if.reg.trap_state = (1 << 31) | (2 << 16); | ||||||
|  |             //            hart_if.fault_data = hart_if.reg.PC; | ||||||
|  |             return iss::Err; | ||||||
|  |         } | ||||||
|  |         satp = val; | ||||||
|  |         update_vm_info(); | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     uint64_t virt2phys(iss::access_type access, uint64_t addr); | ||||||
|  |  | ||||||
|  |     static inline vm_info decode_vm_info(uint32_t state, uint32_t sptbr) { | ||||||
|  |         if(state == arch::PRIV_M) | ||||||
|  |             return {0, 0, 0, 0}; | ||||||
|  |         if(state <= arch::PRIV_S) | ||||||
|  |             switch(bit_sub<31, 1>(sptbr)) { | ||||||
|  |             case 0: | ||||||
|  |                 return {0, 0, 0, 0}; // off | ||||||
|  |             case 1: | ||||||
|  |                 return {2, 10, 4, bit_sub<0, 22>(sptbr) << PGSHIFT}; // SV32 | ||||||
|  |             default: | ||||||
|  |                 abort(); | ||||||
|  |             } | ||||||
|  |         abort(); | ||||||
|  |         return {0, 0, 0, 0}; // dummy | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     static inline vm_info decode_vm_info(uint32_t state, uint64_t sptbr) { | ||||||
|  |         if(state == arch::PRIV_M) | ||||||
|  |             return {0, 0, 0, 0}; | ||||||
|  |         if(state <= arch::PRIV_S) | ||||||
|  |             switch(bit_sub<60, 4>(sptbr)) { | ||||||
|  |             case 0: | ||||||
|  |                 return {0, 0, 0, 0}; // off | ||||||
|  |             case 8: | ||||||
|  |                 return {3, 9, 8, bit_sub<0, 44>(sptbr) << PGSHIFT}; // SV39 | ||||||
|  |             case 9: | ||||||
|  |                 return {4, 9, 8, bit_sub<0, 44>(sptbr) << PGSHIFT}; // SV48 | ||||||
|  |             case 10: | ||||||
|  |                 return {5, 9, 8, bit_sub<0, 44>(sptbr) << PGSHIFT}; // SV57 | ||||||
|  |             case 11: | ||||||
|  |                 return {6, 9, 8, bit_sub<0, 44>(sptbr) << PGSHIFT}; // SV64 | ||||||
|  |             default: | ||||||
|  |                 abort(); | ||||||
|  |             } | ||||||
|  |         abort(); | ||||||
|  |         return {0, 0, 0, 0}; // dummy | ||||||
|  |     } | ||||||
|  |  | ||||||
|  | protected: | ||||||
|  |     reg_t satp; | ||||||
|  |     absl::flat_hash_map<reg_t, uint64_t> ptw; | ||||||
|  |     std::array<vm_info, 2> vmt; | ||||||
|  |     std::array<address_type, 4> addr_mode; | ||||||
|  |  | ||||||
|  |     arch::priv_if<WORD_TYPE> hart_if; | ||||||
|  |     memory_if down_stream_mem; | ||||||
|  | }; | ||||||
|  |  | ||||||
|  | template <typename WORD_TYPE> uint64_t mmu<WORD_TYPE>::virt2phys(iss::access_type access, uint64_t addr) { | ||||||
|  |     const auto type = access & iss::access_type::FUNC; | ||||||
|  |     auto it = ptw.find(addr >> PGSHIFT); | ||||||
|  |     if(it != ptw.end()) { | ||||||
|  |         const reg_t pte = it->second; | ||||||
|  |         const reg_t ad = PTE_A | (type == iss::access_type::WRITE) * PTE_D; | ||||||
|  | #ifdef RISCV_ENABLE_DIRTY | ||||||
|  |         // set accessed and possibly dirty bits. | ||||||
|  |         *(uint32_t*)ppte |= ad; | ||||||
|  |         return {addr.getAccessType(), addr.space, (pte & (~PGMASK)) | (addr.val & PGMASK)}; | ||||||
|  | #else | ||||||
|  |         // take exception if access or possibly dirty bit is not set. | ||||||
|  |         if((pte & ad) == ad) | ||||||
|  |             return {(pte & (~PGMASK)) | (addr & PGMASK)}; | ||||||
|  |         else | ||||||
|  |             ptw.erase(it); // throw an exception | ||||||
|  | #endif | ||||||
|  |     } else { | ||||||
|  |         uint32_t mode = type != iss::access_type::FETCH && hart_if.state.mstatus.MPRV ? // MPRV | ||||||
|  |                             hart_if.state.mstatus.MPP | ||||||
|  |                                                                                       : hart_if.PRIV; | ||||||
|  |  | ||||||
|  |         const vm_info& vm = vmt[static_cast<uint16_t>(type) / 2]; | ||||||
|  |  | ||||||
|  |         const bool s_mode = mode == arch::PRIV_S; | ||||||
|  |         const bool sum = hart_if.state.mstatus.SUM; | ||||||
|  |         const bool mxr = hart_if.state.mstatus.MXR; | ||||||
|  |  | ||||||
|  |         // verify bits xlen-1:va_bits-1 are all equal | ||||||
|  |         const int va_bits = PGSHIFT + vm.levels * vm.idxbits; | ||||||
|  |         const reg_t mask = (reg_t(1) << (sizeof(reg_t) * 8 - (va_bits - 1))) - 1; | ||||||
|  |         const reg_t masked_msbs = (addr >> (va_bits - 1)) & mask; | ||||||
|  |         const int levels = (masked_msbs != 0 && masked_msbs != mask) ? 0 : vm.levels; | ||||||
|  |  | ||||||
|  |         reg_t base = vm.ptbase; | ||||||
|  |         for(int i = levels - 1; i >= 0; i--) { | ||||||
|  |             const int ptshift = i * vm.idxbits; | ||||||
|  |             const reg_t idx = (addr >> (PGSHIFT + ptshift)) & ((1 << vm.idxbits) - 1); | ||||||
|  |  | ||||||
|  |             // check that physical address of PTE is legal | ||||||
|  |             reg_t pte = 0; | ||||||
|  |             const uint8_t res = down_stream_mem.rd_mem(iss::access_type::READ, base + idx * vm.ptesize, vm.ptesize, (uint8_t*)&pte); | ||||||
|  |             if(res != 0) | ||||||
|  |                 throw arch::trap_load_access_fault(addr); | ||||||
|  |             const reg_t ppn = pte >> PTE_PPN_SHIFT; | ||||||
|  |  | ||||||
|  |             if(PTE_TABLE(pte)) { // next level of page table | ||||||
|  |                 base = ppn << PGSHIFT; | ||||||
|  |             } else if((pte & PTE_U) ? s_mode && (type == iss::access_type::FETCH || !sum) : !s_mode) { | ||||||
|  |                 break; | ||||||
|  |             } else if(!(pte & PTE_V) || (!(pte & PTE_R) && (pte & PTE_W))) { | ||||||
|  |                 break; | ||||||
|  |             } else if(type == (type == iss::access_type::FETCH  ? !(pte & PTE_X) | ||||||
|  |                                : type == iss::access_type::READ ? !(pte & PTE_R) && !(mxr && (pte & PTE_X)) | ||||||
|  |                                                                 : !((pte & PTE_R) && (pte & PTE_W)))) { | ||||||
|  |                 break; | ||||||
|  |             } else if((ppn & ((reg_t(1) << ptshift) - 1)) != 0) { | ||||||
|  |                 break; | ||||||
|  |             } else { | ||||||
|  |                 const reg_t ad = PTE_A | ((type == iss::access_type::WRITE) * PTE_D); | ||||||
|  | #ifdef RISCV_ENABLE_DIRTY | ||||||
|  |                 // set accessed and possibly dirty bits. | ||||||
|  |                 *(uint32_t*)ppte |= ad; | ||||||
|  | #else | ||||||
|  |                 // take exception if access or possibly dirty bit is not set. | ||||||
|  |                 if((pte & ad) != ad) | ||||||
|  |                     break; | ||||||
|  | #endif | ||||||
|  |                 // for superpage mappings, make a fake leaf PTE for the TLB's benefit. | ||||||
|  |                 const reg_t vpn = addr >> PGSHIFT; | ||||||
|  |                 const reg_t value = (ppn | (vpn & ((reg_t(1) << ptshift) - 1))) << PGSHIFT; | ||||||
|  |                 const reg_t offset = addr & PGMASK; | ||||||
|  |                 ptw[vpn] = value | (pte & 0xff); | ||||||
|  |                 return value | offset; | ||||||
|  |             } | ||||||
|  |         } | ||||||
|  |     } | ||||||
|  |     switch(type) { | ||||||
|  |     case access_type::FETCH: | ||||||
|  |         hart_if.raise_trap(12, 0, addr); | ||||||
|  |         throw arch::trap_instruction_page_fault(addr); | ||||||
|  |     case access_type::READ: | ||||||
|  |         hart_if.raise_trap(13, 0, addr); | ||||||
|  |         throw arch::trap_load_page_fault(addr); | ||||||
|  |     case access_type::WRITE: | ||||||
|  |         hart_if.raise_trap(15, 0, addr); | ||||||
|  |         throw arch::trap_store_page_fault(addr); | ||||||
|  |     default: | ||||||
|  |         abort(); | ||||||
|  |     } | ||||||
|  | } | ||||||
|  |  | ||||||
|  | template <typename WORD_TYPE> inline void mmu<WORD_TYPE>::update_vm_info() { | ||||||
|  |     vmt[1] = decode_vm_info(hart_if.PRIV, satp); | ||||||
|  |     addr_mode[3] = addr_mode[2] = vmt[1].is_active() ? iss::address_type::VIRTUAL : iss::address_type::PHYSICAL; | ||||||
|  |     if(hart_if.state.mstatus.MPRV) | ||||||
|  |         vmt[0] = decode_vm_info(hart_if.state.mstatus.MPP, satp); | ||||||
|  |     else | ||||||
|  |         vmt[0] = vmt[1]; | ||||||
|  |     addr_mode[1] = addr_mode[0] = vmt[0].is_active() ? iss::address_type::VIRTUAL : iss::address_type::PHYSICAL; | ||||||
|  |     ptw.clear(); | ||||||
|  | } | ||||||
|  |  | ||||||
|  | } // namespace mem | ||||||
|  | } // namespace iss | ||||||
							
								
								
									
										244
									
								
								src/iss/mem/pmp.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										244
									
								
								src/iss/mem/pmp.h
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,244 @@ | |||||||
|  | /******************************************************************************* | ||||||
|  |  * Copyright (C) 2025 MINRES Technologies GmbH | ||||||
|  |  * All rights reserved. | ||||||
|  |  * | ||||||
|  |  * Redistribution and use in source and binary forms, with or without | ||||||
|  |  * modification, are permitted provided that the following conditions are met: | ||||||
|  |  * | ||||||
|  |  * 1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer. | ||||||
|  |  * | ||||||
|  |  * 2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer in the documentation | ||||||
|  |  *    and/or other materials provided with the distribution. | ||||||
|  |  * | ||||||
|  |  * 3. Neither the name of the copyright holder nor the names of its contributors | ||||||
|  |  *    may be used to endorse or promote products derived from this software | ||||||
|  |  *    without specific prior written permission. | ||||||
|  |  * | ||||||
|  |  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  |  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  |  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||||
|  |  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||||
|  |  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||||
|  |  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||||
|  |  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||||
|  |  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||||
|  |  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||||
|  |  * POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  * | ||||||
|  |  * Contributors: | ||||||
|  |  *       eyck@minres.com - initial implementation | ||||||
|  |  ******************************************************************************/ | ||||||
|  |  | ||||||
|  | #include "memory_if.h" | ||||||
|  | #include "iss/arch/riscv_hart_common.h" | ||||||
|  | #include "iss/vm_types.h" | ||||||
|  | #include <util/logging.h> | ||||||
|  |  | ||||||
|  | namespace iss { | ||||||
|  | namespace mem { | ||||||
|  | struct clic_config { | ||||||
|  |     uint64_t clic_base{0xc0000000}; | ||||||
|  |     unsigned clic_int_ctl_bits{4}; | ||||||
|  |     unsigned clic_num_irq{16}; | ||||||
|  |     unsigned clic_num_trigger{0}; | ||||||
|  |     bool nmode{false}; | ||||||
|  | }; | ||||||
|  |  | ||||||
|  | inline void read_reg_with_offset(uint32_t reg, uint8_t offs, uint8_t* const data, unsigned length) { | ||||||
|  |     auto reg_ptr = reinterpret_cast<uint8_t*>(®); | ||||||
|  |     switch(offs) { | ||||||
|  |     default: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(data + i) = *(reg_ptr + i); | ||||||
|  |         break; | ||||||
|  |     case 1: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(data + i) = *(reg_ptr + 1 + i); | ||||||
|  |         break; | ||||||
|  |     case 2: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(data + i) = *(reg_ptr + 2 + i); | ||||||
|  |         break; | ||||||
|  |     case 3: | ||||||
|  |         *data = *(reg_ptr + 3); | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  | } | ||||||
|  |  | ||||||
|  | inline void write_reg_with_offset(uint32_t& reg, uint8_t offs, const uint8_t* const data, unsigned length) { | ||||||
|  |     auto reg_ptr = reinterpret_cast<uint8_t*>(®); | ||||||
|  |     switch(offs) { | ||||||
|  |     default: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(reg_ptr + i) = *(data + i); | ||||||
|  |         break; | ||||||
|  |     case 1: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(reg_ptr + 1 + i) = *(data + i); | ||||||
|  |         break; | ||||||
|  |     case 2: | ||||||
|  |         for(auto i = 0U; i < length; ++i) | ||||||
|  |             *(reg_ptr + 2 + i) = *(data + i); | ||||||
|  |         break; | ||||||
|  |     case 3: | ||||||
|  |         *(reg_ptr + 3) = *data; | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  | } | ||||||
|  |  | ||||||
|  | template <typename WORD_TYPE> struct pmp : public memory_elem { | ||||||
|  |     using this_class = pmp<WORD_TYPE>; | ||||||
|  |     using reg_t = WORD_TYPE; | ||||||
|  |     constexpr static unsigned WORD_LEN = sizeof(WORD_TYPE) * 8; | ||||||
|  |  | ||||||
|  |     pmp(arch::priv_if<WORD_TYPE> hart_if) | ||||||
|  |     : hart_if(hart_if) { | ||||||
|  |         for(size_t i = arch::pmpaddr0; i <= arch::pmpaddr15; ++i) { | ||||||
|  |             hart_if.csr_rd_cb[i] = MK_CSR_RD_CB(read_plain); | ||||||
|  |             hart_if.csr_wr_cb[i] = MK_CSR_WR_CB(write_plain); | ||||||
|  |         } | ||||||
|  |         for(size_t i = arch::pmpcfg0; i < arch::pmpcfg0 + 16 / sizeof(reg_t); ++i) { | ||||||
|  |             hart_if.csr_rd_cb[i] = MK_CSR_RD_CB(read_plain); | ||||||
|  |             hart_if.csr_wr_cb[i] = MK_CSR_WR_CB(write_pmpcfg); | ||||||
|  |         } | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     virtual ~pmp() = default; | ||||||
|  |  | ||||||
|  |     memory_if get_mem_if() override { | ||||||
|  |         return memory_if{.rd_mem{util::delegate<rd_mem_func_sig>::from<this_class, &this_class::read_mem>(this)}, | ||||||
|  |                          .wr_mem{util::delegate<wr_mem_func_sig>::from<this_class, &this_class::write_mem>(this)}}; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     void set_next(memory_if mem) override { down_stream_mem = mem; } | ||||||
|  |  | ||||||
|  | private: | ||||||
|  |     iss::status read_mem(iss::access_type access, uint64_t addr, unsigned length, uint8_t* data) { | ||||||
|  |         if(!pmp_check(access, addr, length) && !is_debug(access)) { | ||||||
|  |             hart_if.fault_data = addr; | ||||||
|  |             if(is_debug(access)) | ||||||
|  |                 throw trap_access(0, addr); | ||||||
|  |             hart_if.reg.trap_state = (1UL << 31) | ((access == access_type::FETCH ? 1 : 5) << 16); // issue trap 1 | ||||||
|  |             return iss::Err; | ||||||
|  |         } | ||||||
|  |         return down_stream_mem.rd_mem(access, addr, length, data); | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_mem(iss::access_type access, uint64_t addr, unsigned length, uint8_t const* data) { | ||||||
|  |         if(!pmp_check(access, addr, length) && !is_debug(access)) { | ||||||
|  |             hart_if.fault_data = addr; | ||||||
|  |             if(is_debug(access)) | ||||||
|  |                 throw trap_access(0, addr); | ||||||
|  |             hart_if.reg.trap_state = (1UL << 31) | (7 << 16); // issue trap 1 | ||||||
|  |             return iss::Err; | ||||||
|  |         } | ||||||
|  |         return down_stream_mem.wr_mem(access, addr, length, data); | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_plain(unsigned addr, reg_t& val) { | ||||||
|  |         val = hart_if.csr[addr]; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_plain(unsigned addr, reg_t const& val) { | ||||||
|  |         hart_if.csr[addr] = val; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status write_pmpcfg(unsigned addr, reg_t val) { | ||||||
|  |         hart_if.csr[addr] = val & 0x9f9f9f9f; | ||||||
|  |         return iss::Ok; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     bool pmp_check(const access_type type, const uint64_t addr, const unsigned len); | ||||||
|  |  | ||||||
|  | protected: | ||||||
|  |     arch::priv_if<WORD_TYPE> hart_if; | ||||||
|  |     memory_if down_stream_mem; | ||||||
|  | }; | ||||||
|  |  | ||||||
|  | template <typename WORD_TYPE> bool pmp<WORD_TYPE>::pmp_check(const access_type type, const uint64_t addr, const unsigned len) { | ||||||
|  |     constexpr auto PMP_SHIFT = 2U; | ||||||
|  |     constexpr auto PMP_R = 0x1U; | ||||||
|  |     constexpr auto PMP_W = 0x2U; | ||||||
|  |     constexpr auto PMP_X = 0x4U; | ||||||
|  |     constexpr auto PMP_A = 0x18U; | ||||||
|  |     constexpr auto PMP_L = 0x80U; | ||||||
|  |     constexpr auto PMP_TOR = 0x1U; | ||||||
|  |     constexpr auto PMP_NA4 = 0x2U; | ||||||
|  |     constexpr auto PMP_NAPOT = 0x3U; | ||||||
|  |     reg_t base = 0; | ||||||
|  |     auto any_active = false; | ||||||
|  |     auto const cfg_reg_size = sizeof(reg_t); | ||||||
|  |     for(size_t i = 0; i < 16; i++) { | ||||||
|  |         reg_t tor = hart_if.csr[arch::pmpaddr0 + i] << PMP_SHIFT; | ||||||
|  |         uint8_t cfg = hart_if.csr[arch::pmpcfg0 + (i / cfg_reg_size)] >> (i % cfg_reg_size); | ||||||
|  |         if(cfg & PMP_A) { | ||||||
|  |             any_active = true; | ||||||
|  |             auto pmp_a = (cfg & PMP_A) >> 3; | ||||||
|  |             auto is_tor = pmp_a == PMP_TOR; | ||||||
|  |             auto is_na4 = pmp_a == PMP_NA4; | ||||||
|  |  | ||||||
|  |             reg_t mask = (hart_if.csr[arch::pmpaddr0 + i] << 1) | (!is_na4); | ||||||
|  |             mask = ~(mask & ~(mask + 1)) << PMP_SHIFT; | ||||||
|  |  | ||||||
|  |             // Check each 4-byte sector of the access | ||||||
|  |             auto any_match = false; | ||||||
|  |             auto all_match = true; | ||||||
|  |             for(reg_t offset = 0; offset < len; offset += 1 << PMP_SHIFT) { | ||||||
|  |                 reg_t cur_addr = addr + offset; | ||||||
|  |                 auto napot_match = ((cur_addr ^ tor) & mask) == 0; | ||||||
|  |                 auto tor_match = base <= (cur_addr + len - 1) && cur_addr < tor; | ||||||
|  |                 auto match = is_tor ? tor_match : napot_match; | ||||||
|  |                 any_match |= match; | ||||||
|  |                 all_match &= match; | ||||||
|  |             } | ||||||
|  |             if(any_match) { | ||||||
|  |                 // If the PMP matches only a strict subset of the access, fail it | ||||||
|  |                 if(!all_match) | ||||||
|  |                     return false; | ||||||
|  |                 return (hart_if.reg.PRIV == arch::PRIV_M && !(cfg & PMP_L)) || (type == access_type::READ && (cfg & PMP_R)) || | ||||||
|  |                        (type == access_type::WRITE && (cfg & PMP_W)) || (type == access_type::FETCH && (cfg & PMP_X)); | ||||||
|  |             } | ||||||
|  |         } | ||||||
|  |         base = tor; | ||||||
|  |     } | ||||||
|  |     //    constexpr auto pmp_num_regs = 16; | ||||||
|  |     //    reg_t tor_base = 0; | ||||||
|  |     //    auto any_active = false; | ||||||
|  |     //    auto lower_addr = addr >>2; | ||||||
|  |     //    auto upper_addr = (addr+len-1)>>2; | ||||||
|  |     //    for (size_t i = 0; i < pmp_num_regs; i++) { | ||||||
|  |     //        uint8_t cfg = csr[pmpcfg0+(i/4)]>>(i%4); | ||||||
|  |     //        uint8_t cfg_next = i==(pmp_num_regs-1)? 0 : csr[pmpcfg0+((i+1)/4)]>>((i+1)%4); | ||||||
|  |     //        auto pmpaddr = csr[pmpaddr0+i]; | ||||||
|  |     //        if (cfg & PMP_A) { | ||||||
|  |     //            any_active=true; | ||||||
|  |     //            auto is_tor = bit_sub<3, 2>(cfg) == PMP_TOR; | ||||||
|  |     //            auto is_napot = bit_sub<4, 1>(cfg) && bit_sub<3, 2>(cfg_next)!= PMP_TOR; | ||||||
|  |     //            if(is_napot) { | ||||||
|  |     //                reg_t mask = bit_sub<3, 1>(cfg)?~( pmpaddr & ~(pmpaddr + 1)): 0x3fffffff; | ||||||
|  |     //                auto mpmpaddr = pmpaddr & mask; | ||||||
|  |     //                if((lower_addr&mask) == mpmpaddr && (upper_addr&mask)==mpmpaddr) | ||||||
|  |     //                    return  (hart_if.reg.PRIV == PRIV_M && !(cfg & PMP_L)) || | ||||||
|  |     //                            (type == access_type::READ && (cfg & PMP_R)) || | ||||||
|  |     //                            (type == access_type::WRITE && (cfg & PMP_W)) || | ||||||
|  |     //                            (type == access_type::FETCH && (cfg & PMP_X)); | ||||||
|  |     //            } else if(is_tor) { | ||||||
|  |     //                if(lower_addr>=tor_base && upper_addr<=pmpaddr) | ||||||
|  |     //                    return  (hart_if.reg.PRIV == PRIV_M && !(cfg & PMP_L)) || | ||||||
|  |     //                            (type == access_type::READ && (cfg & PMP_R)) || | ||||||
|  |     //                            (type == access_type::WRITE && (cfg & PMP_W)) || | ||||||
|  |     //                            (type == access_type::FETCH && (cfg & PMP_X)); | ||||||
|  |     //            } | ||||||
|  |     //        } | ||||||
|  |     //        tor_base = pmpaddr; | ||||||
|  |     //    } | ||||||
|  |     return !any_active || hart_if.reg.PRIV == arch::PRIV_M; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | } // namespace mem | ||||||
|  | } // namespace iss | ||||||
| @@ -1,3 +1,37 @@ | |||||||
|  | /******************************************************************************* | ||||||
|  |  * Copyright (C) 2025 MINRES Technologies GmbH | ||||||
|  |  * All rights reserved. | ||||||
|  |  * | ||||||
|  |  * Redistribution and use in source and binary forms, with or without | ||||||
|  |  * modification, are permitted provided that the following conditions are met: | ||||||
|  |  * | ||||||
|  |  * 1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer. | ||||||
|  |  * | ||||||
|  |  * 2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer in the documentation | ||||||
|  |  *    and/or other materials provided with the distribution. | ||||||
|  |  * | ||||||
|  |  * 3. Neither the name of the copyright holder nor the names of its contributors | ||||||
|  |  *    may be used to endorse or promote products derived from this software | ||||||
|  |  *    without specific prior written permission. | ||||||
|  |  * | ||||||
|  |  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  |  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  |  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||||
|  |  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||||
|  |  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||||
|  |  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||||
|  |  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||||
|  |  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||||
|  |  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||||
|  |  * POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  * | ||||||
|  |  * Contributors: | ||||||
|  |  *       eyck@minres.com - initial implementation | ||||||
|  |  ******************************************************************************/ | ||||||
|  |  | ||||||
| #include "semihosting.h" | #include "semihosting.h" | ||||||
| #include <chrono> | #include <chrono> | ||||||
| #include <cstdint> | #include <cstdint> | ||||||
|   | |||||||
| @@ -1,3 +1,37 @@ | |||||||
|  | /******************************************************************************* | ||||||
|  |  * Copyright (C) 2025 MINRES Technologies GmbH | ||||||
|  |  * All rights reserved. | ||||||
|  |  * | ||||||
|  |  * Redistribution and use in source and binary forms, with or without | ||||||
|  |  * modification, are permitted provided that the following conditions are met: | ||||||
|  |  * | ||||||
|  |  * 1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer. | ||||||
|  |  * | ||||||
|  |  * 2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer in the documentation | ||||||
|  |  *    and/or other materials provided with the distribution. | ||||||
|  |  * | ||||||
|  |  * 3. Neither the name of the copyright holder nor the names of its contributors | ||||||
|  |  *    may be used to endorse or promote products derived from this software | ||||||
|  |  *    without specific prior written permission. | ||||||
|  |  * | ||||||
|  |  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  |  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  |  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||||
|  |  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||||
|  |  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||||
|  |  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||||
|  |  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||||
|  |  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||||
|  |  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||||
|  |  * POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  * | ||||||
|  |  * Contributors: | ||||||
|  |  *       eyck@minres.com - initial implementation | ||||||
|  |  ******************************************************************************/ | ||||||
|  |  | ||||||
| #ifndef _SEMIHOSTING_H_ | #ifndef _SEMIHOSTING_H_ | ||||||
| #define _SEMIHOSTING_H_ | #define _SEMIHOSTING_H_ | ||||||
| #include <chrono> | #include <chrono> | ||||||
|   | |||||||
							
								
								
									
										33
									
								
								src/main.cpp
									
									
									
									
									
								
							
							
						
						
									
										33
									
								
								src/main.cpp
									
									
									
									
									
								
							| @@ -40,6 +40,7 @@ | |||||||
| #include <vector> | #include <vector> | ||||||
|  |  | ||||||
| #include "iss/arch/tgc_mapper.h" | #include "iss/arch/tgc_mapper.h" | ||||||
|  | #include "util/logging.h" | ||||||
| #include <boost/lexical_cast.hpp> | #include <boost/lexical_cast.hpp> | ||||||
| #include <boost/program_options.hpp> | #include <boost/program_options.hpp> | ||||||
| #ifdef WITH_LLVM | #ifdef WITH_LLVM | ||||||
| @@ -69,7 +70,8 @@ int main(int argc, char* argv[]) { | |||||||
|         ("logfile,l", po::value<std::string>(), "Sets default log file.") |         ("logfile,l", po::value<std::string>(), "Sets default log file.") | ||||||
|         ("disass,d", po::value<std::string>()->implicit_value(""), "Enables disassembly") |         ("disass,d", po::value<std::string>()->implicit_value(""), "Enables disassembly") | ||||||
|         ("gdb-port,g", po::value<unsigned>()->default_value(0), "enable gdb server and specify port to use") |         ("gdb-port,g", po::value<unsigned>()->default_value(0), "enable gdb server and specify port to use") | ||||||
|         ("instructions,i", po::value<uint64_t>()->default_value(std::numeric_limits<uint64_t>::max()), "max. number of instructions to simulate") |         ("ilimit,i", po::value<uint64_t>()->default_value(std::numeric_limits<uint64_t>::max()), "max. number of instructions to simulate") | ||||||
|  |         ("flimit", po::value<uint64_t>()->default_value(std::numeric_limits<uint64_t>::max()), "max. number of fetches to simulate") | ||||||
|         ("reset,r", po::value<std::string>(), "reset address") |         ("reset,r", po::value<std::string>(), "reset address") | ||||||
|         ("dump-ir", "dump the intermediate representation") |         ("dump-ir", "dump the intermediate representation") | ||||||
|         ("elf,f", po::value<std::vector<std::string>>(), "ELF file(s) to load") |         ("elf,f", po::value<std::vector<std::string>>(), "ELF file(s) to load") | ||||||
| @@ -140,7 +142,10 @@ int main(int argc, char* argv[]) { | |||||||
|             std::tie(cpu, vm) = f.create(isa_opt, clim["gdb-port"].as<unsigned>(), &semihosting_cb); |             std::tie(cpu, vm) = f.create(isa_opt, clim["gdb-port"].as<unsigned>(), &semihosting_cb); | ||||||
|         } |         } | ||||||
|         if(!cpu) { |         if(!cpu) { | ||||||
|             CPPLOG(ERR) << "Could not create cpu for isa " << isa_opt << " and backend " << clim["backend"].as<std::string>() << std::endl; |             auto list = f.get_names(); | ||||||
|  |             std::sort(std::begin(list), std::end(list)); | ||||||
|  |             CPPLOG(ERR) << "Could not create cpu for isa " << isa_opt << " and backend " << clim["backend"].as<std::string>() << "\n" | ||||||
|  |                         << "Available implementations (core|platform|backend):\n  - " << util::join(list, "\n  - ") << std::endl; | ||||||
|             return 127; |             return 127; | ||||||
|         } |         } | ||||||
|         if(!vm) { |         if(!vm) { | ||||||
| @@ -202,21 +207,36 @@ int main(int argc, char* argv[]) { | |||||||
|         if(clim.count("elf")) |         if(clim.count("elf")) | ||||||
|             for(std::string input : clim["elf"].as<std::vector<std::string>>()) { |             for(std::string input : clim["elf"].as<std::vector<std::string>>()) { | ||||||
|                 auto start_addr = vm->get_arch()->load_file(input); |                 auto start_addr = vm->get_arch()->load_file(input); | ||||||
|                 if(start_addr.second) // FIXME: this always evaluates to true as load file always returns <sth, true> |                 if(start_addr.second) | ||||||
|                     start_address = start_addr.first; |                     start_address = start_addr.first; | ||||||
|  |                 else { | ||||||
|  |                     LOG(ERR) << "Error occured while loading file " << input << std::endl; | ||||||
|  |                     return 1; | ||||||
|  |                 } | ||||||
|             } |             } | ||||||
|         for(std::string input : args) { |         for(std::string input : args) { | ||||||
|             auto start_addr = vm->get_arch()->load_file(input); // treat remaining arguments as elf files |             auto start_addr = vm->get_arch()->load_file(input); // treat remaining arguments as elf files | ||||||
|             if(start_addr.second) // FIXME: this always evaluates to true as load file always returns <sth, true> |             if(start_addr.second) | ||||||
|                 start_address = start_addr.first; |                 start_address = start_addr.first; | ||||||
|  |             else { | ||||||
|  |                 LOG(ERR) << "Error occured while loading file " << input << std::endl; | ||||||
|  |                 return 1; | ||||||
|  |             } | ||||||
|         } |         } | ||||||
|         if(clim.count("reset")) { |         if(clim.count("reset")) { | ||||||
|             auto str = clim["reset"].as<std::string>(); |             auto str = clim["reset"].as<std::string>(); | ||||||
|             start_address = str.find("0x") == 0 ? std::stoull(str.substr(2), nullptr, 16) : std::stoull(str, nullptr, 10); |             start_address = str.find("0x") == 0 ? std::stoull(str.substr(2), nullptr, 16) : std::stoull(str, nullptr, 10); | ||||||
|         } |         } | ||||||
|         vm->reset(start_address); |         vm->reset(start_address); | ||||||
|         auto cycles = clim["instructions"].as<uint64_t>(); |         auto limit = clim["ilimit"].as<uint64_t>(); | ||||||
|         res = vm->start(cycles, dump); |         auto cond = iss::finish_cond_e::JUMP_TO_SELF; | ||||||
|  |         if(clim.count("flimit")) { | ||||||
|  |             cond = cond | iss::finish_cond_e::FCOUNT_LIMIT; | ||||||
|  |             limit = clim["flimit"].as<uint64_t>(); | ||||||
|  |         } else { | ||||||
|  |             cond = cond | iss::finish_cond_e::ICOUNT_LIMIT; | ||||||
|  |         } | ||||||
|  |         res = vm->start(limit, dump, cond); | ||||||
|  |  | ||||||
|         auto instr_if = vm->get_arch()->get_instrumentation_if(); |         auto instr_if = vm->get_arch()->get_instrumentation_if(); | ||||||
|         // this assumes a single input file |         // this assumes a single input file | ||||||
| @@ -239,6 +259,7 @@ int main(int argc, char* argv[]) { | |||||||
|                 LOG(ERR) << "Error opening file " << filename << std::endl; |                 LOG(ERR) << "Error opening file " << filename << std::endl; | ||||||
|                 return 1; |                 return 1; | ||||||
|             } |             } | ||||||
|  |             LOGGER(DEFAULT)::reporting_level() = logging::ERR; | ||||||
|             for(auto addr = start_addr; addr < end_addr; addr += data.size()) { |             for(auto addr = start_addr; addr < end_addr; addr += data.size()) { | ||||||
|                 vm->get_arch()->read(iss::address_type::PHYSICAL, iss::access_type::DEBUG_READ, 0 /*MEM*/, addr, data.size(), |                 vm->get_arch()->read(iss::address_type::PHYSICAL, iss::access_type::DEBUG_READ, 0 /*MEM*/, addr, data.size(), | ||||||
|                                      data.data()); // FIXME: get space from iss::arch::traits<ARCH>::mem_type_e::MEM |                                      data.data()); // FIXME: get space from iss::arch::traits<ARCH>::mem_type_e::MEM | ||||||
|   | |||||||
| @@ -1,5 +1,5 @@ | |||||||
| /******************************************************************************* | /******************************************************************************* | ||||||
|  * Copyright (C) 2017, 2018 MINRES Technologies GmbH |  * Copyright (C) 2017 - 2025 MINRES Technologies GmbH | ||||||
|  * All rights reserved. |  * All rights reserved. | ||||||
|  * |  * | ||||||
|  * Redistribution and use in source and binary forms, with or without |  * Redistribution and use in source and binary forms, with or without | ||||||
| @@ -42,7 +42,6 @@ | |||||||
| #include <iss/plugin/loader.h> | #include <iss/plugin/loader.h> | ||||||
| #endif | #endif | ||||||
| #include "sc_core_adapter_if.h" | #include "sc_core_adapter_if.h" | ||||||
| #include <iss/arch/tgc_mapper.h> |  | ||||||
| #include <scc/report.h> | #include <scc/report.h> | ||||||
| #include <util/ities.h> | #include <util/ities.h> | ||||||
| #include <iostream> | #include <iostream> | ||||||
| @@ -125,7 +124,7 @@ using vm_ptr = std::unique_ptr<iss::vm_if>; | |||||||
|  |  | ||||||
| class core_wrapper { | class core_wrapper { | ||||||
| public: | public: | ||||||
|     core_wrapper(core_complex* owner) |     core_wrapper(core_complex_if* owner) | ||||||
|     : owner(owner) {} |     : owner(owner) {} | ||||||
|  |  | ||||||
|     void reset(uint64_t addr) { vm->reset(addr); } |     void reset(uint64_t addr) { vm->reset(addr); } | ||||||
| @@ -181,7 +180,7 @@ public: | |||||||
|                                              "SystemC sub-commands: break <time>, print_time"}); |                                              "SystemC sub-commands: break <time>, print_time"}); | ||||||
|     } |     } | ||||||
|  |  | ||||||
|     core_complex* const owner; |     core_complex_if* const owner; | ||||||
|     vm_ptr vm{nullptr}; |     vm_ptr vm{nullptr}; | ||||||
|     sc_cpu_ptr cpu{nullptr}; |     sc_cpu_ptr cpu{nullptr}; | ||||||
|     iss::debugger::target_adapter_if* tgt_adapter{nullptr}; |     iss::debugger::target_adapter_if* tgt_adapter{nullptr}; | ||||||
| @@ -197,9 +196,9 @@ struct core_trace { | |||||||
|     scv_tr_handle tr_handle; |     scv_tr_handle tr_handle; | ||||||
| }; | }; | ||||||
|  |  | ||||||
| SC_HAS_PROCESS(core_complex); // NOLINT |  | ||||||
| #ifndef CWR_SYSTEMC | #ifndef CWR_SYSTEMC | ||||||
| core_complex::core_complex(sc_module_name const& name) | template <unsigned int BUSWIDTH> | ||||||
|  | core_complex<BUSWIDTH>::core_complex(sc_module_name const& name) | ||||||
| : sc_module(name) | : sc_module(name) | ||||||
| , fetch_lut(tlm_dmi_ext()) | , fetch_lut(tlm_dmi_ext()) | ||||||
| , read_lut(tlm_dmi_ext()) | , read_lut(tlm_dmi_ext()) | ||||||
| @@ -208,7 +207,7 @@ core_complex::core_complex(sc_module_name const& name) | |||||||
| } | } | ||||||
| #endif | #endif | ||||||
|  |  | ||||||
| void core_complex::init() { | template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::init() { | ||||||
|     trc = new core_trace(); |     trc = new core_trace(); | ||||||
|     ibus.register_invalidate_direct_mem_ptr([=](uint64_t start, uint64_t end) -> void { |     ibus.register_invalidate_direct_mem_ptr([=](uint64_t start, uint64_t end) -> void { | ||||||
|         auto lut_entry = fetch_lut.getEntry(start); |         auto lut_entry = fetch_lut.getEntry(start); | ||||||
| @@ -227,6 +226,7 @@ void core_complex::init() { | |||||||
|         } |         } | ||||||
|     }); |     }); | ||||||
|  |  | ||||||
|  |     SC_HAS_PROCESS(core_complex<BUSWIDTH>); // NOLINT | ||||||
|     SC_THREAD(run); |     SC_THREAD(run); | ||||||
|     SC_METHOD(rst_cb); |     SC_METHOD(rst_cb); | ||||||
|     sensitive << rst_i; |     sensitive << rst_i; | ||||||
| @@ -252,16 +252,16 @@ void core_complex::init() { | |||||||
| #endif | #endif | ||||||
| } | } | ||||||
|  |  | ||||||
| core_complex::~core_complex() { | template <unsigned int BUSWIDTH> core_complex<BUSWIDTH>::~core_complex() { | ||||||
|     delete cpu; |     delete cpu; | ||||||
|     delete trc; |     delete trc; | ||||||
|     for(auto* p : plugin_list) |     for(auto* p : plugin_list) | ||||||
|         delete p; |         delete p; | ||||||
| } | } | ||||||
|  |  | ||||||
| void core_complex::trace(sc_trace_file* trf) const {} | template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::trace(sc_trace_file* trf) const {} | ||||||
|  |  | ||||||
| void core_complex::before_end_of_elaboration() { | template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::before_end_of_elaboration() { | ||||||
|     SCCDEBUG(SCMOD) << "instantiating iss::arch::tgf with " << GET_PROP_VALUE(backend) << " backend"; |     SCCDEBUG(SCMOD) << "instantiating iss::arch::tgf with " << GET_PROP_VALUE(backend) << " backend"; | ||||||
|     // cpu = scc::make_unique<core_wrapper>(this); |     // cpu = scc::make_unique<core_wrapper>(this); | ||||||
|     cpu = new core_wrapper(this); |     cpu = new core_wrapper(this); | ||||||
| @@ -302,7 +302,7 @@ void core_complex::before_end_of_elaboration() { | |||||||
|     } |     } | ||||||
| } | } | ||||||
|  |  | ||||||
| void core_complex::start_of_simulation() { | template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::start_of_simulation() { | ||||||
|     // quantum_keeper.reset(); |     // quantum_keeper.reset(); | ||||||
|     if(GET_PROP_VALUE(elf_file).size() > 0) { |     if(GET_PROP_VALUE(elf_file).size() > 0) { | ||||||
|         istringstream is(GET_PROP_VALUE(elf_file)); |         istringstream is(GET_PROP_VALUE(elf_file)); | ||||||
| @@ -325,7 +325,7 @@ void core_complex::start_of_simulation() { | |||||||
|     } |     } | ||||||
| } | } | ||||||
|  |  | ||||||
| bool core_complex::disass_output(uint64_t pc, const std::string instr_str) { | template <unsigned int BUSWIDTH> bool core_complex<BUSWIDTH>::disass_output(uint64_t pc, const std::string instr_str) { | ||||||
|     if(trc->m_db == nullptr) |     if(trc->m_db == nullptr) | ||||||
|         return false; |         return false; | ||||||
|     if(trc->tr_handle.is_active()) |     if(trc->tr_handle.is_active()) | ||||||
| @@ -339,7 +339,7 @@ bool core_complex::disass_output(uint64_t pc, const std::string instr_str) { | |||||||
|     return true; |     return true; | ||||||
| } | } | ||||||
|  |  | ||||||
| void core_complex::forward() { | template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::forward() { | ||||||
| #ifndef CWR_SYSTEMC | #ifndef CWR_SYSTEMC | ||||||
|     set_clock_period(clk_i.read()); |     set_clock_period(clk_i.read()); | ||||||
| #else | #else | ||||||
| @@ -348,24 +348,24 @@ void core_complex::forward() { | |||||||
| #endif | #endif | ||||||
| } | } | ||||||
|  |  | ||||||
| void core_complex::set_clock_period(sc_core::sc_time period) { | template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::set_clock_period(sc_core::sc_time period) { | ||||||
|     curr_clk = period; |     curr_clk = period; | ||||||
|     if(period == SC_ZERO_TIME) |     if(period == SC_ZERO_TIME) | ||||||
|         cpu->set_interrupt_execution(true); |         cpu->set_interrupt_execution(true); | ||||||
| } | } | ||||||
|  |  | ||||||
| void core_complex::rst_cb() { | template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::rst_cb() { | ||||||
|     if(rst_i.read()) |     if(rst_i.read()) | ||||||
|         cpu->set_interrupt_execution(true); |         cpu->set_interrupt_execution(true); | ||||||
| } | } | ||||||
|  |  | ||||||
| void core_complex::sw_irq_cb() { cpu->local_irq(3, sw_irq_i.read()); } | template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::sw_irq_cb() { cpu->local_irq(3, sw_irq_i.read()); } | ||||||
|  |  | ||||||
| void core_complex::timer_irq_cb() { cpu->local_irq(7, timer_irq_i.read()); } | template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::timer_irq_cb() { cpu->local_irq(7, timer_irq_i.read()); } | ||||||
|  |  | ||||||
| void core_complex::ext_irq_cb() { cpu->local_irq(11, ext_irq_i.read()); } | template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::ext_irq_cb() { cpu->local_irq(11, ext_irq_i.read()); } | ||||||
|  |  | ||||||
| void core_complex::local_irq_cb() { | template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::local_irq_cb() { | ||||||
|     for(auto i = 0U; i < local_irq_i.size(); ++i) { |     for(auto i = 0U; i < local_irq_i.size(); ++i) { | ||||||
|         if(local_irq_i[i].event()) { |         if(local_irq_i[i].event()) { | ||||||
|             cpu->local_irq(16 + i, local_irq_i[i].read()); |             cpu->local_irq(16 + i, local_irq_i[i].read()); | ||||||
| @@ -373,7 +373,7 @@ void core_complex::local_irq_cb() { | |||||||
|     } |     } | ||||||
| } | } | ||||||
|  |  | ||||||
| void core_complex::run() { | template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::run() { | ||||||
|     wait(SC_ZERO_TIME); // separate from elaboration phase |     wait(SC_ZERO_TIME); // separate from elaboration phase | ||||||
|     do { |     do { | ||||||
|         wait(SC_ZERO_TIME); |         wait(SC_ZERO_TIME); | ||||||
| @@ -387,11 +387,11 @@ void core_complex::run() { | |||||||
|         quantum_keeper.reset(); |         quantum_keeper.reset(); | ||||||
|         cpu->set_interrupt_execution(false); |         cpu->set_interrupt_execution(false); | ||||||
|         cpu->start(dump_ir); |         cpu->start(dump_ir); | ||||||
|     } while(cpu->get_interrupt_execution()); |     } while(!cpu->get_interrupt_execution()); | ||||||
|     sc_stop(); |     sc_stop(); | ||||||
| } | } | ||||||
|  |  | ||||||
| bool core_complex::read_mem(uint64_t addr, unsigned length, uint8_t* const data, bool is_fetch) { | template <unsigned int BUSWIDTH> bool core_complex<BUSWIDTH>::read_mem(uint64_t addr, unsigned length, uint8_t* const data, bool is_fetch) { | ||||||
|     auto& dmi_lut = is_fetch ? fetch_lut : read_lut; |     auto& dmi_lut = is_fetch ? fetch_lut : read_lut; | ||||||
|     auto lut_entry = dmi_lut.getEntry(addr); |     auto lut_entry = dmi_lut.getEntry(addr); | ||||||
|     if(lut_entry.get_granted_access() != tlm::tlm_dmi::DMI_ACCESS_NONE && addr + length <= lut_entry.get_end_address() + 1) { |     if(lut_entry.get_granted_access() != tlm::tlm_dmi::DMI_ACCESS_NONE && addr + length <= lut_entry.get_end_address() + 1) { | ||||||
| @@ -419,7 +419,7 @@ bool core_complex::read_mem(uint64_t addr, unsigned length, uint8_t* const data, | |||||||
|             gp.set_extension(preExt); |             gp.set_extension(preExt); | ||||||
|         } |         } | ||||||
|         auto pre_delay = delay; |         auto pre_delay = delay; | ||||||
|         dbus->b_transport(gp, delay); |         sckt->b_transport(gp, delay); | ||||||
|         if(pre_delay > delay) { |         if(pre_delay > delay) { | ||||||
|             quantum_keeper.reset(); |             quantum_keeper.reset(); | ||||||
|         } else { |         } else { | ||||||
| @@ -449,7 +449,7 @@ bool core_complex::read_mem(uint64_t addr, unsigned length, uint8_t* const data, | |||||||
|     } |     } | ||||||
| } | } | ||||||
|  |  | ||||||
| bool core_complex::write_mem(uint64_t addr, unsigned length, const uint8_t* const data) { | template <unsigned int BUSWIDTH> bool core_complex<BUSWIDTH>::write_mem(uint64_t addr, unsigned length, const uint8_t* const data) { | ||||||
|     auto lut_entry = write_lut.getEntry(addr); |     auto lut_entry = write_lut.getEntry(addr); | ||||||
|     if(lut_entry.get_granted_access() != tlm::tlm_dmi::DMI_ACCESS_NONE && addr + length <= lut_entry.get_end_address() + 1) { |     if(lut_entry.get_granted_access() != tlm::tlm_dmi::DMI_ACCESS_NONE && addr + length <= lut_entry.get_end_address() + 1) { | ||||||
|         auto offset = addr - lut_entry.get_start_address(); |         auto offset = addr - lut_entry.get_start_address(); | ||||||
| @@ -497,7 +497,7 @@ bool core_complex::write_mem(uint64_t addr, unsigned length, const uint8_t* cons | |||||||
|     } |     } | ||||||
| } | } | ||||||
|  |  | ||||||
| bool core_complex::read_mem_dbg(uint64_t addr, unsigned length, uint8_t* const data) { | template <unsigned int BUSWIDTH> bool core_complex<BUSWIDTH>::read_mem_dbg(uint64_t addr, unsigned length, uint8_t* const data) { | ||||||
|     tlm::tlm_generic_payload gp; |     tlm::tlm_generic_payload gp; | ||||||
|     gp.set_command(tlm::TLM_READ_COMMAND); |     gp.set_command(tlm::TLM_READ_COMMAND); | ||||||
|     gp.set_address(addr); |     gp.set_address(addr); | ||||||
| @@ -507,7 +507,7 @@ bool core_complex::read_mem_dbg(uint64_t addr, unsigned length, uint8_t* const d | |||||||
|     return dbus->transport_dbg(gp) == length; |     return dbus->transport_dbg(gp) == length; | ||||||
| } | } | ||||||
|  |  | ||||||
| bool core_complex::write_mem_dbg(uint64_t addr, unsigned length, const uint8_t* const data) { | template <unsigned int BUSWIDTH> bool core_complex<BUSWIDTH>::write_mem_dbg(uint64_t addr, unsigned length, const uint8_t* const data) { | ||||||
|     write_buf.resize(length); |     write_buf.resize(length); | ||||||
|     std::copy(data, data + length, write_buf.begin()); // need to copy as TLM does not guarantee data integrity |     std::copy(data, data + length, write_buf.begin()); // need to copy as TLM does not guarantee data integrity | ||||||
|     tlm::tlm_generic_payload gp; |     tlm::tlm_generic_payload gp; | ||||||
| @@ -518,5 +518,10 @@ bool core_complex::write_mem_dbg(uint64_t addr, unsigned length, const uint8_t* | |||||||
|     gp.set_streaming_width(length); |     gp.set_streaming_width(length); | ||||||
|     return dbus->transport_dbg(gp) == length; |     return dbus->transport_dbg(gp) == length; | ||||||
| } | } | ||||||
|  |  | ||||||
|  | template class core_complex<scc::LT>; | ||||||
|  | template class core_complex<32>; | ||||||
|  | template class core_complex<64>; | ||||||
|  |  | ||||||
| } /* namespace tgfs */ | } /* namespace tgfs */ | ||||||
| } /* namespace sysc */ | } /* namespace sysc */ | ||||||
|   | |||||||
| @@ -1,5 +1,5 @@ | |||||||
| /******************************************************************************* | /******************************************************************************* | ||||||
|  * Copyright (C) 2017-2021 MINRES Technologies GmbH |  * Copyright (C) 2017 - 2025 MINRES Technologies GmbH | ||||||
|  * All rights reserved. |  * All rights reserved. | ||||||
|  * |  * | ||||||
|  * Redistribution and use in source and binary forms, with or without |  * Redistribution and use in source and binary forms, with or without | ||||||
| @@ -33,6 +33,7 @@ | |||||||
| #ifndef _SYSC_CORE_COMPLEX_H_ | #ifndef _SYSC_CORE_COMPLEX_H_ | ||||||
| #define _SYSC_CORE_COMPLEX_H_ | #define _SYSC_CORE_COMPLEX_H_ | ||||||
|  |  | ||||||
|  | #include <scc/signal_opt_ports.h> | ||||||
| #include <scc/tick2time.h> | #include <scc/tick2time.h> | ||||||
| #include <scc/traceable.h> | #include <scc/traceable.h> | ||||||
| #include <scc/utilities.h> | #include <scc/utilities.h> | ||||||
| @@ -40,10 +41,8 @@ | |||||||
| #include <tlm/scc/scv/tlm_rec_initiator_socket.h> | #include <tlm/scc/scv/tlm_rec_initiator_socket.h> | ||||||
| #ifdef CWR_SYSTEMC | #ifdef CWR_SYSTEMC | ||||||
| #include <scmlinc/scml_property.h> | #include <scmlinc/scml_property.h> | ||||||
| #define SOCKET_WIDTH 32 |  | ||||||
| #else | #else | ||||||
| #include <cci_configuration> | #include <cci_configuration> | ||||||
| #define SOCKET_WIDTH scc::LT |  | ||||||
| #endif | #endif | ||||||
| #include <memory> | #include <memory> | ||||||
| #include <tlm> | #include <tlm> | ||||||
| @@ -68,12 +67,35 @@ public: | |||||||
| namespace tgfs { | namespace tgfs { | ||||||
| class core_wrapper; | class core_wrapper; | ||||||
| struct core_trace; | struct core_trace; | ||||||
|  | struct core_complex_if { | ||||||
|  |  | ||||||
| class core_complex : public sc_core::sc_module, public scc::traceable { |     virtual ~core_complex_if() = default; | ||||||
|  |  | ||||||
|  |     virtual bool read_mem(uint64_t addr, unsigned length, uint8_t* const data, bool is_fetch) = 0; | ||||||
|  |  | ||||||
|  |     virtual bool write_mem(uint64_t addr, unsigned length, const uint8_t* const data) = 0; | ||||||
|  |  | ||||||
|  |     virtual bool read_mem_dbg(uint64_t addr, unsigned length, uint8_t* const data) = 0; | ||||||
|  |  | ||||||
|  |     virtual bool write_mem_dbg(uint64_t addr, unsigned length, const uint8_t* const data) = 0; | ||||||
|  |  | ||||||
|  |     virtual bool disass_output(uint64_t pc, const std::string instr) = 0; | ||||||
|  |  | ||||||
|  |     virtual unsigned get_last_bus_cycles() = 0; | ||||||
|  |  | ||||||
|  |     //! Allow quantum keeper handling | ||||||
|  |     virtual void sync(uint64_t) = 0; | ||||||
|  |  | ||||||
|  |     virtual char const* hier_name() = 0; | ||||||
|  |  | ||||||
|  |     scc::sc_in_opt<uint64_t> mtime_i{"mtime_i"}; | ||||||
|  | }; | ||||||
|  |  | ||||||
|  | template <unsigned int BUSWIDTH = scc::LT> class core_complex : public sc_core::sc_module, public scc::traceable, public core_complex_if { | ||||||
| public: | public: | ||||||
|     tlm::scc::initiator_mixin<tlm::tlm_initiator_socket<SOCKET_WIDTH>> ibus{"ibus"}; |     tlm::scc::initiator_mixin<tlm::tlm_initiator_socket<BUSWIDTH>> ibus{"ibus"}; | ||||||
|  |  | ||||||
|     tlm::scc::initiator_mixin<tlm::tlm_initiator_socket<SOCKET_WIDTH>> dbus{"dbus"}; |     tlm::scc::initiator_mixin<tlm::tlm_initiator_socket<BUSWIDTH>> dbus{"dbus"}; | ||||||
|  |  | ||||||
|     sc_core::sc_in<bool> rst_i{"rst_i"}; |     sc_core::sc_in<bool> rst_i{"rst_i"}; | ||||||
|  |  | ||||||
| @@ -88,8 +110,6 @@ public: | |||||||
| #ifndef CWR_SYSTEMC | #ifndef CWR_SYSTEMC | ||||||
|     sc_core::sc_in<sc_core::sc_time> clk_i{"clk_i"}; |     sc_core::sc_in<sc_core::sc_time> clk_i{"clk_i"}; | ||||||
|  |  | ||||||
|     sc_core::sc_port<tlm::tlm_peek_if<uint64_t>, 1, sc_core::SC_ZERO_OR_MORE_BOUND> mtime_o{"mtime_o"}; |  | ||||||
|  |  | ||||||
|     cci::cci_param<std::string> elf_file{"elf_file", ""}; |     cci::cci_param<std::string> elf_file{"elf_file", ""}; | ||||||
|  |  | ||||||
|     cci::cci_param<bool> enable_disass{"enable_disass", false}; |     cci::cci_param<bool> enable_disass{"enable_disass", false}; | ||||||
| @@ -115,8 +135,6 @@ public: | |||||||
| #else | #else | ||||||
|     sc_core::sc_in<bool> clk_i{"clk_i"}; |     sc_core::sc_in<bool> clk_i{"clk_i"}; | ||||||
|  |  | ||||||
|     sc_core::sc_in<uint64_t> mtime_i{"mtime_i"}; |  | ||||||
|  |  | ||||||
|     scml_property<std::string> elf_file{"elf_file", ""}; |     scml_property<std::string> elf_file{"elf_file", ""}; | ||||||
|  |  | ||||||
|     scml_property<bool> enable_disass{"enable_disass", false}; |     scml_property<bool> enable_disass{"enable_disass", false}; | ||||||
| @@ -159,13 +177,13 @@ public: | |||||||
|  |  | ||||||
|     ~core_complex(); |     ~core_complex(); | ||||||
|  |  | ||||||
|     inline unsigned get_last_bus_cycles() { |     unsigned get_last_bus_cycles() override { | ||||||
|         auto mem_incr = std::max(ibus_inc, dbus_inc); |         auto mem_incr = std::max(ibus_inc, dbus_inc); | ||||||
|         ibus_inc = dbus_inc = 0; |         ibus_inc = dbus_inc = 0; | ||||||
|         return mem_incr > 1 ? mem_incr : 1; |         return mem_incr > 1 ? mem_incr : 1; | ||||||
|     } |     } | ||||||
|  |  | ||||||
|     inline void sync(uint64_t cycle) { |     void sync(uint64_t cycle) override { | ||||||
|         auto core_inc = curr_clk * (cycle - last_sync_cycle); |         auto core_inc = curr_clk * (cycle - last_sync_cycle); | ||||||
|         quantum_keeper.inc(core_inc); |         quantum_keeper.inc(core_inc); | ||||||
|         if(quantum_keeper.need_sync()) { |         if(quantum_keeper.need_sync()) { | ||||||
| @@ -175,20 +193,22 @@ public: | |||||||
|         last_sync_cycle = cycle; |         last_sync_cycle = cycle; | ||||||
|     } |     } | ||||||
|  |  | ||||||
|     bool read_mem(uint64_t addr, unsigned length, uint8_t* const data, bool is_fetch); |     bool read_mem(uint64_t addr, unsigned length, uint8_t* const data, bool is_fetch) override; | ||||||
|  |  | ||||||
|     bool write_mem(uint64_t addr, unsigned length, const uint8_t* const data); |     bool write_mem(uint64_t addr, unsigned length, const uint8_t* const data) override; | ||||||
|  |  | ||||||
|     bool read_mem_dbg(uint64_t addr, unsigned length, uint8_t* const data); |     bool read_mem_dbg(uint64_t addr, unsigned length, uint8_t* const data) override; | ||||||
|  |  | ||||||
|     bool write_mem_dbg(uint64_t addr, unsigned length, const uint8_t* const data); |     bool write_mem_dbg(uint64_t addr, unsigned length, const uint8_t* const data) override; | ||||||
|  |  | ||||||
|     void trace(sc_core::sc_trace_file* trf) const override; |     void trace(sc_core::sc_trace_file* trf) const override; | ||||||
|  |  | ||||||
|     bool disass_output(uint64_t pc, const std::string instr); |     bool disass_output(uint64_t pc, const std::string instr) override; | ||||||
|  |  | ||||||
|     void set_clock_period(sc_core::sc_time period); |     void set_clock_period(sc_core::sc_time period); | ||||||
|  |  | ||||||
|  |     char const* hier_name() override { return name(); } | ||||||
|  |  | ||||||
| protected: | protected: | ||||||
|     void before_end_of_elaboration() override; |     void before_end_of_elaboration() override; | ||||||
|     void start_of_simulation() override; |     void start_of_simulation() override; | ||||||
|   | |||||||
| @@ -46,12 +46,12 @@ using namespace sysc; | |||||||
| volatile std::array<bool, 2> tgc_init = { | volatile std::array<bool, 2> tgc_init = { | ||||||
|     iss_factory::instance().register_creator("tgc5c|m_p|interp", |     iss_factory::instance().register_creator("tgc5c|m_p|interp", | ||||||
|                                              [](unsigned gdb_port, void* data) -> iss_factory::base_t { |                                              [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|                                                  auto cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |                                                  auto cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|                                                  auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::tgc5c>>(cc); |                                                  auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::tgc5c>>(cc); | ||||||
|                                                  return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; |                                                  return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||||
|                                              }), |                                              }), | ||||||
|     iss_factory::instance().register_creator("tgc5c|mu_p|interp", [](unsigned gdb_port, void* data) -> iss_factory::base_t { |     iss_factory::instance().register_creator("tgc5c|mu_p|interp", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|         auto cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |         auto cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|         auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::tgc5c>>(cc); |         auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::tgc5c>>(cc); | ||||||
|         return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; |         return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||||
|     })}; |     })}; | ||||||
| @@ -62,12 +62,12 @@ using namespace sysc; | |||||||
| volatile std::array<bool, 2> tgc_init = { | volatile std::array<bool, 2> tgc_init = { | ||||||
|     iss_factory::instance().register_creator("tgc5c|m_p|llvm", |     iss_factory::instance().register_creator("tgc5c|m_p|llvm", | ||||||
|                                              [](unsigned gdb_port, void* data) -> iss_factory::base_t { |                                              [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|                                                  auto cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |                                                  auto cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|                                                  auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::tgc5c>>(cc); |                                                  auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::tgc5c>>(cc); | ||||||
|                                                  return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; |                                                  return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||||
|                                              }), |                                              }), | ||||||
|     iss_factory::instance().register_creator("tgc5c|mu_p|llvm", [](unsigned gdb_port, void* data) -> iss_factory::base_t { |     iss_factory::instance().register_creator("tgc5c|mu_p|llvm", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|         auto cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |         auto cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|         auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::tgc5c>>(cc); |         auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::tgc5c>>(cc); | ||||||
|         return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; |         return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||||
|     })}; |     })}; | ||||||
| @@ -79,12 +79,12 @@ using namespace sysc; | |||||||
| volatile std::array<bool, 2> tgc_init = { | volatile std::array<bool, 2> tgc_init = { | ||||||
|     iss_factory::instance().register_creator("tgc5c|m_p|tcc", |     iss_factory::instance().register_creator("tgc5c|m_p|tcc", | ||||||
|                                              [](unsigned gdb_port, void* data) -> iss_factory::base_t { |                                              [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|                                                  auto cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |                                                  auto cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|                                                  auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::tgc5c>>(cc); |                                                  auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::tgc5c>>(cc); | ||||||
|                                                  return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; |                                                  return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||||
|                                              }), |                                              }), | ||||||
|     iss_factory::instance().register_creator("tgc5c|mu_p|tcc", [](unsigned gdb_port, void* data) -> iss_factory::base_t { |     iss_factory::instance().register_creator("tgc5c|mu_p|tcc", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|         auto cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |         auto cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|         auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::tgc5c>>(cc); |         auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::tgc5c>>(cc); | ||||||
|         return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; |         return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||||
|     })}; |     })}; | ||||||
| @@ -96,12 +96,12 @@ using namespace sysc; | |||||||
| volatile std::array<bool, 2> tgc_init = { | volatile std::array<bool, 2> tgc_init = { | ||||||
|     iss_factory::instance().register_creator("tgc5c|m_p|asmjit", |     iss_factory::instance().register_creator("tgc5c|m_p|asmjit", | ||||||
|                                              [](unsigned gdb_port, void* data) -> iss_factory::base_t { |                                              [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|                                                  auto cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |                                                  auto cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|                                                  auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::tgc5c>>(cc); |                                                  auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::tgc5c>>(cc); | ||||||
|                                                  return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; |                                                  return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||||
|                                              }), |                                              }), | ||||||
|     iss_factory::instance().register_creator("tgc5c|mu_p|asmjit", [](unsigned gdb_port, void* data) -> iss_factory::base_t { |     iss_factory::instance().register_creator("tgc5c|mu_p|asmjit", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||||
|         auto cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); |         auto cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||||
|         auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::tgc5c>>(cc); |         auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::tgc5c>>(cc); | ||||||
|         return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; |         return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||||
|     })}; |     })}; | ||||||
|   | |||||||
| @@ -1,9 +1,36 @@ | |||||||
| /* | /******************************************************************************* | ||||||
|  * sc_core_adapter.h |  * Copyright (C) 2023 - 2025 MINRES Technologies GmbH | ||||||
|  |  * All rights reserved. | ||||||
|  * |  * | ||||||
|  *  Created on: Jul 5, 2023 |  * Redistribution and use in source and binary forms, with or without | ||||||
|  *      Author: eyck |  * modification, are permitted provided that the following conditions are met: | ||||||
|  */ |  * | ||||||
|  |  * 1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer. | ||||||
|  |  * | ||||||
|  |  * 2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer in the documentation | ||||||
|  |  *    and/or other materials provided with the distribution. | ||||||
|  |  * | ||||||
|  |  * 3. Neither the name of the copyright holder nor the names of its contributors | ||||||
|  |  *    may be used to endorse or promote products derived from this software | ||||||
|  |  *    without specific prior written permission. | ||||||
|  |  * | ||||||
|  |  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  |  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  |  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||||
|  |  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||||
|  |  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||||
|  |  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||||
|  |  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||||
|  |  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||||
|  |  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||||
|  |  * POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  * | ||||||
|  |  * Contributors: | ||||||
|  |  *       eyck@minres.com - initial implementation | ||||||
|  |  ******************************************************************************/ | ||||||
|  |  | ||||||
| #ifndef _SYSC_SC_CORE_ADAPTER_H_ | #ifndef _SYSC_SC_CORE_ADAPTER_H_ | ||||||
| #define _SYSC_SC_CORE_ADAPTER_H_ | #define _SYSC_SC_CORE_ADAPTER_H_ | ||||||
| @@ -11,6 +38,7 @@ | |||||||
| #include "sc_core_adapter_if.h" | #include "sc_core_adapter_if.h" | ||||||
| #include <iostream> | #include <iostream> | ||||||
| #include <iss/iss.h> | #include <iss/iss.h> | ||||||
|  | #include <iss/mem/memory_if.h> | ||||||
| #include <iss/vm_types.h> | #include <iss/vm_types.h> | ||||||
| #include <scc/report.h> | #include <scc/report.h> | ||||||
| #include <util/ities.h> | #include <util/ities.h> | ||||||
| @@ -18,11 +46,16 @@ | |||||||
| namespace sysc { | namespace sysc { | ||||||
| template <typename PLAT> class sc_core_adapter : public PLAT, public sc_core_adapter_if { | template <typename PLAT> class sc_core_adapter : public PLAT, public sc_core_adapter_if { | ||||||
| public: | public: | ||||||
|  |     using this_class = sc_core_adapter<PLAT>; | ||||||
|     using reg_t = typename iss::arch::traits<typename PLAT::core>::reg_t; |     using reg_t = typename iss::arch::traits<typename PLAT::core>::reg_t; | ||||||
|     using phys_addr_t = typename iss::arch::traits<typename PLAT::core>::phys_addr_t; |     using phys_addr_t = typename iss::arch::traits<typename PLAT::core>::phys_addr_t; | ||||||
|     using heart_state_t = typename PLAT::hart_state_type; |     sc_core_adapter(sysc::tgfs::core_complex_if* owner) | ||||||
|     sc_core_adapter(sysc::tgfs::core_complex* owner) |     : owner(owner) { | ||||||
|     : owner(owner) {} |         this->csr_rd_cb[iss::arch::time] = MK_CSR_RD_CB(read_time); | ||||||
|  |         if(sizeof(reg_t) == 4) | ||||||
|  |             this->csr_rd_cb[iss::arch::timeh] = MK_CSR_RD_CB(read_time); | ||||||
|  |         this->memories.replace_last(*this); | ||||||
|  |     } | ||||||
|  |  | ||||||
|     iss::arch_if* get_arch_if() override { return this; } |     iss::arch_if* get_arch_if() override { return this; } | ||||||
|  |  | ||||||
| @@ -54,79 +87,77 @@ public: | |||||||
|             std::stringstream s; |             std::stringstream s; | ||||||
|             s << "[p:" << lvl[this->reg.PRIV] << ";s:0x" << std::hex << std::setfill('0') << std::setw(sizeof(reg_t) * 2) |             s << "[p:" << lvl[this->reg.PRIV] << ";s:0x" << std::hex << std::setfill('0') << std::setw(sizeof(reg_t) * 2) | ||||||
|               << (reg_t)this->state.mstatus << std::dec << ";c:" << this->reg.icount + this->cycle_offset << "]"; |               << (reg_t)this->state.mstatus << std::dec << ";c:" << this->reg.icount + this->cycle_offset << "]"; | ||||||
|             SCCDEBUG(owner->name()) << "disass: " |             SCCDEBUG(owner->hier_name()) << "disass: " | ||||||
|                                     << "0x" << std::setw(16) << std::right << std::setfill('0') << std::hex << pc << "\t\t" << std::setw(40) |                                          << "0x" << std::setw(16) << std::right << std::setfill('0') << std::hex << pc << "\t\t" | ||||||
|                                     << std::setfill(' ') << std::left << instr << s.str(); |                                          << std::setw(40) << std::setfill(' ') << std::left << instr << s.str(); | ||||||
|         } |         } | ||||||
|     }; |     }; | ||||||
|  |  | ||||||
|     iss::status read_mem(phys_addr_t addr, unsigned length, uint8_t* const data) override { |     iss::mem::memory_if get_mem_if() override { | ||||||
|         if(addr.access && iss::access_type::DEBUG) |         return iss::mem::memory_if{.rd_mem{util::delegate<iss::mem::rd_mem_func_sig>::from<this_class, &this_class::read_mem>(this)}, | ||||||
|             return owner->read_mem_dbg(addr.val, length, data) ? iss::Ok : iss::Err; |                                    .wr_mem{util::delegate<iss::mem::wr_mem_func_sig>::from<this_class, &this_class::write_mem>(this)}}; | ||||||
|  |     } | ||||||
|  |  | ||||||
|  |     iss::status read_mem(iss::access_type access, uint64_t addr, unsigned length, uint8_t* data) { | ||||||
|  |         if(access && iss::access_type::DEBUG) | ||||||
|  |             return owner->read_mem_dbg(addr, length, data) ? iss::Ok : iss::Err; | ||||||
|         else { |         else { | ||||||
|             return owner->read_mem(addr.val, length, data, is_fetch(addr.access)) ? iss::Ok : iss::Err; |             return owner->read_mem(addr, length, data, is_fetch(access)) ? iss::Ok : iss::Err; | ||||||
|         } |         } | ||||||
|     } |     } | ||||||
|  |  | ||||||
|     iss::status write_mem(phys_addr_t addr, unsigned length, const uint8_t* const data) override { |     iss::status write_mem(iss::access_type access, uint64_t addr, unsigned length, uint8_t const* data) { | ||||||
|         if(addr.access && iss::access_type::DEBUG) |         if(access && iss::access_type::DEBUG) | ||||||
|             return owner->write_mem_dbg(addr.val, length, data) ? iss::Ok : iss::Err; |             return owner->write_mem_dbg(addr, length, data) ? iss::Ok : iss::Err; | ||||||
|         else { |         if(addr == this->tohost) { | ||||||
|             auto tohost_upper = (sizeof(reg_t) == 4 && addr.val == (this->tohost + 4)) || (sizeof(reg_t) == 8 && addr.val == this->tohost); |             reg_t cur_data = *reinterpret_cast<const reg_t*>(data); | ||||||
|             auto tohost_lower = (sizeof(reg_t) == 4 && addr.val == this->tohost) || (sizeof(reg_t) == 64 && addr.val == this->tohost); |             // Extract Device (bits 63:56) | ||||||
|             if(tohost_lower || tohost_upper) { |             uint8_t device = sizeof(reg_t) == 4 ? 0 : (cur_data >> 56) & 0xFF; | ||||||
|                 if(tohost_upper || (tohost_lower && to_host_wr_cnt > 0)) { |             // Extract Command (bits 55:48) | ||||||
|                     switch(hostvar >> 48) { |             uint8_t command = sizeof(reg_t) == 4 ? 0 : (cur_data >> 48) & 0xFF; | ||||||
|                     case 0: |             // Extract payload (bits 47:0) | ||||||
|                         if(hostvar != 0x1) { |             uint64_t payload_addr = cur_data & 0xFFFFFFFFFFFFULL; // 24bits | ||||||
|                             SCCINFO(owner->name()) |             if(payload_addr & 1) { | ||||||
|                                 << "tohost value is 0x" << std::hex << hostvar << std::dec << " (" << hostvar << "), stopping simulation"; |                 if(payload_addr != 0x1) { | ||||||
|  |                     SCCERR(owner->hier_name()) << "tohost value is 0x" << std::hex << payload_addr << std::dec << " (" << payload_addr | ||||||
|  |                                                << "), stopping simulation"; | ||||||
|                 } else { |                 } else { | ||||||
|                             SCCINFO(owner->name()) |                     SCCINFO(owner->hier_name()) | ||||||
|                                 << "tohost value is 0x" << std::hex << hostvar << std::dec << " (" << hostvar << "), stopping simulation"; |                         << "tohost value is 0x" << std::hex << payload_addr << std::dec << " (" << payload_addr << "), stopping simulation"; | ||||||
|                 } |                 } | ||||||
|                 this->reg.trap_state = std::numeric_limits<uint32_t>::max(); |                 this->reg.trap_state = std::numeric_limits<uint32_t>::max(); | ||||||
|                         this->interrupt_sim = hostvar; |                 this->interrupt_sim = payload_addr; | ||||||
| #ifndef WITH_TCC |  | ||||||
|                         throw(iss::simulation_stopped(hostvar)); |  | ||||||
| #endif |  | ||||||
|                         break; |  | ||||||
|                     default: |  | ||||||
|                         break; |  | ||||||
|                     } |  | ||||||
|                 } else if(tohost_lower) |  | ||||||
|                     to_host_wr_cnt++; |  | ||||||
|                 return iss::Ok; |                 return iss::Ok; | ||||||
|             } else { |  | ||||||
|                 auto res = owner->write_mem(addr.val, length, data) ? iss::Ok : iss::Err; |  | ||||||
|                 // clear MTIP on mtimecmp write |  | ||||||
|                 if(addr.val == 0x2004000) { |  | ||||||
|                     reg_t val; |  | ||||||
|                     this->read_csr(iss::arch::mip, val); |  | ||||||
|                     if(val & (1ULL << 7)) |  | ||||||
|                         this->write_csr(iss::arch::mip, val & ~(1ULL << 7)); |  | ||||||
|             } |             } | ||||||
|  |             if(device == 0 && command == 0) { | ||||||
|  |                 std::array<uint64_t, 8> loaded_payload; | ||||||
|  |                 auto res = owner->read_mem(payload_addr, 8 * sizeof(uint64_t), reinterpret_cast<uint8_t*>(loaded_payload.data()), false) | ||||||
|  |                                ? iss::Ok | ||||||
|  |                                : iss::Err; | ||||||
|  |                 if(res == iss::Err) { | ||||||
|  |                     SCCERR(owner->hier_name()) << "Syscall read went wrong"; | ||||||
|  |                     return iss::Ok; | ||||||
|  |                 } | ||||||
|  |                 uint64_t syscall_num = loaded_payload.at(0); | ||||||
|  |                 if(syscall_num == 64) // SYS_WRITE | ||||||
|  |                     return this->execute_sys_write(this, loaded_payload, PLAT::MEM); | ||||||
|  |                 SCCERR(owner->hier_name()) << "tohost syscall with number 0x" << std::hex << syscall_num << std::dec << " (" << syscall_num | ||||||
|  |                                            << ") not implemented"; | ||||||
|  |                 this->reg.trap_state = std::numeric_limits<uint32_t>::max(); | ||||||
|  |                 this->interrupt_sim = payload_addr; | ||||||
|  |                 return iss::Ok; | ||||||
|  |             } | ||||||
|  |             SCCERR(owner->hier_name()) << "tohost functionality not implemented for device " << device << " and command " << command; | ||||||
|  |             this->reg.trap_state = std::numeric_limits<uint32_t>::max(); | ||||||
|  |             this->interrupt_sim = payload_addr; | ||||||
|  |             return iss::Ok; | ||||||
|  |         } | ||||||
|  |         auto res = owner->write_mem(addr, length, data) ? iss::Ok : iss::Err; | ||||||
|         return res; |         return res; | ||||||
|     } |     } | ||||||
|         } |  | ||||||
|     } |  | ||||||
|  |  | ||||||
|     iss::status read_csr(unsigned addr, reg_t& val) override { |     iss::status read_time(unsigned addr, reg_t& val) { | ||||||
| #ifndef CWR_SYSTEMC |         uint64_t time_val = owner->mtime_i.get_interface() ? owner->mtime_i.read() : 0; | ||||||
|         if((addr == iss::arch::time || addr == iss::arch::timeh) && owner->mtime_o.get_interface(0)) { |  | ||||||
|             uint64_t time_val; |  | ||||||
|             bool ret = owner->mtime_o->nb_peek(time_val); |  | ||||||
|             if(addr == iss::arch::time) { |  | ||||||
|                 val = static_cast<reg_t>(time_val); |  | ||||||
|             } else if(addr == iss::arch::timeh) { |  | ||||||
|                 if(sizeof(reg_t) != 4) |  | ||||||
|                     return iss::Err; |  | ||||||
|                 val = static_cast<reg_t>(time_val >> 32); |  | ||||||
|             } |  | ||||||
|             return ret ? iss::Ok : iss::Err; |  | ||||||
| #else |  | ||||||
|         if((addr == iss::arch::time || addr == iss::arch::timeh)) { |  | ||||||
|             uint64_t time_val = owner->mtime_i.read(); |  | ||||||
|         if(addr == iss::arch::time) { |         if(addr == iss::arch::time) { | ||||||
|             val = static_cast<reg_t>(time_val); |             val = static_cast<reg_t>(time_val); | ||||||
|         } else if(addr == iss::arch::timeh) { |         } else if(addr == iss::arch::timeh) { | ||||||
| @@ -135,18 +166,14 @@ public: | |||||||
|             val = static_cast<reg_t>(time_val >> 32); |             val = static_cast<reg_t>(time_val >> 32); | ||||||
|         } |         } | ||||||
|         return iss::Ok; |         return iss::Ok; | ||||||
| #endif |  | ||||||
|         } else { |  | ||||||
|             return PLAT::read_csr(addr, val); |  | ||||||
|         } |  | ||||||
|     } |     } | ||||||
|  |  | ||||||
|     void wait_until(uint64_t flags) override { |     void wait_until(uint64_t flags) override { | ||||||
|         SCCDEBUG(owner->name()) << "Sleeping until interrupt"; |         SCCDEBUG(owner->hier_name()) << "Sleeping until interrupt"; | ||||||
|  |         PLAT::wait_until(flags); | ||||||
|         while(this->reg.pending_trap == 0 && (this->csr[iss::arch::mip] & this->csr[iss::arch::mie]) == 0) { |         while(this->reg.pending_trap == 0 && (this->csr[iss::arch::mip] & this->csr[iss::arch::mie]) == 0) { | ||||||
|             sc_core::wait(wfi_evt); |             sc_core::wait(wfi_evt); | ||||||
|         } |         } | ||||||
|         PLAT::wait_until(flags); |  | ||||||
|     } |     } | ||||||
|  |  | ||||||
|     void local_irq(short id, bool value) override { |     void local_irq(short id, bool value) override { | ||||||
| @@ -173,13 +200,12 @@ public: | |||||||
|             this->csr[iss::arch::mip] &= ~mask; |             this->csr[iss::arch::mip] &= ~mask; | ||||||
|         this->check_interrupt(); |         this->check_interrupt(); | ||||||
|         if(value) |         if(value) | ||||||
|             SCCTRACE(owner->name()) << "Triggering interrupt " << id << " Pending trap: " << this->reg.pending_trap; |             SCCTRACE(owner->hier_name()) << "Triggering interrupt " << id << " Pending trap: " << this->reg.pending_trap; | ||||||
|     } |     } | ||||||
|  |  | ||||||
| private: | private: | ||||||
|     sysc::tgfs::core_complex* const owner; |     sysc::tgfs::core_complex_if* const owner{nullptr}; | ||||||
|     sc_core::sc_event wfi_evt; |     sc_core::sc_event wfi_evt; | ||||||
|     uint64_t hostvar{std::numeric_limits<uint64_t>::max()}; |  | ||||||
|     unsigned to_host_wr_cnt = 0; |     unsigned to_host_wr_cnt = 0; | ||||||
|     bool first{true}; |     bool first{true}; | ||||||
| }; | }; | ||||||
|   | |||||||
| @@ -1,9 +1,36 @@ | |||||||
| /* | /******************************************************************************* | ||||||
|  * sc_core_adapter.h |  * Copyright (C) 2023 MINRES Technologies GmbH | ||||||
|  |  * All rights reserved. | ||||||
|  * |  * | ||||||
|  *  Created on: Jul 5, 2023 |  * Redistribution and use in source and binary forms, with or without | ||||||
|  *      Author: eyck |  * modification, are permitted provided that the following conditions are met: | ||||||
|  */ |  * | ||||||
|  |  * 1. Redistributions of source code must retain the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer. | ||||||
|  |  * | ||||||
|  |  * 2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  |  *    this list of conditions and the following disclaimer in the documentation | ||||||
|  |  *    and/or other materials provided with the distribution. | ||||||
|  |  * | ||||||
|  |  * 3. Neither the name of the copyright holder nor the names of its contributors | ||||||
|  |  *    may be used to endorse or promote products derived from this software | ||||||
|  |  *    without specific prior written permission. | ||||||
|  |  * | ||||||
|  |  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  |  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  |  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  |  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||||
|  |  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||||
|  |  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||||
|  |  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||||
|  |  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||||
|  |  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||||
|  |  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||||
|  |  * POSSIBILITY OF SUCH DAMAGE. | ||||||
|  |  * | ||||||
|  |  * Contributors: | ||||||
|  |  *       eyck@minres.com - initial implementation | ||||||
|  |  ******************************************************************************/ | ||||||
|  |  | ||||||
| #ifndef _SYSC_SC_CORE_ADAPTER_IF_H_ | #ifndef _SYSC_SC_CORE_ADAPTER_IF_H_ | ||||||
| #define _SYSC_SC_CORE_ADAPTER_IF_H_ | #define _SYSC_SC_CORE_ADAPTER_IF_H_ | ||||||
|   | |||||||
							
								
								
									
										70
									
								
								src/vm/aes_sbox.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										70
									
								
								src/vm/aes_sbox.h
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,70 @@ | |||||||
|  | //////////////////////////////////////////////////////////////////////////////// | ||||||
|  | // Copyright (C) 2025, MINRES Technologies GmbH | ||||||
|  | // All rights reserved. | ||||||
|  | // | ||||||
|  | // Redistribution and use in source and binary forms, with or without | ||||||
|  | // modification, are permitted provided that the following conditions are met: | ||||||
|  | // | ||||||
|  | // 1. Redistributions of source code must retain the above copyright notice, | ||||||
|  | //    this list of conditions and the following disclaimer. | ||||||
|  | // | ||||||
|  | // 2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  | //    this list of conditions and the following disclaimer in the documentation | ||||||
|  | //    and/or other materials provided with the distribution. | ||||||
|  | // | ||||||
|  | // 3. Neither the name of the copyright holder nor the names of its contributors | ||||||
|  | //    may be used to endorse or promote products derived from this software | ||||||
|  | //    without specific prior written permission. | ||||||
|  | // | ||||||
|  | // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  | // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  | // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  | // ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||||
|  | // LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||||
|  | // CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||||
|  | // SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||||
|  | // INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||||
|  | // CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||||
|  | // ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||||
|  | // POSSIBILITY OF SUCH DAMAGE. | ||||||
|  | // | ||||||
|  | // Contributors: | ||||||
|  | //       ales@minres.com - initial API and implementation | ||||||
|  | //////////////////////////////////////////////////////////////////////////////// | ||||||
|  |  | ||||||
|  | #ifndef _VM_AES_SBOX_H_ | ||||||
|  | #define _VM_AES_SBOX_H_ | ||||||
|  | #include <cstdint> | ||||||
|  | extern "C" { | ||||||
|  | const uint8_t AES_ENC_SBOX[] = { | ||||||
|  |     0x63, 0x7C, 0x77, 0x7B, 0xF2, 0x6B, 0x6F, 0xC5, 0x30, 0x01, 0x67, 0x2B, 0xFE, 0xD7, 0xAB, 0x76, 0xCA, 0x82, 0xC9, 0x7D, 0xFA, 0x59, | ||||||
|  |     0x47, 0xF0, 0xAD, 0xD4, 0xA2, 0xAF, 0x9C, 0xA4, 0x72, 0xC0, 0xB7, 0xFD, 0x93, 0x26, 0x36, 0x3F, 0xF7, 0xCC, 0x34, 0xA5, 0xE5, 0xF1, | ||||||
|  |     0x71, 0xD8, 0x31, 0x15, 0x04, 0xC7, 0x23, 0xC3, 0x18, 0x96, 0x05, 0x9A, 0x07, 0x12, 0x80, 0xE2, 0xEB, 0x27, 0xB2, 0x75, 0x09, 0x83, | ||||||
|  |     0x2C, 0x1A, 0x1B, 0x6E, 0x5A, 0xA0, 0x52, 0x3B, 0xD6, 0xB3, 0x29, 0xE3, 0x2F, 0x84, 0x53, 0xD1, 0x00, 0xED, 0x20, 0xFC, 0xB1, 0x5B, | ||||||
|  |     0x6A, 0xCB, 0xBE, 0x39, 0x4A, 0x4C, 0x58, 0xCF, 0xD0, 0xEF, 0xAA, 0xFB, 0x43, 0x4D, 0x33, 0x85, 0x45, 0xF9, 0x02, 0x7F, 0x50, 0x3C, | ||||||
|  |     0x9F, 0xA8, 0x51, 0xA3, 0x40, 0x8F, 0x92, 0x9D, 0x38, 0xF5, 0xBC, 0xB6, 0xDA, 0x21, 0x10, 0xFF, 0xF3, 0xD2, 0xCD, 0x0C, 0x13, 0xEC, | ||||||
|  |     0x5F, 0x97, 0x44, 0x17, 0xC4, 0xA7, 0x7E, 0x3D, 0x64, 0x5D, 0x19, 0x73, 0x60, 0x81, 0x4F, 0xDC, 0x22, 0x2A, 0x90, 0x88, 0x46, 0xEE, | ||||||
|  |     0xB8, 0x14, 0xDE, 0x5E, 0x0B, 0xDB, 0xE0, 0x32, 0x3A, 0x0A, 0x49, 0x06, 0x24, 0x5C, 0xC2, 0xD3, 0xAC, 0x62, 0x91, 0x95, 0xE4, 0x79, | ||||||
|  |     0xE7, 0xC8, 0x37, 0x6D, 0x8D, 0xD5, 0x4E, 0xA9, 0x6C, 0x56, 0xF4, 0xEA, 0x65, 0x7A, 0xAE, 0x08, 0xBA, 0x78, 0x25, 0x2E, 0x1C, 0xA6, | ||||||
|  |     0xB4, 0xC6, 0xE8, 0xDD, 0x74, 0x1F, 0x4B, 0xBD, 0x8B, 0x8A, 0x70, 0x3E, 0xB5, 0x66, 0x48, 0x03, 0xF6, 0x0E, 0x61, 0x35, 0x57, 0xB9, | ||||||
|  |     0x86, 0xC1, 0x1D, 0x9E, 0xE1, 0xF8, 0x98, 0x11, 0x69, 0xD9, 0x8E, 0x94, 0x9B, 0x1E, 0x87, 0xE9, 0xCE, 0x55, 0x28, 0xDF, 0x8C, 0xA1, | ||||||
|  |     0x89, 0x0D, 0xBF, 0xE6, 0x42, 0x68, 0x41, 0x99, 0x2D, 0x0F, 0xB0, 0x54, 0xBB, 0x16}; | ||||||
|  | uint8_t inline aes_sbox_fwd(uint8_t index) { return AES_ENC_SBOX[index]; } | ||||||
|  |  | ||||||
|  | const uint8_t AES_DEC_SBOX[] = { | ||||||
|  |     0x52, 0x09, 0x6A, 0xD5, 0x30, 0x36, 0xA5, 0x38, 0xBF, 0x40, 0xA3, 0x9E, 0x81, 0xF3, 0xD7, 0xFB, 0x7C, 0xE3, 0x39, 0x82, 0x9B, 0x2F, | ||||||
|  |     0xFF, 0x87, 0x34, 0x8E, 0x43, 0x44, 0xC4, 0xDE, 0xE9, 0xCB, 0x54, 0x7B, 0x94, 0x32, 0xA6, 0xC2, 0x23, 0x3D, 0xEE, 0x4C, 0x95, 0x0B, | ||||||
|  |     0x42, 0xFA, 0xC3, 0x4E, 0x08, 0x2E, 0xA1, 0x66, 0x28, 0xD9, 0x24, 0xB2, 0x76, 0x5B, 0xA2, 0x49, 0x6D, 0x8B, 0xD1, 0x25, 0x72, 0xF8, | ||||||
|  |     0xF6, 0x64, 0x86, 0x68, 0x98, 0x16, 0xD4, 0xA4, 0x5C, 0xCC, 0x5D, 0x65, 0xB6, 0x92, 0x6C, 0x70, 0x48, 0x50, 0xFD, 0xED, 0xB9, 0xDA, | ||||||
|  |     0x5E, 0x15, 0x46, 0x57, 0xA7, 0x8D, 0x9D, 0x84, 0x90, 0xD8, 0xAB, 0x00, 0x8C, 0xBC, 0xD3, 0x0A, 0xF7, 0xE4, 0x58, 0x05, 0xB8, 0xB3, | ||||||
|  |     0x45, 0x06, 0xD0, 0x2C, 0x1E, 0x8F, 0xCA, 0x3F, 0x0F, 0x02, 0xC1, 0xAF, 0xBD, 0x03, 0x01, 0x13, 0x8A, 0x6B, 0x3A, 0x91, 0x11, 0x41, | ||||||
|  |     0x4F, 0x67, 0xDC, 0xEA, 0x97, 0xF2, 0xCF, 0xCE, 0xF0, 0xB4, 0xE6, 0x73, 0x96, 0xAC, 0x74, 0x22, 0xE7, 0xAD, 0x35, 0x85, 0xE2, 0xF9, | ||||||
|  |     0x37, 0xE8, 0x1C, 0x75, 0xDF, 0x6E, 0x47, 0xF1, 0x1A, 0x71, 0x1D, 0x29, 0xC5, 0x89, 0x6F, 0xB7, 0x62, 0x0E, 0xAA, 0x18, 0xBE, 0x1B, | ||||||
|  |     0xFC, 0x56, 0x3E, 0x4B, 0xC6, 0xD2, 0x79, 0x20, 0x9A, 0xDB, 0xC0, 0xFE, 0x78, 0xCD, 0x5A, 0xF4, 0x1F, 0xDD, 0xA8, 0x33, 0x88, 0x07, | ||||||
|  |     0xC7, 0x31, 0xB1, 0x12, 0x10, 0x59, 0x27, 0x80, 0xEC, 0x5F, 0x60, 0x51, 0x7F, 0xA9, 0x19, 0xB5, 0x4A, 0x0D, 0x2D, 0xE5, 0x7A, 0x9F, | ||||||
|  |     0x93, 0xC9, 0x9C, 0xEF, 0xA0, 0xE0, 0x3B, 0x4D, 0xAE, 0x2A, 0xF5, 0xB0, 0xC8, 0xEB, 0xBB, 0x3C, 0x83, 0x53, 0x99, 0x61, 0x17, 0x2B, | ||||||
|  |     0x04, 0x7E, 0xBA, 0x77, 0xD6, 0x26, 0xE1, 0x69, 0x14, 0x63, 0x55, 0x21, 0x0C, 0x7D}; | ||||||
|  | uint8_t inline aes_sbox_inv(uint8_t index) { return AES_DEC_SBOX[index]; } | ||||||
|  | } | ||||||
|  |  | ||||||
|  | #endif /* _VM_AES_SBOX_H_ */ | ||||||
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							| @@ -33,6 +33,9 @@ | |||||||
| //////////////////////////////////////////////////////////////////////////////// | //////////////////////////////////////////////////////////////////////////////// | ||||||
|  |  | ||||||
| #include "fp_functions.h" | #include "fp_functions.h" | ||||||
|  | #include "softfloat_types.h" | ||||||
|  | #include <array> | ||||||
|  | #include <cstdint> | ||||||
|  |  | ||||||
| extern "C" { | extern "C" { | ||||||
| #include "internals.h" | #include "internals.h" | ||||||
| @@ -43,20 +46,375 @@ extern "C" { | |||||||
| #include <limits> | #include <limits> | ||||||
|  |  | ||||||
| using this_t = uint8_t*; | using this_t = uint8_t*; | ||||||
| const uint8_t rmm_map[] = { | template <typename T> T constexpr defaultNaN(); | ||||||
|     softfloat_round_near_even /*RNE*/,   softfloat_round_minMag /*RTZ*/, softfloat_round_min /*RDN*/, softfloat_round_max /*RUP?*/, | template <> uint16_t constexpr defaultNaN<uint16_t>() { return defaultNaNF16UI; } | ||||||
|     softfloat_round_near_maxMag /*RMM*/, softfloat_round_max /*RTZ*/,    softfloat_round_max /*RTZ*/, softfloat_round_max /*RTZ*/, | template <> uint32_t constexpr defaultNaN<uint32_t>() { return defaultNaNF32UI; } | ||||||
| }; | template <> uint64_t constexpr defaultNaN<uint64_t>() { return defaultNaNF64UI; } | ||||||
|  | template <typename T> T constexpr posInf(); | ||||||
|  | template <> uint16_t constexpr posInf<uint16_t>() { return 0x7C00; } | ||||||
|  | template <> uint32_t constexpr posInf<uint32_t>() { return 0x7F800000; } | ||||||
|  | template <> uint64_t constexpr posInf<uint64_t>() { return 0x7FF0000000000000; } | ||||||
|  | template <typename T> T constexpr negInf(); | ||||||
|  | template <> uint16_t constexpr negInf<uint16_t>() { return 0xFC00; } | ||||||
|  | template <> uint32_t constexpr negInf<uint32_t>() { return 0xFF800000; } | ||||||
|  | template <> uint64_t constexpr negInf<uint64_t>() { return 0xFFF0000000000000; } | ||||||
|  | template <typename T> T constexpr negZero(); | ||||||
|  | template <> uint16_t constexpr negZero<uint16_t>() { return 0x8000; } | ||||||
|  | template <> uint32_t constexpr negZero<uint32_t>() { return 0x80000000; } | ||||||
|  | template <> uint64_t constexpr negZero<uint64_t>() { return 0x8000000000000000; } | ||||||
|  |  | ||||||
| const uint32_t quiet_nan32 = 0x7fC00000; | template <typename T> bool rsqrt_check(T fclass_val, bool& subnormal, T& ret_val) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     switch(fclass_val) { | ||||||
|  |     case 0x0001: { | ||||||
|  |         softfloat_exceptionFlags |= softfloat_flag_invalid; | ||||||
|  |         ret_val = defaultNaN<T>(); | ||||||
|  |         return true; | ||||||
|  |     } | ||||||
|  |     case 0x0002: { | ||||||
|  |         softfloat_exceptionFlags |= softfloat_flag_invalid; | ||||||
|  |         ret_val = defaultNaN<T>(); | ||||||
|  |         return true; | ||||||
|  |     } | ||||||
|  |     case 0x0004: { | ||||||
|  |         softfloat_exceptionFlags |= softfloat_flag_invalid; | ||||||
|  |         ret_val = defaultNaN<T>(); | ||||||
|  |         return true; | ||||||
|  |     } | ||||||
|  |     case 0x0100: { | ||||||
|  |         softfloat_exceptionFlags |= softfloat_flag_invalid; | ||||||
|  |         ret_val = defaultNaN<T>(); | ||||||
|  |         return true; | ||||||
|  |     } | ||||||
|  |     case 0x0200: { | ||||||
|  |         ret_val = defaultNaN<T>(); | ||||||
|  |         return true; | ||||||
|  |     } | ||||||
|  |     case 0x0008: { | ||||||
|  |         softfloat_exceptionFlags |= softfloat_flag_infinite; | ||||||
|  |         ret_val = negInf<T>(); | ||||||
|  |         return true; | ||||||
|  |     } | ||||||
|  |     case 0x0010: { | ||||||
|  |         softfloat_exceptionFlags |= softfloat_flag_infinite; | ||||||
|  |         ret_val = posInf<T>(); | ||||||
|  |         return true; | ||||||
|  |     } | ||||||
|  |     case 0x0080: { | ||||||
|  |         ret_val = 0; | ||||||
|  |         return true; | ||||||
|  |     } | ||||||
|  |     case 0x0020: { | ||||||
|  |         subnormal = true; | ||||||
|  |     } | ||||||
|  |     default: | ||||||
|  |         return false; | ||||||
|  |     } | ||||||
|  | } | ||||||
|  | static constexpr std::array<std::array<uint64_t, 64>, 2> rsqrt_table{ | ||||||
|  |     {{ | ||||||
|  |          52, 51, 50, 48, 47, 46, 44, 43, 42, 41, 40, 39, 38, 36, 35, 34, 33, 32, 31, 30, 30, 29, 28, 27, 26, 25, 24, 23, 23, 22, 21, 20, | ||||||
|  |          19, 19, 18, 17, 16, 16, 15, 14, 14, 13, 12, 12, 11, 10, 10, 9,  9,  8,  7,  7,  6,  6,  5,  4,  4,  3,  3,  2,  2,  1,  1,  0, | ||||||
|  |      }, | ||||||
|  |      {127, 125, 123, 121, 119, 118, 116, 114, 113, 111, 109, 108, 106, 105, 103, 102, 100, 99, 97, 96, 95, 93, | ||||||
|  |       92,  91,  90,  88,  87,  86,  85,  84,  83,  82,  80,  79,  78,  77,  76,  75,  74,  73, 72, 71, 70, 70, | ||||||
|  |       69,  68,  67,  66,  65,  64,  63,  63,  62,  61,  60,  59,  59,  58,  57,  56,  56,  55, 54, 53}}}; | ||||||
|  |  | ||||||
|  | uint64_t constexpr frsqrt7_general(const unsigned s, const unsigned e, const uint64_t sign, const int64_t exp, const uint64_t sig, | ||||||
|  |                                    const bool subnormal) { | ||||||
|  |     int64_t normalized_exp = exp; | ||||||
|  |     uint64_t normalized_sig = sig; | ||||||
|  |     if(subnormal) { | ||||||
|  |         signed nr_leadingzeros = __builtin_clzll(sig) - (64 - s); | ||||||
|  |         normalized_exp = -nr_leadingzeros; | ||||||
|  |         normalized_sig = (sig << (1 + nr_leadingzeros)) & ((1ULL << s) - 1); | ||||||
|  |     } | ||||||
|  |     unsigned exp_idx = normalized_exp & 1; | ||||||
|  |     unsigned sig_idx = (normalized_sig >> (s - 6)) & 0x3f; | ||||||
|  |     // The output of the table becomes the seven high bits of the result significand (after the leading one); the remainder of the | ||||||
|  |     // result significand is zero. | ||||||
|  |     uint64_t out_sig = rsqrt_table[exp_idx][sig_idx] << (s - 7); | ||||||
|  |     // The output exponent equals floor((3*B - 1 - the normalized input exponent) / 2), where B is the exponent bias. | ||||||
|  |     unsigned bias = (1UL << (e - 1)) - 1; | ||||||
|  |     uint64_t out_exp = (3 * bias - 1 - normalized_exp) / 2; | ||||||
|  |     // The output sign equals the input sign. | ||||||
|  |     return (sign << (s + e)) | (out_exp << s) | out_sig; | ||||||
|  | } | ||||||
|  | template <typename T> bool recip_check(T fclass_val, bool& subnormal, uint64_t& ret_val) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     switch(fclass_val) { | ||||||
|  |     case 0x0001: { | ||||||
|  |         ret_val = negZero<T>(); | ||||||
|  |         return true; | ||||||
|  |     } | ||||||
|  |     case 0x0080: { | ||||||
|  |         ret_val = 0; | ||||||
|  |         return true; | ||||||
|  |     } | ||||||
|  |     case 0x0008: { | ||||||
|  |         softfloat_exceptionFlags |= softfloat_flag_infinite; | ||||||
|  |         ret_val = negInf<T>(); | ||||||
|  |         return true; | ||||||
|  |     } | ||||||
|  |     case 0x0010: { | ||||||
|  |         softfloat_exceptionFlags |= softfloat_flag_infinite; | ||||||
|  |         ret_val = posInf<T>(); | ||||||
|  |         return true; | ||||||
|  |     } | ||||||
|  |     case 0x0100: { | ||||||
|  |         softfloat_exceptionFlags |= softfloat_flag_invalid; | ||||||
|  |         ret_val = defaultNaN<T>(); | ||||||
|  |         return true; | ||||||
|  |     } | ||||||
|  |     case 0x0200: { | ||||||
|  |         ret_val = defaultNaN<T>(); | ||||||
|  |         return true; | ||||||
|  |     } | ||||||
|  |     case 0x0004: { | ||||||
|  |         subnormal = true; | ||||||
|  |         return false; | ||||||
|  |     } | ||||||
|  |     case 0x0020: { | ||||||
|  |         subnormal = true; | ||||||
|  |         return false; | ||||||
|  |     } | ||||||
|  |     default: { | ||||||
|  |         subnormal = false; | ||||||
|  |         return false; | ||||||
|  |     } | ||||||
|  |     } | ||||||
|  | } | ||||||
|  | static constexpr std::array<uint64_t, 128> rec_table{ | ||||||
|  |     {127, 125, 123, 121, 119, 117, 116, 114, 112, 110, 109, 107, 105, 104, 102, 100, 99, 97, 96, 94, 93, 91, 90, 88, 87, 85, | ||||||
|  |      84,  83,  81,  80,  79,  77,  76,  75,  74,  72,  71,  70,  69,  68,  66,  65,  64, 63, 62, 61, 60, 59, 58, 57, 56, 55, | ||||||
|  |      54,  53,  52,  51,  50,  49,  48,  47,  46,  45,  44,  43,  42,  41,  40,  40,  39, 38, 37, 36, 35, 35, 34, 33, 32, 31, | ||||||
|  |      31,  30,  29,  28,  28,  27,  26,  25,  25,  24,  23,  23,  22,  21,  21,  20,  19, 19, 18, 17, 17, 16, 15, 15, 14, 14, | ||||||
|  |      13,  12,  12,  11,  11,  10,  9,   9,   8,   8,   7,   7,   6,   5,   5,   4,   4,  3,  3,  2,  2,  1,  1,  0}}; | ||||||
|  | bool frec_general(uint64_t& res, const unsigned s, const unsigned e, const uint64_t sign, const int64_t exp, const uint64_t sig, | ||||||
|  |                   const bool subnormal, uint8_t mode) { | ||||||
|  |     int nr_leadingzeros = __builtin_clzll(sig) - (64 - s); | ||||||
|  |     int64_t normalized_exp = subnormal ? -nr_leadingzeros : exp; | ||||||
|  |     uint64_t normalized_sig = subnormal ? ((sig << (1 + nr_leadingzeros)) & ((1ULL << s) - 1)) : sig; | ||||||
|  |     unsigned idx = (normalized_sig >> (s - 7)) & 0x7f; | ||||||
|  |     unsigned bias = (1UL << (e - 1)) - 1; | ||||||
|  |     uint64_t mid_exp = 2 * (bias)-1 - normalized_exp; | ||||||
|  |     uint64_t mid_sig = rec_table[idx] << (s - 7); | ||||||
|  |  | ||||||
|  |     uint64_t out_exp = mid_exp; | ||||||
|  |     uint64_t out_sig = mid_sig; | ||||||
|  |     if(mid_exp == 0) { | ||||||
|  |         out_exp = mid_exp; | ||||||
|  |         out_sig = (mid_sig >> 1) | (1ULL << (s - 1)); | ||||||
|  |     } else if(mid_exp == (1ULL << e) - 1) { | ||||||
|  |         out_exp = 0; | ||||||
|  |         out_sig = (mid_sig >> 2) | (1ULL << (s - 2)); | ||||||
|  |     } | ||||||
|  |     if(subnormal && nr_leadingzeros > 1) { | ||||||
|  |         if((mode == 0b001) || (mode == 0b010 && sign == 0b0) || (mode == 0b011 && sign == 0b1)) { | ||||||
|  |             res = (sign << (s + e)) | ((1ULL << (e - 1)) - 1) << s | ((1ULL << s) - 1); | ||||||
|  |             return true; | ||||||
|  |         } else { | ||||||
|  |             res = (sign << (s + e)) | ((1ULL << e) - 1) << s; | ||||||
|  |             return true; | ||||||
|  |         } | ||||||
|  |     } | ||||||
|  |     res = (sign << (s + e)) | (out_exp << s) | out_sig; | ||||||
|  |     return false; | ||||||
|  | } | ||||||
|  |  | ||||||
| extern "C" { | extern "C" { | ||||||
|  |  | ||||||
| uint32_t fget_flags() { return softfloat_exceptionFlags & 0x1f; } | uint32_t fget_flags() { return softfloat_exceptionFlags & 0x1f; } | ||||||
|  | uint16_t fadd_h(uint16_t v1, uint16_t v2, uint8_t mode) { | ||||||
|  |     float16_t v1f{v1}, v2f{v2}; | ||||||
|  |     softfloat_roundingMode = mode; | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     float16_t r = f16_add(v1f, v2f); | ||||||
|  |     return r.v; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | uint16_t fsub_h(uint16_t v1, uint16_t v2, uint8_t mode) { | ||||||
|  |     float16_t v1f{v1}, v2f{v2}; | ||||||
|  |     softfloat_roundingMode = mode; | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     float16_t r = f16_sub(v1f, v2f); | ||||||
|  |     return r.v; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | uint16_t fmul_h(uint16_t v1, uint16_t v2, uint8_t mode) { | ||||||
|  |     float16_t v1f{v1}, v2f{v2}; | ||||||
|  |     softfloat_roundingMode = mode; | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     float16_t r = f16_mul(v1f, v2f); | ||||||
|  |     return r.v; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | uint16_t fdiv_h(uint16_t v1, uint16_t v2, uint8_t mode) { | ||||||
|  |     float16_t v1f{v1}, v2f{v2}; | ||||||
|  |     softfloat_roundingMode = mode; | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     float16_t r = f16_div(v1f, v2f); | ||||||
|  |     return r.v; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | uint16_t fsqrt_h(uint16_t v1, uint8_t mode) { | ||||||
|  |     float16_t v1f{v1}; | ||||||
|  |     softfloat_roundingMode = mode; | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     float16_t r = f16_sqrt(v1f); | ||||||
|  |     return r.v; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | uint16_t fcmp_h(uint16_t v1, uint16_t v2, uint16_t op) { | ||||||
|  |     float16_t v1f{v1}, v2f{v2}; | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     bool nan = v1 == defaultNaNF16UI || v2 & defaultNaNF16UI; | ||||||
|  |     bool snan = softfloat_isSigNaNF16UI(v1) || softfloat_isSigNaNF16UI(v2); | ||||||
|  |     switch(op) { | ||||||
|  |     case 0: | ||||||
|  |         if(nan | snan) { | ||||||
|  |             if(snan) | ||||||
|  |                 softfloat_raiseFlags(softfloat_flag_invalid); | ||||||
|  |             return 0; | ||||||
|  |         } else | ||||||
|  |             return f16_eq(v1f, v2f) ? 1 : 0; | ||||||
|  |     case 1: | ||||||
|  |         if(nan | snan) { | ||||||
|  |             softfloat_raiseFlags(softfloat_flag_invalid); | ||||||
|  |             return 0; | ||||||
|  |         } else | ||||||
|  |             return f16_le(v1f, v2f) ? 1 : 0; | ||||||
|  |     case 2: | ||||||
|  |         if(nan | snan) { | ||||||
|  |             softfloat_raiseFlags(softfloat_flag_invalid); | ||||||
|  |             return 0; | ||||||
|  |         } else | ||||||
|  |             return f16_lt(v1f, v2f) ? 1 : 0; | ||||||
|  |     default: | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  |     return -1; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | uint16_t fmadd_h(uint16_t v1, uint16_t v2, uint16_t v3, uint16_t op, uint8_t mode) { | ||||||
|  |     uint16_t F16_SIGN = 1UL << 15; | ||||||
|  |     switch(op) { | ||||||
|  |     case 0: // FMADD_S | ||||||
|  |         break; | ||||||
|  |     case 1: // FMSUB_S | ||||||
|  |         v3 ^= F16_SIGN; | ||||||
|  |         break; | ||||||
|  |     case 2: // FNMADD_S | ||||||
|  |         v1 ^= F16_SIGN; | ||||||
|  |         v3 ^= F16_SIGN; | ||||||
|  |         break; | ||||||
|  |     case 3: // FNMSUB_S | ||||||
|  |         v1 ^= F16_SIGN; | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  |     softfloat_roundingMode = mode; | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     float16_t res = softfloat_mulAddF16(v1, v2, v3, 0); | ||||||
|  |     return res.v; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | uint16_t fsel_h(uint16_t v1, uint16_t v2, uint16_t op) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     bool v1_nan = (v1 & defaultNaNF16UI) == defaultNaNF16UI; | ||||||
|  |     bool v2_nan = (v2 & defaultNaNF16UI) == defaultNaNF16UI; | ||||||
|  |     bool v1_snan = softfloat_isSigNaNF16UI(v1); | ||||||
|  |     bool v2_snan = softfloat_isSigNaNF16UI(v2); | ||||||
|  |     if(v1_snan || v2_snan) | ||||||
|  |         softfloat_raiseFlags(softfloat_flag_invalid); | ||||||
|  |     if(v1_nan || v1_snan) | ||||||
|  |         return (v2_nan || v2_snan) ? defaultNaNF16UI : v2; | ||||||
|  |     else if(v2_nan || v2_snan) | ||||||
|  |         return v1; | ||||||
|  |     else { | ||||||
|  |         if((v1 & 0x7fff) == 0 && (v2 & 0x7fff) == 0) { | ||||||
|  |             return op == 0 ? ((v1 & 0x8000) ? v1 : v2) : ((v1 & 0x8000) ? v2 : v1); | ||||||
|  |         } else { | ||||||
|  |             float16_t v1f{v1}, v2f{v2}; | ||||||
|  |             return op == 0 ? (f16_lt(v1f, v2f) ? v1 : v2) : (f16_lt(v1f, v2f) ? v2 : v1); | ||||||
|  |         } | ||||||
|  |     } | ||||||
|  | } | ||||||
|  |  | ||||||
|  | uint16_t fclass_h(uint16_t v1) { | ||||||
|  |  | ||||||
|  |     float16_t a{v1}; | ||||||
|  |     union ui16_f16 uA; | ||||||
|  |     uint_fast16_t uiA; | ||||||
|  |  | ||||||
|  |     uA.f = a; | ||||||
|  |     uiA = uA.ui; | ||||||
|  |  | ||||||
|  |     bool infOrNaN = expF16UI(uiA) == 0x1F; | ||||||
|  |     bool subnormalOrZero = expF16UI(uiA) == 0; | ||||||
|  |     bool sign = signF16UI(uiA); | ||||||
|  |     bool fracZero = fracF16UI(uiA) == 0; | ||||||
|  |     bool isNaN = isNaNF16UI(uiA); | ||||||
|  |     bool isSNaN = softfloat_isSigNaNF16UI(uiA); | ||||||
|  |  | ||||||
|  |     return (sign && infOrNaN && fracZero) << 0 | (sign && !infOrNaN && !subnormalOrZero) << 1 | | ||||||
|  |            (sign && subnormalOrZero && !fracZero) << 2 | (sign && subnormalOrZero && fracZero) << 3 | (!sign && infOrNaN && fracZero) << 7 | | ||||||
|  |            (!sign && !infOrNaN && !subnormalOrZero) << 6 | (!sign && subnormalOrZero && !fracZero) << 5 | | ||||||
|  |            (!sign && subnormalOrZero && fracZero) << 4 | (isNaN && isSNaN) << 8 | (isNaN && !isSNaN) << 9; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | uint16_t frsqrt7_h(uint16_t v) { | ||||||
|  |     bool subnormal = false; | ||||||
|  |     uint16_t ret_val = 0; | ||||||
|  |     if(rsqrt_check(fclass_h(v), subnormal, ret_val)) { | ||||||
|  |         return ret_val; | ||||||
|  |     } | ||||||
|  |     uint16_t sig = fracF64UI(v); | ||||||
|  |     int16_t exp = expF64UI(v); | ||||||
|  |     uint16_t sign = signF64UI(v); | ||||||
|  |     unsigned constexpr e = 5; | ||||||
|  |     unsigned constexpr s = 10; | ||||||
|  |     return frsqrt7_general(s, e, sign, exp, sig, subnormal); | ||||||
|  | } | ||||||
|  |  | ||||||
|  | uint16_t frec7_h(uint16_t v, uint8_t mode) { | ||||||
|  |     bool subnormal = false; | ||||||
|  |     uint64_t ret_val = 0; | ||||||
|  |     if(recip_check(fclass_h(v), subnormal, ret_val)) { | ||||||
|  |         return ret_val; | ||||||
|  |     } | ||||||
|  |     uint16_t sig = fracF16UI(v); | ||||||
|  |     int exp = expF16UI(v); | ||||||
|  |     uint16_t sign = signF16UI(v); | ||||||
|  |     unsigned constexpr e = 5; | ||||||
|  |     unsigned constexpr s = 10; | ||||||
|  |     if(frec_general(ret_val, s, e, sign, exp, sig, subnormal, mode)) | ||||||
|  |         softfloat_exceptionFlags |= (softfloat_flag_inexact | softfloat_flag_overflow); | ||||||
|  |     return ret_val; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | uint16_t unbox_h(uint8_t FLEN, uint64_t v) { | ||||||
|  |     uint64_t mask = 0; | ||||||
|  |     switch(FLEN) { | ||||||
|  |     case 32: { | ||||||
|  |         mask = std::numeric_limits<uint32_t>::max() & ~((uint64_t)std::numeric_limits<uint16_t>::max()); | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  |     case 64: { | ||||||
|  |         mask = std::numeric_limits<uint64_t>::max() & ~((uint64_t)std::numeric_limits<uint16_t>::max()); | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  |     default: | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  |     if((v & mask) != mask) | ||||||
|  |         return defaultNaNF16UI; | ||||||
|  |     else | ||||||
|  |         return v & std::numeric_limits<uint32_t>::max(); | ||||||
|  | } | ||||||
|  |  | ||||||
| uint32_t fadd_s(uint32_t v1, uint32_t v2, uint8_t mode) { | uint32_t fadd_s(uint32_t v1, uint32_t v2, uint8_t mode) { | ||||||
|     float32_t v1f{v1}, v2f{v2}; |     float32_t v1f{v1}, v2f{v2}; | ||||||
|     softfloat_roundingMode = rmm_map[mode & 0x7]; |     softfloat_roundingMode = mode; | ||||||
|     softfloat_exceptionFlags = 0; |     softfloat_exceptionFlags = 0; | ||||||
|     float32_t r = f32_add(v1f, v2f); |     float32_t r = f32_add(v1f, v2f); | ||||||
|     return r.v; |     return r.v; | ||||||
| @@ -64,7 +422,7 @@ uint32_t fadd_s(uint32_t v1, uint32_t v2, uint8_t mode) { | |||||||
|  |  | ||||||
| uint32_t fsub_s(uint32_t v1, uint32_t v2, uint8_t mode) { | uint32_t fsub_s(uint32_t v1, uint32_t v2, uint8_t mode) { | ||||||
|     float32_t v1f{v1}, v2f{v2}; |     float32_t v1f{v1}, v2f{v2}; | ||||||
|     softfloat_roundingMode = rmm_map[mode & 0x7]; |     softfloat_roundingMode = mode; | ||||||
|     softfloat_exceptionFlags = 0; |     softfloat_exceptionFlags = 0; | ||||||
|     float32_t r = f32_sub(v1f, v2f); |     float32_t r = f32_sub(v1f, v2f); | ||||||
|     return r.v; |     return r.v; | ||||||
| @@ -72,7 +430,7 @@ uint32_t fsub_s(uint32_t v1, uint32_t v2, uint8_t mode) { | |||||||
|  |  | ||||||
| uint32_t fmul_s(uint32_t v1, uint32_t v2, uint8_t mode) { | uint32_t fmul_s(uint32_t v1, uint32_t v2, uint8_t mode) { | ||||||
|     float32_t v1f{v1}, v2f{v2}; |     float32_t v1f{v1}, v2f{v2}; | ||||||
|     softfloat_roundingMode = rmm_map[mode & 0x7]; |     softfloat_roundingMode = mode; | ||||||
|     softfloat_exceptionFlags = 0; |     softfloat_exceptionFlags = 0; | ||||||
|     float32_t r = f32_mul(v1f, v2f); |     float32_t r = f32_mul(v1f, v2f); | ||||||
|     return r.v; |     return r.v; | ||||||
| @@ -80,7 +438,7 @@ uint32_t fmul_s(uint32_t v1, uint32_t v2, uint8_t mode) { | |||||||
|  |  | ||||||
| uint32_t fdiv_s(uint32_t v1, uint32_t v2, uint8_t mode) { | uint32_t fdiv_s(uint32_t v1, uint32_t v2, uint8_t mode) { | ||||||
|     float32_t v1f{v1}, v2f{v2}; |     float32_t v1f{v1}, v2f{v2}; | ||||||
|     softfloat_roundingMode = rmm_map[mode & 0x7]; |     softfloat_roundingMode = mode; | ||||||
|     softfloat_exceptionFlags = 0; |     softfloat_exceptionFlags = 0; | ||||||
|     float32_t r = f32_div(v1f, v2f); |     float32_t r = f32_div(v1f, v2f); | ||||||
|     return r.v; |     return r.v; | ||||||
| @@ -88,7 +446,7 @@ uint32_t fdiv_s(uint32_t v1, uint32_t v2, uint8_t mode) { | |||||||
|  |  | ||||||
| uint32_t fsqrt_s(uint32_t v1, uint8_t mode) { | uint32_t fsqrt_s(uint32_t v1, uint8_t mode) { | ||||||
|     float32_t v1f{v1}; |     float32_t v1f{v1}; | ||||||
|     softfloat_roundingMode = rmm_map[mode & 0x7]; |     softfloat_roundingMode = mode; | ||||||
|     softfloat_exceptionFlags = 0; |     softfloat_exceptionFlags = 0; | ||||||
|     float32_t r = f32_sqrt(v1f); |     float32_t r = f32_sqrt(v1f); | ||||||
|     return r.v; |     return r.v; | ||||||
| @@ -97,7 +455,7 @@ uint32_t fsqrt_s(uint32_t v1, uint8_t mode) { | |||||||
| uint32_t fcmp_s(uint32_t v1, uint32_t v2, uint32_t op) { | uint32_t fcmp_s(uint32_t v1, uint32_t v2, uint32_t op) { | ||||||
|     float32_t v1f{v1}, v2f{v2}; |     float32_t v1f{v1}, v2f{v2}; | ||||||
|     softfloat_exceptionFlags = 0; |     softfloat_exceptionFlags = 0; | ||||||
|     bool nan = (v1 & defaultNaNF32UI) == quiet_nan32 || (v2 & defaultNaNF32UI) == quiet_nan32; |     bool nan = v1 == defaultNaNF32UI || v2 == defaultNaNF32UI; | ||||||
|     bool snan = softfloat_isSigNaNF32UI(v1) || softfloat_isSigNaNF32UI(v2); |     bool snan = softfloat_isSigNaNF32UI(v1) || softfloat_isSigNaNF32UI(v2); | ||||||
|     switch(op) { |     switch(op) { | ||||||
|     case 0: |     case 0: | ||||||
| @@ -125,36 +483,25 @@ uint32_t fcmp_s(uint32_t v1, uint32_t v2, uint32_t op) { | |||||||
|     return -1; |     return -1; | ||||||
| } | } | ||||||
|  |  | ||||||
| uint32_t fcvt_s(uint32_t v1, uint32_t op, uint8_t mode) { |  | ||||||
|     float32_t v1f{v1}; |  | ||||||
|     softfloat_exceptionFlags = 0; |  | ||||||
|     float32_t r; |  | ||||||
|     switch(op) { |  | ||||||
|     case 0: { // w->s, fp to int32 |  | ||||||
|         uint_fast32_t res = f32_to_i32(v1f, rmm_map[mode & 0x7], true); |  | ||||||
|         return (uint32_t)res; |  | ||||||
|     } |  | ||||||
|     case 1: { // wu->s |  | ||||||
|         uint_fast32_t res = f32_to_ui32(v1f, rmm_map[mode & 0x7], true); |  | ||||||
|         return (uint32_t)res; |  | ||||||
|     } |  | ||||||
|     case 2: // s->w |  | ||||||
|         r = i32_to_f32(v1); |  | ||||||
|         return r.v; |  | ||||||
|     case 3: // s->wu |  | ||||||
|         r = ui32_to_f32(v1); |  | ||||||
|         return r.v; |  | ||||||
|     } |  | ||||||
|     return 0; |  | ||||||
| } |  | ||||||
|  |  | ||||||
| uint32_t fmadd_s(uint32_t v1, uint32_t v2, uint32_t v3, uint32_t op, uint8_t mode) { | uint32_t fmadd_s(uint32_t v1, uint32_t v2, uint32_t v3, uint32_t op, uint8_t mode) { | ||||||
|     // op should be {softfloat_mulAdd_subProd(2), softfloat_mulAdd_subC(1)} |     uint32_t F32_SIGN = 1UL << 31; | ||||||
|     softfloat_roundingMode = rmm_map[mode & 0x7]; |     switch(op) { | ||||||
|  |     case 0: // FMADD_S | ||||||
|  |         break; | ||||||
|  |     case 1: // FMSUB_S | ||||||
|  |         v3 ^= F32_SIGN; | ||||||
|  |         break; | ||||||
|  |     case 2: // FNMADD_S | ||||||
|  |         v1 ^= F32_SIGN; | ||||||
|  |         v3 ^= F32_SIGN; | ||||||
|  |         break; | ||||||
|  |     case 3: // FNMSUB_S | ||||||
|  |         v1 ^= F32_SIGN; | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  |     softfloat_roundingMode = mode; | ||||||
|     softfloat_exceptionFlags = 0; |     softfloat_exceptionFlags = 0; | ||||||
|     float32_t res = softfloat_mulAddF32(v1, v2, v3, op & 0x1); |     float32_t res = softfloat_mulAddF32(v1, v2, v3, 0); | ||||||
|     if(op > 1) |  | ||||||
|         res.v ^= 1ULL << 31; |  | ||||||
|     return res.v; |     return res.v; | ||||||
| } | } | ||||||
|  |  | ||||||
| @@ -189,8 +536,8 @@ uint32_t fclass_s(uint32_t v1) { | |||||||
|     uA.f = a; |     uA.f = a; | ||||||
|     uiA = uA.ui; |     uiA = uA.ui; | ||||||
|  |  | ||||||
|     uint_fast16_t infOrNaN = expF32UI(uiA) == 0xFF; |     bool infOrNaN = expF32UI(uiA) == 0xFF; | ||||||
|     uint_fast16_t subnormalOrZero = expF32UI(uiA) == 0; |     bool subnormalOrZero = expF32UI(uiA) == 0; | ||||||
|     bool sign = signF32UI(uiA); |     bool sign = signF32UI(uiA); | ||||||
|     bool fracZero = fracF32UI(uiA) == 0; |     bool fracZero = fracF32UI(uiA) == 0; | ||||||
|     bool isNaN = isNaNF32UI(uiA); |     bool isNaN = isNaNF32UI(uiA); | ||||||
| @@ -202,33 +549,60 @@ uint32_t fclass_s(uint32_t v1) { | |||||||
|            (!sign && subnormalOrZero && fracZero) << 4 | (isNaN && isSNaN) << 8 | (isNaN && !isSNaN) << 9; |            (!sign && subnormalOrZero && fracZero) << 4 | (isNaN && isSNaN) << 8 | (isNaN && !isSNaN) << 9; | ||||||
| } | } | ||||||
|  |  | ||||||
| uint32_t fconv_d2f(uint64_t v1, uint8_t mode) { | uint32_t frsqrt7_s(uint32_t v) { | ||||||
|     softfloat_roundingMode = rmm_map[mode & 0x7]; |     bool subnormal = false; | ||||||
|     bool nan = (v1 & defaultNaNF64UI) == defaultNaNF64UI; |     uint32_t ret_val = 0; | ||||||
|     if(nan) { |     if(rsqrt_check(fclass_s(v), subnormal, ret_val)) { | ||||||
|         return defaultNaNF32UI; |         return ret_val; | ||||||
|     } else { |  | ||||||
|         float32_t res = f64_to_f32(float64_t{v1}); |  | ||||||
|         return res.v; |  | ||||||
|     } |     } | ||||||
|  |     uint32_t sig = fracF32UI(v); | ||||||
|  |     int exp = expF32UI(v); | ||||||
|  |     uint32_t sign = signF32UI(v); | ||||||
|  |     unsigned constexpr e = 8; | ||||||
|  |     unsigned constexpr s = 23; | ||||||
|  |     return frsqrt7_general(s, e, sign, exp, sig, subnormal); | ||||||
| } | } | ||||||
|  |  | ||||||
| uint64_t fconv_f2d(uint32_t v1, uint8_t mode) { | uint32_t frec7_s(uint32_t v, uint8_t mode) { | ||||||
|     bool nan = (v1 & defaultNaNF32UI) == defaultNaNF32UI; |     bool subnormal = false; | ||||||
|     if(nan) { |     uint64_t ret_val = 0; | ||||||
|         return defaultNaNF64UI; |     if(recip_check(fclass_s(v), subnormal, ret_val)) { | ||||||
|     } else { |         return ret_val; | ||||||
|         softfloat_roundingMode = rmm_map[mode & 0x7]; |  | ||||||
|         float64_t res = f32_to_f64(float32_t{v1}); |  | ||||||
|         return res.v; |  | ||||||
|     } |     } | ||||||
|  |     uint32_t sig = fracF32UI(v); | ||||||
|  |     int exp = expF32UI(v); | ||||||
|  |     uint32_t sign = signF32UI(v); | ||||||
|  |     unsigned constexpr e = 8; | ||||||
|  |     unsigned constexpr s = 23; | ||||||
|  |     if(frec_general(ret_val, s, e, sign, exp, sig, subnormal, mode)) | ||||||
|  |         softfloat_exceptionFlags |= (softfloat_flag_inexact | softfloat_flag_overflow); | ||||||
|  |     return ret_val; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | uint32_t unbox_s(uint8_t FLEN, uint64_t v) { | ||||||
|  |     uint64_t mask = 0; | ||||||
|  |     switch(FLEN) { | ||||||
|  |     case 32: { | ||||||
|  |         return v; | ||||||
|  |     } | ||||||
|  |     case 64: { | ||||||
|  |         mask = std::numeric_limits<uint64_t>::max() & ~((uint64_t)std::numeric_limits<uint32_t>::max()); | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  |     default: | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  |     if((v & mask) != mask) | ||||||
|  |         return defaultNaNF32UI; | ||||||
|  |     else | ||||||
|  |         return v & std::numeric_limits<uint32_t>::max(); | ||||||
| } | } | ||||||
|  |  | ||||||
| uint64_t fadd_d(uint64_t v1, uint64_t v2, uint8_t mode) { | uint64_t fadd_d(uint64_t v1, uint64_t v2, uint8_t mode) { | ||||||
|     bool nan = (v1 & defaultNaNF32UI) == quiet_nan32; |     bool nan = v1 == defaultNaNF32UI; | ||||||
|     bool snan = softfloat_isSigNaNF32UI(v1); |     bool snan = softfloat_isSigNaNF32UI(v1); | ||||||
|     float64_t v1f{v1}, v2f{v2}; |     float64_t v1f{v1}, v2f{v2}; | ||||||
|     softfloat_roundingMode = rmm_map[mode & 0x7]; |     softfloat_roundingMode = mode; | ||||||
|     softfloat_exceptionFlags = 0; |     softfloat_exceptionFlags = 0; | ||||||
|     float64_t r = f64_add(v1f, v2f); |     float64_t r = f64_add(v1f, v2f); | ||||||
|     return r.v; |     return r.v; | ||||||
| @@ -236,7 +610,7 @@ uint64_t fadd_d(uint64_t v1, uint64_t v2, uint8_t mode) { | |||||||
|  |  | ||||||
| uint64_t fsub_d(uint64_t v1, uint64_t v2, uint8_t mode) { | uint64_t fsub_d(uint64_t v1, uint64_t v2, uint8_t mode) { | ||||||
|     float64_t v1f{v1}, v2f{v2}; |     float64_t v1f{v1}, v2f{v2}; | ||||||
|     softfloat_roundingMode = rmm_map[mode & 0x7]; |     softfloat_roundingMode = mode; | ||||||
|     softfloat_exceptionFlags = 0; |     softfloat_exceptionFlags = 0; | ||||||
|     float64_t r = f64_sub(v1f, v2f); |     float64_t r = f64_sub(v1f, v2f); | ||||||
|     return r.v; |     return r.v; | ||||||
| @@ -244,7 +618,7 @@ uint64_t fsub_d(uint64_t v1, uint64_t v2, uint8_t mode) { | |||||||
|  |  | ||||||
| uint64_t fmul_d(uint64_t v1, uint64_t v2, uint8_t mode) { | uint64_t fmul_d(uint64_t v1, uint64_t v2, uint8_t mode) { | ||||||
|     float64_t v1f{v1}, v2f{v2}; |     float64_t v1f{v1}, v2f{v2}; | ||||||
|     softfloat_roundingMode = rmm_map[mode & 0x7]; |     softfloat_roundingMode = mode; | ||||||
|     softfloat_exceptionFlags = 0; |     softfloat_exceptionFlags = 0; | ||||||
|     float64_t r = f64_mul(v1f, v2f); |     float64_t r = f64_mul(v1f, v2f); | ||||||
|     return r.v; |     return r.v; | ||||||
| @@ -252,7 +626,7 @@ uint64_t fmul_d(uint64_t v1, uint64_t v2, uint8_t mode) { | |||||||
|  |  | ||||||
| uint64_t fdiv_d(uint64_t v1, uint64_t v2, uint8_t mode) { | uint64_t fdiv_d(uint64_t v1, uint64_t v2, uint8_t mode) { | ||||||
|     float64_t v1f{v1}, v2f{v2}; |     float64_t v1f{v1}, v2f{v2}; | ||||||
|     softfloat_roundingMode = rmm_map[mode & 0x7]; |     softfloat_roundingMode = mode; | ||||||
|     softfloat_exceptionFlags = 0; |     softfloat_exceptionFlags = 0; | ||||||
|     float64_t r = f64_div(v1f, v2f); |     float64_t r = f64_div(v1f, v2f); | ||||||
|     return r.v; |     return r.v; | ||||||
| @@ -260,7 +634,7 @@ uint64_t fdiv_d(uint64_t v1, uint64_t v2, uint8_t mode) { | |||||||
|  |  | ||||||
| uint64_t fsqrt_d(uint64_t v1, uint8_t mode) { | uint64_t fsqrt_d(uint64_t v1, uint8_t mode) { | ||||||
|     float64_t v1f{v1}; |     float64_t v1f{v1}; | ||||||
|     softfloat_roundingMode = rmm_map[mode & 0x7]; |     softfloat_roundingMode = mode; | ||||||
|     softfloat_exceptionFlags = 0; |     softfloat_exceptionFlags = 0; | ||||||
|     float64_t r = f64_sqrt(v1f); |     float64_t r = f64_sqrt(v1f); | ||||||
|     return r.v; |     return r.v; | ||||||
| @@ -269,7 +643,7 @@ uint64_t fsqrt_d(uint64_t v1, uint8_t mode) { | |||||||
| uint64_t fcmp_d(uint64_t v1, uint64_t v2, uint32_t op) { | uint64_t fcmp_d(uint64_t v1, uint64_t v2, uint32_t op) { | ||||||
|     float64_t v1f{v1}, v2f{v2}; |     float64_t v1f{v1}, v2f{v2}; | ||||||
|     softfloat_exceptionFlags = 0; |     softfloat_exceptionFlags = 0; | ||||||
|     bool nan = (v1 & defaultNaNF64UI) == quiet_nan32 || (v2 & defaultNaNF64UI) == quiet_nan32; |     bool nan = v1 == defaultNaNF64UI || v2 == defaultNaNF64UI; | ||||||
|     bool snan = softfloat_isSigNaNF64UI(v1) || softfloat_isSigNaNF64UI(v2); |     bool snan = softfloat_isSigNaNF64UI(v1) || softfloat_isSigNaNF64UI(v2); | ||||||
|     switch(op) { |     switch(op) { | ||||||
|     case 0: |     case 0: | ||||||
| @@ -297,36 +671,25 @@ uint64_t fcmp_d(uint64_t v1, uint64_t v2, uint32_t op) { | |||||||
|     return -1; |     return -1; | ||||||
| } | } | ||||||
|  |  | ||||||
| uint64_t fcvt_d(uint64_t v1, uint32_t op, uint8_t mode) { |  | ||||||
|     float64_t v1f{v1}; |  | ||||||
|     softfloat_exceptionFlags = 0; |  | ||||||
|     float64_t r; |  | ||||||
|     switch(op) { |  | ||||||
|     case 0: { // l->d, fp to int32 |  | ||||||
|         int64_t res = f64_to_i64(v1f, rmm_map[mode & 0x7], true); |  | ||||||
|         return (uint64_t)res; |  | ||||||
|     } |  | ||||||
|     case 1: { // lu->s |  | ||||||
|         uint64_t res = f64_to_ui64(v1f, rmm_map[mode & 0x7], true); |  | ||||||
|         return res; |  | ||||||
|     } |  | ||||||
|     case 2: // s->l |  | ||||||
|         r = i64_to_f64(v1); |  | ||||||
|         return r.v; |  | ||||||
|     case 3: // s->lu |  | ||||||
|         r = ui64_to_f64(v1); |  | ||||||
|         return r.v; |  | ||||||
|     } |  | ||||||
|     return 0; |  | ||||||
| } |  | ||||||
|  |  | ||||||
| uint64_t fmadd_d(uint64_t v1, uint64_t v2, uint64_t v3, uint32_t op, uint8_t mode) { | uint64_t fmadd_d(uint64_t v1, uint64_t v2, uint64_t v3, uint32_t op, uint8_t mode) { | ||||||
|     // op should be {softfloat_mulAdd_subProd(2), softfloat_mulAdd_subC(1)} |     uint64_t F64_SIGN = 1ULL << 63; | ||||||
|     softfloat_roundingMode = rmm_map[mode & 0x7]; |     switch(op) { | ||||||
|  |     case 0: // FMADD_D | ||||||
|  |         break; | ||||||
|  |     case 1: // FMSUB_D | ||||||
|  |         v3 ^= F64_SIGN; | ||||||
|  |         break; | ||||||
|  |     case 2: // FNMADD_D | ||||||
|  |         v1 ^= F64_SIGN; | ||||||
|  |         v3 ^= F64_SIGN; | ||||||
|  |         break; | ||||||
|  |     case 3: // FNMSUB_D | ||||||
|  |         v1 ^= F64_SIGN; | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  |     softfloat_roundingMode = mode; | ||||||
|     softfloat_exceptionFlags = 0; |     softfloat_exceptionFlags = 0; | ||||||
|     float64_t res = softfloat_mulAddF64(v1, v2, v3, op & 0x1); |     float64_t res = softfloat_mulAddF64(v1, v2, v3, 0); | ||||||
|     if(op > 1) |  | ||||||
|         res.v ^= 1ULL << 63; |  | ||||||
|     return res.v; |     return res.v; | ||||||
| } | } | ||||||
|  |  | ||||||
| @@ -362,8 +725,8 @@ uint64_t fclass_d(uint64_t v1) { | |||||||
|     uA.f = a; |     uA.f = a; | ||||||
|     uiA = uA.ui; |     uiA = uA.ui; | ||||||
|  |  | ||||||
|     uint_fast16_t infOrNaN = expF64UI(uiA) == 0x7FF; |     bool infOrNaN = expF64UI(uiA) == 0x7FF; | ||||||
|     uint_fast16_t subnormalOrZero = expF64UI(uiA) == 0; |     bool subnormalOrZero = expF64UI(uiA) == 0; | ||||||
|     bool sign = signF64UI(uiA); |     bool sign = signF64UI(uiA); | ||||||
|     bool fracZero = fracF64UI(uiA) == 0; |     bool fracZero = fracF64UI(uiA) == 0; | ||||||
|     bool isNaN = isNaNF64UI(uiA); |     bool isNaN = isNaNF64UI(uiA); | ||||||
| @@ -375,52 +738,211 @@ uint64_t fclass_d(uint64_t v1) { | |||||||
|            (!sign && subnormalOrZero && fracZero) << 4 | (isNaN && isSNaN) << 8 | (isNaN && !isSNaN) << 9; |            (!sign && subnormalOrZero && fracZero) << 4 | (isNaN && isSNaN) << 8 | (isNaN && !isSNaN) << 9; | ||||||
| } | } | ||||||
|  |  | ||||||
| uint64_t fcvt_32_64(uint32_t v1, uint32_t op, uint8_t mode) { | uint64_t frsqrt7_d(uint64_t v) { | ||||||
|     float32_t v1f{v1}; |     bool subnormal = false; | ||||||
|     softfloat_exceptionFlags = 0; |     uint64_t ret_val = 0; | ||||||
|     float64_t r; |     if(rsqrt_check(fclass_d(v), subnormal, ret_val)) { | ||||||
|     switch(op) { |         return ret_val; | ||||||
|     case 0: // l->s, fp to int32 |  | ||||||
|         return f32_to_i64(v1f, rmm_map[mode & 0x7], true); |  | ||||||
|     case 1: // wu->s |  | ||||||
|         return f32_to_ui64(v1f, rmm_map[mode & 0x7], true); |  | ||||||
|     case 2: // s->w |  | ||||||
|         r = i32_to_f64(v1); |  | ||||||
|         return r.v; |  | ||||||
|     case 3: // s->wu |  | ||||||
|         r = ui32_to_f64(v1); |  | ||||||
|         return r.v; |  | ||||||
|     } |     } | ||||||
|     return 0; |     uint64_t sig = fracF64UI(v); | ||||||
|  |     int exp = expF64UI(v); | ||||||
|  |     uint64_t sign = signF64UI(v); | ||||||
|  |     unsigned constexpr e = 11; | ||||||
|  |     unsigned constexpr s = 52; | ||||||
|  |     return frsqrt7_general(s, e, sign, exp, sig, subnormal); | ||||||
| } | } | ||||||
|  |  | ||||||
| uint32_t fcvt_64_32(uint64_t v1, uint32_t op, uint8_t mode) { | uint64_t frec7_d(uint64_t v, uint8_t mode) { | ||||||
|     softfloat_exceptionFlags = 0; |     bool subnormal = false; | ||||||
|     float32_t r; |     uint64_t ret_val = 0; | ||||||
|     switch(op) { |     if(recip_check(fclass_d(v), subnormal, ret_val)) { | ||||||
|     case 0: { // wu->s |         return ret_val; | ||||||
|         int32_t r = f64_to_i32(float64_t{v1}, rmm_map[mode & 0x7], true); |  | ||||||
|         return r; |  | ||||||
|     } |     } | ||||||
|     case 1: { // wu->s |     uint64_t sig = fracF64UI(v); | ||||||
|         uint32_t r = f64_to_ui32(float64_t{v1}, rmm_map[mode & 0x7], true); |     int exp = expF64UI(v); | ||||||
|         return r; |     uint64_t sign = signF64UI(v); | ||||||
|     } |     unsigned constexpr e = 11; | ||||||
|     case 2: // l->s, fp to int32 |     unsigned constexpr s = 52; | ||||||
|         r = i64_to_f32(v1); |     if(frec_general(ret_val, s, e, sign, exp, sig, subnormal, mode)) | ||||||
|         return r.v; |         softfloat_exceptionFlags |= (softfloat_flag_inexact | softfloat_flag_overflow); | ||||||
|     case 3: // wu->s |     return ret_val; | ||||||
|         r = ui64_to_f32(v1); |  | ||||||
|         return r.v; |  | ||||||
|     } |  | ||||||
|     return 0; |  | ||||||
| } | } | ||||||
|  |  | ||||||
| uint32_t unbox_s(uint64_t v) { | uint64_t unbox_d(uint8_t FLEN, uint64_t v) { | ||||||
|     constexpr uint64_t mask = std::numeric_limits<uint64_t>::max() & ~((uint64_t)std::numeric_limits<uint32_t>::max()); |     uint64_t mask = 0; | ||||||
|  |     switch(FLEN) { | ||||||
|  |     case 64: { | ||||||
|  |         return v; | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|  |     default: | ||||||
|  |         break; | ||||||
|  |     } | ||||||
|     if((v & mask) != mask) |     if((v & mask) != mask) | ||||||
|         return 0x7fc00000; |         return defaultNaNF64UI; | ||||||
|     else |     else | ||||||
|         return v & std::numeric_limits<uint32_t>::max(); |         return v & std::numeric_limits<uint32_t>::max(); | ||||||
| } | } | ||||||
|  |  | ||||||
|  | // conversion: float to float | ||||||
|  | uint32_t f16tof32(uint16_t val, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f16_to_f32(float16_t{val}).v; | ||||||
|  | } | ||||||
|  | uint64_t f16tof64(uint16_t val, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f16_to_f64(float16_t{val}).v; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | uint16_t f32tof16(uint32_t val, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f32_to_f16(float32_t{val}).v; | ||||||
|  | } | ||||||
|  | uint64_t f32tof64(uint32_t val, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f32_to_f64(float32_t{val}).v; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | uint16_t f64tof16(uint64_t val, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f64_to_f16(float64_t{val}).v; | ||||||
|  | } | ||||||
|  | uint32_t f64tof32(uint64_t val, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f64_to_f32(float64_t{val}).v; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | // conversions: float to unsigned | ||||||
|  | uint32_t f16toui32(uint16_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f16_to_ui32(float16_t{v}, rm, true); | ||||||
|  | } | ||||||
|  | uint64_t f16toui64(uint16_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f16_to_ui64(float16_t{v}, rm, true); | ||||||
|  | } | ||||||
|  | uint32_t f32toui32(uint32_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f32_to_ui32(float32_t{v}, rm, true); | ||||||
|  | } | ||||||
|  | uint64_t f32toui64(uint32_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f32_to_ui64(float32_t{v}, rm, true); | ||||||
|  | } | ||||||
|  | uint32_t f64toui32(uint64_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f64_to_ui32(float64_t{v}, rm, true); | ||||||
|  | } | ||||||
|  | uint64_t f64toui64(uint64_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f64_to_ui64(float64_t{v}, rm, true); | ||||||
|  | } | ||||||
|  |  | ||||||
|  | // conversions: float to signed | ||||||
|  | uint32_t f16toi32(uint16_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f16_to_i32(float16_t{v}, rm, true); | ||||||
|  | } | ||||||
|  | uint64_t f16toi64(uint16_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f16_to_i64(float16_t{v}, rm, true); | ||||||
|  | } | ||||||
|  | uint32_t f32toi32(uint32_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f32_to_i32(float32_t{v}, rm, true); | ||||||
|  | } | ||||||
|  | uint64_t f32toi64(uint32_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f32_to_i64(float32_t{v}, rm, true); | ||||||
|  | } | ||||||
|  | uint32_t f64toi32(uint64_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f64_to_i32(float64_t{v}, rm, true); | ||||||
|  | } | ||||||
|  | uint64_t f64toi64(uint64_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return f64_to_i64(float64_t{v}, rm, true); | ||||||
|  | } | ||||||
|  |  | ||||||
|  | // conversions: unsigned to float | ||||||
|  | uint16_t ui32tof16(uint32_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return ui32_to_f16(v).v; | ||||||
|  | } | ||||||
|  | uint16_t ui64tof16(uint64_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return ui64_to_f16(v).v; | ||||||
|  | } | ||||||
|  | uint32_t ui32tof32(uint32_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return ui32_to_f32(v).v; | ||||||
|  | } | ||||||
|  | uint32_t ui64tof32(uint64_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return ui64_to_f32(v).v; | ||||||
|  | } | ||||||
|  | uint64_t ui32tof64(uint32_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return ui32_to_f64(v).v; | ||||||
|  | } | ||||||
|  | uint64_t ui64tof64(uint64_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return ui64_to_f64(v).v; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | // conversions: signed to float | ||||||
|  | uint16_t i32tof16(uint32_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return i32_to_f16(v).v; | ||||||
|  | } | ||||||
|  | uint16_t i64tof16(uint64_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return i64_to_f16(v).v; | ||||||
|  | } | ||||||
|  | uint32_t i32tof32(uint32_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return i32_to_f32(v).v; | ||||||
|  | } | ||||||
|  | uint32_t i64tof32(uint64_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return i64_to_f32(v).v; | ||||||
|  | } | ||||||
|  | uint64_t i32tof64(uint32_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return i32_to_f64(v).v; | ||||||
|  | } | ||||||
|  | uint64_t i64tof64(uint64_t v, uint8_t rm) { | ||||||
|  |     softfloat_exceptionFlags = 0; | ||||||
|  |     softfloat_roundingMode = rm; | ||||||
|  |     return i64_to_f64(v).v; | ||||||
|  | } | ||||||
| } | } | ||||||
| @@ -39,30 +39,87 @@ | |||||||
|  |  | ||||||
| extern "C" { | extern "C" { | ||||||
| uint32_t fget_flags(); | uint32_t fget_flags(); | ||||||
|  |  | ||||||
|  | // half precision | ||||||
|  | uint16_t fadd_h(uint16_t v1, uint16_t v2, uint8_t mode); | ||||||
|  | uint16_t fsub_h(uint16_t v1, uint16_t v2, uint8_t mode); | ||||||
|  | uint16_t fmul_h(uint16_t v1, uint16_t v2, uint8_t mode); | ||||||
|  | uint16_t fdiv_h(uint16_t v1, uint16_t v2, uint8_t mode); | ||||||
|  | uint16_t fsqrt_h(uint16_t v1, uint8_t mode); | ||||||
|  | uint16_t fcmp_h(uint16_t v1, uint16_t v2, uint16_t op); | ||||||
|  | uint16_t fmadd_h(uint16_t v1, uint16_t v2, uint16_t v3, uint16_t op, uint8_t mode); | ||||||
|  | uint16_t fsel_h(uint16_t v1, uint16_t v2, uint16_t op); | ||||||
|  | uint16_t fclass_h(uint16_t v1); | ||||||
|  | uint16_t frsqrt7_h(uint16_t v); | ||||||
|  | uint16_t frec7_h(uint16_t v, uint8_t mode); | ||||||
|  | uint16_t unbox_h(uint8_t FLEN, uint64_t v); | ||||||
|  |  | ||||||
|  | // single precision | ||||||
| uint32_t fadd_s(uint32_t v1, uint32_t v2, uint8_t mode); | uint32_t fadd_s(uint32_t v1, uint32_t v2, uint8_t mode); | ||||||
| uint32_t fsub_s(uint32_t v1, uint32_t v2, uint8_t mode); | uint32_t fsub_s(uint32_t v1, uint32_t v2, uint8_t mode); | ||||||
| uint32_t fmul_s(uint32_t v1, uint32_t v2, uint8_t mode); | uint32_t fmul_s(uint32_t v1, uint32_t v2, uint8_t mode); | ||||||
| uint32_t fdiv_s(uint32_t v1, uint32_t v2, uint8_t mode); | uint32_t fdiv_s(uint32_t v1, uint32_t v2, uint8_t mode); | ||||||
| uint32_t fsqrt_s(uint32_t v1, uint8_t mode); | uint32_t fsqrt_s(uint32_t v1, uint8_t mode); | ||||||
| uint32_t fcmp_s(uint32_t v1, uint32_t v2, uint32_t op); | uint32_t fcmp_s(uint32_t v1, uint32_t v2, uint32_t op); | ||||||
| uint32_t fcvt_s(uint32_t v1, uint32_t op, uint8_t mode); |  | ||||||
| uint32_t fmadd_s(uint32_t v1, uint32_t v2, uint32_t v3, uint32_t op, uint8_t mode); | uint32_t fmadd_s(uint32_t v1, uint32_t v2, uint32_t v3, uint32_t op, uint8_t mode); | ||||||
| uint32_t fsel_s(uint32_t v1, uint32_t v2, uint32_t op); | uint32_t fsel_s(uint32_t v1, uint32_t v2, uint32_t op); | ||||||
| uint32_t fclass_s(uint32_t v1); | uint32_t fclass_s(uint32_t v1); | ||||||
| uint32_t fconv_d2f(uint64_t v1, uint8_t mode); | uint32_t frsqrt7_s(uint32_t v); | ||||||
| uint64_t fconv_f2d(uint32_t v1, uint8_t mode); | uint32_t frec7_s(uint32_t v, uint8_t mode); | ||||||
|  | uint32_t unbox_s(uint8_t FLEN, uint64_t v); | ||||||
|  |  | ||||||
|  | // double precision | ||||||
| uint64_t fadd_d(uint64_t v1, uint64_t v2, uint8_t mode); | uint64_t fadd_d(uint64_t v1, uint64_t v2, uint8_t mode); | ||||||
| uint64_t fsub_d(uint64_t v1, uint64_t v2, uint8_t mode); | uint64_t fsub_d(uint64_t v1, uint64_t v2, uint8_t mode); | ||||||
| uint64_t fmul_d(uint64_t v1, uint64_t v2, uint8_t mode); | uint64_t fmul_d(uint64_t v1, uint64_t v2, uint8_t mode); | ||||||
| uint64_t fdiv_d(uint64_t v1, uint64_t v2, uint8_t mode); | uint64_t fdiv_d(uint64_t v1, uint64_t v2, uint8_t mode); | ||||||
| uint64_t fsqrt_d(uint64_t v1, uint8_t mode); | uint64_t fsqrt_d(uint64_t v1, uint8_t mode); | ||||||
| uint64_t fcmp_d(uint64_t v1, uint64_t v2, uint32_t op); | uint64_t fcmp_d(uint64_t v1, uint64_t v2, uint32_t op); | ||||||
| uint64_t fcvt_d(uint64_t v1, uint32_t op, uint8_t mode); |  | ||||||
| uint64_t fmadd_d(uint64_t v1, uint64_t v2, uint64_t v3, uint32_t op, uint8_t mode); | uint64_t fmadd_d(uint64_t v1, uint64_t v2, uint64_t v3, uint32_t op, uint8_t mode); | ||||||
| uint64_t fsel_d(uint64_t v1, uint64_t v2, uint32_t op); | uint64_t fsel_d(uint64_t v1, uint64_t v2, uint32_t op); | ||||||
| uint64_t fclass_d(uint64_t v1); | uint64_t fclass_d(uint64_t v1); | ||||||
| uint64_t fcvt_32_64(uint32_t v1, uint32_t op, uint8_t mode); | uint64_t frsqrt7_d(uint64_t v); | ||||||
| uint32_t fcvt_64_32(uint64_t v1, uint32_t op, uint8_t mode); | uint64_t frec7_d(uint64_t v, uint8_t mode); | ||||||
| uint32_t unbox_s(uint64_t v); | uint64_t unbox_d(uint8_t FLEN, uint64_t v); | ||||||
|  |  | ||||||
|  | // conversion: float to float | ||||||
|  | uint32_t f16tof32(uint16_t val, uint8_t rm); | ||||||
|  | uint64_t f16tof64(uint16_t val, uint8_t rm); | ||||||
|  | uint16_t f32tof16(uint32_t val, uint8_t rm); | ||||||
|  | uint64_t f32tof64(uint32_t val, uint8_t rm); | ||||||
|  | uint16_t f64tof16(uint64_t val, uint8_t rm); | ||||||
|  | uint32_t f64tof32(uint64_t val, uint8_t rm); | ||||||
|  |  | ||||||
|  | // conversions: float to unsigned | ||||||
|  | uint32_t f16toui32(uint16_t v, uint8_t rm); | ||||||
|  | uint64_t f16toui64(uint16_t v, uint8_t rm); | ||||||
|  | uint32_t f32toui32(uint32_t v, uint8_t rm); | ||||||
|  | uint64_t f32toui64(uint32_t v, uint8_t rm); | ||||||
|  | uint32_t f64toui32(uint64_t v, uint8_t rm); | ||||||
|  | uint64_t f64toui64(uint64_t v, uint8_t rm); | ||||||
|  |  | ||||||
|  | // conversions: float to signed | ||||||
|  | uint32_t f16toi32(uint16_t v, uint8_t rm); | ||||||
|  | uint64_t f16toi64(uint16_t v, uint8_t rm); | ||||||
|  | uint32_t f32toi32(uint32_t v, uint8_t rm); | ||||||
|  | uint64_t f32toi64(uint32_t v, uint8_t rm); | ||||||
|  | uint32_t f64toi32(uint64_t v, uint8_t rm); | ||||||
|  | uint64_t f64toi64(uint64_t v, uint8_t rm); | ||||||
|  |  | ||||||
|  | // conversions: unsigned to float | ||||||
|  | uint16_t ui32tof16(uint32_t v, uint8_t rm); | ||||||
|  | uint16_t ui64tof16(uint64_t v, uint8_t rm); | ||||||
|  | uint32_t ui32tof32(uint32_t v, uint8_t rm); | ||||||
|  | uint32_t ui64tof32(uint64_t v, uint8_t rm); | ||||||
|  | uint64_t ui32tof64(uint32_t v, uint8_t rm); | ||||||
|  | uint64_t ui64tof64(uint64_t v, uint8_t rm); | ||||||
|  |  | ||||||
|  | // conversions: signed to float | ||||||
|  | uint16_t i32tof16(uint32_t v, uint8_t rm); | ||||||
|  | uint16_t i64tof16(uint64_t v, uint8_t rm); | ||||||
|  | uint32_t i32tof32(uint32_t v, uint8_t rm); | ||||||
|  | uint32_t i64tof32(uint64_t v, uint8_t rm); | ||||||
|  | uint64_t i32tof64(uint32_t v, uint8_t rm); | ||||||
|  | uint64_t i64tof64(uint64_t v, uint8_t rm); | ||||||
| } | } | ||||||
| #endif /* RISCV_SRC_VM_FP_FUNCTIONS_H_ */ | #endif /* _VM_FP_FUNCTIONS_H_ */ | ||||||
|   | |||||||
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							| @@ -72,32 +72,70 @@ using namespace ::llvm; | |||||||
| void add_fp_functions_2_module(Module* mod, uint32_t flen, uint32_t xlen) { | void add_fp_functions_2_module(Module* mod, uint32_t flen, uint32_t xlen) { | ||||||
|     if(flen) { |     if(flen) { | ||||||
|         FDECL(fget_flags, INT_TYPE(32)); |         FDECL(fget_flags, INT_TYPE(32)); | ||||||
|  |  | ||||||
|  |         FDECL(fadd_h, INT_TYPE(16), INT_TYPE(16), INT_TYPE(16), INT_TYPE(8)); | ||||||
|  |         FDECL(fsub_h, INT_TYPE(16), INT_TYPE(16), INT_TYPE(16), INT_TYPE(8)); | ||||||
|  |         FDECL(fmul_h, INT_TYPE(16), INT_TYPE(16), INT_TYPE(16), INT_TYPE(8)); | ||||||
|  |         FDECL(fdiv_h, INT_TYPE(16), INT_TYPE(16), INT_TYPE(16), INT_TYPE(8)); | ||||||
|  |         FDECL(fsqrt_h, INT_TYPE(16), INT_TYPE(16), INT_TYPE(8)); | ||||||
|  |         FDECL(fcmp_h, INT_TYPE(16), INT_TYPE(16), INT_TYPE(16), INT_TYPE(16)); | ||||||
|  |         FDECL(fmadd_h, INT_TYPE(16), INT_TYPE(16), INT_TYPE(16), INT_TYPE(16), INT_TYPE(16), INT_TYPE(8)); | ||||||
|  |         FDECL(fsel_h, INT_TYPE(16), INT_TYPE(16), INT_TYPE(16), INT_TYPE(16)); | ||||||
|  |         FDECL(fclass_h, INT_TYPE(16), INT_TYPE(16)); | ||||||
|  |         FDECL(unbox_h, INT_TYPE(16), INT_TYPE(32), INT_TYPE(64)); // technically the first arg is only 8 bits | ||||||
|  |  | ||||||
|  |         FDECL(f16toi32, INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)) | ||||||
|  |         FDECL(f16toui32, INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)) | ||||||
|  |         FDECL(i32tof16, INT_TYPE(16), INT_TYPE(32), INT_TYPE(8)) | ||||||
|  |         FDECL(ui32tof16, INT_TYPE(16), INT_TYPE(32), INT_TYPE(8)) | ||||||
|  |         FDECL(f16toi64, INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)) | ||||||
|  |         FDECL(f16toui64, INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)) | ||||||
|  |         FDECL(i64tof16, INT_TYPE(16), INT_TYPE(64), INT_TYPE(8)) | ||||||
|  |         FDECL(ui64tof16, INT_TYPE(16), INT_TYPE(64), INT_TYPE(8)) | ||||||
|  |  | ||||||
|         FDECL(fadd_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); |         FDECL(fadd_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||||
|         FDECL(fsub_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); |         FDECL(fsub_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||||
|         FDECL(fmul_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); |         FDECL(fmul_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||||
|         FDECL(fdiv_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); |         FDECL(fdiv_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||||
|         FDECL(fsqrt_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); |         FDECL(fsqrt_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||||
|         FDECL(fcmp_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(32)); |         FDECL(fcmp_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(32)); | ||||||
|         FDECL(fcvt_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); |  | ||||||
|         FDECL(fmadd_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); |         FDECL(fmadd_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||||
|         FDECL(fsel_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(32)); |         FDECL(fsel_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(32)); | ||||||
|         FDECL(fclass_s, INT_TYPE(32), INT_TYPE(32)); |         FDECL(fclass_s, INT_TYPE(32), INT_TYPE(32)); | ||||||
|         FDECL(fcvt_32_64, INT_TYPE(64), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); |         FDECL(unbox_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(64)); // technically the first arg is only 8 bits | ||||||
|         FDECL(fcvt_64_32, INT_TYPE(32), INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); |  | ||||||
|  |         FDECL(f32toi32, INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||||
|  |         FDECL(f32toui32, INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||||
|  |         FDECL(i32tof32, INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||||
|  |         FDECL(ui32tof32, INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||||
|  |         FDECL(f32toi64, INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); | ||||||
|  |         FDECL(f32toui64, INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); | ||||||
|  |         FDECL(i64tof32, INT_TYPE(32), INT_TYPE(64), INT_TYPE(8)); | ||||||
|  |         FDECL(ui64tof32, INT_TYPE(32), INT_TYPE(64), INT_TYPE(8)); | ||||||
|         if(flen > 32) { |         if(flen > 32) { | ||||||
|             FDECL(fconv_d2f, INT_TYPE(32), INT_TYPE(64), INT_TYPE(8)); |  | ||||||
|             FDECL(fconv_f2d, INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); |  | ||||||
|             FDECL(fadd_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); |             FDECL(fadd_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||||
|             FDECL(fsub_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); |             FDECL(fsub_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||||
|             FDECL(fmul_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); |             FDECL(fmul_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||||
|             FDECL(fdiv_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); |             FDECL(fdiv_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||||
|             FDECL(fsqrt_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); |             FDECL(fsqrt_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||||
|             FDECL(fcmp_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(32)); |             FDECL(fcmp_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(32)); | ||||||
|             FDECL(fcvt_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); |  | ||||||
|             FDECL(fmadd_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); |             FDECL(fmadd_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); | ||||||
|             FDECL(fsel_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(32)); |             FDECL(fsel_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(32)); | ||||||
|             FDECL(fclass_d, INT_TYPE(64), INT_TYPE(64)); |             FDECL(fclass_d, INT_TYPE(64), INT_TYPE(64)); | ||||||
|             FDECL(unbox_s, INT_TYPE(32), INT_TYPE(64)); |  | ||||||
|  |             FDECL(f64tof32, INT_TYPE(32), INT_TYPE(64), INT_TYPE(8)); | ||||||
|  |             FDECL(f32tof64, INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); | ||||||
|  |             FDECL(f64toi64, INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||||
|  |             FDECL(f64toui64, INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||||
|  |             FDECL(i64tof64, INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||||
|  |             FDECL(ui64tof64, INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||||
|  |             FDECL(i32tof64, INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); | ||||||
|  |             FDECL(ui32tof64, INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); | ||||||
|  |             FDECL(f64toi32, INT_TYPE(32), INT_TYPE(64), INT_TYPE(8)); | ||||||
|  |             FDECL(f64toui32, INT_TYPE(32), INT_TYPE(64), INT_TYPE(8)); | ||||||
|  |  | ||||||
|  |             FDECL(unbox_d, INT_TYPE(64), INT_TYPE(32), INT_TYPE(64)); // technically the first arg is only 8 bits | ||||||
|         } |         } | ||||||
|     } |     } | ||||||
| } | } | ||||||
|   | |||||||
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							
							
								
								
									
										101
									
								
								src/vm/vector_functions.cpp
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										101
									
								
								src/vm/vector_functions.cpp
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,101 @@ | |||||||
|  | //////////////////////////////////////////////////////////////////////////////// | ||||||
|  | // Copyright (C) 2025, MINRES Technologies GmbH | ||||||
|  | // All rights reserved. | ||||||
|  | // | ||||||
|  | // Redistribution and use in source and binary forms, with or without | ||||||
|  | // modification, are permitted provided that the following conditions are met: | ||||||
|  | // | ||||||
|  | // 1. Redistributions of source code must retain the above copyright notice, | ||||||
|  | //    this list of conditions and the following disclaimer. | ||||||
|  | // | ||||||
|  | // 2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  | //    this list of conditions and the following disclaimer in the documentation | ||||||
|  | //    and/or other materials provided with the distribution. | ||||||
|  | // | ||||||
|  | // 3. Neither the name of the copyright holder nor the names of its contributors | ||||||
|  | //    may be used to endorse or promote products derived from this software | ||||||
|  | //    without specific prior written permission. | ||||||
|  | // | ||||||
|  | // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  | // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  | // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  | // ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||||
|  | // LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||||
|  | // CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||||
|  | // SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||||
|  | // INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||||
|  | // CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||||
|  | // ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||||
|  | // POSSIBILITY OF SUCH DAMAGE. | ||||||
|  | // | ||||||
|  | // Contributors: | ||||||
|  | //       alex@minres.com - initial API and implementation | ||||||
|  | //////////////////////////////////////////////////////////////////////////////// | ||||||
|  |  | ||||||
|  | #include "vector_functions.h" | ||||||
|  | #include "iss/vm_types.h" | ||||||
|  | #include <algorithm> | ||||||
|  | #include <cassert> | ||||||
|  | #include <cstddef> | ||||||
|  | #include <cstdint> | ||||||
|  | #include <functional> | ||||||
|  | #include <limits> | ||||||
|  | #include <math.h> | ||||||
|  | #include <stdexcept> | ||||||
|  | #include <vector> | ||||||
|  |  | ||||||
|  | namespace softvector { | ||||||
|  |  | ||||||
|  | bool softvec_read(void* core, uint64_t addr, uint64_t length, uint8_t* data) { | ||||||
|  |     // Read length bytes from addr into *data | ||||||
|  |     iss::status status = static_cast<iss::arch_if*>(core)->read(iss::address_type::PHYSICAL, iss::access_type::READ, | ||||||
|  |                                                                 0 /*traits<ARCH>::MEM*/, addr, length, data); | ||||||
|  |     return status == iss::Ok; | ||||||
|  | } | ||||||
|  | bool softvec_write(void* core, uint64_t addr, uint64_t length, uint8_t* data) { | ||||||
|  |     // Write length bytes from addr into *data | ||||||
|  |     iss::status status = static_cast<iss::arch_if*>(core)->write(iss::address_type::PHYSICAL, iss::access_type::READ, | ||||||
|  |                                                                  0 /*traits<ARCH>::MEM*/, addr, length, data); | ||||||
|  |     return status == iss::Ok; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | vtype_t::vtype_t(uint32_t vtype_val) { underlying = (vtype_val & 0x8000) << 32 | (vtype_val & ~0x8000); } | ||||||
|  | vtype_t::vtype_t(uint64_t vtype_val) { underlying = vtype_val; } | ||||||
|  | bool vtype_t::vill() { return underlying >> 63; } | ||||||
|  | bool vtype_t::vma() { return (underlying >> 7) & 1; } | ||||||
|  | bool vtype_t::vta() { return (underlying >> 6) & 1; } | ||||||
|  | unsigned vtype_t::sew() { | ||||||
|  |     uint8_t vsew = (underlying >> 3) & 0b111; | ||||||
|  |     // pow(2, 3 + vsew); | ||||||
|  |     return 1 << (3 + vsew); | ||||||
|  | } | ||||||
|  | double vtype_t::lmul() { | ||||||
|  |     uint8_t vlmul = underlying & 0b111; | ||||||
|  |     assert(vlmul != 0b100); // reserved encoding | ||||||
|  |     int8_t signed_vlmul = (vlmul >> 2) ? 0b11111000 | vlmul : vlmul; | ||||||
|  |     return pow(2, signed_vlmul); | ||||||
|  | } | ||||||
|  |  | ||||||
|  | mask_bit_reference& mask_bit_reference::operator=(const bool new_value) { | ||||||
|  |     *start = *start & ~(1U << pos) | static_cast<unsigned>(new_value) << pos; | ||||||
|  |     return *this; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | mask_bit_reference::mask_bit_reference(uint8_t* start, uint8_t pos) | ||||||
|  | : start(start) | ||||||
|  | , pos(pos) { | ||||||
|  |     assert(pos < 8 && "Bit reference can only be initialized for bytes"); | ||||||
|  | }; | ||||||
|  | mask_bit_reference::operator bool() const { return *(start) & (1U << (pos)); } | ||||||
|  |  | ||||||
|  | mask_bit_reference vmask_view::operator[](size_t idx) const { | ||||||
|  |     assert(idx < elem_count); | ||||||
|  |     return {start + idx / 8, static_cast<uint8_t>(idx % 8)}; | ||||||
|  | } | ||||||
|  |  | ||||||
|  | vmask_view read_vmask(uint8_t* V, uint16_t VLEN, uint16_t elem_count, uint8_t reg_idx) { | ||||||
|  |     uint8_t* mask_start = V + VLEN / 8 * reg_idx; | ||||||
|  |     assert(mask_start + elem_count / 8 <= V + VLEN * RFS / 8); | ||||||
|  |     return {mask_start, elem_count}; | ||||||
|  | } | ||||||
|  | } // namespace softvector | ||||||
							
								
								
									
										172
									
								
								src/vm/vector_functions.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										172
									
								
								src/vm/vector_functions.h
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,172 @@ | |||||||
|  | //////////////////////////////////////////////////////////////////////////////// | ||||||
|  | // Copyright (C) 2025, MINRES Technologies GmbH | ||||||
|  | // All rights reserved. | ||||||
|  | // | ||||||
|  | // Redistribution and use in source and binary forms, with or without | ||||||
|  | // modification, are permitted provided that the following conditions are met: | ||||||
|  | // | ||||||
|  | // 1. Redistributions of source code must retain the above copyright notice, | ||||||
|  | //    this list of conditions and the following disclaimer. | ||||||
|  | // | ||||||
|  | // 2. Redistributions in binary form must reproduce the above copyright notice, | ||||||
|  | //    this list of conditions and the following disclaimer in the documentation | ||||||
|  | //    and/or other materials provided with the distribution. | ||||||
|  | // | ||||||
|  | // 3. Neither the name of the copyright holder nor the names of its contributors | ||||||
|  | //    may be used to endorse or promote products derived from this software | ||||||
|  | //    without specific prior written permission. | ||||||
|  | // | ||||||
|  | // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||||
|  | // AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||||
|  | // IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||||
|  | // ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||||
|  | // LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||||
|  | // CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||||
|  | // SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||||
|  | // INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||||
|  | // CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||||
|  | // ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||||
|  | // POSSIBILITY OF SUCH DAMAGE. | ||||||
|  | // | ||||||
|  | // Contributors: | ||||||
|  | //       alex@minres.com - initial API and implementation | ||||||
|  | //////////////////////////////////////////////////////////////////////////////// | ||||||
|  |  | ||||||
|  | #ifndef _VM_VECTOR_FUNCTIONS_H_ | ||||||
|  | #define _VM_VECTOR_FUNCTIONS_H_ | ||||||
|  |  | ||||||
|  | #include "iss/arch_if.h" | ||||||
|  | #include "iss/vm_types.h" | ||||||
|  | #include <cstdint> | ||||||
|  | #include <functional> | ||||||
|  | #include <stdint.h> | ||||||
|  | namespace softvector { | ||||||
|  | const unsigned RFS = 32; | ||||||
|  |  | ||||||
|  | struct vtype_t { | ||||||
|  |     uint64_t underlying; | ||||||
|  |     vtype_t(uint32_t vtype_val); | ||||||
|  |     vtype_t(uint64_t vtype_val); | ||||||
|  |     unsigned sew(); | ||||||
|  |     double lmul(); | ||||||
|  |     bool vill(); | ||||||
|  |     bool vma(); | ||||||
|  |     bool vta(); | ||||||
|  | }; | ||||||
|  | class mask_bit_reference { | ||||||
|  |     uint8_t* start; | ||||||
|  |     uint8_t pos; | ||||||
|  |  | ||||||
|  | public: | ||||||
|  |     mask_bit_reference& operator=(const bool new_value); | ||||||
|  |     mask_bit_reference(uint8_t* start, uint8_t pos); | ||||||
|  |     operator bool() const; | ||||||
|  | }; | ||||||
|  |  | ||||||
|  | struct vmask_view { | ||||||
|  |     uint8_t* start; | ||||||
|  |     size_t elem_count; | ||||||
|  |     mask_bit_reference operator[](size_t) const; | ||||||
|  | }; | ||||||
|  | vmask_view read_vmask(uint8_t* V, uint16_t VLEN, uint16_t elem_count, uint8_t reg_idx = 0); | ||||||
|  | template <unsigned VLEN> vmask_view read_vmask(uint8_t* V, uint16_t elem_count, uint8_t reg_idx = 0); | ||||||
|  |  | ||||||
|  | bool softvec_read(void* core, uint64_t addr, uint64_t length, uint8_t* data); | ||||||
|  | bool softvec_write(void* core, uint64_t addr, uint64_t length, uint8_t* data); | ||||||
|  | template <unsigned VLEN, typename eew_t> | ||||||
|  | uint64_t vector_load_store(void* core, std::function<bool(void*, uint64_t, uint64_t, uint8_t*)> load_store_fn, uint8_t* V, uint64_t vl, | ||||||
|  |                            uint64_t vstart, vtype_t vtype, bool vm, uint8_t vd, uint64_t rs1, uint8_t segment_size, int64_t stride = 0, | ||||||
|  |                            bool use_stride = false); | ||||||
|  | template <unsigned XLEN, unsigned VLEN, typename eew_t, typename sew_t> | ||||||
|  | uint64_t vector_load_store_index(void* core, std::function<bool(void*, uint64_t, uint64_t, uint8_t*)> load_store_fn, uint8_t* V, | ||||||
|  |                                  uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, uint8_t vd, uint64_t rs1, uint8_t vs2, | ||||||
|  |                                  uint8_t segment_size); | ||||||
|  | template <unsigned VLEN, typename dest_elem_t, typename src2_elem_t = dest_elem_t, typename src1_elem_t = src2_elem_t> | ||||||
|  | void vector_vector_op(uint8_t* V, unsigned funct6, unsigned funct3, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, | ||||||
|  |                       unsigned vs2, unsigned vs1); | ||||||
|  | template <unsigned VLEN, typename dest_elem_t, typename src2_elem_t = dest_elem_t, typename src1_elem_t = src2_elem_t> | ||||||
|  | void vector_imm_op(uint8_t* V, unsigned funct6, unsigned funct3, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, | ||||||
|  |                    unsigned vs2, typename std::make_signed<src1_elem_t>::type imm); | ||||||
|  | template <unsigned VLEN, typename elem_t> | ||||||
|  | void vector_vector_carry(uint8_t* V, unsigned funct6, unsigned funct3, uint64_t vl, uint64_t vstart, vtype_t vtype, unsigned vd, | ||||||
|  |                          unsigned vs2, unsigned vs1, signed carry); | ||||||
|  | template <unsigned VLEN, typename elem_t> | ||||||
|  | void vector_imm_carry(uint8_t* V, unsigned funct6, unsigned funct3, uint64_t vl, uint64_t vstart, vtype_t vtype, unsigned vd, unsigned vs2, | ||||||
|  |                       typename std::make_signed<elem_t>::type imm, signed carry); | ||||||
|  | template <unsigned VLEN, typename scr_elem_t> | ||||||
|  | void vector_vector_merge(uint8_t* V, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, unsigned vs2, unsigned vs1); | ||||||
|  | template <unsigned VLEN, typename scr_elem_t> | ||||||
|  | void vector_imm_merge(uint8_t* V, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, unsigned vs2, uint64_t imm); | ||||||
|  | template <unsigned VLEN, typename dest_elem_t, typename src2_elem_t = dest_elem_t> | ||||||
|  | void vector_unary_op(uint8_t* V, unsigned unary_op, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, unsigned vs2); | ||||||
|  | template <unsigned VLEN, typename elem_t> | ||||||
|  | void mask_vector_vector_op(uint8_t* V, unsigned funct, unsigned funct3, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, | ||||||
|  |                            unsigned vs2, unsigned vs1); | ||||||
|  | template <unsigned VLEN, typename elem_t> | ||||||
|  | void mask_vector_imm_op(uint8_t* V, unsigned funct, unsigned funct3, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, | ||||||
|  |                         unsigned vs2, typename std::make_signed<elem_t>::type imm); | ||||||
|  | void carry_vector_vector_op(uint8_t* V, unsigned funct, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, unsigned vs2, | ||||||
|  |                             unsigned vs1); | ||||||
|  | template <unsigned VLEN, typename elem_t> | ||||||
|  | void carry_vector_imm_op(uint8_t* V, unsigned funct, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, unsigned vs2, | ||||||
|  |                          typename std::make_signed<elem_t>::type imm); | ||||||
|  | template <unsigned VLEN, typename dest_elem_t, typename src2_elem_t = dest_elem_t, typename src1_elem_t = dest_elem_t> | ||||||
|  | bool sat_vector_vector_op(uint8_t* V, unsigned funct6, unsigned funct3, uint64_t vl, uint64_t vstart, vtype_t vtype, int64_t vxrm, bool vm, | ||||||
|  |                           unsigned vd, unsigned vs2, unsigned vs1); | ||||||
|  | template <unsigned VLEN, typename dest_elem_t, typename src2_elem_t = dest_elem_t, typename src1_elem_t = dest_elem_t> | ||||||
|  | bool sat_vector_imm_op(uint8_t* V, unsigned funct6, unsigned funct3, uint64_t vl, uint64_t vstart, vtype_t vtype, int64_t vxrm, bool vm, | ||||||
|  |                        unsigned vd, unsigned vs2, typename std::make_signed<src1_elem_t>::type imm); | ||||||
|  | template <unsigned VLEN, typename dest_elem_t, typename src_elem_t = dest_elem_t> | ||||||
|  | void vector_red_op(uint8_t* V, unsigned funct6, unsigned funct3, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, | ||||||
|  |                    unsigned vs2, unsigned vs1); | ||||||
|  | template <unsigned VLEN> | ||||||
|  | void mask_mask_op(uint8_t* V, unsigned funct6, unsigned funct3, uint64_t vl, uint64_t vstart, unsigned vd, unsigned vs2, unsigned vs1); | ||||||
|  | template <unsigned VLEN> uint64_t vcpop(uint8_t* V, uint64_t vl, uint64_t vstart, bool vm, unsigned vs2); | ||||||
|  | template <unsigned VLEN> uint64_t vfirst(uint8_t* V, uint64_t vl, uint64_t vstart, bool vm, unsigned vs2); | ||||||
|  | template <unsigned VLEN> void mask_set_op(uint8_t* V, unsigned enc, uint64_t vl, uint64_t vstart, bool vm, unsigned vd, unsigned vs2); | ||||||
|  | template <unsigned VLEN, typename src_elem_t> | ||||||
|  | void viota(uint8_t* V, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, unsigned vs2); | ||||||
|  | template <unsigned VLEN, typename src_elem_t> void vid(uint8_t* V, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd); | ||||||
|  | template <unsigned VLEN, typename src_elem_t> uint64_t scalar_move(uint8_t* V, vtype_t vtype, unsigned vd, uint64_t val, bool to_vector); | ||||||
|  | template <unsigned VLEN, typename src_elem_t> | ||||||
|  | void vector_slideup(uint8_t* V, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, unsigned vs2, uint64_t imm); | ||||||
|  | template <unsigned VLEN, typename src_elem_t> | ||||||
|  | void vector_slidedown(uint8_t* V, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, unsigned vs2, uint64_t imm); | ||||||
|  | template <unsigned VLEN, typename src_elem_t> | ||||||
|  | void vector_slide1up(uint8_t* V, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, unsigned vs2, uint64_t imm); | ||||||
|  | template <unsigned VLEN, typename src_elem_t> | ||||||
|  | void vector_slide1down(uint8_t* V, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, unsigned vs2, uint64_t imm); | ||||||
|  | template <unsigned VLEN, typename dest_elem_t, typename scr_elem_t = dest_elem_t> | ||||||
|  | void vector_vector_gather(uint8_t* V, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, unsigned vs2, unsigned vs1); | ||||||
|  | template <unsigned VLEN, typename scr_elem_t> | ||||||
|  | void vector_imm_gather(uint8_t* V, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, unsigned vs2, uint64_t imm); | ||||||
|  | template <unsigned VLEN, typename scr_elem_t> | ||||||
|  | void vector_compress(uint8_t* V, uint64_t vl, uint64_t vstart, vtype_t vtype, unsigned vd, unsigned vs2, unsigned vs1); | ||||||
|  | template <unsigned VLEN> void vector_whole_move(uint8_t* V, unsigned vd, unsigned vs2, unsigned count); | ||||||
|  | template <unsigned VLEN, typename dest_elem_t, typename src_elem_t = dest_elem_t> | ||||||
|  | void fp_vector_red_op(uint8_t* V, unsigned funct6, unsigned funct3, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, | ||||||
|  |                       unsigned vs2, unsigned vs1, uint8_t rm); | ||||||
|  | template <unsigned VLEN, typename dest_elem_t, typename src2_elem_t = dest_elem_t, typename src1_elem_t = src2_elem_t> | ||||||
|  | void fp_vector_vector_op(uint8_t* V, unsigned funct6, unsigned funct3, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, | ||||||
|  |                          unsigned vs2, unsigned vs1, uint8_t rm); | ||||||
|  | template <unsigned VLEN, typename dest_elem_t, typename src2_elem_t = dest_elem_t, typename src1_elem_t = src2_elem_t> | ||||||
|  | void fp_vector_imm_op(uint8_t* V, unsigned funct6, unsigned funct3, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, | ||||||
|  |                       unsigned vs2, src1_elem_t imm, uint8_t rm); | ||||||
|  | template <unsigned VLEN, typename elem_t> | ||||||
|  | void fp_vector_unary_op(uint8_t* V, unsigned encoding_space, unsigned unary_op, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, | ||||||
|  |                         unsigned vd, unsigned vs2, uint8_t rm); | ||||||
|  | template <unsigned VLEN, typename dest_elem_t, typename src_elem_t> | ||||||
|  | void fp_vector_unary_w(uint8_t* V, unsigned unary_op, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, unsigned vs2, | ||||||
|  |                        uint8_t rm); | ||||||
|  | template <unsigned VLEN, typename dest_elem_t, typename src_elem_t> | ||||||
|  | void fp_vector_unary_n(uint8_t* V, unsigned unary_op, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, unsigned vs2, | ||||||
|  |                        uint8_t rm); | ||||||
|  | template <unsigned VLEN, typename elem_t> | ||||||
|  | void mask_fp_vector_vector_op(uint8_t* V, unsigned funct6, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, unsigned vs2, | ||||||
|  |                               unsigned vs1, uint8_t rm); | ||||||
|  | template <unsigned VLEN, typename elem_t> | ||||||
|  | void mask_fp_vector_imm_op(uint8_t* V, unsigned funct6, uint64_t vl, uint64_t vstart, vtype_t vtype, bool vm, unsigned vd, unsigned vs2, | ||||||
|  |                            elem_t imm, uint8_t rm); | ||||||
|  | } // namespace softvector | ||||||
|  | #include "vm/vector_functions.hpp" | ||||||
|  | #endif /* _VM_VECTOR_FUNCTIONS_H_ */ | ||||||
							
								
								
									
										1942
									
								
								src/vm/vector_functions.hpp
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										1942
									
								
								src/vm/vector_functions.hpp
									
									
									
									
									
										Normal file
									
								
							
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							
		Reference in New Issue
	
	Block a user