Compare commits
	
		
			175 Commits
		
	
	
		
			82c26acfc8
			...
			feature/ht
		
	
	| Author | SHA1 | Date | |
|---|---|---|---|
| aaebeaf023 | |||
| f4718c6de3 | |||
| 53de21eef9 | |||
| d443c89c87 | |||
| 9a2df32d57 | |||
| be0f783af8 | |||
| 1089800682 | |||
| a6a6f51f0b | |||
| 21e1f791ad | |||
| be6f5791fa | |||
| d907dc7f54 | |||
| 75e81ce236 | |||
| 82a70efdb8 | |||
| 978c3db06e | |||
| 0e88664ff7 | |||
| ac818f304d | |||
| ad60449073 | |||
| b45b3589fa | |||
| 1fb7e8fcea | |||
| 5f9d0beafb | |||
| 4c0d1c75aa | |||
| 2f3abf2f76 | |||
| 62768bf81e | |||
| f6be8ec006 | |||
| a8f56b6e27 | |||
| 76ea0db25d | |||
| ec1b820c18 | |||
| 64329cf0f6 | |||
| 9de0aed84d | |||
| bb4e2766d1 | |||
| 0996d15bd4 | |||
| 6305efa7c2 | |||
| de79adc50d | |||
| 0473aa5344 | |||
| a45fcd28db | |||
| 0f15032210 | |||
| efc11d87a5 | |||
| 4a19e27926 | |||
| c15cdb0955 | |||
| 6609d12582 | |||
| b5341700aa | |||
| 0b5062d21c | |||
| fbca690b3b | |||
| 235a7e6e24 | |||
| 62d21e1156 | |||
| 9c51d6eade | |||
| 2878dca6b5 | |||
| c28e8fd00c | |||
| b3cc9d2346 | |||
| 933f08494c | |||
| 21f8eab432 | |||
| 6ddb8da07f | |||
| edf456c59f | |||
| 42efced1eb | |||
| c376e34b2b | |||
| f579ec6e48 | |||
| fd20e66f1f | |||
| 5d69b79232 | |||
| 2edd68d1bd | |||
| 7ffa7667b6 | |||
| 93d89e07ca | |||
| 17dcba4b90 | |||
| 39d2518fdd | |||
| a365110054 | |||
| d2efb23ff7 | |||
| 04b7a09b19 | |||
| 72b11beac5 | |||
| e87b7d5fd0 | |||
| 5a2b96ef3e | |||
| c6b99cd155 | |||
| b1306c3a47 | |||
| 0d6bf924ed | |||
| 86de536c8f | |||
| 051dd5e2d3 | |||
| e3942be776 | |||
| 6ee484a771 | |||
| 60808c8649 | |||
| 0432803d82 | |||
| 4f5d9214ed | |||
| d42d2ce533 | |||
| 236d12d7f5 | |||
| e1b6cab890 | |||
| 8361f88718 | |||
| 2ec7ea4b41 | |||
| b24965d321 | |||
| 244bf6d2f2 | |||
| 1a4465a371 | |||
| fa82a50824 | |||
| 6dc17857da | |||
| 11a30caae8 | |||
| ac1a26a10c | |||
| 7a199e122d | |||
| d8c3d2e19c | |||
| 375755999a | |||
| 9996fd4833 | |||
| 149b3136d2 | |||
| ac8f8b0539 | |||
| b2cbf90d0b | |||
| 373145478e | |||
| 55b0cea94f | |||
| 5b17599aa2 | |||
| 4cfb15c7cd | |||
| 63da7f8d57 | |||
| fb4012fbd1 | |||
| 24449f1c0f | |||
| fd303c8343 | |||
| 346b177a87 | |||
| d4ec131fa7 | |||
| 48370a4555 | |||
| 36b076774e | |||
| 482a4ec253 | |||
| 2fb28364c5 | |||
| 8460f4ab7f | |||
| 3fd51cc68c | |||
| 551822916c | |||
| 37db31fb4b | |||
| e2da306eee | |||
| 41051f8f34 | |||
| 2a7449fa1e | |||
|   | a6c48ceaac | ||
| 1e30b68507 | |||
|   | ed793471bb | ||
| 58fb815f32 | |||
| 3cc8bd0854 | |||
| a27850f841 | |||
| fb330cddea | |||
| b76c5bf0d6 | |||
| 001c6349f7 | |||
| ee6a11dae6 | |||
| 2e27b025cc | |||
| f0a004be9d | |||
| 3422c7cd5c | |||
| ad79a28705 | |||
| 9fdbc3ff38 | |||
| 602bc6e06a | |||
| 6cb76fc256 | |||
| fbcd389580 | |||
| b25b7848c6 | |||
| 6c986d38d8 | |||
| a1ebd83d2a | |||
| 8aed551813 | |||
| 1e6a0086e9 | |||
| 119d4a8b43 | |||
| 9841b16122 | |||
| fbda1424f3 | |||
| fe2d5cb2f9 | |||
| 3ff59ba45d | |||
| db5765b342 | |||
| 075e04249a | |||
| 207f778ee6 | |||
| f4f90c5e65 | |||
| bc4ea30815 | |||
| e921201f7b | |||
| e6aa6e5842 | |||
| 4418fa7e4f | |||
| adaa7e1c04 | |||
| 0eb1db0e7e | |||
| e48597b2b7 | |||
| 458c773e19 | |||
| b3f40f9b15 | |||
| 6419ad471e | |||
| 759061b569 | |||
| 2115e9ceae | |||
| 2bea95c1a7 | |||
| 7001b693ae | |||
| e6f11081eb | |||
| 09db0cd35d | |||
| 980c8031c3 | |||
| b86d7a517d | |||
| b7478965ab | |||
| bf4a6deb86 | |||
| ffe730219d | |||
| 60c926c921 | |||
| 9371a09b71 | |||
| 4c3a7386b0 | 
| @@ -1,4 +1,3 @@ | ||||
| --- | ||||
| Language:        Cpp | ||||
| # BasedOnStyle:  LLVM | ||||
| # should be in line with IndentWidth | ||||
| @@ -13,8 +12,8 @@ AllowAllParametersOfDeclarationOnNextLine: true | ||||
| AllowShortBlocksOnASingleLine: false | ||||
| AllowShortCaseLabelsOnASingleLine: false | ||||
| AllowShortFunctionsOnASingleLine: All | ||||
| AllowShortIfStatementsOnASingleLine: true | ||||
| AllowShortLoopsOnASingleLine: true | ||||
| AllowShortIfStatementsOnASingleLine: false | ||||
| AllowShortLoopsOnASingleLine: false | ||||
| AlwaysBreakAfterDefinitionReturnType: None | ||||
| AlwaysBreakAfterReturnType: None | ||||
| AlwaysBreakBeforeMultilineStrings: false | ||||
| @@ -39,8 +38,8 @@ BreakBeforeTernaryOperators: true | ||||
| BreakConstructorInitializersBeforeComma: true | ||||
| BreakAfterJavaFieldAnnotations: false | ||||
| BreakStringLiterals: true | ||||
| ColumnLimit:     120 | ||||
| CommentPragmas:  '^ IWYU pragma:' | ||||
| ColumnLimit:     140 | ||||
| CommentPragmas:  '^( IWYU pragma:| @suppress)' | ||||
| ConstructorInitializerAllOnOneLineOrOnePerLine: false | ||||
| ConstructorInitializerIndentWidth: 0 | ||||
| ContinuationIndentWidth: 4 | ||||
| @@ -76,13 +75,13 @@ PenaltyBreakFirstLessLess: 120 | ||||
| PenaltyBreakString: 1000 | ||||
| PenaltyExcessCharacter: 1000000 | ||||
| PenaltyReturnTypeOnItsOwnLine: 60 | ||||
| PointerAlignment: Right | ||||
| PointerAlignment: Left | ||||
| ReflowComments:  true | ||||
| SortIncludes:    true | ||||
| SpaceAfterCStyleCast: false | ||||
| SpaceAfterTemplateKeyword: true | ||||
| SpaceBeforeAssignmentOperators: true | ||||
| SpaceBeforeParens: ControlStatements | ||||
| SpaceBeforeParens: Never | ||||
| SpaceInEmptyParentheses: false | ||||
| SpacesBeforeTrailingComments: 1 | ||||
| SpacesInAngles:  false | ||||
|   | ||||
							
								
								
									
										2
									
								
								.gitignore
									
									
									
									
										vendored
									
									
								
							
							
						
						
									
										2
									
								
								.gitignore
									
									
									
									
										vendored
									
									
								
							| @@ -1,5 +1,6 @@ | ||||
| .DS_Store | ||||
| /*.il | ||||
| /.settings | ||||
| /avr-instr.html | ||||
| /blink.S | ||||
| /flash.* | ||||
| @@ -14,7 +15,6 @@ | ||||
| /*.ods | ||||
| /build*/ | ||||
| /*.logs | ||||
| language.settings.xml | ||||
| /*.gtkw | ||||
| /Debug wo LLVM/ | ||||
| /*.txdb | ||||
|   | ||||
							
								
								
									
										236
									
								
								CMakeLists.txt
									
									
									
									
									
								
							
							
						
						
									
										236
									
								
								CMakeLists.txt
									
									
									
									
									
								
							| @@ -1,8 +1,9 @@ | ||||
| cmake_minimum_required(VERSION 3.12) | ||||
| cmake_minimum_required(VERSION 3.18) | ||||
| list(APPEND CMAKE_MODULE_PATH ${CMAKE_CURRENT_SOURCE_DIR}/cmake) | ||||
| ############################################################################### | ||||
|  | ||||
| # ############################################################################## | ||||
| # | ||||
| ############################################################################### | ||||
| # ############################################################################## | ||||
| project(dbt-rise-tgc VERSION 1.0.0) | ||||
|  | ||||
| include(GNUInstallDirs) | ||||
| @@ -16,20 +17,30 @@ add_subdirectory(softfloat) | ||||
|  | ||||
| set(LIB_SOURCES | ||||
|     src/iss/plugin/instruction_count.cpp | ||||
| 	src/iss/arch/tgc5c.cpp | ||||
| 	src/vm/interp/vm_tgc5c.cpp | ||||
| 	src/vm/fp_functions.cpp | ||||
|     src/iss/arch/tgc5c.cpp | ||||
|     src/vm/interp/vm_tgc5c.cpp | ||||
|     src/vm/fp_functions.cpp | ||||
|     src/iss/debugger/csr_names.cpp | ||||
|     src/iss/semihosting/semihosting.cpp | ||||
| ) | ||||
|  | ||||
| if(WITH_TCC) | ||||
| 	list(APPEND LIB_SOURCES | ||||
| 	   src/vm/tcc/vm_tgc5c.cpp | ||||
|     list(APPEND LIB_SOURCES | ||||
|         src/vm/tcc/vm_tgc5c.cpp | ||||
|     ) | ||||
| endif() | ||||
|  | ||||
| if(WITH_LLVM) | ||||
| 	list(APPEND LIB_SOURCES | ||||
| 		src/vm/llvm/vm_tgc5c.cpp | ||||
| 		src/vm/llvm/fp_impl.cpp | ||||
| 	) | ||||
|     list(APPEND LIB_SOURCES | ||||
|         src/vm/llvm/vm_tgc5c.cpp | ||||
|         src/vm/llvm/fp_impl.cpp | ||||
|     ) | ||||
| endif() | ||||
|  | ||||
| if(WITH_ASMJIT) | ||||
|     list(APPEND LIB_SOURCES | ||||
|         src/vm/asmjit/vm_tgc5c.cpp | ||||
|     ) | ||||
| endif() | ||||
|  | ||||
| # library files | ||||
| @@ -37,29 +48,37 @@ FILE(GLOB GEN_ISS_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/src-gen/iss/arch/*.cpp) | ||||
| FILE(GLOB GEN_VM_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/src-gen/vm/interp/vm_*.cpp) | ||||
| FILE(GLOB GEN_YAML_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/contrib/instr/*.yaml) | ||||
| list(APPEND LIB_SOURCES ${GEN_ISS_SOURCES} ${GEN_VM_SOURCES}) | ||||
|  | ||||
| foreach(FILEPATH ${GEN_ISS_SOURCES}) | ||||
|     get_filename_component(CORE ${FILEPATH} NAME_WE) | ||||
|     string(TOUPPER ${CORE} CORE) | ||||
|     list(APPEND LIB_DEFINES CORE_${CORE}) | ||||
| endforeach() | ||||
|  | ||||
| message(STATUS "Core defines are ${LIB_DEFINES}") | ||||
|  | ||||
| if(WITH_LLVM) | ||||
| 	FILE(GLOB LLVM_GEN_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/src-gen/vm/llvm/vm_*.cpp) | ||||
| 	list(APPEND LIB_SOURCES ${LLVM_GEN_SOURCES}) | ||||
|     FILE(GLOB LLVM_GEN_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/src-gen/vm/llvm/vm_*.cpp) | ||||
|     list(APPEND LIB_SOURCES ${LLVM_GEN_SOURCES}) | ||||
| endif() | ||||
|  | ||||
| if(WITH_TCC) | ||||
| 	FILE(GLOB TCC_GEN_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/src-gen/vm/tcc/vm_*.cpp) | ||||
| 	list(APPEND LIB_SOURCES ${TCC_GEN_SOURCES}) | ||||
|     FILE(GLOB TCC_GEN_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/src-gen/vm/tcc/vm_*.cpp) | ||||
|     list(APPEND LIB_SOURCES ${TCC_GEN_SOURCES}) | ||||
| endif() | ||||
|  | ||||
| if(WITH_ASMJIT) | ||||
|     FILE(GLOB TCC_GEN_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/src-gen/vm/asmjit/vm_*.cpp) | ||||
|     list(APPEND LIB_SOURCES ${TCC_GEN_SOURCES}) | ||||
| endif() | ||||
|  | ||||
| if(TARGET yaml-cpp::yaml-cpp) | ||||
|     list(APPEND LIB_SOURCES | ||||
|     	src/iss/plugin/cycle_estimate.cpp | ||||
| 	    src/iss/plugin/instruction_count.cpp | ||||
|         src/iss/plugin/cycle_estimate.cpp | ||||
|         src/iss/plugin/instruction_count.cpp | ||||
|     ) | ||||
| endif() | ||||
|  | ||||
| # Define the library | ||||
| add_library(${PROJECT_NAME} SHARED ${LIB_SOURCES}) | ||||
|  | ||||
| @@ -68,60 +87,57 @@ if("${CMAKE_CXX_COMPILER_ID}" STREQUAL "GNU") | ||||
| elseif("${CMAKE_CXX_COMPILER_ID}" STREQUAL "MSVC") | ||||
|     target_compile_options(${PROJECT_NAME} PRIVATE /wd4293) | ||||
| endif() | ||||
|  | ||||
| target_include_directories(${PROJECT_NAME} PUBLIC src) | ||||
| target_include_directories(${PROJECT_NAME} PUBLIC src-gen) | ||||
|  | ||||
| target_force_link_libraries(${PROJECT_NAME} PRIVATE dbt-rise-core) | ||||
|  | ||||
| # only re-export the include paths | ||||
| get_target_property(DBT_CORE_INCL dbt-rise-core INTERFACE_INCLUDE_DIRECTORIES) | ||||
| target_include_directories(${PROJECT_NAME} INTERFACE ${DBT_CORE_INCL}) | ||||
| get_target_property(DBT_CORE_DEFS dbt-rise-core INTERFACE_COMPILE_DEFINITIONS) | ||||
| if(NOT (DBT_CORE_DEFS STREQUAL DBT_CORE_DEFS-NOTFOUND)) | ||||
| 	target_compile_definitions(${PROJECT_NAME} INTERFACE ${DBT_CORE_DEFS}) | ||||
|  | ||||
| if(NOT(DBT_CORE_DEFS STREQUAL DBT_CORE_DEFS-NOTFOUND)) | ||||
|     target_compile_definitions(${PROJECT_NAME} INTERFACE ${DBT_CORE_DEFS}) | ||||
| endif() | ||||
|  | ||||
| target_link_libraries(${PROJECT_NAME} PUBLIC elfio::elfio softfloat scc-util Boost::coroutine) | ||||
| if(TARGET yaml-cpp::yaml-cpp) | ||||
| 	target_compile_definitions(${PROJECT_NAME} PUBLIC WITH_PLUGINS) | ||||
| 	target_link_libraries(${PROJECT_NAME} PUBLIC yaml-cpp::yaml-cpp) | ||||
| endif() | ||||
|  | ||||
| if(WITH_LLVM) | ||||
|     find_package(LLVM) | ||||
| 	target_compile_definitions(${PROJECT_NAME} PUBLIC ${LLVM_DEFINITIONS}) | ||||
| 	target_include_directories(${PROJECT_NAME} PUBLIC ${LLVM_INCLUDE_DIRS}) | ||||
| 	if(BUILD_SHARED_LIBS) | ||||
| 		target_link_libraries( ${PROJECT_NAME} PUBLIC ${LLVM_LIBRARIES}) | ||||
| 	endif() | ||||
| if(TARGET yaml-cpp::yaml-cpp) | ||||
|     target_compile_definitions(${PROJECT_NAME} PUBLIC WITH_PLUGINS) | ||||
|     target_link_libraries(${PROJECT_NAME} PUBLIC yaml-cpp::yaml-cpp) | ||||
| endif() | ||||
|  | ||||
| set_target_properties(${PROJECT_NAME} PROPERTIES | ||||
|   VERSION ${PROJECT_VERSION} | ||||
|   FRAMEWORK FALSE | ||||
|     VERSION ${PROJECT_VERSION} | ||||
|     FRAMEWORK FALSE | ||||
| ) | ||||
| install(TARGETS ${PROJECT_NAME} COMPONENT ${PROJECT_NAME} | ||||
|   EXPORT ${PROJECT_NAME}Targets            # for downstream dependencies | ||||
|   ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR}  # static lib | ||||
|   RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR}  # binaries | ||||
|   LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR}  # shared lib | ||||
|   FRAMEWORK DESTINATION ${CMAKE_INSTALL_LIBDIR} # for mac | ||||
|   PUBLIC_HEADER DESTINATION ${CMAKE_INSTALL_INCLUDEDIR}/${PROJECT_NAME} # headers for mac (note the different component -> different package) | ||||
|   INCLUDES DESTINATION ${CMAKE_INSTALL_INCLUDEDIR}             # headers | ||||
|     EXPORT ${PROJECT_NAME}Targets # for downstream dependencies | ||||
|     ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR} # static lib | ||||
|     RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} # binaries | ||||
|     LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR} # shared lib | ||||
|     FRAMEWORK DESTINATION ${CMAKE_INSTALL_LIBDIR} # for mac | ||||
|     PUBLIC_HEADER DESTINATION ${CMAKE_INSTALL_INCLUDEDIR}/${PROJECT_NAME} # headers for mac (note the different component -> different package) | ||||
|     INCLUDES DESTINATION ${CMAKE_INSTALL_INCLUDEDIR} # headers | ||||
| ) | ||||
| install(DIRECTORY ${CMAKE_CURRENT_SOURCE_DIR}/incl/iss COMPONENT ${PROJECT_NAME} | ||||
|         DESTINATION ${CMAKE_INSTALL_INCLUDEDIR} # target directory | ||||
|         FILES_MATCHING # install only matched files | ||||
|         PATTERN "*.h" # select header files | ||||
|         ) | ||||
|     DESTINATION ${CMAKE_INSTALL_INCLUDEDIR} # target directory | ||||
|     FILES_MATCHING # install only matched files | ||||
|     PATTERN "*.h" # select header files | ||||
| ) | ||||
| install(FILES ${GEN_YAML_SOURCES} DESTINATION share/tgc-vp) | ||||
| ############################################################################### | ||||
|  | ||||
| # ############################################################################## | ||||
| # | ||||
| ############################################################################### | ||||
| # ############################################################################## | ||||
| set(CMAKE_INSTALL_RPATH $ORIGIN/../${CMAKE_INSTALL_LIBDIR}) | ||||
| project(tgc-sim) | ||||
| find_package(Boost COMPONENTS program_options thread REQUIRED) | ||||
|  | ||||
| add_executable(${PROJECT_NAME} src/main.cpp) | ||||
|  | ||||
| if(TARGET ${CORE_NAME}_cpp) | ||||
|     list(APPEND TGC_SOURCES ${${CORE_NAME}_OUTPUT_FILES}) | ||||
| else() | ||||
| @@ -133,21 +149,20 @@ else() | ||||
| endif() | ||||
|  | ||||
| foreach(F IN LISTS TGC_SOURCES) | ||||
|     if (${F} MATCHES ".*/arch/([^/]*)\.cpp") | ||||
|         string(REGEX REPLACE  ".*/([^/]*)\.cpp"  "\\1" CORE_NAME_LC ${F}) | ||||
|     if(${F} MATCHES ".*/arch/([^/]*)\.cpp") | ||||
|         string(REGEX REPLACE ".*/([^/]*)\.cpp" "\\1" CORE_NAME_LC ${F}) | ||||
|         string(TOUPPER ${CORE_NAME_LC} CORE_NAME) | ||||
|         target_compile_definitions(${PROJECT_NAME} PRIVATE CORE_${CORE_NAME}) | ||||
|     endif() | ||||
| endforeach() | ||||
|  | ||||
| #if(WITH_LLVM) | ||||
| #    target_compile_definitions(${PROJECT_NAME} PRIVATE WITH_LLVM) | ||||
| #    #target_link_libraries(${PROJECT_NAME} PUBLIC ${llvm_libs}) | ||||
| #endif() | ||||
| #if(WITH_TCC) | ||||
| #    target_compile_definitions(${PROJECT_NAME} PRIVATE WITH_TCC) | ||||
| #endif() | ||||
|  | ||||
| # if(WITH_LLVM) | ||||
| # target_compile_definitions(${PROJECT_NAME} PRIVATE WITH_LLVM) | ||||
| # #target_link_libraries(${PROJECT_NAME} PUBLIC ${llvm_libs}) | ||||
| # endif() | ||||
| # if(WITH_TCC) | ||||
| # target_compile_definitions(${PROJECT_NAME} PRIVATE WITH_TCC) | ||||
| # endif() | ||||
| target_link_libraries(${PROJECT_NAME} PUBLIC dbt-rise-tgc fmt::fmt) | ||||
|  | ||||
| if(TARGET Boost::program_options) | ||||
| @@ -155,74 +170,91 @@ if(TARGET Boost::program_options) | ||||
| else() | ||||
|     target_link_libraries(${PROJECT_NAME} PUBLIC ${BOOST_program_options_LIBRARY}) | ||||
| endif() | ||||
|  | ||||
| target_link_libraries(${PROJECT_NAME} PUBLIC ${CMAKE_DL_LIBS}) | ||||
| if (Tcmalloc_FOUND) | ||||
|  | ||||
| if(Tcmalloc_FOUND) | ||||
|     target_link_libraries(${PROJECT_NAME} PUBLIC ${Tcmalloc_LIBRARIES}) | ||||
| endif(Tcmalloc_FOUND) | ||||
|  | ||||
| install(TARGETS tgc-sim | ||||
|   EXPORT ${PROJECT_NAME}Targets            # for downstream dependencies | ||||
|   ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR}  # static lib | ||||
|   RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR}  # binaries | ||||
|   LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR}  # shared lib | ||||
|   FRAMEWORK DESTINATION ${CMAKE_INSTALL_LIBDIR} # for mac | ||||
|   PUBLIC_HEADER DESTINATION ${CMAKE_INSTALL_INCLUDEDIR}/${PROJECT_NAME}  # headers for mac (note the different component -> different package) | ||||
|   INCLUDES DESTINATION ${CMAKE_INSTALL_INCLUDEDIR}             # headers | ||||
|     EXPORT ${PROJECT_NAME}Targets # for downstream dependencies | ||||
|     ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR} # static lib | ||||
|     RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} # binaries | ||||
|     LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR} # shared lib | ||||
|     FRAMEWORK DESTINATION ${CMAKE_INSTALL_LIBDIR} # for mac | ||||
|     PUBLIC_HEADER DESTINATION ${CMAKE_INSTALL_INCLUDEDIR}/${PROJECT_NAME} # headers for mac (note the different component -> different package) | ||||
|     INCLUDES DESTINATION ${CMAKE_INSTALL_INCLUDEDIR} # headers | ||||
| ) | ||||
|  | ||||
| if(BUILD_TESTING) | ||||
|   	# ... CMake code to create tests ... | ||||
| 	add_test(NAME tgc-sim-interp | ||||
| 	         COMMAND tgc-sim -f ${CMAKE_BINARY_DIR}/../../Firmwares/hello-world/hello --backend interp) | ||||
| 	if(WITH_TCC) | ||||
| 	add_test(NAME tgc-sim-tcc | ||||
| 	         COMMAND tgc-sim -f ${CMAKE_BINARY_DIR}/../../Firmwares/hello-world/hello --backend tcc) | ||||
| 	endif() | ||||
| 	if(WITH_LLVM) | ||||
| 	add_test(NAME tgc-sim-llvm | ||||
| 	         COMMAND tgc-sim -f ${CMAKE_BINARY_DIR}/../../Firmwares/hello-world/hello --backend llvm) | ||||
| 	endif() | ||||
|     # ... CMake code to create tests ... | ||||
|     add_test(NAME tgc-sim-interp | ||||
|         COMMAND tgc-sim -f ${CMAKE_BINARY_DIR}/../../Firmwares/hello-world/hello --backend interp) | ||||
|  | ||||
|     if(WITH_TCC) | ||||
|         add_test(NAME tgc-sim-tcc | ||||
|             COMMAND tgc-sim -f ${CMAKE_BINARY_DIR}/../../Firmwares/hello-world/hello --backend tcc) | ||||
|     endif() | ||||
|  | ||||
|     if(WITH_LLVM) | ||||
|         add_test(NAME tgc-sim-llvm | ||||
|             COMMAND tgc-sim -f ${CMAKE_BINARY_DIR}/../../Firmwares/hello-world/hello --backend llvm) | ||||
|     endif() | ||||
|  | ||||
|     if(WITH_ASMJIT) | ||||
|         add_test(NAME tgc-sim-asmjit | ||||
|             COMMAND tgc-sim -f ${CMAKE_BINARY_DIR}/../../Firmwares/hello-world/hello --backend asmjit) | ||||
|     endif() | ||||
| endif() | ||||
| ############################################################################### | ||||
|  | ||||
| # ############################################################################## | ||||
| # | ||||
| ############################################################################### | ||||
| # ############################################################################## | ||||
| if(TARGET scc-sysc) | ||||
| 	project(dbt-rise-tgc_sc VERSION 1.0.0) | ||||
| 	set(LIB_SOURCES  | ||||
|     	src/sysc/core_complex.cpp | ||||
|     	src/sysc/register_tgc_c.cpp | ||||
| 	) | ||||
| 	FILE(GLOB GEN_SC_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/src-gen/sysc/register_*.cpp) | ||||
| 	list(APPEND LIB_SOURCES ${GEN_SC_SOURCES}) | ||||
|     project(dbt-rise-tgc_sc VERSION 1.0.0) | ||||
|     set(LIB_SOURCES | ||||
|         src/sysc/core_complex.cpp | ||||
|         src/sysc/register_tgc_c.cpp | ||||
|     ) | ||||
|     FILE(GLOB GEN_SC_SOURCES ${CMAKE_CURRENT_SOURCE_DIR}/src-gen/sysc/register_*.cpp) | ||||
|     list(APPEND LIB_SOURCES ${GEN_SC_SOURCES}) | ||||
|     add_library(${PROJECT_NAME} ${LIB_SOURCES}) | ||||
|     target_compile_definitions(${PROJECT_NAME} PUBLIC WITH_SYSTEMC) | ||||
|     target_compile_definitions(${PROJECT_NAME} PRIVATE CORE_${CORE_NAME}) | ||||
|  | ||||
|     foreach(F IN LISTS TGC_SOURCES) | ||||
|         if (${F} MATCHES ".*/arch/([^/]*)\.cpp") | ||||
|             string(REGEX REPLACE  ".*/([^/]*)\.cpp"  "\\1" CORE_NAME_LC ${F}) | ||||
|         if(${F} MATCHES ".*/arch/([^/]*)\.cpp") | ||||
|             string(REGEX REPLACE ".*/([^/]*)\.cpp" "\\1" CORE_NAME_LC ${F}) | ||||
|             string(TOUPPER ${CORE_NAME_LC} CORE_NAME) | ||||
|             target_compile_definitions(${PROJECT_NAME} PRIVATE CORE_${CORE_NAME}) | ||||
|         endif() | ||||
|     endforeach() | ||||
|     target_link_libraries(${PROJECT_NAME} PUBLIC dbt-rise-tgc scc-sysc) | ||||
| #    if(WITH_LLVM) | ||||
| #        target_link_libraries(${PROJECT_NAME} PUBLIC ${llvm_libs}) | ||||
| #    endif() | ||||
|  | ||||
| 	set(LIB_HEADERS ${CMAKE_CURRENT_SOURCE_DIR}/src/sysc/core_complex.h) | ||||
|     target_link_libraries(${PROJECT_NAME} PUBLIC dbt-rise-tgc scc-sysc) | ||||
|  | ||||
|     # if(WITH_LLVM) | ||||
|     # target_link_libraries(${PROJECT_NAME} PUBLIC ${llvm_libs}) | ||||
|     # endif() | ||||
|     set(LIB_HEADERS ${CMAKE_CURRENT_SOURCE_DIR}/src/sysc/core_complex.h) | ||||
|     set_target_properties(${PROJECT_NAME} PROPERTIES | ||||
|       VERSION ${PROJECT_VERSION} | ||||
|       FRAMEWORK FALSE | ||||
|       PUBLIC_HEADER "${LIB_HEADERS}" # specify the public headers | ||||
|         VERSION ${PROJECT_VERSION} | ||||
|         FRAMEWORK FALSE | ||||
|         PUBLIC_HEADER "${LIB_HEADERS}" # specify the public headers | ||||
|     ) | ||||
|     install(TARGETS ${PROJECT_NAME} COMPONENT ${PROJECT_NAME} | ||||
| 	  EXPORT ${PROJECT_NAME}Targets            # for downstream dependencies | ||||
| 	  ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR}  # static lib | ||||
| 	  RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR}  # binaries | ||||
| 	  LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR}  # shared lib | ||||
| 	  FRAMEWORK DESTINATION ${CMAKE_INSTALL_LIBDIR} # for mac | ||||
| 	  PUBLIC_HEADER DESTINATION ${CMAKE_INSTALL_INCLUDEDIR}/sysc   # headers for mac (note the different component -> different package) | ||||
| 	  INCLUDES DESTINATION ${CMAKE_INSTALL_INCLUDEDIR}             # headers | ||||
| 	)     | ||||
|         EXPORT ${PROJECT_NAME}Targets # for downstream dependencies | ||||
|         ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR} # static lib | ||||
|         RUNTIME DESTINATION ${CMAKE_INSTALL_BINDIR} # binaries | ||||
|         LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR} # shared lib | ||||
|         FRAMEWORK DESTINATION ${CMAKE_INSTALL_LIBDIR} # for mac | ||||
|         PUBLIC_HEADER DESTINATION ${CMAKE_INSTALL_INCLUDEDIR}/sysc # headers for mac (note the different component -> different package) | ||||
|         INCLUDES DESTINATION ${CMAKE_INSTALL_INCLUDEDIR} # headers | ||||
|     ) | ||||
| endif() | ||||
|  | ||||
| project(elfio-test) | ||||
| find_package(Boost COMPONENTS program_options thread REQUIRED) | ||||
|  | ||||
| add_executable(${PROJECT_NAME} src/elfio.cpp) | ||||
| target_link_libraries(${PROJECT_NAME} PUBLIC elfio::elfio) | ||||
|   | ||||
							
								
								
									
										1
									
								
								contrib/instr/.gitignore
									
									
									
									
										vendored
									
									
										Normal file
									
								
							
							
						
						
									
										1
									
								
								contrib/instr/.gitignore
									
									
									
									
										vendored
									
									
										Normal file
									
								
							| @@ -0,0 +1 @@ | ||||
| /*.yaml | ||||
| @@ -1,5 +1,5 @@ | ||||
|  | ||||
| RV32I:  | ||||
| RVI:  | ||||
|   LUI: | ||||
|     index: 0 | ||||
|     encoding: 0b00000000000000000000000000110111 | ||||
| @@ -349,7 +349,7 @@ Zifencei: | ||||
|     size:   32 | ||||
|     branch:   false | ||||
|     delay:   1 | ||||
| RV32M:  | ||||
| RVM:  | ||||
|   MUL: | ||||
|     index: 49 | ||||
|     encoding: 0b00000010000000000000000000110011 | ||||
|   | ||||
							
								
								
									
										650
									
								
								contrib/instr/TGC5C_slow.yaml
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										650
									
								
								contrib/instr/TGC5C_slow.yaml
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,650 @@ | ||||
| RV32I: | ||||
|   ADD: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 51 | ||||
|     index: 27 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   ADDI: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 19 | ||||
|     index: 18 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   AND: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 28723 | ||||
|     index: 36 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   ANDI: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 28691 | ||||
|     index: 23 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   AUIPC: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 23 | ||||
|     index: 1 | ||||
|     mask: 127 | ||||
|     size: 32 | ||||
|   BEQ: | ||||
|     branch: true | ||||
|     delay: | ||||
|     - 1 | ||||
|     - 2 | ||||
|     encoding: 99 | ||||
|     index: 4 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   BGE: | ||||
|     branch: true | ||||
|     delay: | ||||
|     - 1 | ||||
|     - 2 | ||||
|     encoding: 20579 | ||||
|     index: 7 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   BGEU: | ||||
|     branch: true | ||||
|     delay: | ||||
|     - 1 | ||||
|     - 2 | ||||
|     encoding: 28771 | ||||
|     index: 9 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   BLT: | ||||
|     branch: true | ||||
|     delay: | ||||
|     - 1 | ||||
|     - 2 | ||||
|     encoding: 16483 | ||||
|     index: 6 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   BLTU: | ||||
|     branch: true | ||||
|     delay: | ||||
|     - 1 | ||||
|     - 2 | ||||
|     encoding: 24675 | ||||
|     index: 8 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   BNE: | ||||
|     branch: true | ||||
|     delay: | ||||
|     - 1 | ||||
|     - 2 | ||||
|     encoding: 4195 | ||||
|     index: 5 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   EBREAK: | ||||
|     attributes: | ||||
|     - - name:no_cont | ||||
|     branch: false | ||||
|     delay: 3 | ||||
|     encoding: 1048691 | ||||
|     index: 39 | ||||
|     mask: 4294967295 | ||||
|     size: 32 | ||||
|   ECALL: | ||||
|     attributes: | ||||
|     - - name:no_cont | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 115 | ||||
|     index: 38 | ||||
|     mask: 4294967295 | ||||
|     size: 32 | ||||
|   FENCE: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 15 | ||||
|     index: 37 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   JAL: | ||||
|     branch: true | ||||
|     delay: 2 | ||||
|     encoding: 111 | ||||
|     index: 2 | ||||
|     mask: 127 | ||||
|     size: 32 | ||||
|   JALR: | ||||
|     branch: true | ||||
|     delay: 2 | ||||
|     encoding: 103 | ||||
|     index: 3 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   LB: | ||||
|     branch: false | ||||
|     delay: 2 | ||||
|     encoding: 3 | ||||
|     index: 10 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   LBU: | ||||
|     branch: false | ||||
|     delay: 2 | ||||
|     encoding: 16387 | ||||
|     index: 13 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   LH: | ||||
|     branch: false | ||||
|     delay: 2 | ||||
|     encoding: 4099 | ||||
|     index: 11 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   LHU: | ||||
|     branch: false | ||||
|     delay: 2 | ||||
|     encoding: 20483 | ||||
|     index: 14 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   LUI: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 55 | ||||
|     index: 0 | ||||
|     mask: 127 | ||||
|     size: 32 | ||||
|   LW: | ||||
|     branch: false | ||||
|     delay: 2 | ||||
|     encoding: 8195 | ||||
|     index: 12 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   MRET: | ||||
|     attributes: | ||||
|     - - name:no_cont | ||||
|     branch: false | ||||
|     delay: 2 | ||||
|     encoding: 807403635 | ||||
|     index: 40 | ||||
|     mask: 4294967295 | ||||
|     size: 32 | ||||
|   OR: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 24627 | ||||
|     index: 35 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   ORI: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 24595 | ||||
|     index: 22 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   SB: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 35 | ||||
|     index: 15 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   SH: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 4131 | ||||
|     index: 16 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   SLL: | ||||
|     branch: false | ||||
|     delay: X_24:20 | ||||
|     encoding: 4147 | ||||
|     index: 29 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   SLLI: | ||||
|     branch: false | ||||
|     delay: u_24:20 | ||||
|     encoding: 4115 | ||||
|     index: 24 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   SLT: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 8243 | ||||
|     index: 30 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   SLTI: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 8211 | ||||
|     index: 19 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   SLTIU: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 12307 | ||||
|     index: 20 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   SLTU: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 12339 | ||||
|     index: 31 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   SRA: | ||||
|     branch: false | ||||
|     delay: X_24:20 | ||||
|     encoding: 1073762355 | ||||
|     index: 34 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   SRAI: | ||||
|     branch: false | ||||
|     delay: u_24:20 | ||||
|     encoding: 1073762323 | ||||
|     index: 26 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   SRL: | ||||
|     branch: false | ||||
|     delay: X_24:20 | ||||
|     encoding: 20531 | ||||
|     index: 33 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   SRLI: | ||||
|     branch: false | ||||
|     delay: u_24:20 | ||||
|     encoding: 20499 | ||||
|     index: 25 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   SUB: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 1073741875 | ||||
|     index: 28 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   SW: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 8227 | ||||
|     index: 17 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   WFI: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 273678451 | ||||
|     index: 41 | ||||
|     mask: 4294967295 | ||||
|     size: 32 | ||||
|   XOR: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 16435 | ||||
|     index: 32 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   XORI: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 16403 | ||||
|     index: 21 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
| RV32M: | ||||
|   DIV: | ||||
|     branch: false | ||||
|     delay: 33 | ||||
|     encoding: 33570867 | ||||
|     index: 53 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   DIVU: | ||||
|     branch: false | ||||
|     delay: 33 | ||||
|     encoding: 33574963 | ||||
|     index: 54 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   MUL: | ||||
|     branch: false | ||||
|     delay: 32 | ||||
|     encoding: 33554483 | ||||
|     index: 49 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   MULH: | ||||
|     branch: false | ||||
|     delay: 32 | ||||
|     encoding: 33558579 | ||||
|     index: 50 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   MULHSU: | ||||
|     branch: false | ||||
|     delay: 32 | ||||
|     encoding: 33562675 | ||||
|     index: 51 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   MULHU: | ||||
|     branch: false | ||||
|     delay: 32 | ||||
|     encoding: 33566771 | ||||
|     index: 52 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   REM: | ||||
|     branch: false | ||||
|     delay: 33 | ||||
|     encoding: 33579059 | ||||
|     index: 55 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
|   REMU: | ||||
|     branch: false | ||||
|     delay: 33 | ||||
|     encoding: 33583155 | ||||
|     index: 56 | ||||
|     mask: 4261441663 | ||||
|     size: 32 | ||||
| Zca: | ||||
|   C__ADD: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 36866 | ||||
|     index: 82 | ||||
|     mask: 61443 | ||||
|     size: 16 | ||||
|   C__ADDI: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 1 | ||||
|     index: 60 | ||||
|     mask: 57347 | ||||
|     size: 16 | ||||
|   C__ADDI16SP: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 24833 | ||||
|     index: 65 | ||||
|     mask: 61315 | ||||
|     size: 16 | ||||
|   C__ADDI4SPN: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 0 | ||||
|     index: 57 | ||||
|     mask: 57347 | ||||
|     size: 16 | ||||
|   C__AND: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 35937 | ||||
|     index: 73 | ||||
|     mask: 64611 | ||||
|     size: 16 | ||||
|   C__ANDI: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 34817 | ||||
|     index: 69 | ||||
|     mask: 60419 | ||||
|     size: 16 | ||||
|   C__BEQZ: | ||||
|     branch: true | ||||
|     delay: | ||||
|     - 1 | ||||
|     - 2 | ||||
|     encoding: 49153 | ||||
|     index: 75 | ||||
|     mask: 57347 | ||||
|     size: 16 | ||||
|   C__BNEZ: | ||||
|     branch: true | ||||
|     delay: | ||||
|     - 1 | ||||
|     - 2 | ||||
|     encoding: 57345 | ||||
|     index: 76 | ||||
|     mask: 57347 | ||||
|     size: 16 | ||||
|   C__EBREAK: | ||||
|     branch: false | ||||
|     delay: 3 | ||||
|     encoding: 36866 | ||||
|     index: 84 | ||||
|     mask: 65535 | ||||
|     size: 16 | ||||
|   C__J: | ||||
|     branch: true | ||||
|     delay: 1 | ||||
|     encoding: 40961 | ||||
|     index: 74 | ||||
|     mask: 57347 | ||||
|     size: 16 | ||||
|   C__JAL: | ||||
|     attributes: | ||||
|     - - name:enable | ||||
|       - value:1 | ||||
|     branch: true | ||||
|     delay: 1 | ||||
|     encoding: 8193 | ||||
|     index: 62 | ||||
|     mask: 57347 | ||||
|     size: 16 | ||||
|   C__JALR: | ||||
|     branch: true | ||||
|     delay: 1 | ||||
|     encoding: 36866 | ||||
|     index: 83 | ||||
|     mask: 61567 | ||||
|     size: 16 | ||||
|   C__JR: | ||||
|     branch: true | ||||
|     delay: 1 | ||||
|     encoding: 32770 | ||||
|     index: 80 | ||||
|     mask: 61567 | ||||
|     size: 16 | ||||
|   C__LI: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 16385 | ||||
|     index: 63 | ||||
|     mask: 57347 | ||||
|     size: 16 | ||||
|   C__LUI: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 24577 | ||||
|     index: 64 | ||||
|     mask: 57347 | ||||
|     size: 16 | ||||
|   C__LW: | ||||
|     branch: false | ||||
|     delay: 2 | ||||
|     encoding: 16384 | ||||
|     index: 58 | ||||
|     mask: 57347 | ||||
|     size: 16 | ||||
|   C__LWSP: | ||||
|     branch: false | ||||
|     delay: 2 | ||||
|     encoding: 16386 | ||||
|     index: 78 | ||||
|     mask: 57347 | ||||
|     size: 16 | ||||
|   C__MV: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 32770 | ||||
|     index: 79 | ||||
|     mask: 61443 | ||||
|     size: 16 | ||||
|   C__NOP: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 1 | ||||
|     index: 61 | ||||
|     mask: 61315 | ||||
|     size: 16 | ||||
|   C__OR: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 35905 | ||||
|     index: 72 | ||||
|     mask: 64611 | ||||
|     size: 16 | ||||
|   C__SLLI: | ||||
|     attributes: | ||||
|     - - name:enable | ||||
|       - value:1 | ||||
|     branch: false | ||||
|     delay: u_12:12*16+u_6:2 | ||||
|     encoding: 2 | ||||
|     index: 77 | ||||
|     mask: 61443 | ||||
|     size: 16 | ||||
|   C__SRAI: | ||||
|     attributes: | ||||
|     - - name:enable | ||||
|       - value:1 | ||||
|     branch: false | ||||
|     delay: u_12:12*16+u_6:2 | ||||
|     encoding: 33793 | ||||
|     index: 68 | ||||
|     mask: 64515 | ||||
|     size: 16 | ||||
|   C__SRLI: | ||||
|     attributes: | ||||
|     - - name:enable | ||||
|       - value:1 | ||||
|     branch: false | ||||
|     delay: u_12:12*16+u_6:2 | ||||
|     encoding: 32769 | ||||
|     index: 67 | ||||
|     mask: 64515 | ||||
|     size: 16 | ||||
|   C__SUB: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 35841 | ||||
|     index: 70 | ||||
|     mask: 64611 | ||||
|     size: 16 | ||||
|   C__SW: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 49152 | ||||
|     index: 59 | ||||
|     mask: 57347 | ||||
|     size: 16 | ||||
|   C__SWSP: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 49154 | ||||
|     index: 85 | ||||
|     mask: 57347 | ||||
|     size: 16 | ||||
|   C__XOR: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 35873 | ||||
|     index: 71 | ||||
|     mask: 64611 | ||||
|     size: 16 | ||||
|   DII: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 0 | ||||
|     index: 86 | ||||
|     mask: 65535 | ||||
|     size: 16 | ||||
|   __reserved_clui: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 24577 | ||||
|     index: 66 | ||||
|     mask: 61567 | ||||
|     size: 16 | ||||
|   __reserved_cmv: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 32770 | ||||
|     index: 81 | ||||
|     mask: 65535 | ||||
|     size: 16 | ||||
| Zicsr: | ||||
|   CSRRC: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 12403 | ||||
|     index: 44 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   CSRRCI: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 28787 | ||||
|     index: 47 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   CSRRS: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 8307 | ||||
|     index: 43 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   CSRRSI: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 24691 | ||||
|     index: 46 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   CSRRW: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 4211 | ||||
|     index: 42 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
|   CSRRWI: | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 20595 | ||||
|     index: 45 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
| Zifencei: | ||||
|   FENCE_I: | ||||
|     attributes: | ||||
|     - - name:flush | ||||
|     branch: false | ||||
|     delay: 1 | ||||
|     encoding: 4111 | ||||
|     index: 48 | ||||
|     mask: 28799 | ||||
|     size: 32 | ||||
| @@ -1,5 +1,5 @@ | ||||
| /******************************************************************************* | ||||
|  * Copyright (C) 2017 - 2020 MINRES Technologies GmbH | ||||
|  * Copyright (C) 2024 MINRES Technologies GmbH | ||||
|  * All rights reserved. | ||||
|  * | ||||
|  * Redistribution and use in source and binary forms, with or without | ||||
| @@ -37,6 +37,7 @@ def getRegisterSizes(){ | ||||
|     return regs | ||||
| } | ||||
| %> | ||||
| // clang-format off | ||||
| #include "${coreDef.name.toLowerCase()}.h" | ||||
| #include "util/ities.h" | ||||
| #include <util/logging.h> | ||||
| @@ -46,10 +47,10 @@ def getRegisterSizes(){ | ||||
|  | ||||
| using namespace iss::arch; | ||||
|  | ||||
| constexpr std::array<const char*, ${registers.size}>    iss::arch::traits<iss::arch::${coreDef.name.toLowerCase()}>::reg_names; | ||||
| constexpr std::array<const char*, ${registers.size}>    iss::arch::traits<iss::arch::${coreDef.name.toLowerCase()}>::reg_aliases; | ||||
| constexpr std::array<const uint32_t, ${getRegisterSizes().size}> iss::arch::traits<iss::arch::${coreDef.name.toLowerCase()}>::reg_bit_widths; | ||||
| constexpr std::array<const uint32_t, ${getRegisterSizes().size}> iss::arch::traits<iss::arch::${coreDef.name.toLowerCase()}>::reg_byte_offsets; | ||||
| constexpr std::array<const char*, ${registers.size()}>    iss::arch::traits<iss::arch::${coreDef.name.toLowerCase()}>::reg_names; | ||||
| constexpr std::array<const char*, ${registers.size()}>    iss::arch::traits<iss::arch::${coreDef.name.toLowerCase()}>::reg_aliases; | ||||
| constexpr std::array<const uint32_t, ${getRegisterSizes().size()}> iss::arch::traits<iss::arch::${coreDef.name.toLowerCase()}>::reg_bit_widths; | ||||
| constexpr std::array<const uint32_t, ${getRegisterSizes().size()}> iss::arch::traits<iss::arch::${coreDef.name.toLowerCase()}>::reg_byte_offsets; | ||||
|  | ||||
| ${coreDef.name.toLowerCase()}::${coreDef.name.toLowerCase()}()  = default; | ||||
|  | ||||
| @@ -73,4 +74,4 @@ uint8_t *${coreDef.name.toLowerCase()}::get_regs_base_ptr() { | ||||
| ${coreDef.name.toLowerCase()}::phys_addr_t ${coreDef.name.toLowerCase()}::virt2phys(const iss::addr_t &addr) { | ||||
|     return phys_addr_t(addr.access, addr.space, addr.val&traits<${coreDef.name.toLowerCase()}>::addr_mask); | ||||
| } | ||||
|  | ||||
| // clang-format on | ||||
|   | ||||
| @@ -1,5 +1,5 @@ | ||||
| /******************************************************************************* | ||||
|  * Copyright (C) 2017 - 2021 MINRES Technologies GmbH | ||||
|  * Copyright (C) 2024 MINRES Technologies GmbH | ||||
|  * All rights reserved. | ||||
|  * | ||||
|  * Redistribution and use in source and binary forms, with or without | ||||
| @@ -60,7 +60,7 @@ def getCString(def val){ | ||||
| %> | ||||
| #ifndef _${coreDef.name.toUpperCase()}_H_ | ||||
| #define _${coreDef.name.toUpperCase()}_H_ | ||||
|  | ||||
| // clang-format off | ||||
| #include <array> | ||||
| #include <iss/arch/traits.h> | ||||
| #include <iss/arch_if.h> | ||||
| @@ -75,10 +75,10 @@ template <> struct traits<${coreDef.name.toLowerCase()}> { | ||||
|  | ||||
|     constexpr static char const* const core_type = "${coreDef.name}"; | ||||
|      | ||||
|     static constexpr std::array<const char*, ${registers.size}> reg_names{ | ||||
|     static constexpr std::array<const char*, ${registers.size()}> reg_names{ | ||||
|         {"${registers.collect{it.name.toLowerCase()}.join('", "')}"}}; | ||||
|   | ||||
|     static constexpr std::array<const char*, ${registers.size}> reg_aliases{ | ||||
|     static constexpr std::array<const char*, ${registers.size()}> reg_aliases{ | ||||
|         {"${registers.collect{it.alias.toLowerCase()}.join('", "')}"}}; | ||||
|  | ||||
|     enum constants {${constants.collect{c -> c.name+"="+getCString(c.value)}.join(', ')}}; | ||||
| @@ -99,17 +99,17 @@ template <> struct traits<${coreDef.name.toLowerCase()}> { | ||||
|  | ||||
|     using phys_addr_t = iss::typed_addr_t<iss::address_type::PHYSICAL>; | ||||
|  | ||||
|     static constexpr std::array<const uint32_t, ${getRegisterSizes().size}> reg_bit_widths{ | ||||
|     static constexpr std::array<const uint32_t, ${getRegisterSizes().size()}> reg_bit_widths{ | ||||
|         {${getRegisterSizes().join(',')}}}; | ||||
|  | ||||
|     static constexpr std::array<const uint32_t, ${getRegisterOffsets().size}> reg_byte_offsets{ | ||||
|     static constexpr std::array<const uint32_t, ${getRegisterOffsets().size()}> reg_byte_offsets{ | ||||
|         {${getRegisterOffsets().join(',')}}}; | ||||
|  | ||||
|     static const uint64_t addr_mask = (reg_t(1) << (XLEN - 1)) | ((reg_t(1) << (XLEN - 1)) - 1); | ||||
|  | ||||
|     enum sreg_flag_e { FLAGS }; | ||||
|  | ||||
|     enum mem_type_e { ${spaces.collect{it.name}.join(', ')} }; | ||||
|     enum mem_type_e { ${spaces.collect{it.name}.join(', ')}, IMEM = MEM }; | ||||
|      | ||||
|     enum class opcode_e {<%instructions.eachWithIndex{instr, index -> %> | ||||
|         ${instr.instruction.name} = ${index},<%}%> | ||||
| @@ -131,8 +131,6 @@ struct ${coreDef.name.toLowerCase()}: public arch_if { | ||||
|  | ||||
|     uint8_t* get_regs_base_ptr() override; | ||||
|  | ||||
|     inline uint64_t get_icount() { return reg.icount; } | ||||
|  | ||||
|     inline bool should_stop() { return interrupt_sim; } | ||||
|  | ||||
|     inline uint64_t stop_code() { return interrupt_sim; } | ||||
| @@ -141,8 +139,6 @@ struct ${coreDef.name.toLowerCase()}: public arch_if { | ||||
|  | ||||
|     virtual iss::sync_type needed_sync() const { return iss::NO_SYNC; } | ||||
|  | ||||
|     inline uint32_t get_last_branch() { return reg.last_branch; } | ||||
|  | ||||
|  | ||||
| #pragma pack(push, 1) | ||||
|     struct ${coreDef.name}_regs {<% | ||||
| @@ -174,3 +170,4 @@ if(fcsr != null) {%> | ||||
| } | ||||
| }             | ||||
| #endif /* _${coreDef.name.toUpperCase()}_H_ */ | ||||
| // clang-format on | ||||
|   | ||||
| @@ -1,5 +1,5 @@ | ||||
| /******************************************************************************* | ||||
|  * Copyright (C) 2023 MINRES Technologies GmbH | ||||
|  * Copyright (C) 2024 MINRES Technologies GmbH | ||||
|  * All rights reserved. | ||||
|  * | ||||
|  * Redistribution and use in source and binary forms, with or without | ||||
| @@ -29,46 +29,103 @@ | ||||
|  * POSSIBILITY OF SUCH DAMAGE. | ||||
|  * | ||||
|  *******************************************************************************/ | ||||
|  | ||||
| #include "iss_factory.h" | ||||
| // clang-format off | ||||
| #include <sysc/iss_factory.h> | ||||
| #include <iss/arch/${coreDef.name.toLowerCase()}.h> | ||||
| #include <iss/arch/riscv_hart_m_p.h> | ||||
| #include <iss/arch/riscv_hart_mu_p.h> | ||||
| #include "sc_core_adapter.h" | ||||
| #include "core_complex.h" | ||||
| #include <sysc/sc_core_adapter.h> | ||||
| #include <sysc/core_complex.h> | ||||
| #include <array> | ||||
|  | ||||
| <% | ||||
| def array_count = coreDef.name.toLowerCase()=="tgc5d" || coreDef.name.toLowerCase()=="tgc5e"? 3 : 2; | ||||
| %> | ||||
| namespace iss { | ||||
| namespace interp { | ||||
| using namespace sysc; | ||||
| volatile std::array<bool, 2> ${coreDef.name.toLowerCase()}_init = { | ||||
| volatile std::array<bool, ${array_count}> ${coreDef.name.toLowerCase()}_init = { | ||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|interp", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); | ||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::${coreDef.name.toLowerCase()}>>(cc); | ||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||
|         }), | ||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|interp", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); | ||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}>>(cc); | ||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||
|         }) | ||||
|         })<%if(coreDef.name.toLowerCase()=="tgc5d" || coreDef.name.toLowerCase()=="tgc5e") {%>, | ||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p_clic_pmp|interp", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_EXT_N | iss::arch::FEAT_CLIC)>>(cc); | ||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||
|         })<%}%> | ||||
| }; | ||||
| } | ||||
| #if defined(WITH_LLVM) | ||||
| namespace llvm { | ||||
| using namespace sysc; | ||||
| volatile std::array<bool, ${array_count}> ${coreDef.name.toLowerCase()}_init = { | ||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|llvm", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::${coreDef.name.toLowerCase()}>>(cc); | ||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||
|         }), | ||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|llvm", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}>>(cc); | ||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||
|         })<%if(coreDef.name.toLowerCase()=="tgc5d" || coreDef.name.toLowerCase()=="tgc5e") {%>, | ||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p_clic_pmp|llvm", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_EXT_N | iss::arch::FEAT_CLIC)>>(cc); | ||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||
|         })<%}%> | ||||
| }; | ||||
| } | ||||
| #endif | ||||
| #if defined(WITH_TCC) | ||||
| namespace tcc { | ||||
| using namespace sysc; | ||||
| volatile std::array<bool, 2> ${coreDef.name.toLowerCase()}_init = { | ||||
| volatile std::array<bool, ${array_count}> ${coreDef.name.toLowerCase()}_init = { | ||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|tcc", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); | ||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::${coreDef.name.toLowerCase()}>>(cc); | ||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||
|         }), | ||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|tcc", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); | ||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}>>(cc); | ||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||
|         }) | ||||
|         })<%if(coreDef.name.toLowerCase()=="tgc5d" || coreDef.name.toLowerCase()=="tgc5e") {%>, | ||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p_clic_pmp|tcc", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_EXT_N | iss::arch::FEAT_CLIC)>>(cc); | ||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||
|         })<%}%> | ||||
| }; | ||||
| } | ||||
| #endif | ||||
| #if defined(WITH_ASMJIT) | ||||
| namespace asmjit { | ||||
| using namespace sysc; | ||||
| volatile std::array<bool, ${array_count}> ${coreDef.name.toLowerCase()}_init = { | ||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|asmjit", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::${coreDef.name.toLowerCase()}>>(cc); | ||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||
|         }), | ||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|asmjit", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}>>(cc); | ||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||
|         })<%if(coreDef.name.toLowerCase()=="tgc5d" || coreDef.name.toLowerCase()=="tgc5e") {%>, | ||||
|         iss_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p_clic_pmp|asmjit", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|             auto* cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::${coreDef.name.toLowerCase()}, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_EXT_N | iss::arch::FEAT_CLIC)>>(cc); | ||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::${coreDef.name.toLowerCase()}*>(cpu), gdb_port)}}; | ||||
|         })<%}%> | ||||
| }; | ||||
| } | ||||
| #endif | ||||
| } | ||||
| // clang-format on | ||||
							
								
								
									
										370
									
								
								gen_input/templates/asmjit/CORENAME.cpp.gtl
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										370
									
								
								gen_input/templates/asmjit/CORENAME.cpp.gtl
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,370 @@ | ||||
| /******************************************************************************* | ||||
|  * Copyright (C) 2017-2024 MINRES Technologies GmbH | ||||
|  * All rights reserved. | ||||
|  * | ||||
|  * Redistribution and use in source and binary forms, with or without | ||||
|  * modification, are permitted provided that the following conditions are met: | ||||
|  * | ||||
|  * 1. Redistributions of source code must retain the above copyright notice, | ||||
|  *    this list of conditions and the following disclaimer. | ||||
|  * | ||||
|  * 2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|  *    this list of conditions and the following disclaimer in the documentation | ||||
|  *    and/or other materials provided with the distribution. | ||||
|  * | ||||
|  * 3. Neither the name of the copyright holder nor the names of its contributors | ||||
|  *    may be used to endorse or promote products derived from this software | ||||
|  *    without specific prior written permission. | ||||
|  * | ||||
|  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" | ||||
|  * AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | ||||
|  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE | ||||
|  * ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE | ||||
|  * LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR | ||||
|  * CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF | ||||
|  * SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS | ||||
|  * INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN | ||||
|  * CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) | ||||
|  * ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE | ||||
|  * POSSIBILITY OF SUCH DAMAGE. | ||||
|  * | ||||
|  *******************************************************************************/ | ||||
| // clang-format off | ||||
| #include <iss/arch/${coreDef.name.toLowerCase()}.h> | ||||
| #include <iss/debugger/gdb_session.h> | ||||
| #include <iss/debugger/server.h> | ||||
| #include <iss/iss.h> | ||||
| #include <iss/asmjit/vm_base.h> | ||||
| #include <asmjit/asmjit.h> | ||||
| #include <util/logging.h> | ||||
| #include <iss/instruction_decoder.h> | ||||
| <%def fcsr = registers.find {it.name=='FCSR'} | ||||
| if(fcsr != null) {%> | ||||
| #include <vm/fp_functions.h><%}%> | ||||
| #ifndef FMT_HEADER_ONLY | ||||
| #define FMT_HEADER_ONLY | ||||
| #endif | ||||
| #include <fmt/format.h> | ||||
|  | ||||
| #include <array> | ||||
| #include <iss/debugger/riscv_target_adapter.h> | ||||
|  | ||||
| namespace iss { | ||||
| namespace asmjit { | ||||
|  | ||||
|  | ||||
| namespace ${coreDef.name.toLowerCase()} { | ||||
| using namespace ::asmjit; | ||||
| using namespace iss::arch; | ||||
| using namespace iss::debugger; | ||||
|  | ||||
| template <typename ARCH> class vm_impl : public iss::asmjit::vm_base<ARCH> { | ||||
| public: | ||||
|     using traits = arch::traits<ARCH>; | ||||
|     using super = typename iss::asmjit::vm_base<ARCH>; | ||||
|     using virt_addr_t = typename super::virt_addr_t; | ||||
|     using phys_addr_t = typename super::phys_addr_t; | ||||
|     using code_word_t = typename super::code_word_t; | ||||
|     using mem_type_e = typename super::mem_type_e; | ||||
|     using addr_t = typename super::addr_t; | ||||
|  | ||||
|     vm_impl(); | ||||
|  | ||||
|     vm_impl(ARCH &core, unsigned core_id = 0, unsigned cluster_id = 0); | ||||
|  | ||||
|     void enableDebug(bool enable) { super::sync_exec = super::ALL_SYNC; } | ||||
|  | ||||
|     target_adapter_if *accquire_target_adapter(server_if *srv) override { | ||||
|         debugger_if::dbg_enabled = true; | ||||
|         if (vm_base<ARCH>::tgt_adapter == nullptr) | ||||
|             vm_base<ARCH>::tgt_adapter = new riscv_target_adapter<ARCH>(srv, this->get_arch()); | ||||
|         return vm_base<ARCH>::tgt_adapter; | ||||
|     } | ||||
|  | ||||
| protected: | ||||
|     using super::get_ptr_for; | ||||
|     using super::get_reg_for; | ||||
|     using super::get_reg_for_Gp; | ||||
|     using super::load_reg_from_mem; | ||||
|     using super::load_reg_from_mem_Gp; | ||||
|     using super::write_reg_to_mem; | ||||
|     using super::gen_read_mem; | ||||
|     using super::gen_write_mem; | ||||
|     using super::gen_leave; | ||||
|     using super::gen_sync; | ||||
|     | ||||
|     using this_class = vm_impl<ARCH>; | ||||
|     using compile_func = continuation_e (this_class::*)(virt_addr_t&, code_word_t, jit_holder&); | ||||
|  | ||||
|     continuation_e gen_single_inst_behavior(virt_addr_t&, jit_holder&) override; | ||||
|     enum globals_e {TVAL = 0, GLOBALS_SIZE}; | ||||
|     void gen_block_prologue(jit_holder& jh) override; | ||||
|     void gen_block_epilogue(jit_holder& jh) override; | ||||
|     inline const char *name(size_t index){return traits::reg_aliases.at(index);} | ||||
| <%if(fcsr != null) {%> | ||||
|     inline const char *fname(size_t index){return index < 32?name(index+traits::F0):"illegal";}    | ||||
| <%}%> | ||||
|     void gen_instr_prologue(jit_holder& jh); | ||||
|     void gen_instr_epilogue(jit_holder& jh); | ||||
|     inline void gen_raise(jit_holder& jh, uint16_t trap_id, uint16_t cause); | ||||
|     template <typename T, typename = typename std::enable_if<std::is_integral<T>::value>::type> void gen_set_tval(jit_holder& jh, T new_tval) ; | ||||
|     void gen_set_tval(jit_holder& jh, x86_reg_t _new_tval) ; | ||||
|  | ||||
|     template<unsigned W, typename U, typename S = typename std::make_signed<U>::type> | ||||
|     inline S sext(U from) { | ||||
|         auto mask = (1ULL<<W) - 1; | ||||
|         auto sign_mask = 1ULL<<(W-1); | ||||
|         return (from & mask) | ((from & sign_mask) ? ~mask : 0); | ||||
|     } | ||||
| <%functions.each{ it.eachLine { %> | ||||
|     ${it}<%}%> | ||||
| <%}%> | ||||
| private: | ||||
|     /**************************************************************************** | ||||
|      * start opcode definitions | ||||
|      ****************************************************************************/ | ||||
|     struct instruction_descriptor { | ||||
|         uint32_t length; | ||||
|         uint32_t value; | ||||
|         uint32_t mask; | ||||
|         compile_func op; | ||||
|     }; | ||||
|  | ||||
|     const std::array<instruction_descriptor, ${instructions.size()}> instr_descr = {{ | ||||
|          /* entries are: size, valid value, valid mask, function ptr */<%instructions.each{instr -> %> | ||||
|         /* instruction ${instr.instruction.name}, encoding '${instr.encoding}' */ | ||||
|         {${instr.length}, ${instr.encoding}, ${instr.mask}, &this_class::__${generator.functionName(instr.name)}},<%}%> | ||||
|     }}; | ||||
|  | ||||
|     //needs to be declared after instr_descr | ||||
|     decoder instr_decoder; | ||||
|  | ||||
|     /* instruction definitions */<%instructions.eachWithIndex{instr, idx -> %> | ||||
|     /* instruction ${idx}: ${instr.name} */ | ||||
|     continuation_e __${generator.functionName(instr.name)}(virt_addr_t& pc, code_word_t instr, jit_holder& jh){ | ||||
|         uint64_t PC = pc.val; | ||||
|         <%instr.fields.eachLine{%>${it} | ||||
|         <%}%>if(this->disass_enabled){ | ||||
|             /* generate disass */ | ||||
|             <%instr.disass.eachLine{%> | ||||
|             ${it}<%}%> | ||||
|             InvokeNode* call_print_disass; | ||||
|             char* mnemonic_ptr = strdup(mnemonic.c_str()); | ||||
|             jh.disass_collection.push_back(mnemonic_ptr); | ||||
|             jh.cc.invoke(&call_print_disass, &print_disass, FuncSignature::build<void, void *, uint64_t, char *>()); | ||||
|             call_print_disass->setArg(0, jh.arch_if_ptr); | ||||
|             call_print_disass->setArg(1, pc.val); | ||||
|             call_print_disass->setArg(2, mnemonic_ptr); | ||||
|  | ||||
|         } | ||||
|         x86::Compiler& cc = jh.cc; | ||||
|         cc.comment(fmt::format("${instr.name}_{:#x}:",pc.val).c_str()); | ||||
|         gen_sync(jh, PRE_SYNC, ${idx}); | ||||
|         mov(cc, jh.pc, pc.val); | ||||
|         gen_set_tval(jh, instr); | ||||
|         pc = pc+${instr.length/8}; | ||||
|         mov(cc, jh.next_pc, pc.val); | ||||
|  | ||||
|         gen_instr_prologue(jh); | ||||
|         cc.comment("//behavior:"); | ||||
|         /*generate behavior*/ | ||||
|         <%instr.behavior.eachLine{%>${it} | ||||
|         <%}%> | ||||
|         gen_sync(jh, POST_SYNC, ${idx}); | ||||
|         gen_instr_epilogue(jh); | ||||
|     	return returnValue;         | ||||
|     } | ||||
|     <%}%> | ||||
|     /**************************************************************************** | ||||
|      * end opcode definitions | ||||
|      ****************************************************************************/ | ||||
|     continuation_e illegal_instruction(virt_addr_t &pc, code_word_t instr, jit_holder& jh ) { | ||||
|         x86::Compiler& cc = jh.cc; | ||||
|         if(this->disass_enabled){           | ||||
|             auto mnemonic = std::string("illegal_instruction"); | ||||
|             InvokeNode* call_print_disass; | ||||
|             char* mnemonic_ptr = strdup(mnemonic.c_str()); | ||||
|             jh.disass_collection.push_back(mnemonic_ptr); | ||||
|             jh.cc.invoke(&call_print_disass, &print_disass, FuncSignature::build<void, void *, uint64_t, char *>()); | ||||
|             call_print_disass->setArg(0, jh.arch_if_ptr); | ||||
|             call_print_disass->setArg(1, pc.val); | ||||
|             call_print_disass->setArg(2, mnemonic_ptr); | ||||
|         } | ||||
|         cc.comment(fmt::format("illegal_instruction{:#x}:",pc.val).c_str()); | ||||
|         gen_sync(jh, PRE_SYNC, instr_descr.size()); | ||||
|         mov(cc, jh.pc, pc.val); | ||||
|         gen_set_tval(jh, instr); | ||||
|         pc = pc + ((instr & 3) == 3 ? 4 : 2); | ||||
|         mov(cc, jh.next_pc, pc.val); | ||||
|         gen_instr_prologue(jh); | ||||
|         cc.comment("//behavior:"); | ||||
|         gen_raise(jh, 0, 2); | ||||
|         gen_sync(jh, POST_SYNC, instr_descr.size()); | ||||
|         gen_instr_epilogue(jh); | ||||
|         return ILLEGAL_INSTR; | ||||
|     } | ||||
| }; | ||||
|  | ||||
| template <typename ARCH> vm_impl<ARCH>::vm_impl() { this(new ARCH()); } | ||||
|  | ||||
| template <typename ARCH> | ||||
| vm_impl<ARCH>::vm_impl(ARCH &core, unsigned core_id, unsigned cluster_id) | ||||
| : vm_base<ARCH>(core, core_id, cluster_id) | ||||
| , instr_decoder([this]() { | ||||
|         std::vector<generic_instruction_descriptor> g_instr_descr; | ||||
|         g_instr_descr.reserve(instr_descr.size()); | ||||
|         for (uint32_t i = 0; i < instr_descr.size(); ++i) { | ||||
|             generic_instruction_descriptor new_instr_descr {instr_descr[i].value, instr_descr[i].mask, i}; | ||||
|             g_instr_descr.push_back(new_instr_descr); | ||||
|         } | ||||
|         return std::move(g_instr_descr); | ||||
|     }()) {} | ||||
|  | ||||
| template <typename ARCH> | ||||
| continuation_e vm_impl<ARCH>::gen_single_inst_behavior(virt_addr_t &pc, jit_holder& jh) { | ||||
|     enum {TRAP_ID=1<<16}; | ||||
|     code_word_t instr = 0; | ||||
|     phys_addr_t paddr(pc); | ||||
|     auto *const data = (uint8_t *)&instr; | ||||
|     if(this->core.has_mmu()) | ||||
|         paddr = this->core.virt2phys(pc); | ||||
|     auto res = this->core.read(paddr, 4, data); | ||||
|     if (res != iss::Ok) | ||||
|         return ILLEGAL_FETCH; | ||||
|     if (instr == 0x0000006f || (instr&0xffff)==0xa001) | ||||
|         return JUMP_TO_SELF; | ||||
|     uint32_t inst_index = instr_decoder.decode_instr(instr); | ||||
|     compile_func f = nullptr; | ||||
|     if(inst_index < instr_descr.size()) | ||||
|         f = instr_descr[inst_index].op; | ||||
|     if (f == nullptr)  | ||||
|         f = &this_class::illegal_instruction; | ||||
|     return (this->*f)(pc, instr, jh); | ||||
| } | ||||
| template <typename ARCH> | ||||
| void vm_impl<ARCH>::gen_instr_prologue(jit_holder& jh) { | ||||
|     auto& cc = jh.cc; | ||||
|  | ||||
|     cc.comment("//gen_instr_prologue"); | ||||
|  | ||||
|     x86_reg_t current_trap_state = get_reg_for(cc, traits::TRAP_STATE); | ||||
|     mov(cc, current_trap_state, get_ptr_for(jh, traits::TRAP_STATE)); | ||||
|     mov(cc, get_ptr_for(jh, traits::PENDING_TRAP), current_trap_state); | ||||
|  | ||||
| } | ||||
| template <typename ARCH> | ||||
| void vm_impl<ARCH>::gen_instr_epilogue(jit_holder& jh) { | ||||
|     auto& cc = jh.cc; | ||||
|  | ||||
|     cc.comment("//gen_instr_epilogue"); | ||||
|     x86_reg_t current_trap_state = get_reg_for(cc, traits::TRAP_STATE); | ||||
|     mov(cc, current_trap_state, get_ptr_for(jh, traits::TRAP_STATE)); | ||||
|     cmp(cc, current_trap_state, 0); | ||||
|     cc.jne(jh.trap_entry); | ||||
|     cc.inc(get_ptr_for(jh, traits::ICOUNT)); | ||||
|     cc.inc(get_ptr_for(jh, traits::CYCLE)); | ||||
| } | ||||
| template <typename ARCH> | ||||
| void vm_impl<ARCH>::gen_block_prologue(jit_holder& jh){ | ||||
|     jh.pc = load_reg_from_mem_Gp(jh, traits::PC); | ||||
|     jh.next_pc = load_reg_from_mem_Gp(jh, traits::NEXT_PC); | ||||
|     jh.globals.resize(GLOBALS_SIZE); | ||||
|     jh.globals[TVAL] = get_reg_Gp(jh.cc, 64, false); | ||||
| } | ||||
| template <typename ARCH> | ||||
| void vm_impl<ARCH>::gen_block_epilogue(jit_holder& jh){ | ||||
|     x86::Compiler& cc = jh.cc; | ||||
|     cc.comment("//gen_block_epilogue"); | ||||
|     cc.ret(jh.next_pc); | ||||
|  | ||||
|     cc.bind(jh.trap_entry); | ||||
|     this->write_back(jh); | ||||
|  | ||||
|     x86::Gp current_trap_state = get_reg_for_Gp(cc, traits::TRAP_STATE); | ||||
|     mov(cc, current_trap_state, get_ptr_for(jh, traits::TRAP_STATE)); | ||||
|  | ||||
|     x86::Gp current_pc = get_reg_for_Gp(cc, traits::PC); | ||||
|     mov(cc, current_pc, get_ptr_for(jh, traits::PC)); | ||||
|  | ||||
|     cc.comment("//enter trap call;"); | ||||
|     InvokeNode* call_enter_trap; | ||||
|     cc.invoke(&call_enter_trap, &enter_trap, FuncSignature::build<uint64_t, void*, uint64_t, uint64_t, uint64_t>()); | ||||
|     call_enter_trap->setArg(0, jh.arch_if_ptr); | ||||
|     call_enter_trap->setArg(1, current_trap_state); | ||||
|     call_enter_trap->setArg(2, current_pc); | ||||
|     call_enter_trap->setArg(3, jh.globals[TVAL]); | ||||
|  | ||||
|     x86_reg_t current_next_pc = get_reg_for(cc, traits::NEXT_PC); | ||||
|     mov(cc, current_next_pc, get_ptr_for(jh, traits::NEXT_PC)); | ||||
|     mov(cc, jh.next_pc, current_next_pc); | ||||
|  | ||||
|     mov(cc, get_ptr_for(jh, traits::LAST_BRANCH), static_cast<int>(UNKNOWN_JUMP)); | ||||
|     cc.ret(jh.next_pc); | ||||
| } | ||||
| template <typename ARCH> | ||||
| inline void vm_impl<ARCH>::gen_raise(jit_holder& jh, uint16_t trap_id, uint16_t cause) { | ||||
|     auto& cc = jh.cc; | ||||
|     cc.comment("//gen_raise"); | ||||
|     auto tmp1 = get_reg_for(cc, traits::TRAP_STATE); | ||||
|     mov(cc, tmp1, 0x80ULL << 24 | (cause << 16) | trap_id); | ||||
|     mov(cc, get_ptr_for(jh, traits::TRAP_STATE), tmp1); | ||||
|     cc.jmp(jh.trap_entry); | ||||
| } | ||||
| template <typename ARCH> | ||||
| template <typename T, typename> | ||||
| void vm_impl<ARCH>::gen_set_tval(jit_holder& jh, T new_tval) { | ||||
|         mov(jh.cc, jh.globals[TVAL], new_tval); | ||||
|     } | ||||
| template <typename ARCH> | ||||
| void vm_impl<ARCH>::gen_set_tval(jit_holder& jh, x86_reg_t _new_tval) { | ||||
|     if(nonstd::holds_alternative<x86::Gp>(_new_tval)) { | ||||
|         x86::Gp new_tval = nonstd::get<x86::Gp>(_new_tval); | ||||
|         if(new_tval.size() < 8) | ||||
|             new_tval = gen_ext_Gp(jh.cc, new_tval, 64, false); | ||||
|         mov(jh.cc, jh.globals[TVAL], new_tval); | ||||
|     } else { | ||||
|         throw std::runtime_error("Variant not supported in gen_set_tval"); | ||||
|     } | ||||
| } | ||||
|  | ||||
| } // namespace tgc5c | ||||
|  | ||||
| template <> | ||||
| std::unique_ptr<vm_if> create<arch::${coreDef.name.toLowerCase()}>(arch::${coreDef.name.toLowerCase()} *core, unsigned short port, bool dump) { | ||||
|     auto ret = new ${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*core, dump); | ||||
|     if (port != 0) debugger::server<debugger::gdb_session>::run_server(ret, port); | ||||
|     return std::unique_ptr<vm_if>(ret); | ||||
| } | ||||
| } // namespace asmjit | ||||
| } // namespace iss | ||||
|  | ||||
| #include <iss/arch/riscv_hart_m_p.h> | ||||
| #include <iss/arch/riscv_hart_mu_p.h> | ||||
| #include <iss/factory.h> | ||||
| namespace iss { | ||||
| namespace { | ||||
| volatile std::array<bool, 2> dummy = { | ||||
|         core_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|asmjit", [](unsigned port, void* init_data) -> std::tuple<cpu_ptr, vm_ptr>{ | ||||
|             auto* cpu = new iss::arch::riscv_hart_m_p<iss::arch::${coreDef.name.toLowerCase()}>(); | ||||
| 		    auto vm = new asmjit::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | ||||
| 		    if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | ||||
|             if(init_data){ | ||||
|                 auto* cb = reinterpret_cast<semihosting_cb_t<arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t>*>(init_data); | ||||
|                 cpu->set_semihosting_callback(*cb); | ||||
|             } | ||||
|             return {cpu_ptr{cpu}, vm_ptr{vm}}; | ||||
|         }), | ||||
|         core_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|asmjit", [](unsigned port, void* init_data) -> std::tuple<cpu_ptr, vm_ptr>{ | ||||
|             auto* cpu = new iss::arch::riscv_hart_mu_p<iss::arch::${coreDef.name.toLowerCase()}>(); | ||||
| 		    auto vm = new asmjit::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | ||||
| 		    if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | ||||
|             if(init_data){ | ||||
|                 auto* cb = reinterpret_cast<semihosting_cb_t<arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t>*>(init_data); | ||||
|                 cpu->set_semihosting_callback(*cb); | ||||
|             } | ||||
|             return {cpu_ptr{cpu}, vm_ptr{vm}}; | ||||
|         }) | ||||
| }; | ||||
| } | ||||
| } | ||||
| // clang-format on | ||||
| @@ -1,5 +1,5 @@ | ||||
| /******************************************************************************* | ||||
|  * Copyright (C) 2021 MINRES Technologies GmbH | ||||
|  * Copyright (C) 2017-2024 MINRES Technologies GmbH | ||||
|  * All rights reserved. | ||||
|  * | ||||
|  * Redistribution and use in source and binary forms, with or without | ||||
| @@ -34,17 +34,22 @@ def nativeTypeSize(int size){ | ||||
|     if(size<=8) return 8; else if(size<=16) return 16; else if(size<=32) return 32; else return 64; | ||||
| } | ||||
| %> | ||||
| // clang-format off | ||||
| #include <cstdint> | ||||
| #include <iss/arch/${coreDef.name.toLowerCase()}.h> | ||||
| #include <iss/debugger/gdb_session.h> | ||||
| #include <iss/debugger/server.h> | ||||
| #include <iss/iss.h> | ||||
| #include <iss/interp/vm_base.h> | ||||
| #include <vm/fp_functions.h> | ||||
| #include <util/logging.h> | ||||
| #include <boost/coroutine2/all.hpp> | ||||
| #include <functional> | ||||
| #include <exception> | ||||
| #include <vector> | ||||
| #include <sstream> | ||||
| #include <iss/instruction_decoder.h> | ||||
|  | ||||
|  | ||||
| #ifndef FMT_HEADER_ONLY | ||||
| #define FMT_HEADER_ONLY | ||||
| @@ -95,7 +100,12 @@ protected: | ||||
|     using compile_ret_t = virt_addr_t; | ||||
|     using compile_func = compile_ret_t (this_class::*)(virt_addr_t &pc, code_word_t instr); | ||||
|  | ||||
|     inline const char *name(size_t index){return index<traits::reg_aliases.size()?traits::reg_aliases[index]:"illegal";} | ||||
|     inline const char *name(size_t index){return traits::reg_aliases.at(index);} | ||||
| <% | ||||
| def fcsr = registers.find {it.name=='FCSR'} | ||||
| if(fcsr != null) {%> | ||||
|     inline const char *fname(size_t index){return index < 32?name(index+traits::F0):"illegal";}      | ||||
| <%}%> | ||||
|  | ||||
|     virt_addr_t execute_inst(finish_cond_e cond, virt_addr_t start, uint64_t icount_limit) override; | ||||
|  | ||||
| @@ -104,7 +114,6 @@ protected: | ||||
|     inline void raise(uint16_t trap_id, uint16_t cause){ | ||||
|         auto trap_val =  0x80ULL << 24 | (cause << 16) | trap_id; | ||||
|         this->core.reg.trap_state = trap_val; | ||||
|         this->template get_reg<uint${addrDataWidth}_t>(traits::NEXT_PC) = std::numeric_limits<uint${addrDataWidth}_t>::max(); | ||||
|     } | ||||
|  | ||||
|     inline void leave(unsigned lvl){ | ||||
| @@ -115,6 +124,13 @@ protected: | ||||
|         this->core.wait_until(type); | ||||
|     } | ||||
|  | ||||
|     inline void set_tval(uint64_t new_tval){ | ||||
|         tval = new_tval; | ||||
|     } | ||||
|  | ||||
|     uint64_t fetch_count{0}; | ||||
|     uint64_t tval{0}; | ||||
|  | ||||
|     using yield_t = boost::coroutines2::coroutine<void>::push_type; | ||||
|     using coro_t = boost::coroutines2::coroutine<void>::pull_type; | ||||
|     std::vector<coro_t> spawn_blocks; | ||||
| @@ -144,25 +160,20 @@ private: | ||||
|      * start opcode definitions | ||||
|      ****************************************************************************/ | ||||
|     struct instruction_descriptor { | ||||
|         size_t length; | ||||
|         uint32_t length; | ||||
|         uint32_t value; | ||||
|         uint32_t mask; | ||||
|         typename arch::traits<ARCH>::opcode_e op; | ||||
|     }; | ||||
|     struct decoding_tree_node{ | ||||
|         std::vector<instruction_descriptor> instrs; | ||||
|         std::vector<decoding_tree_node*> children; | ||||
|         uint32_t submask = std::numeric_limits<uint32_t>::max(); | ||||
|         uint32_t value; | ||||
|         decoding_tree_node(uint32_t value) : value(value){} | ||||
|     }; | ||||
|  | ||||
|     decoding_tree_node* root {nullptr}; | ||||
|     const std::array<instruction_descriptor, ${instructions.size}> instr_descr = {{ | ||||
|     const std::array<instruction_descriptor, ${instructions.size()}> instr_descr = {{ | ||||
|          /* entries are: size, valid value, valid mask, function ptr */<%instructions.each{instr -> %> | ||||
|         {${instr.length}, ${instr.encoding}, ${instr.mask}, arch::traits<ARCH>::opcode_e::${instr.instruction.name}},<%}%> | ||||
|     }}; | ||||
|  | ||||
|     //needs to be declared after instr_descr | ||||
|     decoder instr_decoder; | ||||
|  | ||||
|     iss::status fetch_ins(virt_addr_t pc, uint8_t * data){ | ||||
|         if(this->core.has_mmu()) { | ||||
|             auto phys_pc = this->core.virt2phys(pc); | ||||
| @@ -182,66 +193,12 @@ private: | ||||
|         } | ||||
|         return iss::Ok; | ||||
|     } | ||||
|      | ||||
|     void populate_decoding_tree(decoding_tree_node* root){ | ||||
|         //create submask | ||||
|         for(auto instr: root->instrs){ | ||||
|             root->submask &= instr.mask; | ||||
|         } | ||||
|         //put each instr according to submask&encoding into children | ||||
|         for(auto instr: root->instrs){ | ||||
|             bool foundMatch = false; | ||||
|             for(auto child: root->children){ | ||||
|                 //use value as identifying trait | ||||
|                 if(child->value == (instr.value&root->submask)){ | ||||
|                     child->instrs.push_back(instr); | ||||
|                     foundMatch = true; | ||||
|                 } | ||||
|             } | ||||
|             if(!foundMatch){ | ||||
|                 decoding_tree_node* child = new decoding_tree_node(instr.value&root->submask); | ||||
|                 child->instrs.push_back(instr); | ||||
|                 root->children.push_back(child); | ||||
|             } | ||||
|         } | ||||
|         root->instrs.clear(); | ||||
|         //call populate_decoding_tree for all children | ||||
|         if(root->children.size() >1) | ||||
|             for(auto child: root->children){ | ||||
|                 populate_decoding_tree(child);       | ||||
|             } | ||||
|         else{ | ||||
|             //sort instrs by value of the mask, this works bc we want to have the least restrictive one last | ||||
|             std::sort(root->children[0]->instrs.begin(), root->children[0]->instrs.end(), [](const instruction_descriptor& instr1, const instruction_descriptor& instr2) { | ||||
|             return instr1.mask > instr2.mask; | ||||
|             });  | ||||
|         } | ||||
|     } | ||||
|     typename arch::traits<ARCH>::opcode_e  decode_instr(decoding_tree_node* node, code_word_t word){ | ||||
|         if(!node->children.size()){ | ||||
|             if(node->instrs.size() == 1) return node->instrs[0].op; | ||||
|             for(auto instr : node->instrs){ | ||||
|                 if((instr.mask&word) == instr.value) return instr.op; | ||||
|             } | ||||
|         } | ||||
|         else{ | ||||
|             for(auto child : node->children){ | ||||
|                 if (child->value == (node->submask&word)){ | ||||
|                     return decode_instr(child, word); | ||||
|                 }   | ||||
|             }   | ||||
|         } | ||||
|         return arch::traits<ARCH>::opcode_e::MAX_OPCODE; | ||||
|     } | ||||
| }; | ||||
|  | ||||
| template <typename CODE_WORD> void debug_fn(CODE_WORD insn) { | ||||
|     volatile CODE_WORD x = insn; | ||||
|     insn = 2 * x; | ||||
| } | ||||
|  | ||||
| template <typename ARCH> vm_impl<ARCH>::vm_impl() { this(new ARCH()); } | ||||
|  | ||||
| // according to | ||||
| // https://stackoverflow.com/questions/8871204/count-number-of-1s-in-binary-representation | ||||
| #ifdef __GCC__ | ||||
| @@ -258,16 +215,23 @@ constexpr size_t bit_count(uint32_t u) { | ||||
|  | ||||
| template <typename ARCH> | ||||
| vm_impl<ARCH>::vm_impl(ARCH &core, unsigned core_id, unsigned cluster_id) | ||||
| : vm_base<ARCH>(core, core_id, cluster_id) { | ||||
|     root = new decoding_tree_node(std::numeric_limits<uint32_t>::max()); | ||||
|     for(auto instr:instr_descr){ | ||||
|         root->instrs.push_back(instr); | ||||
|     } | ||||
|     populate_decoding_tree(root); | ||||
| : vm_base<ARCH>(core, core_id, cluster_id) | ||||
| , instr_decoder([this]() { | ||||
|         std::vector<generic_instruction_descriptor> g_instr_descr; | ||||
|         g_instr_descr.reserve(instr_descr.size()); | ||||
|         for (uint32_t i = 0; i < instr_descr.size(); ++i) { | ||||
|             generic_instruction_descriptor new_instr_descr {instr_descr[i].value, instr_descr[i].mask, i}; | ||||
|             g_instr_descr.push_back(new_instr_descr); | ||||
|         } | ||||
|         return std::move(g_instr_descr); | ||||
|     }()) {} | ||||
|  | ||||
| inline bool is_icount_limit_enabled(finish_cond_e cond){ | ||||
|     return (cond & finish_cond_e::ICOUNT_LIMIT) == finish_cond_e::ICOUNT_LIMIT; | ||||
| } | ||||
|  | ||||
| inline bool is_count_limit_enabled(finish_cond_e cond){ | ||||
|     return (cond & finish_cond_e::COUNT_LIMIT) == finish_cond_e::COUNT_LIMIT; | ||||
| inline bool is_fcount_limit_enabled(finish_cond_e cond){ | ||||
|     return (cond & finish_cond_e::FCOUNT_LIMIT) == finish_cond_e::FCOUNT_LIMIT; | ||||
| } | ||||
|  | ||||
| inline bool is_jump_to_self_enabled(finish_cond_e cond){ | ||||
| @@ -275,7 +239,7 @@ inline bool is_jump_to_self_enabled(finish_cond_e cond){ | ||||
| } | ||||
|  | ||||
| template <typename ARCH> | ||||
| typename vm_base<ARCH>::virt_addr_t vm_impl<ARCH>::execute_inst(finish_cond_e cond, virt_addr_t start, uint64_t icount_limit){ | ||||
| typename vm_base<ARCH>::virt_addr_t vm_impl<ARCH>::execute_inst(finish_cond_e cond, virt_addr_t start, uint64_t count_limit){ | ||||
|     auto pc=start; | ||||
|     auto* PC = reinterpret_cast<uint${addrDataWidth}_t*>(this->regs_base_ptr+arch::traits<ARCH>::reg_byte_offsets[arch::traits<ARCH>::PC]); | ||||
|     auto* NEXT_PC = reinterpret_cast<uint${addrDataWidth}_t*>(this->regs_base_ptr+arch::traits<ARCH>::reg_byte_offsets[arch::traits<ARCH>::NEXT_PC]); | ||||
| @@ -288,16 +252,26 @@ typename vm_base<ARCH>::virt_addr_t vm_impl<ARCH>::execute_inst(finish_cond_e co | ||||
|     auto *const data = reinterpret_cast<uint8_t*>(&instr); | ||||
|  | ||||
|     while(!this->core.should_stop() && | ||||
|             !(is_count_limit_enabled(cond) && icount >= icount_limit)){ | ||||
|             !(is_icount_limit_enabled(cond) && icount >= count_limit) && | ||||
|             !(is_fcount_limit_enabled(cond) && fetch_count >= count_limit)){ | ||||
|         if(this->debugging_enabled()) | ||||
|             this->tgt_adapter->check_continue(*PC); | ||||
|         pc.val=*PC; | ||||
|         if(fetch_ins(pc, data)!=iss::Ok){ | ||||
|             this->do_sync(POST_SYNC, std::numeric_limits<unsigned>::max()); | ||||
|             pc.val = super::core.enter_trap(std::numeric_limits<uint64_t>::max(), pc.val, 0); | ||||
|             if(this->sync_exec && PRE_SYNC) this->do_sync(PRE_SYNC, std::numeric_limits<unsigned>::max()); | ||||
|             process_spawn_blocks(); | ||||
|             if(this->sync_exec && POST_SYNC) this->do_sync(PRE_SYNC, std::numeric_limits<unsigned>::max()); | ||||
|             pc.val = super::core.enter_trap(arch::traits<ARCH>::RV_CAUSE_FETCH_ACCESS<<16, pc.val, 0); | ||||
|         } else { | ||||
|             if (is_jump_to_self_enabled(cond) && | ||||
|                     (instr == 0x0000006f || (instr&0xffff)==0xa001)) throw simulation_stopped(0); // 'J 0' or 'C.J 0' | ||||
|             auto inst_id = decode_instr(root, instr); | ||||
|             uint32_t inst_index = instr_decoder.decode_instr(instr); | ||||
|             opcode_e inst_id = arch::traits<ARCH>::opcode_e::MAX_OPCODE;; | ||||
|             if(inst_index <instr_descr.size()) | ||||
|                 inst_id = instr_descr[inst_index].op; | ||||
|  | ||||
|             // pre execution stuff | ||||
|              this->core.reg.last_branch = 0; | ||||
|             this->core.reg.last_branch = 0; | ||||
|             if(this->sync_exec && PRE_SYNC) this->do_sync(PRE_SYNC, static_cast<unsigned>(inst_id)); | ||||
|             try{ | ||||
|                 switch(inst_id){<%instructions.eachWithIndex{instr, idx -> %> | ||||
| @@ -306,6 +280,7 @@ typename vm_base<ARCH>::virt_addr_t vm_impl<ARCH>::execute_inst(finish_cond_e co | ||||
|                     <%}%>if(this->disass_enabled){ | ||||
|                         /* generate console output when executing the command */<%instr.disass.eachLine{%> | ||||
|                         ${it}<%}%> | ||||
|                         this->core.disass_output(pc.val, mnemonic); | ||||
|                     } | ||||
|                     // used registers<%instr.usedVariables.each{ k,v-> | ||||
|                     if(v.isArray) {%> | ||||
| @@ -330,16 +305,18 @@ typename vm_base<ARCH>::virt_addr_t vm_impl<ARCH>::execute_inst(finish_cond_e co | ||||
|             //    this->core.reg.trap_state =  this->core.reg.pending_trap; | ||||
|             // trap check | ||||
|             if(trap_state!=0){ | ||||
|                 super::core.enter_trap(trap_state, pc.val, instr); | ||||
|                 //In case of Instruction address misaligned (cause = 0 and trapid = 0) need the targeted addr (in tval) | ||||
|                 auto mcause = (trap_state>>16) & 0xff;  | ||||
|                 super::core.enter_trap(trap_state, pc.val, mcause ? instr:tval); | ||||
|             } else { | ||||
|                 icount++; | ||||
|                 instret++; | ||||
|             } | ||||
|             cycle++; | ||||
|             pc.val=*NEXT_PC; | ||||
|             this->core.reg.PC = this->core.reg.NEXT_PC; | ||||
|             *PC = *NEXT_PC; | ||||
|             this->core.reg.trap_state =  this->core.reg.pending_trap; | ||||
|         } | ||||
|         fetch_count++; | ||||
|         cycle++; | ||||
|     } | ||||
|     return pc; | ||||
| } | ||||
| @@ -355,24 +332,33 @@ std::unique_ptr<vm_if> create<arch::${coreDef.name.toLowerCase()}>(arch::${coreD | ||||
| } // namespace interp | ||||
| } // namespace iss | ||||
|  | ||||
| #include <iss/factory.h> | ||||
| #include <iss/arch/riscv_hart_m_p.h> | ||||
| #include <iss/arch/riscv_hart_mu_p.h> | ||||
| #include <iss/factory.h> | ||||
| namespace iss { | ||||
| namespace { | ||||
| volatile std::array<bool, 2> dummy = { | ||||
|         core_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|interp", [](unsigned port, void*) -> std::tuple<cpu_ptr, vm_ptr>{ | ||||
|         core_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|interp", [](unsigned port, void* init_data) -> std::tuple<cpu_ptr, vm_ptr>{ | ||||
|             auto* cpu = new iss::arch::riscv_hart_m_p<iss::arch::${coreDef.name.toLowerCase()}>(); | ||||
| 		    auto vm = new interp::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | ||||
| 		    if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | ||||
|             if(init_data){ | ||||
|                 auto* cb = reinterpret_cast<semihosting_cb_t<arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t>*>(init_data); | ||||
|                 cpu->set_semihosting_callback(*cb); | ||||
|             } | ||||
|             return {cpu_ptr{cpu}, vm_ptr{vm}}; | ||||
|         }), | ||||
|         core_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|interp", [](unsigned port, void*) -> std::tuple<cpu_ptr, vm_ptr>{ | ||||
|         core_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|interp", [](unsigned port, void* init_data) -> std::tuple<cpu_ptr, vm_ptr>{ | ||||
|             auto* cpu = new iss::arch::riscv_hart_mu_p<iss::arch::${coreDef.name.toLowerCase()}>(); | ||||
| 		    auto vm = new interp::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | ||||
| 		    if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | ||||
|             if(init_data){ | ||||
|                 auto* cb = reinterpret_cast<semihosting_cb_t<arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t>*>(init_data); | ||||
|                 cpu->set_semihosting_callback(*cb); | ||||
|             } | ||||
|             return {cpu_ptr{cpu}, vm_ptr{vm}}; | ||||
|         }) | ||||
| }; | ||||
| } | ||||
| } | ||||
| // clang-format on | ||||
| @@ -1,5 +1,5 @@ | ||||
| /******************************************************************************* | ||||
|  * Copyright (C) 2017, 2018 MINRES Technologies GmbH | ||||
|  * Copyright (C) 2017-2024 MINRES Technologies GmbH | ||||
|  * All rights reserved. | ||||
|  * | ||||
|  * Redistribution and use in source and binary forms, with or without | ||||
| @@ -29,14 +29,17 @@ | ||||
|  * POSSIBILITY OF SUCH DAMAGE. | ||||
|  * | ||||
|  *******************************************************************************/ | ||||
|  | ||||
| // clang-format off | ||||
| #include <iss/arch/${coreDef.name.toLowerCase()}.h> | ||||
| #include <iss/debugger/gdb_session.h> | ||||
| #include <iss/debugger/server.h> | ||||
| #include <iss/iss.h> | ||||
| #include <iss/llvm/vm_base.h> | ||||
| #include <util/logging.h> | ||||
|  | ||||
| #include <iss/instruction_decoder.h> | ||||
| <%def fcsr = registers.find {it.name=='FCSR'} | ||||
| if(fcsr != null) {%> | ||||
| #include <vm/fp_functions.h><%}%> | ||||
| #ifndef FMT_HEADER_ONLY | ||||
| #define FMT_HEADER_ONLY | ||||
| #endif | ||||
| @@ -82,7 +85,9 @@ protected: | ||||
|     using vm_base<ARCH>::get_reg_ptr; | ||||
|  | ||||
|     inline const char *name(size_t index){return traits::reg_aliases.at(index);} | ||||
|  | ||||
| <%if(fcsr != null) {%> | ||||
|     inline const char *fname(size_t index){return index < 32?name(index+traits::F0):"illegal";}    | ||||
| <%}%> | ||||
|     template <typename T> inline ConstantInt *size(T type) { | ||||
|         return ConstantInt::get(getContext(), APInt(32, type->getType()->getScalarSizeInBits())); | ||||
|     } | ||||
| @@ -96,19 +101,17 @@ protected: | ||||
|         return super::gen_cond_assign(cond, this->gen_ext(trueVal, size), this->gen_ext(falseVal, size)); | ||||
|     } | ||||
|  | ||||
|     std::tuple<continuation_e, BasicBlock *> gen_single_inst_behavior(virt_addr_t &, unsigned int &, BasicBlock *) override; | ||||
|     std::tuple<continuation_e, BasicBlock *> gen_single_inst_behavior(virt_addr_t &, BasicBlock *) override; | ||||
|  | ||||
|     void gen_leave_behavior(BasicBlock *leave_blk) override; | ||||
|  | ||||
|     void gen_raise_trap(uint16_t trap_id, uint16_t cause); | ||||
|  | ||||
|     void gen_leave_trap(unsigned lvl); | ||||
|  | ||||
|     void gen_wait(unsigned type); | ||||
|  | ||||
|     void set_tval(uint64_t new_tval); | ||||
|     void set_tval(Value* new_tval); | ||||
|     void gen_trap_behavior(BasicBlock *) override; | ||||
|  | ||||
|     void gen_trap_check(BasicBlock *bb); | ||||
|     void gen_instr_prologue(); | ||||
|     void gen_instr_epilogue(BasicBlock *bb); | ||||
|  | ||||
|     inline Value *gen_reg_load(unsigned i, unsigned level = 0) { | ||||
|         return this->builder.CreateLoad(this->get_typeptr(i), get_reg_ptr(i), false); | ||||
| @@ -132,51 +135,58 @@ protected: | ||||
|         auto sign_mask = 1ULL<<(W-1); | ||||
|         return (from & mask) | ((from & sign_mask) ? ~mask : 0); | ||||
|     } | ||||
|  | ||||
| <%functions.each{ it.eachLine { %> | ||||
|     ${it}<%}%> | ||||
| <%}%> | ||||
| private: | ||||
|     /**************************************************************************** | ||||
|      * start opcode definitions | ||||
|      ****************************************************************************/ | ||||
|     struct instruction_descriptor { | ||||
|         size_t length; | ||||
|         uint32_t length; | ||||
|         uint32_t value; | ||||
|         uint32_t mask; | ||||
|         compile_func op; | ||||
|     }; | ||||
|     struct decoding_tree_node{ | ||||
|         std::vector<instruction_descriptor> instrs; | ||||
|         std::vector<decoding_tree_node*> children; | ||||
|         uint32_t submask = std::numeric_limits<uint32_t>::max(); | ||||
|         uint32_t value; | ||||
|         decoding_tree_node(uint32_t value) : value(value){} | ||||
|     }; | ||||
|  | ||||
|     decoding_tree_node* root {nullptr}; | ||||
|  | ||||
|     const std::array<instruction_descriptor, ${instructions.size}> instr_descr = {{ | ||||
|     const std::array<instruction_descriptor, ${instructions.size()}> instr_descr = {{ | ||||
|          /* entries are: size, valid value, valid mask, function ptr */<%instructions.each{instr -> %> | ||||
|         /* instruction ${instr.instruction.name}, encoding '${instr.encoding}' */ | ||||
|         {${instr.length}, ${instr.encoding}, ${instr.mask}, &this_class::__${generator.functionName(instr.name)}},<%}%> | ||||
|     }}; | ||||
|  | ||||
|     //needs to be declared after instr_descr | ||||
|     decoder instr_decoder; | ||||
|  | ||||
|     /* instruction definitions */<%instructions.eachWithIndex{instr, idx -> %> | ||||
|     /* instruction ${idx}: ${instr.name} */ | ||||
|     std::tuple<continuation_e, BasicBlock*> __${generator.functionName(instr.name)}(virt_addr_t& pc, code_word_t instr, BasicBlock* bb){ | ||||
|         bb->setName(fmt::format("${instr.name}_0x{:X}",pc.val)); | ||||
|         this->gen_sync(PRE_SYNC,${idx}); | ||||
|         uint64_t PC = pc.val; | ||||
|         <%instr.fields.eachLine{%>${it} | ||||
|         <%}%>if(this->disass_enabled){ | ||||
|             /* generate console output when executing the command */<%instr.disass.eachLine{%> | ||||
|             ${it}<%}%> | ||||
|             std::vector<Value*> args { | ||||
|                 this->core_ptr, | ||||
|                 this->gen_const(64, pc.val), | ||||
|                 this->builder.CreateGlobalStringPtr(mnemonic), | ||||
|             }; | ||||
|             this->builder.CreateCall(this->mod->getFunction("print_disass"), args); | ||||
|         } | ||||
|         auto cur_pc_val = this->gen_const(32,pc.val); | ||||
|         bb->setName(fmt::format("${instr.name}_0x{:X}",pc.val)); | ||||
|         this->gen_sync(PRE_SYNC,${idx}); | ||||
|          | ||||
|         this->gen_set_pc(pc, traits::PC); | ||||
|         this->set_tval(instr); | ||||
|         pc=pc+ ${instr.length/8}; | ||||
|         this->gen_set_pc(pc, traits::NEXT_PC); | ||||
|          | ||||
|         this->gen_instr_prologue(); | ||||
|         /*generate behavior*/ | ||||
|         <%instr.behavior.eachLine{%>${it} | ||||
|         <%}%> | ||||
|         this->gen_trap_check(bb); | ||||
|     	this->gen_sync(POST_SYNC, ${idx}); | ||||
|         this->gen_sync(POST_SYNC, ${idx}); | ||||
|         this->gen_instr_epilogue(bb); | ||||
|         this->builder.CreateBr(bb); | ||||
|     	return returnValue;         | ||||
|     } | ||||
| @@ -184,8 +194,17 @@ private: | ||||
|     /**************************************************************************** | ||||
|      * end opcode definitions | ||||
|      ****************************************************************************/ | ||||
|     std::tuple<continuation_e, BasicBlock *> illegal_intruction(virt_addr_t &pc, code_word_t instr, BasicBlock *bb) { | ||||
| 		this->gen_sync(iss::PRE_SYNC, instr_descr.size()); | ||||
|     std::tuple<continuation_e, BasicBlock *> illegal_instruction(virt_addr_t &pc, code_word_t instr, BasicBlock *bb) { | ||||
|         if(this->disass_enabled){ | ||||
|             auto mnemonic = std::string("illegal_instruction"); | ||||
|             std::vector<Value*> args { | ||||
|                 this->core_ptr, | ||||
|                 this->gen_const(64, pc.val), | ||||
|                 this->builder.CreateGlobalStringPtr(mnemonic), | ||||
|             }; | ||||
|             this->builder.CreateCall(this->mod->getFunction("print_disass"), args); | ||||
|         } | ||||
|         this->gen_sync(iss::PRE_SYNC, instr_descr.size()); | ||||
|         this->builder.CreateStore(this->builder.CreateLoad(this->get_typeptr(traits::NEXT_PC), get_reg_ptr(traits::NEXT_PC), true), | ||||
|                                    get_reg_ptr(traits::PC), true); | ||||
|         this->builder.CreateStore( | ||||
| @@ -193,62 +212,13 @@ private: | ||||
|                                      this->gen_const(64U, 1)), | ||||
|             get_reg_ptr(traits::ICOUNT), true); | ||||
|         pc = pc + ((instr & 3) == 3 ? 4 : 2); | ||||
|         this->set_tval(instr); | ||||
|         this->gen_raise_trap(0, 2);     // illegal instruction trap | ||||
| 		this->gen_sync(iss::POST_SYNC, instr_descr.size()); | ||||
|         this->gen_trap_check(this->leave_blk); | ||||
|         return std::make_tuple(BRANCH, nullptr); | ||||
|     }     | ||||
|     //decoding functionality | ||||
|  | ||||
|     void populate_decoding_tree(decoding_tree_node* root){ | ||||
|         //create submask | ||||
|         for(auto instr: root->instrs){ | ||||
|             root->submask &= instr.mask; | ||||
|         } | ||||
|         //put each instr according to submask&encoding into children | ||||
|         for(auto instr: root->instrs){ | ||||
|             bool foundMatch = false; | ||||
|             for(auto child: root->children){ | ||||
|                 //use value as identifying trait | ||||
|                 if(child->value == (instr.value&root->submask)){ | ||||
|                     child->instrs.push_back(instr); | ||||
|                     foundMatch = true; | ||||
|                 } | ||||
|             } | ||||
|             if(!foundMatch){ | ||||
|                 decoding_tree_node* child = new decoding_tree_node(instr.value&root->submask); | ||||
|                 child->instrs.push_back(instr); | ||||
|                 root->children.push_back(child); | ||||
|             } | ||||
|         } | ||||
|         root->instrs.clear(); | ||||
|         //call populate_decoding_tree for all children | ||||
|         if(root->children.size() >1) | ||||
|             for(auto child: root->children){ | ||||
|                 populate_decoding_tree(child);       | ||||
|             } | ||||
|         else{ | ||||
|             //sort instrs by value of the mask, this works bc we want to have the least restrictive one last | ||||
|             std::sort(root->children[0]->instrs.begin(), root->children[0]->instrs.end(), [](const instruction_descriptor& instr1, const instruction_descriptor& instr2) { | ||||
|             return instr1.mask > instr2.mask; | ||||
|             });  | ||||
|         } | ||||
|     } | ||||
|     compile_func decode_instr(decoding_tree_node* node, code_word_t word){ | ||||
|         if(!node->children.size()){ | ||||
|             if(node->instrs.size() == 1) return node->instrs[0].op; | ||||
|             for(auto instr : node->instrs){ | ||||
|                 if((instr.mask&word) == instr.value) return instr.op; | ||||
|             } | ||||
|         } | ||||
|         else{ | ||||
|             for(auto child : node->children){ | ||||
|                 if (child->value == (node->submask&word)){ | ||||
|                     return decode_instr(child, word); | ||||
|                 }   | ||||
|             }   | ||||
|         } | ||||
|         return nullptr; | ||||
|         bb = this->leave_blk; | ||||
|         this->gen_instr_epilogue(bb); | ||||
|         this->builder.CreateBr(bb); | ||||
|         return std::make_tuple(ILLEGAL_INSTR, nullptr); | ||||
|     }     | ||||
| }; | ||||
|  | ||||
| @@ -261,17 +231,20 @@ template <typename ARCH> vm_impl<ARCH>::vm_impl() { this(new ARCH()); } | ||||
|  | ||||
| template <typename ARCH> | ||||
| vm_impl<ARCH>::vm_impl(ARCH &core, unsigned core_id, unsigned cluster_id) | ||||
| : vm_base<ARCH>(core, core_id, cluster_id) { | ||||
|     root = new decoding_tree_node(std::numeric_limits<uint32_t>::max()); | ||||
|     for(auto instr:instr_descr){ | ||||
|         root->instrs.push_back(instr); | ||||
|     } | ||||
|     populate_decoding_tree(root); | ||||
| } | ||||
| : vm_base<ARCH>(core, core_id, cluster_id) | ||||
| , instr_decoder([this]() { | ||||
|         std::vector<generic_instruction_descriptor> g_instr_descr; | ||||
|         g_instr_descr.reserve(instr_descr.size()); | ||||
|         for (uint32_t i = 0; i < instr_descr.size(); ++i) { | ||||
|             generic_instruction_descriptor new_instr_descr {instr_descr[i].value, instr_descr[i].mask, i}; | ||||
|             g_instr_descr.push_back(new_instr_descr); | ||||
|         } | ||||
|         return std::move(g_instr_descr); | ||||
|     }()) {} | ||||
|  | ||||
| template <typename ARCH> | ||||
| std::tuple<continuation_e, BasicBlock *> | ||||
| vm_impl<ARCH>::gen_single_inst_behavior(virt_addr_t &pc, unsigned int &inst_cnt, BasicBlock *this_block) { | ||||
| vm_impl<ARCH>::gen_single_inst_behavior(virt_addr_t &pc, BasicBlock *this_block) { | ||||
|     // we fetch at max 4 byte, alignment is 2 | ||||
|     enum {TRAP_ID=1<<16}; | ||||
|     code_word_t instr = 0; | ||||
| @@ -280,65 +253,83 @@ vm_impl<ARCH>::gen_single_inst_behavior(virt_addr_t &pc, unsigned int &inst_cnt, | ||||
|     auto *const data = (uint8_t *)&instr; | ||||
|     if(this->core.has_mmu()) | ||||
|         paddr = this->core.virt2phys(pc); | ||||
|     //TODO: re-add page handling | ||||
| //    if ((pc.val & upper_bits) != ((pc.val + 2) & upper_bits)) { // we may cross a page boundary | ||||
| //        auto res = this->core.read(paddr, 2, data); | ||||
| //        if (res != iss::Ok) throw trap_access(TRAP_ID, pc.val); | ||||
| //        if ((instr & 0x3) == 0x3) { // this is a 32bit instruction | ||||
| //            res = this->core.read(this->core.v2p(pc + 2), 2, data + 2); | ||||
| //        } | ||||
| //    } else { | ||||
|         auto res = this->core.read(paddr, 4, data); | ||||
|         if (res != iss::Ok) throw trap_access(TRAP_ID, pc.val); | ||||
| //    } | ||||
|     if (instr == 0x0000006f || (instr&0xffff)==0xa001) throw simulation_stopped(0); // 'J 0' or 'C.J 0' | ||||
|     // curr pc on stack | ||||
|     ++inst_cnt; | ||||
|     auto f = decode_instr(root, instr); | ||||
|     auto res = this->core.read(paddr, 4, data); | ||||
|     if (res != iss::Ok)  | ||||
|         return std::make_tuple(ILLEGAL_FETCH, nullptr); | ||||
|     if (instr == 0x0000006f || (instr&0xffff)==0xa001){ | ||||
|         this->builder.CreateBr(this->leave_blk); | ||||
|         return std::make_tuple(JUMP_TO_SELF, nullptr); | ||||
|         } | ||||
|     uint32_t inst_index = instr_decoder.decode_instr(instr); | ||||
|     compile_func f = nullptr; | ||||
|     if(inst_index < instr_descr.size()) | ||||
|         f = instr_descr[inst_index].op; | ||||
|     if (f == nullptr) { | ||||
|         f = &this_class::illegal_intruction; | ||||
|         f = &this_class::illegal_instruction; | ||||
|     } | ||||
|     return (this->*f)(pc, instr, this_block); | ||||
| } | ||||
|  | ||||
| template <typename ARCH> void vm_impl<ARCH>::gen_leave_behavior(BasicBlock *leave_blk) { | ||||
| template <typename ARCH> | ||||
| void vm_impl<ARCH>::gen_leave_behavior(BasicBlock *leave_blk) { | ||||
|     this->builder.SetInsertPoint(leave_blk); | ||||
|     this->builder.CreateRet(this->builder.CreateLoad(this->get_typeptr(traits::NEXT_PC),get_reg_ptr(traits::NEXT_PC), false)); | ||||
| } | ||||
|  | ||||
| template <typename ARCH> void vm_impl<ARCH>::gen_raise_trap(uint16_t trap_id, uint16_t cause) { | ||||
| template <typename ARCH> | ||||
| void vm_impl<ARCH>::gen_raise_trap(uint16_t trap_id, uint16_t cause) { | ||||
|     auto *TRAP_val = this->gen_const(32, 0x80 << 24 | (cause << 16) | trap_id); | ||||
|     this->builder.CreateStore(TRAP_val, get_reg_ptr(traits::TRAP_STATE), true); | ||||
|     this->builder.CreateStore(this->gen_const(32U, std::numeric_limits<uint32_t>::max()), get_reg_ptr(traits::LAST_BRANCH), false); | ||||
|     this->builder.CreateBr(this->trap_blk); | ||||
| } | ||||
|  | ||||
| template <typename ARCH> void vm_impl<ARCH>::gen_leave_trap(unsigned lvl) { | ||||
| template <typename ARCH> | ||||
| void vm_impl<ARCH>::gen_leave_trap(unsigned lvl) { | ||||
|     std::vector<Value *> args{ this->core_ptr, ConstantInt::get(getContext(), APInt(64, lvl)) }; | ||||
|     this->builder.CreateCall(this->mod->getFunction("leave_trap"), args); | ||||
|     auto *PC_val = this->gen_read_mem(traits::CSR, (lvl << 8) + 0x41, traits::XLEN / 8); | ||||
|     this->builder.CreateStore(PC_val, get_reg_ptr(traits::NEXT_PC), false); | ||||
|     this->builder.CreateStore(this->gen_const(32U, std::numeric_limits<uint32_t>::max()), get_reg_ptr(traits::LAST_BRANCH), false); | ||||
|     this->builder.CreateStore(this->gen_const(32U, static_cast<int>(UNKNOWN_JUMP)), get_reg_ptr(traits::LAST_BRANCH), false); | ||||
| } | ||||
|  | ||||
| template <typename ARCH> void vm_impl<ARCH>::gen_wait(unsigned type) { | ||||
| template <typename ARCH> | ||||
| void vm_impl<ARCH>::gen_wait(unsigned type) { | ||||
|     std::vector<Value *> args{ this->core_ptr, ConstantInt::get(getContext(), APInt(64, type)) }; | ||||
|     this->builder.CreateCall(this->mod->getFunction("wait"), args); | ||||
| } | ||||
|  | ||||
| template <typename ARCH> void vm_impl<ARCH>::gen_trap_behavior(BasicBlock *trap_blk) { | ||||
| template <typename ARCH> | ||||
| inline void vm_impl<ARCH>::set_tval(uint64_t tval) { | ||||
|     auto tmp_tval = this->gen_const(64, tval); | ||||
|     this->set_tval(tmp_tval); | ||||
| } | ||||
| template <typename ARCH> | ||||
| inline void vm_impl<ARCH>::set_tval(Value* new_tval) { | ||||
|     this->builder.CreateStore(this->gen_ext(new_tval, 64, false), this->tval); | ||||
| } | ||||
| template <typename ARCH>  | ||||
| void vm_impl<ARCH>::gen_trap_behavior(BasicBlock *trap_blk) { | ||||
|     this->builder.SetInsertPoint(trap_blk); | ||||
|     this->gen_sync(POST_SYNC, -1); //TODO get right InstrId | ||||
|     auto *trap_state_val = this->builder.CreateLoad(this->get_typeptr(traits::TRAP_STATE), get_reg_ptr(traits::TRAP_STATE), true); | ||||
|     this->builder.CreateStore(this->gen_const(32U, std::numeric_limits<uint32_t>::max()), | ||||
|                               get_reg_ptr(traits::LAST_BRANCH), false); | ||||
|     std::vector<Value *> args{this->core_ptr, this->adj_to64(trap_state_val), | ||||
|                               this->adj_to64(this->builder.CreateLoad(this->get_typeptr(traits::PC), get_reg_ptr(traits::PC), false))}; | ||||
|     auto *cur_pc_val = this->builder.CreateLoad(this->get_typeptr(traits::PC), get_reg_ptr(traits::PC), true); | ||||
|     std::vector<Value *> args{this->core_ptr, | ||||
|                                 this->adj_to64(trap_state_val), | ||||
|                                 this->adj_to64(cur_pc_val), | ||||
|                               this->adj_to64(this->builder.CreateLoad(this->get_type(64),this->tval))}; | ||||
|     this->builder.CreateCall(this->mod->getFunction("enter_trap"), args); | ||||
|     this->builder.CreateStore(this->gen_const(32U, static_cast<int>(UNKNOWN_JUMP)), get_reg_ptr(traits::LAST_BRANCH), false); | ||||
|  | ||||
|     auto *trap_addr_val = this->builder.CreateLoad(this->get_typeptr(traits::NEXT_PC), get_reg_ptr(traits::NEXT_PC), false); | ||||
|     this->builder.CreateRet(trap_addr_val); | ||||
| } | ||||
| template <typename ARCH> | ||||
| void vm_impl<ARCH>::gen_instr_prologue() { | ||||
|     auto* trap_val = | ||||
|         this->builder.CreateLoad(this->get_typeptr(arch::traits<ARCH>::PENDING_TRAP), get_reg_ptr(arch::traits<ARCH>::PENDING_TRAP)); | ||||
|     this->builder.CreateStore(trap_val, get_reg_ptr(arch::traits<ARCH>::TRAP_STATE), false); | ||||
| } | ||||
|              | ||||
| template <typename ARCH> inline void vm_impl<ARCH>::gen_trap_check(BasicBlock *bb) { | ||||
|  | ||||
| template <typename ARCH> | ||||
| void vm_impl<ARCH>::gen_instr_epilogue(BasicBlock *bb) { | ||||
|     auto* target_bb = BasicBlock::Create(this->mod->getContext(), "", this->func, bb); | ||||
|     auto *v = this->builder.CreateLoad(this->get_typeptr(traits::TRAP_STATE), get_reg_ptr(traits::TRAP_STATE), true); | ||||
|     this->gen_cond_branch(this->builder.CreateICmp( | ||||
| @@ -346,6 +337,14 @@ template <typename ARCH> inline void vm_impl<ARCH>::gen_trap_check(BasicBlock *b | ||||
|                               ConstantInt::get(getContext(), APInt(v->getType()->getIntegerBitWidth(), 0))), | ||||
|                           target_bb, this->trap_blk, 1); | ||||
|     this->builder.SetInsertPoint(target_bb); | ||||
|     // update icount | ||||
|     auto* icount_val = this->builder.CreateAdd( | ||||
|         this->builder.CreateLoad(this->get_typeptr(arch::traits<ARCH>::ICOUNT), get_reg_ptr(arch::traits<ARCH>::ICOUNT)), this->gen_const(64U, 1)); | ||||
|     this->builder.CreateStore(icount_val, get_reg_ptr(arch::traits<ARCH>::ICOUNT), false); | ||||
|     //increment cyclecount | ||||
|     auto* cycle_val = this->builder.CreateAdd( | ||||
|         this->builder.CreateLoad(this->get_typeptr(arch::traits<ARCH>::CYCLE), get_reg_ptr(arch::traits<ARCH>::CYCLE)), this->gen_const(64U, 1)); | ||||
|     this->builder.CreateStore(cycle_val, get_reg_ptr(arch::traits<ARCH>::CYCLE), false); | ||||
| } | ||||
|  | ||||
| } // namespace ${coreDef.name.toLowerCase()} | ||||
| @@ -359,24 +358,33 @@ std::unique_ptr<vm_if> create<arch::${coreDef.name.toLowerCase()}>(arch::${coreD | ||||
| } // namespace llvm | ||||
| } // namespace iss | ||||
|  | ||||
| #include <iss/factory.h> | ||||
| #include <iss/arch/riscv_hart_m_p.h> | ||||
| #include <iss/arch/riscv_hart_mu_p.h> | ||||
| #include <iss/factory.h> | ||||
| namespace iss { | ||||
| namespace { | ||||
| volatile std::array<bool, 2> dummy = { | ||||
|         core_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|llvm", [](unsigned port, void*) -> std::tuple<cpu_ptr, vm_ptr>{ | ||||
|         core_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|llvm", [](unsigned port, void* init_data) -> std::tuple<cpu_ptr, vm_ptr>{ | ||||
|             auto* cpu = new iss::arch::riscv_hart_m_p<iss::arch::${coreDef.name.toLowerCase()}>(); | ||||
|             auto* vm = new llvm::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | ||||
|             if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | ||||
| 		    auto vm = new llvm::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | ||||
| 		    if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | ||||
|             if(init_data){ | ||||
|                 auto* cb = reinterpret_cast<std::function<void(arch_if*, arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t*, arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t*)>*>(init_data); | ||||
|                 cpu->set_semihosting_callback(*cb); | ||||
|             } | ||||
|             return {cpu_ptr{cpu}, vm_ptr{vm}}; | ||||
|         }), | ||||
|         core_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|llvm", [](unsigned port, void*) -> std::tuple<cpu_ptr, vm_ptr>{ | ||||
|         core_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|llvm", [](unsigned port, void* init_data) -> std::tuple<cpu_ptr, vm_ptr>{ | ||||
|             auto* cpu = new iss::arch::riscv_hart_mu_p<iss::arch::${coreDef.name.toLowerCase()}>(); | ||||
|             auto* vm = new llvm::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | ||||
|             if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | ||||
| 		    auto vm = new llvm::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | ||||
| 		    if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | ||||
|             if(init_data){ | ||||
|                 auto* cb = reinterpret_cast<std::function<void(arch_if*, arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t*, arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t*)>*>(init_data); | ||||
|                 cpu->set_semihosting_callback(*cb); | ||||
|             } | ||||
|             return {cpu_ptr{cpu}, vm_ptr{vm}}; | ||||
|         }) | ||||
| }; | ||||
| } | ||||
| } | ||||
| // clang-format on | ||||
|   | ||||
| @@ -1,5 +1,5 @@ | ||||
| /******************************************************************************* | ||||
|  * Copyright (C) 2020 MINRES Technologies GmbH | ||||
|  * Copyright (C) 2020-2024 MINRES Technologies GmbH | ||||
|  * All rights reserved. | ||||
|  * | ||||
|  * Redistribution and use in source and binary forms, with or without | ||||
| @@ -29,7 +29,7 @@ | ||||
|  * POSSIBILITY OF SUCH DAMAGE. | ||||
|  * | ||||
|  *******************************************************************************/ | ||||
|  | ||||
| // clang-format off | ||||
| #include <iss/arch/${coreDef.name.toLowerCase()}.h> | ||||
| #include <iss/debugger/gdb_session.h> | ||||
| #include <iss/debugger/server.h> | ||||
| @@ -37,7 +37,10 @@ | ||||
| #include <iss/tcc/vm_base.h> | ||||
| #include <util/logging.h> | ||||
| #include <sstream> | ||||
|  | ||||
| #include <iss/instruction_decoder.h> | ||||
| <%def fcsr = registers.find {it.name=='FCSR'} | ||||
| if(fcsr != null) {%> | ||||
| #include <vm/fp_functions.h><%}%> | ||||
| #ifndef FMT_HEADER_ONLY | ||||
| #define FMT_HEADER_ONLY | ||||
| #endif | ||||
| @@ -80,16 +83,21 @@ protected: | ||||
|     using vm_base<ARCH>::get_reg_ptr; | ||||
|  | ||||
|     using this_class = vm_impl<ARCH>; | ||||
|     using compile_ret_t = std::tuple<continuation_e>; | ||||
|     using compile_ret_t = continuation_e; | ||||
|     using compile_func = compile_ret_t (this_class::*)(virt_addr_t &pc, code_word_t instr, tu_builder&); | ||||
|  | ||||
|     inline const char *name(size_t index){return traits::reg_aliases.at(index);} | ||||
| <% | ||||
| if(fcsr != null) {%> | ||||
|     inline const char *fname(size_t index){return index < 32?name(index+traits::F0):"illegal";}    | ||||
| <%}%> | ||||
|     void add_prologue(tu_builder& tu) override; | ||||
|  | ||||
|     void setup_module(std::string m) override { | ||||
|         super::setup_module(m); | ||||
|     } | ||||
|  | ||||
|     compile_ret_t gen_single_inst_behavior(virt_addr_t &, unsigned int &, tu_builder&) override; | ||||
|     compile_ret_t gen_single_inst_behavior(virt_addr_t &, tu_builder&) override; | ||||
|  | ||||
|     void gen_trap_behavior(tu_builder& tu) override; | ||||
|  | ||||
| @@ -97,7 +105,9 @@ protected: | ||||
|  | ||||
|     void gen_leave_trap(tu_builder& tu, unsigned lvl); | ||||
|  | ||||
|     void gen_wait(tu_builder& tu, unsigned type); | ||||
|     inline void gen_set_tval(tu_builder& tu, uint64_t new_tval); | ||||
|  | ||||
|     inline void gen_set_tval(tu_builder& tu, value new_tval); | ||||
|  | ||||
|     inline void gen_trap_check(tu_builder& tu) { | ||||
|         tu("if(*trap_state!=0) goto trap_entry;"); | ||||
| @@ -128,32 +138,29 @@ protected: | ||||
|         return (from & mask) | ((from & sign_mask) ? ~mask : 0); | ||||
|     } | ||||
|  | ||||
| <%functions.each{ it.eachLine { %> | ||||
|     ${it}<%}%> | ||||
| <%}%> | ||||
| private: | ||||
|     /**************************************************************************** | ||||
|      * start opcode definitions | ||||
|      ****************************************************************************/ | ||||
|     struct instruction_descriptor { | ||||
|         size_t length; | ||||
|         uint32_t length; | ||||
|         uint32_t value; | ||||
|         uint32_t mask; | ||||
|         compile_func op; | ||||
|     }; | ||||
|     struct decoding_tree_node{ | ||||
|         std::vector<instruction_descriptor> instrs; | ||||
|         std::vector<decoding_tree_node*> children; | ||||
|         uint32_t submask = std::numeric_limits<uint32_t>::max(); | ||||
|         uint32_t value; | ||||
|         decoding_tree_node(uint32_t value) : value(value){} | ||||
|     }; | ||||
|  | ||||
|     decoding_tree_node* root {nullptr}; | ||||
|  | ||||
|     const std::array<instruction_descriptor, ${instructions.size}> instr_descr = {{ | ||||
|     const std::array<instruction_descriptor, ${instructions.size()}> instr_descr = {{ | ||||
|          /* entries are: size, valid value, valid mask, function ptr */<%instructions.each{instr -> %> | ||||
|         /* instruction ${instr.instruction.name}, encoding '${instr.encoding}' */ | ||||
|         {${instr.length}, ${instr.encoding}, ${instr.mask}, &this_class::__${generator.functionName(instr.name)}},<%}%> | ||||
|     }}; | ||||
|  | ||||
|     //needs to be declared after instr_descr | ||||
|     decoder instr_decoder; | ||||
|  | ||||
|     /* instruction definitions */<%instructions.eachWithIndex{instr, idx -> %> | ||||
|     /* instruction ${idx}: ${instr.name} */ | ||||
|     compile_ret_t __${generator.functionName(instr.name)}(virt_addr_t& pc, code_word_t instr, tu_builder& tu){ | ||||
| @@ -164,82 +171,37 @@ private: | ||||
|         <%}%>if(this->disass_enabled){ | ||||
|             /* generate console output when executing the command */<%instr.disass.eachLine{%> | ||||
|             ${it}<%}%> | ||||
|             tu("print_disass(core_ptr, {:#x}, \"{}\");", pc.val, mnemonic); | ||||
|         } | ||||
|         auto cur_pc_val = tu.constant(pc.val, traits::reg_bit_widths[traits::PC]); | ||||
|         pc=pc+ ${instr.length/8}; | ||||
|         gen_set_pc(tu, pc, traits::NEXT_PC); | ||||
|         tu("(*cycle)++;"); | ||||
|         tu.open_scope(); | ||||
|         this->gen_set_tval(tu, instr); | ||||
|         <%instr.behavior.eachLine{%>${it} | ||||
|         <%}%> | ||||
|         tu.close_scope(); | ||||
|         gen_trap_check(tu);         | ||||
|         vm_base<ARCH>::gen_sync(tu, POST_SYNC,${idx}); | ||||
|         gen_trap_check(tu);         | ||||
|         return returnValue; | ||||
|     } | ||||
|     <%}%> | ||||
|     /**************************************************************************** | ||||
|      * end opcode definitions | ||||
|      ****************************************************************************/ | ||||
|     compile_ret_t illegal_intruction(virt_addr_t &pc, code_word_t instr, tu_builder& tu) { | ||||
|     compile_ret_t illegal_instruction(virt_addr_t &pc, code_word_t instr, tu_builder& tu) { | ||||
|         vm_impl::gen_sync(tu, iss::PRE_SYNC, instr_descr.size()); | ||||
|         if(this->disass_enabled){ | ||||
|             /* generate console output when executing the command */ | ||||
|             tu("print_disass(core_ptr, {:#x}, \"{}\");", pc.val, std::string("illegal_instruction")); | ||||
|         } | ||||
|         pc = pc + ((instr & 3) == 3 ? 4 : 2); | ||||
|         gen_raise_trap(tu, 0, 2);     // illegal instruction trap | ||||
|         gen_raise_trap(tu, 0, static_cast<int32_t>(traits:: RV_CAUSE_ILLEGAL_INSTRUCTION)); | ||||
|         this->gen_set_tval(tu, instr); | ||||
|         vm_impl::gen_sync(tu, iss::POST_SYNC, instr_descr.size()); | ||||
|         vm_impl::gen_trap_check(tu); | ||||
|         return BRANCH; | ||||
|     } | ||||
|      | ||||
|     //decoding functionality | ||||
|  | ||||
|     void populate_decoding_tree(decoding_tree_node* root){ | ||||
|         //create submask | ||||
|         for(auto instr: root->instrs){ | ||||
|             root->submask &= instr.mask; | ||||
|         } | ||||
|         //put each instr according to submask&encoding into children | ||||
|         for(auto instr: root->instrs){ | ||||
|             bool foundMatch = false; | ||||
|             for(auto child: root->children){ | ||||
|                 //use value as identifying trait | ||||
|                 if(child->value == (instr.value&root->submask)){ | ||||
|                     child->instrs.push_back(instr); | ||||
|                     foundMatch = true; | ||||
|                 } | ||||
|             } | ||||
|             if(!foundMatch){ | ||||
|                 decoding_tree_node* child = new decoding_tree_node(instr.value&root->submask); | ||||
|                 child->instrs.push_back(instr); | ||||
|                 root->children.push_back(child); | ||||
|             } | ||||
|         } | ||||
|         root->instrs.clear(); | ||||
|         //call populate_decoding_tree for all children | ||||
|         if(root->children.size() >1) | ||||
|             for(auto child: root->children){ | ||||
|                 populate_decoding_tree(child);       | ||||
|             } | ||||
|         else{ | ||||
|             //sort instrs by value of the mask, this works bc we want to have the least restrictive one last | ||||
|             std::sort(root->children[0]->instrs.begin(), root->children[0]->instrs.end(), [](const instruction_descriptor& instr1, const instruction_descriptor& instr2) { | ||||
|             return instr1.mask > instr2.mask; | ||||
|             });  | ||||
|         } | ||||
|     } | ||||
|     compile_func decode_instr(decoding_tree_node* node, code_word_t word){ | ||||
|         if(!node->children.size()){ | ||||
|             if(node->instrs.size() == 1) return node->instrs[0].op; | ||||
|             for(auto instr : node->instrs){ | ||||
|                 if((instr.mask&word) == instr.value) return instr.op; | ||||
|             } | ||||
|         } | ||||
|         else{ | ||||
|             for(auto child : node->children){ | ||||
|                 if (child->value == (node->submask&word)){ | ||||
|                     return decode_instr(child, word); | ||||
|                 }   | ||||
|             }   | ||||
|         } | ||||
|         return nullptr; | ||||
|         return ILLEGAL_INSTR; | ||||
|     } | ||||
| }; | ||||
|  | ||||
| @@ -252,65 +214,100 @@ template <typename ARCH> vm_impl<ARCH>::vm_impl() { this(new ARCH()); } | ||||
|  | ||||
| template <typename ARCH> | ||||
| vm_impl<ARCH>::vm_impl(ARCH &core, unsigned core_id, unsigned cluster_id) | ||||
| : vm_base<ARCH>(core, core_id, cluster_id) { | ||||
|     root = new decoding_tree_node(std::numeric_limits<uint32_t>::max()); | ||||
|     for(auto instr:instr_descr){ | ||||
|         root->instrs.push_back(instr); | ||||
|     } | ||||
|     populate_decoding_tree(root); | ||||
| } | ||||
| : vm_base<ARCH>(core, core_id, cluster_id) | ||||
| , instr_decoder([this]() { | ||||
|         std::vector<generic_instruction_descriptor> g_instr_descr; | ||||
|         g_instr_descr.reserve(instr_descr.size()); | ||||
|         for (uint32_t i = 0; i < instr_descr.size(); ++i) { | ||||
|             generic_instruction_descriptor new_instr_descr {instr_descr[i].value, instr_descr[i].mask, i}; | ||||
|             g_instr_descr.push_back(new_instr_descr); | ||||
|         } | ||||
|         return std::move(g_instr_descr); | ||||
|     }()) {} | ||||
|  | ||||
| template <typename ARCH> | ||||
| std::tuple<continuation_e> | ||||
| vm_impl<ARCH>::gen_single_inst_behavior(virt_addr_t &pc, unsigned int &inst_cnt, tu_builder& tu) { | ||||
| continuation_e | ||||
| vm_impl<ARCH>::gen_single_inst_behavior(virt_addr_t &pc, tu_builder& tu) { | ||||
|     // we fetch at max 4 byte, alignment is 2 | ||||
|     enum {TRAP_ID=1<<16}; | ||||
|     code_word_t instr = 0; | ||||
|     phys_addr_t paddr(pc); | ||||
|     if(this->core.has_mmu()) | ||||
|         paddr = this->core.virt2phys(pc); | ||||
|     //TODO: re-add page handling | ||||
| //    if ((pc.val & upper_bits) != ((pc.val + 2) & upper_bits)) { // we may cross a page boundary | ||||
| //        auto res = this->core.read(paddr, 2, data); | ||||
| //        if (res != iss::Ok) throw trap_access(TRAP_ID, pc.val); | ||||
| //        if ((insn & 0x3) == 0x3) { // this is a 32bit instruction | ||||
| //            res = this->core.read(this->core.v2p(pc + 2), 2, data + 2); | ||||
| //        } | ||||
| //    } else { | ||||
|         auto res = this->core.read(paddr, 4, reinterpret_cast<uint8_t*>(&instr)); | ||||
|         if (res != iss::Ok) throw trap_access(TRAP_ID, pc.val); | ||||
| //    } | ||||
|     if (instr == 0x0000006f || (instr&0xffff)==0xa001) throw simulation_stopped(0); // 'J 0' or 'C.J 0' | ||||
|     // curr pc on stack | ||||
|     ++inst_cnt; | ||||
|     auto f = decode_instr(root, instr); | ||||
|     auto res = this->core.read(paddr, 4, reinterpret_cast<uint8_t*>(&instr)); | ||||
|     if (res != iss::Ok) | ||||
|         return ILLEGAL_FETCH; | ||||
|     if (instr == 0x0000006f || (instr&0xffff)==0xa001)  | ||||
|         return JUMP_TO_SELF; | ||||
|     uint32_t inst_index = instr_decoder.decode_instr(instr); | ||||
|     compile_func f = nullptr; | ||||
|     if(inst_index < instr_descr.size()) | ||||
|         f = instr_descr[inst_index].op; | ||||
|     if (f == nullptr) { | ||||
|         f = &this_class::illegal_intruction; | ||||
|         f = &this_class::illegal_instruction; | ||||
|     } | ||||
|     return (this->*f)(pc, instr, tu); | ||||
| } | ||||
|  | ||||
| template <typename ARCH> void vm_impl<ARCH>::gen_raise_trap(tu_builder& tu, uint16_t trap_id, uint16_t cause) { | ||||
|     tu("  *trap_state = {:#x};", 0x80 << 24 | (cause << 16) | trap_id); | ||||
|     tu.store(traits::LAST_BRANCH, tu.constant(std::numeric_limits<uint32_t>::max(), 32)); | ||||
| } | ||||
|  | ||||
| template <typename ARCH> void vm_impl<ARCH>::gen_leave_trap(tu_builder& tu, unsigned lvl) { | ||||
|     tu("leave_trap(core_ptr, {});", lvl); | ||||
|     tu.store(traits::NEXT_PC, tu.read_mem(traits::CSR, (lvl << 8) + 0x41, traits::XLEN)); | ||||
|     tu.store(traits::LAST_BRANCH, tu.constant(std::numeric_limits<uint32_t>::max(), 32)); | ||||
|     tu.store(traits::LAST_BRANCH, tu.constant(static_cast<int>(UNKNOWN_JUMP), 32)); | ||||
| } | ||||
|  | ||||
| template <typename ARCH> void vm_impl<ARCH>::gen_wait(tu_builder& tu, unsigned type) { | ||||
| template <typename ARCH> void vm_impl<ARCH>::gen_set_tval(tu_builder& tu, uint64_t new_tval) { | ||||
|     tu(fmt::format("tval = {};", new_tval)); | ||||
| } | ||||
| template <typename ARCH> void vm_impl<ARCH>::gen_set_tval(tu_builder& tu, value new_tval) { | ||||
|     tu(fmt::format("tval = {};", new_tval.str)); | ||||
| } | ||||
|  | ||||
| template <typename ARCH> void vm_impl<ARCH>::gen_trap_behavior(tu_builder& tu) { | ||||
|     tu("trap_entry:"); | ||||
|     this->gen_sync(tu, POST_SYNC, -1);     | ||||
|     tu("enter_trap(core_ptr, *trap_state, *pc, 0);"); | ||||
|     tu.store(traits::LAST_BRANCH, tu.constant(std::numeric_limits<uint32_t>::max(),32)); | ||||
|     tu("enter_trap(core_ptr, *trap_state, *pc, tval);"); | ||||
|     tu.store(traits::LAST_BRANCH, tu.constant(static_cast<int>(UNKNOWN_JUMP),32)); | ||||
|     tu("return *next_pc;"); | ||||
| } | ||||
| template <typename ARCH> void vm_impl<ARCH>::add_prologue(tu_builder& tu){ | ||||
|     std::ostringstream os; | ||||
|     os << tu.add_reg_ptr("trap_state", arch::traits<ARCH>::TRAP_STATE, this->regs_base_ptr); | ||||
|     os << tu.add_reg_ptr("pending_trap", arch::traits<ARCH>::PENDING_TRAP, this->regs_base_ptr); | ||||
|     os << tu.add_reg_ptr("cycle", arch::traits<ARCH>::CYCLE, this->regs_base_ptr); | ||||
| <%if(fcsr != null) {%> | ||||
|     os << "uint32_t (*fget_flags)()=" << (uintptr_t)&fget_flags << ";\\n"; | ||||
|     os << "uint32_t (*fadd_s)(uint32_t v1, uint32_t v2, uint8_t mode)=" << (uintptr_t)&fadd_s << ";\\n"; | ||||
|     os << "uint32_t (*fsub_s)(uint32_t v1, uint32_t v2, uint8_t mode)=" << (uintptr_t)&fsub_s << ";\\n"; | ||||
|     os << "uint32_t (*fmul_s)(uint32_t v1, uint32_t v2, uint8_t mode)=" << (uintptr_t)&fmul_s << ";\\n"; | ||||
|     os << "uint32_t (*fdiv_s)(uint32_t v1, uint32_t v2, uint8_t mode)=" << (uintptr_t)&fdiv_s << ";\\n"; | ||||
|     os << "uint32_t (*fsqrt_s)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&fsqrt_s << ";\\n"; | ||||
|     os << "uint32_t (*fcmp_s)(uint32_t v1, uint32_t v2, uint32_t op)=" << (uintptr_t)&fcmp_s << ";\\n"; | ||||
|     os << "uint32_t (*fcvt_s)(uint32_t v1, uint32_t op, uint8_t mode)=" << (uintptr_t)&fcvt_s << ";\\n"; | ||||
|     os << "uint32_t (*fmadd_s)(uint32_t v1, uint32_t v2, uint32_t v3, uint32_t op, uint8_t mode)=" << (uintptr_t)&fmadd_s << ";\\n"; | ||||
|     os << "uint32_t (*fsel_s)(uint32_t v1, uint32_t v2, uint32_t op)=" << (uintptr_t)&fsel_s << ";\\n"; | ||||
|     os << "uint32_t (*fclass_s)( uint32_t v1 )=" << (uintptr_t)&fclass_s << ";\\n"; | ||||
|     os << "uint32_t (*fconv_d2f)(uint64_t v1, uint8_t mode)=" << (uintptr_t)&fconv_d2f << ";\\n"; | ||||
|     os << "uint64_t (*fconv_f2d)(uint32_t v1, uint8_t mode)=" << (uintptr_t)&fconv_f2d << ";\\n"; | ||||
|     os << "uint64_t (*fadd_d)(uint64_t v1, uint64_t v2, uint8_t mode)=" << (uintptr_t)&fadd_d << ";\\n"; | ||||
|     os << "uint64_t (*fsub_d)(uint64_t v1, uint64_t v2, uint8_t mode)=" << (uintptr_t)&fsub_d << ";\\n"; | ||||
|     os << "uint64_t (*fmul_d)(uint64_t v1, uint64_t v2, uint8_t mode)=" << (uintptr_t)&fmul_d << ";\\n"; | ||||
|     os << "uint64_t (*fdiv_d)(uint64_t v1, uint64_t v2, uint8_t mode)=" << (uintptr_t)&fdiv_d << ";\\n"; | ||||
|     os << "uint64_t (*fsqrt_d)(uint64_t v1, uint8_t mode)=" << (uintptr_t)&fsqrt_d << ";\\n"; | ||||
|     os << "uint64_t (*fcmp_d)(uint64_t v1, uint64_t v2, uint32_t op)=" << (uintptr_t)&fcmp_d << ";\\n"; | ||||
|     os << "uint64_t (*fcvt_d)(uint64_t v1, uint32_t op, uint8_t mode)=" << (uintptr_t)&fcvt_d << ";\\n"; | ||||
|     os << "uint64_t (*fmadd_d)(uint64_t v1, uint64_t v2, uint64_t v3, uint32_t op, uint8_t mode)=" << (uintptr_t)&fmadd_d << ";\\n"; | ||||
|     os << "uint64_t (*fsel_d)(uint64_t v1, uint64_t v2, uint32_t op)=" << (uintptr_t)&fsel_d << ";\\n"; | ||||
|     os << "uint64_t (*fclass_d)(uint64_t v1  )=" << (uintptr_t)&fclass_d << ";\\n"; | ||||
|     os << "uint64_t (*fcvt_32_64)(uint32_t v1, uint32_t op, uint8_t mode)=" << (uintptr_t)&fcvt_32_64 << ";\\n"; | ||||
|     os << "uint32_t (*fcvt_64_32)(uint64_t v1, uint32_t op, uint8_t mode)=" << (uintptr_t)&fcvt_64_32 << ";\\n"; | ||||
|     os << "uint32_t (*unbox_s)(uint64_t v)=" << (uintptr_t)&unbox_s << ";\\n"; | ||||
|     <%}%> | ||||
|     tu.add_prologue(os.str()); | ||||
| } | ||||
|  | ||||
| } // namespace ${coreDef.name.toLowerCase()} | ||||
|  | ||||
| @@ -323,24 +320,33 @@ std::unique_ptr<vm_if> create<arch::${coreDef.name.toLowerCase()}>(arch::${coreD | ||||
| } // namesapce tcc | ||||
| } // namespace iss | ||||
|  | ||||
| #include <iss/factory.h> | ||||
| #include <iss/arch/riscv_hart_m_p.h> | ||||
| #include <iss/arch/riscv_hart_mu_p.h> | ||||
| #include <iss/factory.h> | ||||
| namespace iss { | ||||
| namespace { | ||||
| volatile std::array<bool, 2> dummy = { | ||||
|         core_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|tcc", [](unsigned port, void*) -> std::tuple<cpu_ptr, vm_ptr>{ | ||||
|         core_factory::instance().register_creator("${coreDef.name.toLowerCase()}|m_p|tcc", [](unsigned port, void* init_data) -> std::tuple<cpu_ptr, vm_ptr>{ | ||||
|             auto* cpu = new iss::arch::riscv_hart_m_p<iss::arch::${coreDef.name.toLowerCase()}>(); | ||||
| 		    auto vm = new tcc::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | ||||
| 		    if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | ||||
|             if(init_data){ | ||||
|                 auto* cb = reinterpret_cast<semihosting_cb_t<arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t>*>(init_data); | ||||
|                 cpu->set_semihosting_callback(*cb); | ||||
|             } | ||||
|             return {cpu_ptr{cpu}, vm_ptr{vm}}; | ||||
|         }), | ||||
|         core_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|tcc", [](unsigned port, void*) -> std::tuple<cpu_ptr, vm_ptr>{ | ||||
|         core_factory::instance().register_creator("${coreDef.name.toLowerCase()}|mu_p|tcc", [](unsigned port, void* init_data) -> std::tuple<cpu_ptr, vm_ptr>{ | ||||
|             auto* cpu = new iss::arch::riscv_hart_mu_p<iss::arch::${coreDef.name.toLowerCase()}>(); | ||||
| 		    auto vm = new tcc::${coreDef.name.toLowerCase()}::vm_impl<arch::${coreDef.name.toLowerCase()}>(*cpu, false); | ||||
| 		    if (port != 0) debugger::server<debugger::gdb_session>::run_server(vm, port); | ||||
|             if(init_data){ | ||||
|                 auto* cb = reinterpret_cast<semihosting_cb_t<arch::traits<arch::${coreDef.name.toLowerCase()}>::reg_t>*>(init_data); | ||||
|                 cpu->set_semihosting_callback(*cb); | ||||
|             } | ||||
|             return {cpu_ptr{cpu}, vm_ptr{vm}}; | ||||
|         }) | ||||
| }; | ||||
| } | ||||
| } | ||||
| // clang-format on | ||||
							
								
								
									
										2
									
								
								softfloat/.gitignore
									
									
									
									
										vendored
									
									
										Normal file
									
								
							
							
						
						
									
										2
									
								
								softfloat/.gitignore
									
									
									
									
										vendored
									
									
										Normal file
									
								
							| @@ -0,0 +1,2 @@ | ||||
| build/*/*.o | ||||
| build/*/*.a | ||||
| @@ -327,7 +327,7 @@ set(OTHERS | ||||
|  | ||||
| set(LIB_SOURCES ${PRIMITIVES} ${SPECIALIZE} ${OTHERS}) | ||||
|  | ||||
| add_library(softfloat ${LIB_SOURCES}) | ||||
| add_library(softfloat STATIC ${LIB_SOURCES}) | ||||
| set_property(TARGET softfloat PROPERTY C_STANDARD 99) | ||||
| target_compile_definitions(softfloat PRIVATE  | ||||
| 	SOFTFLOAT_ROUND_ODD  | ||||
| @@ -347,7 +347,7 @@ set_target_properties(softfloat PROPERTIES | ||||
|  | ||||
| install(TARGETS softfloat | ||||
|   EXPORT ${PROJECT_NAME}Targets            # for downstream dependencies | ||||
|   ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR} COMPONENT libs   # static lib | ||||
|   ARCHIVE DESTINATION ${CMAKE_INSTALL_LIBDIR}/static COMPONENT libs   # static lib | ||||
|   LIBRARY DESTINATION ${CMAKE_INSTALL_LIBDIR} COMPONENT libs   # shared lib | ||||
|   FRAMEWORK DESTINATION ${CMAKE_INSTALL_LIBDIR} COMPONENT libs # for mac | ||||
|   PUBLIC_HEADER DESTINATION ${CMAKE_INSTALL_INCLUDEDIR} COMPONENT devel   # headers for mac (note the different component -> different package) | ||||
|   | ||||
							
								
								
									
										24
									
								
								softfloat/README.md
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										24
									
								
								softfloat/README.md
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,24 @@ | ||||
|  | ||||
| Package Overview for Berkeley SoftFloat Release 3e | ||||
| ================================================== | ||||
|  | ||||
| John R. Hauser<br> | ||||
| 2018 January 20 | ||||
|  | ||||
|  | ||||
| Berkeley SoftFloat is a software implementation of binary floating-point | ||||
| that conforms to the IEEE Standard for Floating-Point Arithmetic.  SoftFloat | ||||
| is distributed in the form of C source code.  Building the SoftFloat sources | ||||
| generates a library file (typically `softfloat.a` or `libsoftfloat.a`) | ||||
| containing the floating-point subroutines. | ||||
|  | ||||
|  | ||||
| The SoftFloat package is documented in the following files in the `doc` | ||||
| subdirectory: | ||||
|  | ||||
| * [SoftFloat.html](http://www.jhauser.us/arithmetic/SoftFloat-3/doc/SoftFloat.html) Documentation for using the SoftFloat functions. | ||||
| * [SoftFloat-source.html](http://www.jhauser.us/arithmetic/SoftFloat-3/doc/SoftFloat-source.html) Documentation for building SoftFloat. | ||||
| * [SoftFloat-history.html](http://www.jhauser.us/arithmetic/SoftFloat-3/doc/SoftFloat-history.html) History of the major changes to SoftFloat. | ||||
|  | ||||
| Other files in the package comprise the source code for SoftFloat. | ||||
|  | ||||
							
								
								
									
										399
									
								
								softfloat/build/Linux-RISCV64-GCC/Makefile
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										399
									
								
								softfloat/build/Linux-RISCV64-GCC/Makefile
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,399 @@ | ||||
|  | ||||
| #============================================================================= | ||||
| # | ||||
| # This Makefile is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| # Package, Release 3e, by John R. Hauser. | ||||
| # | ||||
| # Copyright 2011, 2012, 2013, 2014, 2015, 2016, 2017 The Regents of the | ||||
| # University of California.  All rights reserved. | ||||
| # | ||||
| # Redistribution and use in source and binary forms, with or without | ||||
| # modification, are permitted provided that the following conditions are met: | ||||
| # | ||||
| #  1. Redistributions of source code must retain the above copyright notice, | ||||
| #     this list of conditions, and the following disclaimer. | ||||
| # | ||||
| #  2. Redistributions in binary form must reproduce the above copyright | ||||
| #     notice, this list of conditions, and the following disclaimer in the | ||||
| #     documentation and/or other materials provided with the distribution. | ||||
| # | ||||
| #  3. Neither the name of the University nor the names of its contributors | ||||
| #     may be used to endorse or promote products derived from this software | ||||
| #     without specific prior written permission. | ||||
| # | ||||
| # THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| # EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| # WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| # DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| # DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| # (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| # LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| # ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| # (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF | ||||
| # THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| # | ||||
| #============================================================================= | ||||
|  | ||||
| SOURCE_DIR ?= ../../source | ||||
| SPECIALIZE_TYPE ?= RISCV | ||||
| MARCH ?= rv64gcv_zfh_zfhmin | ||||
| MABI ?= lp64d | ||||
|  | ||||
| SOFTFLOAT_OPTS ?= \ | ||||
|   -DSOFTFLOAT_ROUND_ODD -DINLINE_LEVEL=5 -DSOFTFLOAT_FAST_DIV32TO16 \ | ||||
|   -DSOFTFLOAT_FAST_DIV64TO32 | ||||
|  | ||||
| DELETE = rm -f | ||||
| C_INCLUDES = -I. -I$(SOURCE_DIR)/$(SPECIALIZE_TYPE) -I$(SOURCE_DIR)/include | ||||
| COMPILE_C = \ | ||||
|   riscv64-unknown-linux-gnu-gcc -c -march=$(MARCH) -mabi=$(MABI) -Werror-implicit-function-declaration -DSOFTFLOAT_FAST_INT64 \ | ||||
|     $(SOFTFLOAT_OPTS) $(C_INCLUDES) -O2 -o $@ | ||||
| MAKELIB = ar crs $@ | ||||
|  | ||||
| OBJ = .o | ||||
| LIB = .a | ||||
|  | ||||
| OTHER_HEADERS = $(SOURCE_DIR)/include/opts-GCC.h | ||||
|  | ||||
| .PHONY: all | ||||
| all: softfloat$(LIB) | ||||
|  | ||||
| OBJS_PRIMITIVES = \ | ||||
|   s_eq128$(OBJ) \ | ||||
|   s_le128$(OBJ) \ | ||||
|   s_lt128$(OBJ) \ | ||||
|   s_shortShiftLeft128$(OBJ) \ | ||||
|   s_shortShiftRight128$(OBJ) \ | ||||
|   s_shortShiftRightJam64$(OBJ) \ | ||||
|   s_shortShiftRightJam64Extra$(OBJ) \ | ||||
|   s_shortShiftRightJam128$(OBJ) \ | ||||
|   s_shortShiftRightJam128Extra$(OBJ) \ | ||||
|   s_shiftRightJam32$(OBJ) \ | ||||
|   s_shiftRightJam64$(OBJ) \ | ||||
|   s_shiftRightJam64Extra$(OBJ) \ | ||||
|   s_shiftRightJam128$(OBJ) \ | ||||
|   s_shiftRightJam128Extra$(OBJ) \ | ||||
|   s_shiftRightJam256M$(OBJ) \ | ||||
|   s_countLeadingZeros8$(OBJ) \ | ||||
|   s_countLeadingZeros16$(OBJ) \ | ||||
|   s_countLeadingZeros32$(OBJ) \ | ||||
|   s_countLeadingZeros64$(OBJ) \ | ||||
|   s_add128$(OBJ) \ | ||||
|   s_add256M$(OBJ) \ | ||||
|   s_sub128$(OBJ) \ | ||||
|   s_sub256M$(OBJ) \ | ||||
|   s_mul64ByShifted32To128$(OBJ) \ | ||||
|   s_mul64To128$(OBJ) \ | ||||
|   s_mul128By32$(OBJ) \ | ||||
|   s_mul128To256M$(OBJ) \ | ||||
|   s_approxRecip_1Ks$(OBJ) \ | ||||
|   s_approxRecip32_1$(OBJ) \ | ||||
|   s_approxRecipSqrt_1Ks$(OBJ) \ | ||||
|   s_approxRecipSqrt32_1$(OBJ) \ | ||||
|  | ||||
| OBJS_SPECIALIZE = \ | ||||
|   softfloat_raiseFlags$(OBJ) \ | ||||
|   s_f16UIToCommonNaN$(OBJ) \ | ||||
|   s_commonNaNToF16UI$(OBJ) \ | ||||
|   s_propagateNaNF16UI$(OBJ) \ | ||||
|   s_bf16UIToCommonNaN$(OBJ) \ | ||||
|   s_commonNaNToBF16UI$(OBJ) \ | ||||
|   s_f32UIToCommonNaN$(OBJ) \ | ||||
|   s_commonNaNToF32UI$(OBJ) \ | ||||
|   s_propagateNaNF32UI$(OBJ) \ | ||||
|   s_f64UIToCommonNaN$(OBJ) \ | ||||
|   s_commonNaNToF64UI$(OBJ) \ | ||||
|   s_propagateNaNF64UI$(OBJ) \ | ||||
|   extF80M_isSignalingNaN$(OBJ) \ | ||||
|   s_extF80UIToCommonNaN$(OBJ) \ | ||||
|   s_commonNaNToExtF80UI$(OBJ) \ | ||||
|   s_propagateNaNExtF80UI$(OBJ) \ | ||||
|   f128M_isSignalingNaN$(OBJ) \ | ||||
|   s_f128UIToCommonNaN$(OBJ) \ | ||||
|   s_commonNaNToF128UI$(OBJ) \ | ||||
|   s_propagateNaNF128UI$(OBJ) \ | ||||
|  | ||||
| OBJS_OTHERS = \ | ||||
|   s_roundToUI32$(OBJ) \ | ||||
|   s_roundToUI64$(OBJ) \ | ||||
|   s_roundToI32$(OBJ) \ | ||||
|   s_roundToI64$(OBJ) \ | ||||
|   s_normSubnormalBF16Sig$(OBJ) \ | ||||
|   s_roundPackToBF16$(OBJ) \ | ||||
|   s_normSubnormalF16Sig$(OBJ) \ | ||||
|   s_roundPackToF16$(OBJ) \ | ||||
|   s_normRoundPackToF16$(OBJ) \ | ||||
|   s_addMagsF16$(OBJ) \ | ||||
|   s_subMagsF16$(OBJ) \ | ||||
|   s_mulAddF16$(OBJ) \ | ||||
|   s_normSubnormalF32Sig$(OBJ) \ | ||||
|   s_roundPackToF32$(OBJ) \ | ||||
|   s_normRoundPackToF32$(OBJ) \ | ||||
|   s_addMagsF32$(OBJ) \ | ||||
|   s_subMagsF32$(OBJ) \ | ||||
|   s_mulAddF32$(OBJ) \ | ||||
|   s_normSubnormalF64Sig$(OBJ) \ | ||||
|   s_roundPackToF64$(OBJ) \ | ||||
|   s_normRoundPackToF64$(OBJ) \ | ||||
|   s_addMagsF64$(OBJ) \ | ||||
|   s_subMagsF64$(OBJ) \ | ||||
|   s_mulAddF64$(OBJ) \ | ||||
|   s_normSubnormalExtF80Sig$(OBJ) \ | ||||
|   s_roundPackToExtF80$(OBJ) \ | ||||
|   s_normRoundPackToExtF80$(OBJ) \ | ||||
|   s_addMagsExtF80$(OBJ) \ | ||||
|   s_subMagsExtF80$(OBJ) \ | ||||
|   s_normSubnormalF128Sig$(OBJ) \ | ||||
|   s_roundPackToF128$(OBJ) \ | ||||
|   s_normRoundPackToF128$(OBJ) \ | ||||
|   s_addMagsF128$(OBJ) \ | ||||
|   s_subMagsF128$(OBJ) \ | ||||
|   s_mulAddF128$(OBJ) \ | ||||
|   softfloat_state$(OBJ) \ | ||||
|   ui32_to_f16$(OBJ) \ | ||||
|   ui32_to_f32$(OBJ) \ | ||||
|   ui32_to_f64$(OBJ) \ | ||||
|   ui32_to_extF80$(OBJ) \ | ||||
|   ui32_to_extF80M$(OBJ) \ | ||||
|   ui32_to_f128$(OBJ) \ | ||||
|   ui32_to_f128M$(OBJ) \ | ||||
|   ui64_to_f16$(OBJ) \ | ||||
|   ui64_to_f32$(OBJ) \ | ||||
|   ui64_to_f64$(OBJ) \ | ||||
|   ui64_to_extF80$(OBJ) \ | ||||
|   ui64_to_extF80M$(OBJ) \ | ||||
|   ui64_to_f128$(OBJ) \ | ||||
|   ui64_to_f128M$(OBJ) \ | ||||
|   i32_to_f16$(OBJ) \ | ||||
|   i32_to_f32$(OBJ) \ | ||||
|   i32_to_f64$(OBJ) \ | ||||
|   i32_to_extF80$(OBJ) \ | ||||
|   i32_to_extF80M$(OBJ) \ | ||||
|   i32_to_f128$(OBJ) \ | ||||
|   i32_to_f128M$(OBJ) \ | ||||
|   i64_to_f16$(OBJ) \ | ||||
|   i64_to_f32$(OBJ) \ | ||||
|   i64_to_f64$(OBJ) \ | ||||
|   i64_to_extF80$(OBJ) \ | ||||
|   i64_to_extF80M$(OBJ) \ | ||||
|   i64_to_f128$(OBJ) \ | ||||
|   i64_to_f128M$(OBJ) \ | ||||
|   bf16_isSignalingNaN$(OBJ) \ | ||||
|   bf16_to_f32$(OBJ) \ | ||||
|   f16_to_ui32$(OBJ) \ | ||||
|   f16_to_ui64$(OBJ) \ | ||||
|   f16_to_i32$(OBJ) \ | ||||
|   f16_to_i64$(OBJ) \ | ||||
|   f16_to_ui32_r_minMag$(OBJ) \ | ||||
|   f16_to_ui64_r_minMag$(OBJ) \ | ||||
|   f16_to_i32_r_minMag$(OBJ) \ | ||||
|   f16_to_i64_r_minMag$(OBJ) \ | ||||
|   f16_to_f32$(OBJ) \ | ||||
|   f16_to_f64$(OBJ) \ | ||||
|   f16_to_extF80$(OBJ) \ | ||||
|   f16_to_extF80M$(OBJ) \ | ||||
|   f16_to_f128$(OBJ) \ | ||||
|   f16_to_f128M$(OBJ) \ | ||||
|   f16_roundToInt$(OBJ) \ | ||||
|   f16_add$(OBJ) \ | ||||
|   f16_sub$(OBJ) \ | ||||
|   f16_mul$(OBJ) \ | ||||
|   f16_mulAdd$(OBJ) \ | ||||
|   f16_div$(OBJ) \ | ||||
|   f16_rem$(OBJ) \ | ||||
|   f16_sqrt$(OBJ) \ | ||||
|   f16_eq$(OBJ) \ | ||||
|   f16_le$(OBJ) \ | ||||
|   f16_lt$(OBJ) \ | ||||
|   f16_eq_signaling$(OBJ) \ | ||||
|   f16_le_quiet$(OBJ) \ | ||||
|   f16_lt_quiet$(OBJ) \ | ||||
|   f16_isSignalingNaN$(OBJ) \ | ||||
|   f32_to_ui32$(OBJ) \ | ||||
|   f32_to_ui64$(OBJ) \ | ||||
|   f32_to_i32$(OBJ) \ | ||||
|   f32_to_i64$(OBJ) \ | ||||
|   f32_to_ui32_r_minMag$(OBJ) \ | ||||
|   f32_to_ui64_r_minMag$(OBJ) \ | ||||
|   f32_to_i32_r_minMag$(OBJ) \ | ||||
|   f32_to_i64_r_minMag$(OBJ) \ | ||||
|   f32_to_bf16$(OBJ) \ | ||||
|   f32_to_f16$(OBJ) \ | ||||
|   f32_to_f64$(OBJ) \ | ||||
|   f32_to_extF80$(OBJ) \ | ||||
|   f32_to_extF80M$(OBJ) \ | ||||
|   f32_to_f128$(OBJ) \ | ||||
|   f32_to_f128M$(OBJ) \ | ||||
|   f32_roundToInt$(OBJ) \ | ||||
|   f32_add$(OBJ) \ | ||||
|   f32_sub$(OBJ) \ | ||||
|   f32_mul$(OBJ) \ | ||||
|   f32_mulAdd$(OBJ) \ | ||||
|   f32_div$(OBJ) \ | ||||
|   f32_rem$(OBJ) \ | ||||
|   f32_sqrt$(OBJ) \ | ||||
|   f32_eq$(OBJ) \ | ||||
|   f32_le$(OBJ) \ | ||||
|   f32_lt$(OBJ) \ | ||||
|   f32_eq_signaling$(OBJ) \ | ||||
|   f32_le_quiet$(OBJ) \ | ||||
|   f32_lt_quiet$(OBJ) \ | ||||
|   f32_isSignalingNaN$(OBJ) \ | ||||
|   f64_to_ui32$(OBJ) \ | ||||
|   f64_to_ui64$(OBJ) \ | ||||
|   f64_to_i32$(OBJ) \ | ||||
|   f64_to_i64$(OBJ) \ | ||||
|   f64_to_ui32_r_minMag$(OBJ) \ | ||||
|   f64_to_ui64_r_minMag$(OBJ) \ | ||||
|   f64_to_i32_r_minMag$(OBJ) \ | ||||
|   f64_to_i64_r_minMag$(OBJ) \ | ||||
|   f64_to_f16$(OBJ) \ | ||||
|   f64_to_f32$(OBJ) \ | ||||
|   f64_to_extF80$(OBJ) \ | ||||
|   f64_to_extF80M$(OBJ) \ | ||||
|   f64_to_f128$(OBJ) \ | ||||
|   f64_to_f128M$(OBJ) \ | ||||
|   f64_roundToInt$(OBJ) \ | ||||
|   f64_add$(OBJ) \ | ||||
|   f64_sub$(OBJ) \ | ||||
|   f64_mul$(OBJ) \ | ||||
|   f64_mulAdd$(OBJ) \ | ||||
|   f64_div$(OBJ) \ | ||||
|   f64_rem$(OBJ) \ | ||||
|   f64_sqrt$(OBJ) \ | ||||
|   f64_eq$(OBJ) \ | ||||
|   f64_le$(OBJ) \ | ||||
|   f64_lt$(OBJ) \ | ||||
|   f64_eq_signaling$(OBJ) \ | ||||
|   f64_le_quiet$(OBJ) \ | ||||
|   f64_lt_quiet$(OBJ) \ | ||||
|   f64_isSignalingNaN$(OBJ) \ | ||||
|   extF80_to_ui32$(OBJ) \ | ||||
|   extF80_to_ui64$(OBJ) \ | ||||
|   extF80_to_i32$(OBJ) \ | ||||
|   extF80_to_i64$(OBJ) \ | ||||
|   extF80_to_ui32_r_minMag$(OBJ) \ | ||||
|   extF80_to_ui64_r_minMag$(OBJ) \ | ||||
|   extF80_to_i32_r_minMag$(OBJ) \ | ||||
|   extF80_to_i64_r_minMag$(OBJ) \ | ||||
|   extF80_to_f16$(OBJ) \ | ||||
|   extF80_to_f32$(OBJ) \ | ||||
|   extF80_to_f64$(OBJ) \ | ||||
|   extF80_to_f128$(OBJ) \ | ||||
|   extF80_roundToInt$(OBJ) \ | ||||
|   extF80_add$(OBJ) \ | ||||
|   extF80_sub$(OBJ) \ | ||||
|   extF80_mul$(OBJ) \ | ||||
|   extF80_div$(OBJ) \ | ||||
|   extF80_rem$(OBJ) \ | ||||
|   extF80_sqrt$(OBJ) \ | ||||
|   extF80_eq$(OBJ) \ | ||||
|   extF80_le$(OBJ) \ | ||||
|   extF80_lt$(OBJ) \ | ||||
|   extF80_eq_signaling$(OBJ) \ | ||||
|   extF80_le_quiet$(OBJ) \ | ||||
|   extF80_lt_quiet$(OBJ) \ | ||||
|   extF80_isSignalingNaN$(OBJ) \ | ||||
|   extF80M_to_ui32$(OBJ) \ | ||||
|   extF80M_to_ui64$(OBJ) \ | ||||
|   extF80M_to_i32$(OBJ) \ | ||||
|   extF80M_to_i64$(OBJ) \ | ||||
|   extF80M_to_ui32_r_minMag$(OBJ) \ | ||||
|   extF80M_to_ui64_r_minMag$(OBJ) \ | ||||
|   extF80M_to_i32_r_minMag$(OBJ) \ | ||||
|   extF80M_to_i64_r_minMag$(OBJ) \ | ||||
|   extF80M_to_f16$(OBJ) \ | ||||
|   extF80M_to_f32$(OBJ) \ | ||||
|   extF80M_to_f64$(OBJ) \ | ||||
|   extF80M_to_f128M$(OBJ) \ | ||||
|   extF80M_roundToInt$(OBJ) \ | ||||
|   extF80M_add$(OBJ) \ | ||||
|   extF80M_sub$(OBJ) \ | ||||
|   extF80M_mul$(OBJ) \ | ||||
|   extF80M_div$(OBJ) \ | ||||
|   extF80M_rem$(OBJ) \ | ||||
|   extF80M_sqrt$(OBJ) \ | ||||
|   extF80M_eq$(OBJ) \ | ||||
|   extF80M_le$(OBJ) \ | ||||
|   extF80M_lt$(OBJ) \ | ||||
|   extF80M_eq_signaling$(OBJ) \ | ||||
|   extF80M_le_quiet$(OBJ) \ | ||||
|   extF80M_lt_quiet$(OBJ) \ | ||||
|   f128_to_ui32$(OBJ) \ | ||||
|   f128_to_ui64$(OBJ) \ | ||||
|   f128_to_i32$(OBJ) \ | ||||
|   f128_to_i64$(OBJ) \ | ||||
|   f128_to_ui32_r_minMag$(OBJ) \ | ||||
|   f128_to_ui64_r_minMag$(OBJ) \ | ||||
|   f128_to_i32_r_minMag$(OBJ) \ | ||||
|   f128_to_i64_r_minMag$(OBJ) \ | ||||
|   f128_to_f16$(OBJ) \ | ||||
|   f128_to_f32$(OBJ) \ | ||||
|   f128_to_extF80$(OBJ) \ | ||||
|   f128_to_f64$(OBJ) \ | ||||
|   f128_roundToInt$(OBJ) \ | ||||
|   f128_add$(OBJ) \ | ||||
|   f128_sub$(OBJ) \ | ||||
|   f128_mul$(OBJ) \ | ||||
|   f128_mulAdd$(OBJ) \ | ||||
|   f128_div$(OBJ) \ | ||||
|   f128_rem$(OBJ) \ | ||||
|   f128_sqrt$(OBJ) \ | ||||
|   f128_eq$(OBJ) \ | ||||
|   f128_le$(OBJ) \ | ||||
|   f128_lt$(OBJ) \ | ||||
|   f128_eq_signaling$(OBJ) \ | ||||
|   f128_le_quiet$(OBJ) \ | ||||
|   f128_lt_quiet$(OBJ) \ | ||||
|   f128_isSignalingNaN$(OBJ) \ | ||||
|   f128M_to_ui32$(OBJ) \ | ||||
|   f128M_to_ui64$(OBJ) \ | ||||
|   f128M_to_i32$(OBJ) \ | ||||
|   f128M_to_i64$(OBJ) \ | ||||
|   f128M_to_ui32_r_minMag$(OBJ) \ | ||||
|   f128M_to_ui64_r_minMag$(OBJ) \ | ||||
|   f128M_to_i32_r_minMag$(OBJ) \ | ||||
|   f128M_to_i64_r_minMag$(OBJ) \ | ||||
|   f128M_to_f16$(OBJ) \ | ||||
|   f128M_to_f32$(OBJ) \ | ||||
|   f128M_to_extF80M$(OBJ) \ | ||||
|   f128M_to_f64$(OBJ) \ | ||||
|   f128M_roundToInt$(OBJ) \ | ||||
|   f128M_add$(OBJ) \ | ||||
|   f128M_sub$(OBJ) \ | ||||
|   f128M_mul$(OBJ) \ | ||||
|   f128M_mulAdd$(OBJ) \ | ||||
|   f128M_div$(OBJ) \ | ||||
|   f128M_rem$(OBJ) \ | ||||
|   f128M_sqrt$(OBJ) \ | ||||
|   f128M_eq$(OBJ) \ | ||||
|   f128M_le$(OBJ) \ | ||||
|   f128M_lt$(OBJ) \ | ||||
|   f128M_eq_signaling$(OBJ) \ | ||||
|   f128M_le_quiet$(OBJ) \ | ||||
|   f128M_lt_quiet$(OBJ) \ | ||||
|  | ||||
| OBJS_ALL = $(OBJS_PRIMITIVES) $(OBJS_SPECIALIZE) $(OBJS_OTHERS) | ||||
|  | ||||
| $(OBJS_ALL): \ | ||||
|   $(OTHER_HEADERS) platform.h $(SOURCE_DIR)/include/primitiveTypes.h \ | ||||
|   $(SOURCE_DIR)/include/primitives.h | ||||
| $(OBJS_SPECIALIZE) $(OBJS_OTHERS): \ | ||||
|   $(SOURCE_DIR)/include/softfloat_types.h $(SOURCE_DIR)/include/internals.h \ | ||||
|   $(SOURCE_DIR)/$(SPECIALIZE_TYPE)/specialize.h \ | ||||
|   $(SOURCE_DIR)/include/softfloat.h | ||||
|  | ||||
| $(OBJS_PRIMITIVES) $(OBJS_OTHERS): %$(OBJ): $(SOURCE_DIR)/%.c | ||||
| 	$(COMPILE_C) $(SOURCE_DIR)/$*.c | ||||
|  | ||||
| $(OBJS_SPECIALIZE): %$(OBJ): $(SOURCE_DIR)/$(SPECIALIZE_TYPE)/%.c | ||||
| 	$(COMPILE_C) $(SOURCE_DIR)/$(SPECIALIZE_TYPE)/$*.c | ||||
|  | ||||
| softfloat$(LIB): $(OBJS_ALL) | ||||
| 	$(DELETE) $@ | ||||
| 	$(MAKELIB) $^ | ||||
|  | ||||
| .PHONY: clean | ||||
| clean: | ||||
| 	$(DELETE) $(OBJS_ALL) softfloat$(LIB) | ||||
|  | ||||
							
								
								
									
										54
									
								
								softfloat/build/Linux-RISCV64-GCC/platform.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										54
									
								
								softfloat/build/Linux-RISCV64-GCC/platform.h
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,54 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C header file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014, 2015, 2016, 2017 The Regents of the | ||||
| University of California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define LITTLEENDIAN 1 | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #ifdef __GNUC_STDC_INLINE__ | ||||
| #define INLINE inline | ||||
| #else | ||||
| #define INLINE extern inline | ||||
| #endif | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define SOFTFLOAT_BUILTIN_CLZ 1 | ||||
| #define SOFTFLOAT_INTRINSIC_INT128 1 | ||||
| #include "opts-GCC.h" | ||||
|  | ||||
| @@ -94,6 +94,8 @@ OBJS_SPECIALIZE = \ | ||||
|   s_f16UIToCommonNaN$(OBJ) \ | ||||
|   s_commonNaNToF16UI$(OBJ) \ | ||||
|   s_propagateNaNF16UI$(OBJ) \ | ||||
|   s_bf16UIToCommonNaN$(OBJ) \ | ||||
|   s_commonNaNToBF16UI$(OBJ) \ | ||||
|   s_f32UIToCommonNaN$(OBJ) \ | ||||
|   s_commonNaNToF32UI$(OBJ) \ | ||||
|   s_propagateNaNF32UI$(OBJ) \ | ||||
| @@ -114,6 +116,8 @@ OBJS_OTHERS = \ | ||||
|   s_roundToUI64$(OBJ) \ | ||||
|   s_roundToI32$(OBJ) \ | ||||
|   s_roundToI64$(OBJ) \ | ||||
|   s_normSubnormalBF16Sig$(OBJ) \ | ||||
|   s_roundPackToBF16$(OBJ) \ | ||||
|   s_normSubnormalF16Sig$(OBJ) \ | ||||
|   s_roundPackToF16$(OBJ) \ | ||||
|   s_normRoundPackToF16$(OBJ) \ | ||||
| @@ -172,6 +176,8 @@ OBJS_OTHERS = \ | ||||
|   i64_to_extF80M$(OBJ) \ | ||||
|   i64_to_f128$(OBJ) \ | ||||
|   i64_to_f128M$(OBJ) \ | ||||
|   bf16_isSignalingNaN$(OBJ) \ | ||||
|   bf16_to_f32$(OBJ) \ | ||||
|   f16_to_ui32$(OBJ) \ | ||||
|   f16_to_ui64$(OBJ) \ | ||||
|   f16_to_i32$(OBJ) \ | ||||
| @@ -209,6 +215,7 @@ OBJS_OTHERS = \ | ||||
|   f32_to_ui64_r_minMag$(OBJ) \ | ||||
|   f32_to_i32_r_minMag$(OBJ) \ | ||||
|   f32_to_i64_r_minMag$(OBJ) \ | ||||
|   f32_to_bf16$(OBJ) \ | ||||
|   f32_to_f16$(OBJ) \ | ||||
|   f32_to_f64$(OBJ) \ | ||||
|   f32_to_extF80$(OBJ) \ | ||||
|   | ||||
| @@ -35,11 +35,11 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| =============================================================================*/ | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| *----------------------------------------------------------------------------*/ | ||||
|  *----------------------------------------------------------------------------*/ | ||||
| #define LITTLEENDIAN 1 | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| *----------------------------------------------------------------------------*/ | ||||
|  *----------------------------------------------------------------------------*/ | ||||
| #ifdef __GNUC_STDC_INLINE__ | ||||
| //#define INLINE inline | ||||
| #define INLINE static | ||||
| @@ -48,10 +48,9 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| #endif | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| *----------------------------------------------------------------------------*/ | ||||
|  *----------------------------------------------------------------------------*/ | ||||
| #ifdef __GNUC__ | ||||
| #define SOFTFLOAT_BUILTIN_CLZ 1 | ||||
| #define SOFTFLOAT_INTRINSIC_INT128 1 | ||||
| #endif | ||||
| #include "opts-GCC.h" | ||||
|  | ||||
|   | ||||
| @@ -115,6 +115,8 @@ OBJS_OTHERS = \ | ||||
|   s_roundToUI64$(OBJ) \ | ||||
|   s_roundToI32$(OBJ) \ | ||||
|   s_roundToI64$(OBJ) \ | ||||
|   s_normSubnormalBF16Sig$(OBJ) \ | ||||
|   s_roundPackToBF16$(OBJ) \ | ||||
|   s_normSubnormalF16Sig$(OBJ) \ | ||||
|   s_roundPackToF16$(OBJ) \ | ||||
|   s_normRoundPackToF16$(OBJ) \ | ||||
| @@ -173,6 +175,8 @@ OBJS_OTHERS = \ | ||||
|   i64_to_extF80M$(OBJ) \ | ||||
|   i64_to_f128$(OBJ) \ | ||||
|   i64_to_f128M$(OBJ) \ | ||||
|   bf16_isSignalingNaN$(OBJ) \ | ||||
|   bf16_to_f32$(OBJ) \ | ||||
|   f16_to_ui32$(OBJ) \ | ||||
|   f16_to_ui64$(OBJ) \ | ||||
|   f16_to_i32$(OBJ) \ | ||||
| @@ -210,6 +214,7 @@ OBJS_OTHERS = \ | ||||
|   f32_to_ui64_r_minMag$(OBJ) \ | ||||
|   f32_to_i32_r_minMag$(OBJ) \ | ||||
|   f32_to_i64_r_minMag$(OBJ) \ | ||||
|   f32_to_bf16$(OBJ) \ | ||||
|   f32_to_f16$(OBJ) \ | ||||
|   f32_to_f64$(OBJ) \ | ||||
|   f32_to_extF80$(OBJ) \ | ||||
|   | ||||
| @@ -508,7 +508,7 @@ significant extra cost. | ||||
| On computers where the word size is <NOBR>64 bits</NOBR> or larger, both | ||||
| function versions (<CODE>f128M_add</CODE> and <CODE>f128_add</CODE>) are | ||||
| provided, because the cost of passing by value is then more reasonable. | ||||
| Applications that must be portable accross both classes of computers must use | ||||
| Applications that must be portable across both classes of computers must use | ||||
| the pointer-based functions, as these are always implemented. | ||||
| However, if it is known that SoftFloat includes the by-value functions for all | ||||
| platforms of interest, programmers can use whichever version they prefer. | ||||
|   | ||||
							
								
								
									
										59
									
								
								softfloat/source/8086-SSE/s_bf16UIToCommonNaN.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										59
									
								
								softfloat/source/8086-SSE/s_bf16UIToCommonNaN.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,59 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming `uiA' has the bit pattern of a BF16 NaN, converts | ||||
| | this NaN to the common NaN form, and stores the resulting common NaN at the | ||||
| | location pointed to by `zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_bf16UIToCommonNaN( uint_fast16_t uiA, struct commonNaN *zPtr ) | ||||
| { | ||||
|  | ||||
|     if ( softfloat_isSigNaNBF16UI( uiA ) ) { | ||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||
|     } | ||||
|     zPtr->sign = uiA>>15; | ||||
|     zPtr->v64  = (uint_fast64_t) uiA<<56; | ||||
|     zPtr->v0   = 0; | ||||
|  | ||||
| } | ||||
|  | ||||
							
								
								
									
										51
									
								
								softfloat/source/8086-SSE/s_commonNaNToBF16UI.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										51
									
								
								softfloat/source/8086-SSE/s_commonNaNToBF16UI.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,51 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "specialize.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by `aPtr' into a BF16 NaN, and  | ||||
| | returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast16_t softfloat_commonNaNToBF16UI( const struct commonNaN *aPtr ) | ||||
| { | ||||
|  | ||||
|     return (uint_fast16_t) aPtr->sign<<15 | 0x7FC0 | aPtr->v64>>56; | ||||
|  | ||||
| } | ||||
|  | ||||
| @@ -37,10 +37,10 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| #ifndef specialize_h | ||||
| #define specialize_h 1 | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "primitiveTypes.h" | ||||
| #include "softfloat.h" | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Default value for 'softfloat_detectTininess'. | ||||
| @@ -53,21 +53,21 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define ui32_fromPosOverflow 0xFFFFFFFF | ||||
| #define ui32_fromNegOverflow 0xFFFFFFFF | ||||
| #define ui32_fromNaN         0xFFFFFFFF | ||||
| #define i32_fromPosOverflow  (-0x7FFFFFFF - 1) | ||||
| #define i32_fromNegOverflow  (-0x7FFFFFFF - 1) | ||||
| #define i32_fromNaN          (-0x7FFFFFFF - 1) | ||||
| #define ui32_fromNaN 0xFFFFFFFF | ||||
| #define i32_fromPosOverflow (-0x7FFFFFFF - 1) | ||||
| #define i32_fromNegOverflow (-0x7FFFFFFF - 1) | ||||
| #define i32_fromNaN (-0x7FFFFFFF - 1) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The values to return on conversions to 64-bit integer formats that raise an | ||||
| | invalid exception. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define ui64_fromPosOverflow UINT64_C( 0xFFFFFFFFFFFFFFFF ) | ||||
| #define ui64_fromNegOverflow UINT64_C( 0xFFFFFFFFFFFFFFFF ) | ||||
| #define ui64_fromNaN         UINT64_C( 0xFFFFFFFFFFFFFFFF ) | ||||
| #define i64_fromPosOverflow  (-INT64_C( 0x7FFFFFFFFFFFFFFF ) - 1) | ||||
| #define i64_fromNegOverflow  (-INT64_C( 0x7FFFFFFFFFFFFFFF ) - 1) | ||||
| #define i64_fromNaN          (-INT64_C( 0x7FFFFFFFFFFFFFFF ) - 1) | ||||
| #define ui64_fromPosOverflow UINT64_C(0xFFFFFFFFFFFFFFFF) | ||||
| #define ui64_fromNegOverflow UINT64_C(0xFFFFFFFFFFFFFFFF) | ||||
| #define ui64_fromNaN UINT64_C(0xFFFFFFFFFFFFFFFF) | ||||
| #define i64_fromPosOverflow (-INT64_C(0x7FFFFFFFFFFFFFFF) - 1) | ||||
| #define i64_fromNegOverflow (-INT64_C(0x7FFFFFFFFFFFFFFF) - 1) | ||||
| #define i64_fromNaN (-INT64_C(0x7FFFFFFFFFFFFFFF) - 1) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | "Common NaN" structure, used to transfer NaN representations from one format | ||||
| @@ -92,7 +92,7 @@ struct commonNaN { | ||||
| | 16-bit floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF16UI( uiA ) ((((uiA) & 0x7E00) == 0x7C00) && ((uiA) & 0x01FF)) | ||||
| #define softfloat_isSigNaNF16UI(uiA) ((((uiA)&0x7E00) == 0x7C00) && ((uiA)&0x01FF)) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 16-bit floating-point NaN, converts | ||||
| @@ -100,13 +100,13 @@ struct commonNaN { | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_f16UIToCommonNaN( uint_fast16_t uiA, struct commonNaN *zPtr ); | ||||
| void softfloat_f16UIToCommonNaN(uint_fast16_t uiA, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 16-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast16_t softfloat_commonNaNToF16UI( const struct commonNaN *aPtr ); | ||||
| uint_fast16_t softfloat_commonNaNToF16UI(const struct commonNaN* aPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 16-bit floating- | ||||
| @@ -114,8 +114,28 @@ uint_fast16_t softfloat_commonNaNToF16UI( const struct commonNaN *aPtr ); | ||||
| | the combined NaN result.  If either 'uiA' or 'uiB' has the pattern of a | ||||
| | signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast16_t | ||||
|  softfloat_propagateNaNF16UI( uint_fast16_t uiA, uint_fast16_t uiB ); | ||||
| uint_fast16_t softfloat_propagateNaNF16UI(uint_fast16_t uiA, uint_fast16_t uiB); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when 16-bit unsigned integer 'uiA' has the bit pattern of a | ||||
| | 16-bit brain floating-point (BF16) signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNBF16UI(uiA) ((((uiA)&0x7FC0) == 0x7F80) && ((uiA)&0x003F)) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 16-bit BF16 floating-point NaN, converts | ||||
| | this NaN to the common NaN form, and stores the resulting common NaN at the | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_bf16UIToCommonNaN(uint_fast16_t uiA, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 16-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast16_t softfloat_commonNaNToBF16UI(const struct commonNaN* aPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 32-bit floating-point NaN. | ||||
| @@ -127,7 +147,7 @@ uint_fast16_t | ||||
| | 32-bit floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF32UI( uiA ) ((((uiA) & 0x7FC00000) == 0x7F800000) && ((uiA) & 0x003FFFFF)) | ||||
| #define softfloat_isSigNaNF32UI(uiA) ((((uiA)&0x7FC00000) == 0x7F800000) && ((uiA)&0x003FFFFF)) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 32-bit floating-point NaN, converts | ||||
| @@ -135,13 +155,13 @@ uint_fast16_t | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_f32UIToCommonNaN( uint_fast32_t uiA, struct commonNaN *zPtr ); | ||||
| void softfloat_f32UIToCommonNaN(uint_fast32_t uiA, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 32-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast32_t softfloat_commonNaNToF32UI( const struct commonNaN *aPtr ); | ||||
| uint_fast32_t softfloat_commonNaNToF32UI(const struct commonNaN* aPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 32-bit floating- | ||||
| @@ -149,20 +169,20 @@ uint_fast32_t softfloat_commonNaNToF32UI( const struct commonNaN *aPtr ); | ||||
| | the combined NaN result.  If either 'uiA' or 'uiB' has the pattern of a | ||||
| | signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast32_t | ||||
|  softfloat_propagateNaNF32UI( uint_fast32_t uiA, uint_fast32_t uiB ); | ||||
| uint_fast32_t softfloat_propagateNaNF32UI(uint_fast32_t uiA, uint_fast32_t uiB); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 64-bit floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNF64UI UINT64_C( 0xFFF8000000000000 ) | ||||
| #define defaultNaNF64UI UINT64_C(0xFFF8000000000000) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when 64-bit unsigned integer 'uiA' has the bit pattern of a | ||||
| | 64-bit floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF64UI( uiA ) ((((uiA) & UINT64_C( 0x7FF8000000000000 )) == UINT64_C( 0x7FF0000000000000 )) && ((uiA) & UINT64_C( 0x0007FFFFFFFFFFFF ))) | ||||
| #define softfloat_isSigNaNF64UI(uiA)                                                                                                       \ | ||||
|     ((((uiA)&UINT64_C(0x7FF8000000000000)) == UINT64_C(0x7FF0000000000000)) && ((uiA)&UINT64_C(0x0007FFFFFFFFFFFF))) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 64-bit floating-point NaN, converts | ||||
| @@ -170,13 +190,13 @@ uint_fast32_t | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_f64UIToCommonNaN( uint_fast64_t uiA, struct commonNaN *zPtr ); | ||||
| void softfloat_f64UIToCommonNaN(uint_fast64_t uiA, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 64-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast64_t softfloat_commonNaNToF64UI( const struct commonNaN *aPtr ); | ||||
| uint_fast64_t softfloat_commonNaNToF64UI(const struct commonNaN* aPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 64-bit floating- | ||||
| @@ -184,14 +204,13 @@ uint_fast64_t softfloat_commonNaNToF64UI( const struct commonNaN *aPtr ); | ||||
| | the combined NaN result.  If either 'uiA' or 'uiB' has the pattern of a | ||||
| | signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast64_t | ||||
|  softfloat_propagateNaNF64UI( uint_fast64_t uiA, uint_fast64_t uiB ); | ||||
| uint_fast64_t softfloat_propagateNaNF64UI(uint_fast64_t uiA, uint_fast64_t uiB); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 80-bit extended floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNExtF80UI64 0xFFFF | ||||
| #define defaultNaNExtF80UI0  UINT64_C( 0xC000000000000000 ) | ||||
| #define defaultNaNExtF80UI0 UINT64_C(0xC000000000000000) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when the 80-bit unsigned integer formed from concatenating | ||||
| @@ -199,7 +218,8 @@ uint_fast64_t | ||||
| | floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its arguments more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNExtF80UI( uiA64, uiA0 ) ((((uiA64) & 0x7FFF) == 0x7FFF) && ! ((uiA0) & UINT64_C( 0x4000000000000000 )) && ((uiA0) & UINT64_C( 0x3FFFFFFFFFFFFFFF ))) | ||||
| #define softfloat_isSigNaNExtF80UI(uiA64, uiA0)                                                                                            \ | ||||
|     ((((uiA64)&0x7FFF) == 0x7FFF) && !((uiA0)&UINT64_C(0x4000000000000000)) && ((uiA0)&UINT64_C(0x3FFFFFFFFFFFFFFF))) | ||||
|  | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
|  | ||||
| @@ -215,16 +235,14 @@ uint_fast64_t | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_extF80UIToCommonNaN( | ||||
|      uint_fast16_t uiA64, uint_fast64_t uiA0, struct commonNaN *zPtr ); | ||||
| void softfloat_extF80UIToCommonNaN(uint_fast16_t uiA64, uint_fast64_t uiA0, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into an 80-bit extended | ||||
| | floating-point NaN, and returns the bit pattern of this value as an unsigned | ||||
| | integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 softfloat_commonNaNToExtF80UI( const struct commonNaN *aPtr ); | ||||
| struct uint128 softfloat_commonNaNToExtF80UI(const struct commonNaN* aPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting the unsigned integer formed from concatenating 'uiA64' and | ||||
| @@ -235,19 +253,13 @@ struct uint128 softfloat_commonNaNToExtF80UI( const struct commonNaN *aPtr ); | ||||
| | result.  If either original floating-point value is a signaling NaN, the | ||||
| | invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 | ||||
|  softfloat_propagateNaNExtF80UI( | ||||
|      uint_fast16_t uiA64, | ||||
|      uint_fast64_t uiA0, | ||||
|      uint_fast16_t uiB64, | ||||
|      uint_fast64_t uiB0 | ||||
|  ); | ||||
| struct uint128 softfloat_propagateNaNExtF80UI(uint_fast16_t uiA64, uint_fast64_t uiA0, uint_fast16_t uiB64, uint_fast64_t uiB0); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 128-bit floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNF128UI64 UINT64_C( 0xFFFF800000000000 ) | ||||
| #define defaultNaNF128UI0  UINT64_C( 0 ) | ||||
| #define defaultNaNF128UI64 UINT64_C(0xFFFF800000000000) | ||||
| #define defaultNaNF128UI0 UINT64_C(0) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when the 128-bit unsigned integer formed from concatenating | ||||
| @@ -255,7 +267,8 @@ struct uint128 | ||||
| | point signaling NaN. | ||||
| | Note:  This macro evaluates its arguments more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF128UI( uiA64, uiA0 ) ((((uiA64) & UINT64_C( 0x7FFF800000000000 )) == UINT64_C( 0x7FFF000000000000 )) && ((uiA0) || ((uiA64) & UINT64_C( 0x00007FFFFFFFFFFF )))) | ||||
| #define softfloat_isSigNaNF128UI(uiA64, uiA0)                                                                                              \ | ||||
|     ((((uiA64)&UINT64_C(0x7FFF800000000000)) == UINT64_C(0x7FFF000000000000)) && ((uiA0) || ((uiA64)&UINT64_C(0x00007FFFFFFFFFFF)))) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming the unsigned integer formed from concatenating 'uiA64' and 'uiA0' | ||||
| @@ -264,15 +277,13 @@ struct uint128 | ||||
| | pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid exception | ||||
| | is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_f128UIToCommonNaN( | ||||
|      uint_fast64_t uiA64, uint_fast64_t uiA0, struct commonNaN *zPtr ); | ||||
| void softfloat_f128UIToCommonNaN(uint_fast64_t uiA64, uint_fast64_t uiA0, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 128-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 softfloat_commonNaNToF128UI( const struct commonNaN * ); | ||||
| struct uint128 softfloat_commonNaNToF128UI(const struct commonNaN*); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting the unsigned integer formed from concatenating 'uiA64' and | ||||
| @@ -283,13 +294,7 @@ struct uint128 softfloat_commonNaNToF128UI( const struct commonNaN * ); | ||||
| | If either original floating-point value is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 | ||||
|  softfloat_propagateNaNF128UI( | ||||
|      uint_fast64_t uiA64, | ||||
|      uint_fast64_t uiA0, | ||||
|      uint_fast64_t uiB64, | ||||
|      uint_fast64_t uiB0 | ||||
|  ); | ||||
| struct uint128 softfloat_propagateNaNF128UI(uint_fast64_t uiA64, uint_fast64_t uiA0, uint_fast64_t uiB64, uint_fast64_t uiB0); | ||||
|  | ||||
| #else | ||||
|  | ||||
| @@ -304,18 +309,14 @@ struct uint128 | ||||
| | common NaN at the location pointed to by 'zPtr'.  If the NaN is a signaling | ||||
| | NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_extF80MToCommonNaN( | ||||
|      const struct extFloat80M *aSPtr, struct commonNaN *zPtr ); | ||||
| void softfloat_extF80MToCommonNaN(const struct extFloat80M* aSPtr, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into an 80-bit extended | ||||
| | floating-point NaN, and stores this NaN at the location pointed to by | ||||
| | 'zSPtr'. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_commonNaNToExtF80M( | ||||
|      const struct commonNaN *aPtr, struct extFloat80M *zSPtr ); | ||||
| void softfloat_commonNaNToExtF80M(const struct commonNaN* aPtr, struct extFloat80M* zSPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming at least one of the two 80-bit extended floating-point values | ||||
| @@ -323,12 +324,7 @@ void | ||||
| | at the location pointed to by 'zSPtr'.  If either original floating-point | ||||
| | value is a signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_propagateNaNExtF80M( | ||||
|      const struct extFloat80M *aSPtr, | ||||
|      const struct extFloat80M *bSPtr, | ||||
|      struct extFloat80M *zSPtr | ||||
|  ); | ||||
| void softfloat_propagateNaNExtF80M(const struct extFloat80M* aSPtr, const struct extFloat80M* bSPtr, struct extFloat80M* zSPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 128-bit floating-point NaN. | ||||
| @@ -336,7 +332,7 @@ void | ||||
| #define defaultNaNF128UI96 0xFFFF8000 | ||||
| #define defaultNaNF128UI64 0 | ||||
| #define defaultNaNF128UI32 0 | ||||
| #define defaultNaNF128UI0  0 | ||||
| #define defaultNaNF128UI0 0 | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming the 128-bit floating-point value pointed to by 'aWPtr' is a NaN, | ||||
| @@ -346,8 +342,7 @@ void | ||||
| | four 32-bit elements that concatenate in the platform's normal endian order | ||||
| | to form a 128-bit floating-point value. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_f128MToCommonNaN( const uint32_t *aWPtr, struct commonNaN *zPtr ); | ||||
| void softfloat_f128MToCommonNaN(const uint32_t* aWPtr, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 128-bit floating-point | ||||
| @@ -355,8 +350,7 @@ void | ||||
| | 'zWPtr' points to an array of four 32-bit elements that concatenate in the | ||||
| | platform's normal endian order to form a 128-bit floating-point value. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_commonNaNToF128M( const struct commonNaN *aPtr, uint32_t *zWPtr ); | ||||
| void softfloat_commonNaNToF128M(const struct commonNaN* aPtr, uint32_t* zWPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming at least one of the two 128-bit floating-point values pointed to by | ||||
| @@ -366,11 +360,8 @@ void | ||||
| | and 'zWPtr' points to an array of four 32-bit elements that concatenate in | ||||
| | the platform's normal endian order to form a 128-bit floating-point value. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_propagateNaNF128M( | ||||
|      const uint32_t *aWPtr, const uint32_t *bWPtr, uint32_t *zWPtr ); | ||||
| void softfloat_propagateNaNF128M(const uint32_t* aWPtr, const uint32_t* bWPtr, uint32_t* zWPtr); | ||||
|  | ||||
| #endif | ||||
|  | ||||
| #endif | ||||
|  | ||||
|   | ||||
| @@ -37,10 +37,10 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| #ifndef specialize_h | ||||
| #define specialize_h 1 | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "primitiveTypes.h" | ||||
| #include "softfloat.h" | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Default value for 'softfloat_detectTininess'. | ||||
| @@ -53,21 +53,21 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define ui32_fromPosOverflow 0xFFFFFFFF | ||||
| #define ui32_fromNegOverflow 0xFFFFFFFF | ||||
| #define ui32_fromNaN         0xFFFFFFFF | ||||
| #define i32_fromPosOverflow  (-0x7FFFFFFF - 1) | ||||
| #define i32_fromNegOverflow  (-0x7FFFFFFF - 1) | ||||
| #define i32_fromNaN          (-0x7FFFFFFF - 1) | ||||
| #define ui32_fromNaN 0xFFFFFFFF | ||||
| #define i32_fromPosOverflow (-0x7FFFFFFF - 1) | ||||
| #define i32_fromNegOverflow (-0x7FFFFFFF - 1) | ||||
| #define i32_fromNaN (-0x7FFFFFFF - 1) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The values to return on conversions to 64-bit integer formats that raise an | ||||
| | invalid exception. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define ui64_fromPosOverflow UINT64_C( 0xFFFFFFFFFFFFFFFF ) | ||||
| #define ui64_fromNegOverflow UINT64_C( 0xFFFFFFFFFFFFFFFF ) | ||||
| #define ui64_fromNaN         UINT64_C( 0xFFFFFFFFFFFFFFFF ) | ||||
| #define i64_fromPosOverflow  (-INT64_C( 0x7FFFFFFFFFFFFFFF ) - 1) | ||||
| #define i64_fromNegOverflow  (-INT64_C( 0x7FFFFFFFFFFFFFFF ) - 1) | ||||
| #define i64_fromNaN          (-INT64_C( 0x7FFFFFFFFFFFFFFF ) - 1) | ||||
| #define ui64_fromPosOverflow UINT64_C(0xFFFFFFFFFFFFFFFF) | ||||
| #define ui64_fromNegOverflow UINT64_C(0xFFFFFFFFFFFFFFFF) | ||||
| #define ui64_fromNaN UINT64_C(0xFFFFFFFFFFFFFFFF) | ||||
| #define i64_fromPosOverflow (-INT64_C(0x7FFFFFFFFFFFFFFF) - 1) | ||||
| #define i64_fromNegOverflow (-INT64_C(0x7FFFFFFFFFFFFFFF) - 1) | ||||
| #define i64_fromNaN (-INT64_C(0x7FFFFFFFFFFFFFFF) - 1) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | "Common NaN" structure, used to transfer NaN representations from one format | ||||
| @@ -92,7 +92,7 @@ struct commonNaN { | ||||
| | 16-bit floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF16UI( uiA ) ((((uiA) & 0x7E00) == 0x7C00) && ((uiA) & 0x01FF)) | ||||
| #define softfloat_isSigNaNF16UI(uiA) ((((uiA)&0x7E00) == 0x7C00) && ((uiA)&0x01FF)) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 16-bit floating-point NaN, converts | ||||
| @@ -100,13 +100,13 @@ struct commonNaN { | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_f16UIToCommonNaN( uint_fast16_t uiA, struct commonNaN *zPtr ); | ||||
| void softfloat_f16UIToCommonNaN(uint_fast16_t uiA, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 16-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast16_t softfloat_commonNaNToF16UI( const struct commonNaN *aPtr ); | ||||
| uint_fast16_t softfloat_commonNaNToF16UI(const struct commonNaN* aPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 16-bit floating- | ||||
| @@ -114,8 +114,7 @@ uint_fast16_t softfloat_commonNaNToF16UI( const struct commonNaN *aPtr ); | ||||
| | the combined NaN result.  If either 'uiA' or 'uiB' has the pattern of a | ||||
| | signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast16_t | ||||
|  softfloat_propagateNaNF16UI( uint_fast16_t uiA, uint_fast16_t uiB ); | ||||
| uint_fast16_t softfloat_propagateNaNF16UI(uint_fast16_t uiA, uint_fast16_t uiB); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 32-bit floating-point NaN. | ||||
| @@ -127,7 +126,7 @@ uint_fast16_t | ||||
| | 32-bit floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF32UI( uiA ) ((((uiA) & 0x7FC00000) == 0x7F800000) && ((uiA) & 0x003FFFFF)) | ||||
| #define softfloat_isSigNaNF32UI(uiA) ((((uiA)&0x7FC00000) == 0x7F800000) && ((uiA)&0x003FFFFF)) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 32-bit floating-point NaN, converts | ||||
| @@ -135,13 +134,13 @@ uint_fast16_t | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_f32UIToCommonNaN( uint_fast32_t uiA, struct commonNaN *zPtr ); | ||||
| void softfloat_f32UIToCommonNaN(uint_fast32_t uiA, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 32-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast32_t softfloat_commonNaNToF32UI( const struct commonNaN *aPtr ); | ||||
| uint_fast32_t softfloat_commonNaNToF32UI(const struct commonNaN* aPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 32-bit floating- | ||||
| @@ -149,20 +148,20 @@ uint_fast32_t softfloat_commonNaNToF32UI( const struct commonNaN *aPtr ); | ||||
| | the combined NaN result.  If either 'uiA' or 'uiB' has the pattern of a | ||||
| | signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast32_t | ||||
|  softfloat_propagateNaNF32UI( uint_fast32_t uiA, uint_fast32_t uiB ); | ||||
| uint_fast32_t softfloat_propagateNaNF32UI(uint_fast32_t uiA, uint_fast32_t uiB); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 64-bit floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNF64UI UINT64_C( 0xFFF8000000000000 ) | ||||
| #define defaultNaNF64UI UINT64_C(0xFFF8000000000000) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when 64-bit unsigned integer 'uiA' has the bit pattern of a | ||||
| | 64-bit floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF64UI( uiA ) ((((uiA) & UINT64_C( 0x7FF8000000000000 )) == UINT64_C( 0x7FF0000000000000 )) && ((uiA) & UINT64_C( 0x0007FFFFFFFFFFFF ))) | ||||
| #define softfloat_isSigNaNF64UI(uiA)                                                                                                       \ | ||||
|     ((((uiA)&UINT64_C(0x7FF8000000000000)) == UINT64_C(0x7FF0000000000000)) && ((uiA)&UINT64_C(0x0007FFFFFFFFFFFF))) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 64-bit floating-point NaN, converts | ||||
| @@ -170,13 +169,13 @@ uint_fast32_t | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_f64UIToCommonNaN( uint_fast64_t uiA, struct commonNaN *zPtr ); | ||||
| void softfloat_f64UIToCommonNaN(uint_fast64_t uiA, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 64-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast64_t softfloat_commonNaNToF64UI( const struct commonNaN *aPtr ); | ||||
| uint_fast64_t softfloat_commonNaNToF64UI(const struct commonNaN* aPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 64-bit floating- | ||||
| @@ -184,14 +183,13 @@ uint_fast64_t softfloat_commonNaNToF64UI( const struct commonNaN *aPtr ); | ||||
| | the combined NaN result.  If either 'uiA' or 'uiB' has the pattern of a | ||||
| | signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast64_t | ||||
|  softfloat_propagateNaNF64UI( uint_fast64_t uiA, uint_fast64_t uiB ); | ||||
| uint_fast64_t softfloat_propagateNaNF64UI(uint_fast64_t uiA, uint_fast64_t uiB); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 80-bit extended floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNExtF80UI64 0xFFFF | ||||
| #define defaultNaNExtF80UI0  UINT64_C( 0xC000000000000000 ) | ||||
| #define defaultNaNExtF80UI0 UINT64_C(0xC000000000000000) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when the 80-bit unsigned integer formed from concatenating | ||||
| @@ -199,7 +197,8 @@ uint_fast64_t | ||||
| | floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its arguments more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNExtF80UI( uiA64, uiA0 ) ((((uiA64) & 0x7FFF) == 0x7FFF) && ! ((uiA0) & UINT64_C( 0x4000000000000000 )) && ((uiA0) & UINT64_C( 0x3FFFFFFFFFFFFFFF ))) | ||||
| #define softfloat_isSigNaNExtF80UI(uiA64, uiA0)                                                                                            \ | ||||
|     ((((uiA64)&0x7FFF) == 0x7FFF) && !((uiA0)&UINT64_C(0x4000000000000000)) && ((uiA0)&UINT64_C(0x3FFFFFFFFFFFFFFF))) | ||||
|  | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
|  | ||||
| @@ -215,16 +214,14 @@ uint_fast64_t | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_extF80UIToCommonNaN( | ||||
|      uint_fast16_t uiA64, uint_fast64_t uiA0, struct commonNaN *zPtr ); | ||||
| void softfloat_extF80UIToCommonNaN(uint_fast16_t uiA64, uint_fast64_t uiA0, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into an 80-bit extended | ||||
| | floating-point NaN, and returns the bit pattern of this value as an unsigned | ||||
| | integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 softfloat_commonNaNToExtF80UI( const struct commonNaN *aPtr ); | ||||
| struct uint128 softfloat_commonNaNToExtF80UI(const struct commonNaN* aPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting the unsigned integer formed from concatenating 'uiA64' and | ||||
| @@ -235,19 +232,13 @@ struct uint128 softfloat_commonNaNToExtF80UI( const struct commonNaN *aPtr ); | ||||
| | result.  If either original floating-point value is a signaling NaN, the | ||||
| | invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 | ||||
|  softfloat_propagateNaNExtF80UI( | ||||
|      uint_fast16_t uiA64, | ||||
|      uint_fast64_t uiA0, | ||||
|      uint_fast16_t uiB64, | ||||
|      uint_fast64_t uiB0 | ||||
|  ); | ||||
| struct uint128 softfloat_propagateNaNExtF80UI(uint_fast16_t uiA64, uint_fast64_t uiA0, uint_fast16_t uiB64, uint_fast64_t uiB0); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 128-bit floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNF128UI64 UINT64_C( 0xFFFF800000000000 ) | ||||
| #define defaultNaNF128UI0  UINT64_C( 0 ) | ||||
| #define defaultNaNF128UI64 UINT64_C(0xFFFF800000000000) | ||||
| #define defaultNaNF128UI0 UINT64_C(0) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when the 128-bit unsigned integer formed from concatenating | ||||
| @@ -255,7 +246,8 @@ struct uint128 | ||||
| | point signaling NaN. | ||||
| | Note:  This macro evaluates its arguments more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF128UI( uiA64, uiA0 ) ((((uiA64) & UINT64_C( 0x7FFF800000000000 )) == UINT64_C( 0x7FFF000000000000 )) && ((uiA0) || ((uiA64) & UINT64_C( 0x00007FFFFFFFFFFF )))) | ||||
| #define softfloat_isSigNaNF128UI(uiA64, uiA0)                                                                                              \ | ||||
|     ((((uiA64)&UINT64_C(0x7FFF800000000000)) == UINT64_C(0x7FFF000000000000)) && ((uiA0) || ((uiA64)&UINT64_C(0x00007FFFFFFFFFFF)))) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming the unsigned integer formed from concatenating 'uiA64' and 'uiA0' | ||||
| @@ -264,15 +256,13 @@ struct uint128 | ||||
| | pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid exception | ||||
| | is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_f128UIToCommonNaN( | ||||
|      uint_fast64_t uiA64, uint_fast64_t uiA0, struct commonNaN *zPtr ); | ||||
| void softfloat_f128UIToCommonNaN(uint_fast64_t uiA64, uint_fast64_t uiA0, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 128-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 softfloat_commonNaNToF128UI( const struct commonNaN * ); | ||||
| struct uint128 softfloat_commonNaNToF128UI(const struct commonNaN*); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting the unsigned integer formed from concatenating 'uiA64' and | ||||
| @@ -283,13 +273,7 @@ struct uint128 softfloat_commonNaNToF128UI( const struct commonNaN * ); | ||||
| | If either original floating-point value is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 | ||||
|  softfloat_propagateNaNF128UI( | ||||
|      uint_fast64_t uiA64, | ||||
|      uint_fast64_t uiA0, | ||||
|      uint_fast64_t uiB64, | ||||
|      uint_fast64_t uiB0 | ||||
|  ); | ||||
| struct uint128 softfloat_propagateNaNF128UI(uint_fast64_t uiA64, uint_fast64_t uiA0, uint_fast64_t uiB64, uint_fast64_t uiB0); | ||||
|  | ||||
| #else | ||||
|  | ||||
| @@ -304,18 +288,14 @@ struct uint128 | ||||
| | common NaN at the location pointed to by 'zPtr'.  If the NaN is a signaling | ||||
| | NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_extF80MToCommonNaN( | ||||
|      const struct extFloat80M *aSPtr, struct commonNaN *zPtr ); | ||||
| void softfloat_extF80MToCommonNaN(const struct extFloat80M* aSPtr, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into an 80-bit extended | ||||
| | floating-point NaN, and stores this NaN at the location pointed to by | ||||
| | 'zSPtr'. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_commonNaNToExtF80M( | ||||
|      const struct commonNaN *aPtr, struct extFloat80M *zSPtr ); | ||||
| void softfloat_commonNaNToExtF80M(const struct commonNaN* aPtr, struct extFloat80M* zSPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming at least one of the two 80-bit extended floating-point values | ||||
| @@ -323,12 +303,7 @@ void | ||||
| | at the location pointed to by 'zSPtr'.  If either original floating-point | ||||
| | value is a signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_propagateNaNExtF80M( | ||||
|      const struct extFloat80M *aSPtr, | ||||
|      const struct extFloat80M *bSPtr, | ||||
|      struct extFloat80M *zSPtr | ||||
|  ); | ||||
| void softfloat_propagateNaNExtF80M(const struct extFloat80M* aSPtr, const struct extFloat80M* bSPtr, struct extFloat80M* zSPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 128-bit floating-point NaN. | ||||
| @@ -336,7 +311,7 @@ void | ||||
| #define defaultNaNF128UI96 0xFFFF8000 | ||||
| #define defaultNaNF128UI64 0 | ||||
| #define defaultNaNF128UI32 0 | ||||
| #define defaultNaNF128UI0  0 | ||||
| #define defaultNaNF128UI0 0 | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming the 128-bit floating-point value pointed to by 'aWPtr' is a NaN, | ||||
| @@ -346,8 +321,7 @@ void | ||||
| | four 32-bit elements that concatenate in the platform's normal endian order | ||||
| | to form a 128-bit floating-point value. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_f128MToCommonNaN( const uint32_t *aWPtr, struct commonNaN *zPtr ); | ||||
| void softfloat_f128MToCommonNaN(const uint32_t* aWPtr, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 128-bit floating-point | ||||
| @@ -355,8 +329,7 @@ void | ||||
| | 'zWPtr' points to an array of four 32-bit elements that concatenate in the | ||||
| | platform's normal endian order to form a 128-bit floating-point value. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_commonNaNToF128M( const struct commonNaN *aPtr, uint32_t *zWPtr ); | ||||
| void softfloat_commonNaNToF128M(const struct commonNaN* aPtr, uint32_t* zWPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming at least one of the two 128-bit floating-point values pointed to by | ||||
| @@ -366,11 +339,8 @@ void | ||||
| | and 'zWPtr' points to an array of four 32-bit elements that concatenate in | ||||
| | the platform's normal endian order to form a 128-bit floating-point value. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_propagateNaNF128M( | ||||
|      const uint32_t *aWPtr, const uint32_t *bWPtr, uint32_t *zWPtr ); | ||||
| void softfloat_propagateNaNF128M(const uint32_t* aWPtr, const uint32_t* bWPtr, uint32_t* zWPtr); | ||||
|  | ||||
| #endif | ||||
|  | ||||
| #endif | ||||
|  | ||||
|   | ||||
| @@ -37,10 +37,10 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| #ifndef specialize_h | ||||
| #define specialize_h 1 | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "primitiveTypes.h" | ||||
| #include "softfloat.h" | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Default value for 'softfloat_detectTininess'. | ||||
| @@ -53,27 +53,29 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define ui32_fromPosOverflow 0xFFFFFFFF | ||||
| #define ui32_fromNegOverflow 0 | ||||
| #define ui32_fromNaN         0 | ||||
| #define i32_fromPosOverflow  0x7FFFFFFF | ||||
| #define i32_fromNegOverflow  (-0x7FFFFFFF - 1) | ||||
| #define i32_fromNaN          0 | ||||
| #define ui32_fromNaN 0 | ||||
| #define i32_fromPosOverflow 0x7FFFFFFF | ||||
| #define i32_fromNegOverflow (-0x7FFFFFFF - 1) | ||||
| #define i32_fromNaN 0 | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The values to return on conversions to 64-bit integer formats that raise an | ||||
| | invalid exception. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define ui64_fromPosOverflow UINT64_C( 0xFFFFFFFFFFFFFFFF ) | ||||
| #define ui64_fromPosOverflow UINT64_C(0xFFFFFFFFFFFFFFFF) | ||||
| #define ui64_fromNegOverflow 0 | ||||
| #define ui64_fromNaN         0 | ||||
| #define i64_fromPosOverflow  INT64_C( 0x7FFFFFFFFFFFFFFF ) | ||||
| #define i64_fromNegOverflow  (-INT64_C( 0x7FFFFFFFFFFFFFFF ) - 1) | ||||
| #define i64_fromNaN          0 | ||||
| #define ui64_fromNaN 0 | ||||
| #define i64_fromPosOverflow INT64_C(0x7FFFFFFFFFFFFFFF) | ||||
| #define i64_fromNegOverflow (-INT64_C(0x7FFFFFFFFFFFFFFF) - 1) | ||||
| #define i64_fromNaN 0 | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | "Common NaN" structure, used to transfer NaN representations from one format | ||||
| | to another. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct commonNaN { char _unused; }; | ||||
| struct commonNaN { | ||||
|     char _unused; | ||||
| }; | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 16-bit floating-point NaN. | ||||
| @@ -85,7 +87,7 @@ struct commonNaN { char _unused; }; | ||||
| | 16-bit floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF16UI( uiA ) ((((uiA) & 0x7E00) == 0x7C00) && ((uiA) & 0x01FF)) | ||||
| #define softfloat_isSigNaNF16UI(uiA) ((((uiA)&0x7E00) == 0x7C00) && ((uiA)&0x01FF)) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 16-bit floating-point NaN, converts | ||||
| @@ -93,13 +95,15 @@ struct commonNaN { char _unused; }; | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_f16UIToCommonNaN( uiA, zPtr ) if ( ! ((uiA) & 0x0200) ) softfloat_raiseFlags( softfloat_flag_invalid ) | ||||
| #define softfloat_f16UIToCommonNaN(uiA, zPtr)                                                                                              \ | ||||
|     if(!((uiA)&0x0200))                                                                                                                    \ | ||||
|     softfloat_raiseFlags(softfloat_flag_invalid) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 16-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_commonNaNToF16UI( aPtr ) ((uint_fast16_t) defaultNaNF16UI) | ||||
| #define softfloat_commonNaNToF16UI(aPtr) ((uint_fast16_t)defaultNaNF16UI) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 16-bit floating- | ||||
| @@ -107,8 +111,7 @@ struct commonNaN { char _unused; }; | ||||
| | the combined NaN result.  If either 'uiA' or 'uiB' has the pattern of a | ||||
| | signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast16_t | ||||
|  softfloat_propagateNaNF16UI( uint_fast16_t uiA, uint_fast16_t uiB ); | ||||
| uint_fast16_t softfloat_propagateNaNF16UI(uint_fast16_t uiA, uint_fast16_t uiB); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 32-bit floating-point NaN. | ||||
| @@ -120,7 +123,7 @@ uint_fast16_t | ||||
| | 32-bit floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF32UI( uiA ) ((((uiA) & 0x7FC00000) == 0x7F800000) && ((uiA) & 0x003FFFFF)) | ||||
| #define softfloat_isSigNaNF32UI(uiA) ((((uiA)&0x7FC00000) == 0x7F800000) && ((uiA)&0x003FFFFF)) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 32-bit floating-point NaN, converts | ||||
| @@ -128,13 +131,15 @@ uint_fast16_t | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_f32UIToCommonNaN( uiA, zPtr ) if ( ! ((uiA) & 0x00400000) ) softfloat_raiseFlags( softfloat_flag_invalid ) | ||||
| #define softfloat_f32UIToCommonNaN(uiA, zPtr)                                                                                              \ | ||||
|     if(!((uiA)&0x00400000))                                                                                                                \ | ||||
|     softfloat_raiseFlags(softfloat_flag_invalid) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 32-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_commonNaNToF32UI( aPtr ) ((uint_fast32_t) defaultNaNF32UI) | ||||
| #define softfloat_commonNaNToF32UI(aPtr) ((uint_fast32_t)defaultNaNF32UI) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 32-bit floating- | ||||
| @@ -142,20 +147,20 @@ uint_fast16_t | ||||
| | the combined NaN result.  If either 'uiA' or 'uiB' has the pattern of a | ||||
| | signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast32_t | ||||
|  softfloat_propagateNaNF32UI( uint_fast32_t uiA, uint_fast32_t uiB ); | ||||
| uint_fast32_t softfloat_propagateNaNF32UI(uint_fast32_t uiA, uint_fast32_t uiB); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 64-bit floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNF64UI UINT64_C( 0x7FF8000000000000 ) | ||||
| #define defaultNaNF64UI UINT64_C(0x7FF8000000000000) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when 64-bit unsigned integer 'uiA' has the bit pattern of a | ||||
| | 64-bit floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF64UI( uiA ) ((((uiA) & UINT64_C( 0x7FF8000000000000 )) == UINT64_C( 0x7FF0000000000000 )) && ((uiA) & UINT64_C( 0x0007FFFFFFFFFFFF ))) | ||||
| #define softfloat_isSigNaNF64UI(uiA)                                                                                                       \ | ||||
|     ((((uiA)&UINT64_C(0x7FF8000000000000)) == UINT64_C(0x7FF0000000000000)) && ((uiA)&UINT64_C(0x0007FFFFFFFFFFFF))) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 64-bit floating-point NaN, converts | ||||
| @@ -163,13 +168,15 @@ uint_fast32_t | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_f64UIToCommonNaN( uiA, zPtr ) if ( ! ((uiA) & UINT64_C( 0x0008000000000000 )) ) softfloat_raiseFlags( softfloat_flag_invalid ) | ||||
| #define softfloat_f64UIToCommonNaN(uiA, zPtr)                                                                                              \ | ||||
|     if(!((uiA)&UINT64_C(0x0008000000000000)))                                                                                              \ | ||||
|     softfloat_raiseFlags(softfloat_flag_invalid) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 64-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_commonNaNToF64UI( aPtr ) ((uint_fast64_t) defaultNaNF64UI) | ||||
| #define softfloat_commonNaNToF64UI(aPtr) ((uint_fast64_t)defaultNaNF64UI) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 64-bit floating- | ||||
| @@ -177,14 +184,13 @@ uint_fast32_t | ||||
| | the combined NaN result.  If either 'uiA' or 'uiB' has the pattern of a | ||||
| | signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast64_t | ||||
|  softfloat_propagateNaNF64UI( uint_fast64_t uiA, uint_fast64_t uiB ); | ||||
| uint_fast64_t softfloat_propagateNaNF64UI(uint_fast64_t uiA, uint_fast64_t uiB); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 80-bit extended floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNExtF80UI64 0x7FFF | ||||
| #define defaultNaNExtF80UI0  UINT64_C( 0xC000000000000000 ) | ||||
| #define defaultNaNExtF80UI0 UINT64_C(0xC000000000000000) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when the 80-bit unsigned integer formed from concatenating | ||||
| @@ -192,7 +198,8 @@ uint_fast64_t | ||||
| | floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its arguments more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNExtF80UI( uiA64, uiA0 ) ((((uiA64) & 0x7FFF) == 0x7FFF) && ! ((uiA0) & UINT64_C( 0x4000000000000000 )) && ((uiA0) & UINT64_C( 0x3FFFFFFFFFFFFFFF ))) | ||||
| #define softfloat_isSigNaNExtF80UI(uiA64, uiA0)                                                                                            \ | ||||
|     ((((uiA64)&0x7FFF) == 0x7FFF) && !((uiA0)&UINT64_C(0x4000000000000000)) && ((uiA0)&UINT64_C(0x3FFFFFFFFFFFFFFF))) | ||||
|  | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
|  | ||||
| @@ -208,24 +215,25 @@ uint_fast64_t | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_extF80UIToCommonNaN( uiA64, uiA0, zPtr ) if ( ! ((uiA0) & UINT64_C( 0x4000000000000000 )) ) softfloat_raiseFlags( softfloat_flag_invalid ) | ||||
| #define softfloat_extF80UIToCommonNaN(uiA64, uiA0, zPtr)                                                                                   \ | ||||
|     if(!((uiA0)&UINT64_C(0x4000000000000000)))                                                                                             \ | ||||
|     softfloat_raiseFlags(softfloat_flag_invalid) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into an 80-bit extended | ||||
| | floating-point NaN, and returns the bit pattern of this value as an unsigned | ||||
| | integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE && ! defined softfloat_commonNaNToExtF80UI | ||||
| #if defined INLINE && !defined softfloat_commonNaNToExtF80UI | ||||
| INLINE | ||||
| struct uint128 softfloat_commonNaNToExtF80UI( const struct commonNaN *aPtr ) | ||||
| { | ||||
| struct uint128 softfloat_commonNaNToExtF80UI(const struct commonNaN* aPtr) { | ||||
|     struct uint128 uiZ; | ||||
|     uiZ.v64 = defaultNaNExtF80UI64; | ||||
|     uiZ.v0  = defaultNaNExtF80UI0; | ||||
|     uiZ.v0 = defaultNaNExtF80UI0; | ||||
|     return uiZ; | ||||
| } | ||||
| #else | ||||
| struct uint128 softfloat_commonNaNToExtF80UI( const struct commonNaN *aPtr ); | ||||
| struct uint128 softfloat_commonNaNToExtF80UI(const struct commonNaN* aPtr); | ||||
| #endif | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| @@ -237,19 +245,13 @@ struct uint128 softfloat_commonNaNToExtF80UI( const struct commonNaN *aPtr ); | ||||
| | result.  If either original floating-point value is a signaling NaN, the | ||||
| | invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 | ||||
|  softfloat_propagateNaNExtF80UI( | ||||
|      uint_fast16_t uiA64, | ||||
|      uint_fast64_t uiA0, | ||||
|      uint_fast16_t uiB64, | ||||
|      uint_fast64_t uiB0 | ||||
|  ); | ||||
| struct uint128 softfloat_propagateNaNExtF80UI(uint_fast16_t uiA64, uint_fast64_t uiA0, uint_fast16_t uiB64, uint_fast64_t uiB0); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 128-bit floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNF128UI64 UINT64_C( 0x7FFF800000000000 ) | ||||
| #define defaultNaNF128UI0  UINT64_C( 0 ) | ||||
| #define defaultNaNF128UI64 UINT64_C(0x7FFF800000000000) | ||||
| #define defaultNaNF128UI0 UINT64_C(0) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when the 128-bit unsigned integer formed from concatenating | ||||
| @@ -257,7 +259,8 @@ struct uint128 | ||||
| | point signaling NaN. | ||||
| | Note:  This macro evaluates its arguments more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF128UI( uiA64, uiA0 ) ((((uiA64) & UINT64_C( 0x7FFF800000000000 )) == UINT64_C( 0x7FFF000000000000 )) && ((uiA0) || ((uiA64) & UINT64_C( 0x00007FFFFFFFFFFF )))) | ||||
| #define softfloat_isSigNaNF128UI(uiA64, uiA0)                                                                                              \ | ||||
|     ((((uiA64)&UINT64_C(0x7FFF800000000000)) == UINT64_C(0x7FFF000000000000)) && ((uiA0) || ((uiA64)&UINT64_C(0x00007FFFFFFFFFFF)))) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming the unsigned integer formed from concatenating 'uiA64' and 'uiA0' | ||||
| @@ -266,23 +269,24 @@ struct uint128 | ||||
| | pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid exception | ||||
| | is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_f128UIToCommonNaN( uiA64, uiA0, zPtr ) if ( ! ((uiA64) & UINT64_C( 0x0000800000000000 )) ) softfloat_raiseFlags( softfloat_flag_invalid ) | ||||
| #define softfloat_f128UIToCommonNaN(uiA64, uiA0, zPtr)                                                                                     \ | ||||
|     if(!((uiA64)&UINT64_C(0x0000800000000000)))                                                                                            \ | ||||
|     softfloat_raiseFlags(softfloat_flag_invalid) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 128-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE && ! defined softfloat_commonNaNToF128UI | ||||
| #if defined INLINE && !defined softfloat_commonNaNToF128UI | ||||
| INLINE | ||||
| struct uint128 softfloat_commonNaNToF128UI( const struct commonNaN *aPtr ) | ||||
| { | ||||
| struct uint128 softfloat_commonNaNToF128UI(const struct commonNaN* aPtr) { | ||||
|     struct uint128 uiZ; | ||||
|     uiZ.v64 = defaultNaNF128UI64; | ||||
|     uiZ.v0  = defaultNaNF128UI0; | ||||
|     uiZ.v0 = defaultNaNF128UI0; | ||||
|     return uiZ; | ||||
| } | ||||
| #else | ||||
| struct uint128 softfloat_commonNaNToF128UI( const struct commonNaN * ); | ||||
| struct uint128 softfloat_commonNaNToF128UI(const struct commonNaN*); | ||||
| #endif | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| @@ -294,13 +298,7 @@ struct uint128 softfloat_commonNaNToF128UI( const struct commonNaN * ); | ||||
| | If either original floating-point value is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 | ||||
|  softfloat_propagateNaNF128UI( | ||||
|      uint_fast64_t uiA64, | ||||
|      uint_fast64_t uiA0, | ||||
|      uint_fast64_t uiB64, | ||||
|      uint_fast64_t uiB0 | ||||
|  ); | ||||
| struct uint128 softfloat_propagateNaNF128UI(uint_fast64_t uiA64, uint_fast64_t uiA0, uint_fast64_t uiB64, uint_fast64_t uiB0); | ||||
|  | ||||
| #else | ||||
|  | ||||
| @@ -315,26 +313,23 @@ struct uint128 | ||||
| | common NaN at the location pointed to by 'zPtr'.  If the NaN is a signaling | ||||
| | NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_extF80MToCommonNaN( aSPtr, zPtr ) if ( ! ((aSPtr)->signif & UINT64_C( 0x4000000000000000 )) ) softfloat_raiseFlags( softfloat_flag_invalid ) | ||||
| #define softfloat_extF80MToCommonNaN(aSPtr, zPtr)                                                                                          \ | ||||
|     if(!((aSPtr)->signif & UINT64_C(0x4000000000000000)))                                                                                  \ | ||||
|     softfloat_raiseFlags(softfloat_flag_invalid) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into an 80-bit extended | ||||
| | floating-point NaN, and stores this NaN at the location pointed to by | ||||
| | 'zSPtr'. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE && ! defined softfloat_commonNaNToExtF80M | ||||
| #if defined INLINE && !defined softfloat_commonNaNToExtF80M | ||||
| INLINE | ||||
| void | ||||
|  softfloat_commonNaNToExtF80M( | ||||
|      const struct commonNaN *aPtr, struct extFloat80M *zSPtr ) | ||||
| { | ||||
| void softfloat_commonNaNToExtF80M(const struct commonNaN* aPtr, struct extFloat80M* zSPtr) { | ||||
|     zSPtr->signExp = defaultNaNExtF80UI64; | ||||
|     zSPtr->signif  = defaultNaNExtF80UI0; | ||||
|     zSPtr->signif = defaultNaNExtF80UI0; | ||||
| } | ||||
| #else | ||||
| void | ||||
|  softfloat_commonNaNToExtF80M( | ||||
|      const struct commonNaN *aPtr, struct extFloat80M *zSPtr ); | ||||
| void softfloat_commonNaNToExtF80M(const struct commonNaN* aPtr, struct extFloat80M* zSPtr); | ||||
| #endif | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| @@ -343,12 +338,7 @@ void | ||||
| | at the location pointed to by 'zSPtr'.  If either original floating-point | ||||
| | value is a signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_propagateNaNExtF80M( | ||||
|      const struct extFloat80M *aSPtr, | ||||
|      const struct extFloat80M *bSPtr, | ||||
|      struct extFloat80M *zSPtr | ||||
|  ); | ||||
| void softfloat_propagateNaNExtF80M(const struct extFloat80M* aSPtr, const struct extFloat80M* bSPtr, struct extFloat80M* zSPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 128-bit floating-point NaN. | ||||
| @@ -356,7 +346,7 @@ void | ||||
| #define defaultNaNF128UI96 0x7FFF8000 | ||||
| #define defaultNaNF128UI64 0 | ||||
| #define defaultNaNF128UI32 0 | ||||
| #define defaultNaNF128UI0  0 | ||||
| #define defaultNaNF128UI0 0 | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming the 128-bit floating-point value pointed to by 'aWPtr' is a NaN, | ||||
| @@ -366,7 +356,9 @@ void | ||||
| | four 32-bit elements that concatenate in the platform's normal endian order | ||||
| | to form a 128-bit floating-point value. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_f128MToCommonNaN( aWPtr, zPtr ) if ( ! ((aWPtr)[indexWordHi( 4 )] & UINT64_C( 0x0000800000000000 )) ) softfloat_raiseFlags( softfloat_flag_invalid ) | ||||
| #define softfloat_f128MToCommonNaN(aWPtr, zPtr)                                                                                            \ | ||||
|     if(!((aWPtr)[indexWordHi(4)] & UINT64_C(0x0000800000000000)))                                                                          \ | ||||
|     softfloat_raiseFlags(softfloat_flag_invalid) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 128-bit floating-point | ||||
| @@ -374,19 +366,16 @@ void | ||||
| | 'zWPtr' points to an array of four 32-bit elements that concatenate in the | ||||
| | platform's normal endian order to form a 128-bit floating-point value. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE && ! defined softfloat_commonNaNToF128M | ||||
| #if defined INLINE && !defined softfloat_commonNaNToF128M | ||||
| INLINE | ||||
| void | ||||
|  softfloat_commonNaNToF128M( const struct commonNaN *aPtr, uint32_t *zWPtr ) | ||||
| { | ||||
|     zWPtr[indexWord( 4, 3 )] = defaultNaNF128UI96; | ||||
|     zWPtr[indexWord( 4, 2 )] = defaultNaNF128UI64; | ||||
|     zWPtr[indexWord( 4, 1 )] = defaultNaNF128UI32; | ||||
|     zWPtr[indexWord( 4, 0 )] = defaultNaNF128UI0; | ||||
| void softfloat_commonNaNToF128M(const struct commonNaN* aPtr, uint32_t* zWPtr) { | ||||
|     zWPtr[indexWord(4, 3)] = defaultNaNF128UI96; | ||||
|     zWPtr[indexWord(4, 2)] = defaultNaNF128UI64; | ||||
|     zWPtr[indexWord(4, 1)] = defaultNaNF128UI32; | ||||
|     zWPtr[indexWord(4, 0)] = defaultNaNF128UI0; | ||||
| } | ||||
| #else | ||||
| void | ||||
|  softfloat_commonNaNToF128M( const struct commonNaN *aPtr, uint32_t *zWPtr ); | ||||
| void softfloat_commonNaNToF128M(const struct commonNaN* aPtr, uint32_t* zWPtr); | ||||
| #endif | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| @@ -397,11 +386,8 @@ void | ||||
| | and 'zWPtr' points to an array of four 32-bit elements that concatenate in | ||||
| | the platform's normal endian order to form a 128-bit floating-point value. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_propagateNaNF128M( | ||||
|      const uint32_t *aWPtr, const uint32_t *bWPtr, uint32_t *zWPtr ); | ||||
| void softfloat_propagateNaNF128M(const uint32_t* aWPtr, const uint32_t* bWPtr, uint32_t* zWPtr); | ||||
|  | ||||
| #endif | ||||
|  | ||||
| #endif | ||||
|  | ||||
|   | ||||
| @@ -37,10 +37,10 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| #ifndef specialize_h | ||||
| #define specialize_h 1 | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "primitiveTypes.h" | ||||
| #include "softfloat.h" | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Default value for 'softfloat_detectTininess'. | ||||
| @@ -53,21 +53,21 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define ui32_fromPosOverflow 0xFFFFFFFF | ||||
| #define ui32_fromNegOverflow 0 | ||||
| #define ui32_fromNaN         0 | ||||
| #define i32_fromPosOverflow  0x7FFFFFFF | ||||
| #define i32_fromNegOverflow  (-0x7FFFFFFF - 1) | ||||
| #define i32_fromNaN          0 | ||||
| #define ui32_fromNaN 0 | ||||
| #define i32_fromPosOverflow 0x7FFFFFFF | ||||
| #define i32_fromNegOverflow (-0x7FFFFFFF - 1) | ||||
| #define i32_fromNaN 0 | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The values to return on conversions to 64-bit integer formats that raise an | ||||
| | invalid exception. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define ui64_fromPosOverflow UINT64_C( 0xFFFFFFFFFFFFFFFF ) | ||||
| #define ui64_fromPosOverflow UINT64_C(0xFFFFFFFFFFFFFFFF) | ||||
| #define ui64_fromNegOverflow 0 | ||||
| #define ui64_fromNaN         0 | ||||
| #define i64_fromPosOverflow  INT64_C( 0x7FFFFFFFFFFFFFFF ) | ||||
| #define i64_fromNegOverflow  (-INT64_C( 0x7FFFFFFFFFFFFFFF ) - 1) | ||||
| #define i64_fromNaN          0 | ||||
| #define ui64_fromNaN 0 | ||||
| #define i64_fromPosOverflow INT64_C(0x7FFFFFFFFFFFFFFF) | ||||
| #define i64_fromNegOverflow (-INT64_C(0x7FFFFFFFFFFFFFFF) - 1) | ||||
| #define i64_fromNaN 0 | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | "Common NaN" structure, used to transfer NaN representations from one format | ||||
| @@ -92,7 +92,7 @@ struct commonNaN { | ||||
| | 16-bit floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF16UI( uiA ) ((((uiA) & 0x7E00) == 0x7C00) && ((uiA) & 0x01FF)) | ||||
| #define softfloat_isSigNaNF16UI(uiA) ((((uiA)&0x7E00) == 0x7C00) && ((uiA)&0x01FF)) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 16-bit floating-point NaN, converts | ||||
| @@ -100,13 +100,13 @@ struct commonNaN { | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_f16UIToCommonNaN( uint_fast16_t uiA, struct commonNaN *zPtr ); | ||||
| void softfloat_f16UIToCommonNaN(uint_fast16_t uiA, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 16-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast16_t softfloat_commonNaNToF16UI( const struct commonNaN *aPtr ); | ||||
| uint_fast16_t softfloat_commonNaNToF16UI(const struct commonNaN* aPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 16-bit floating- | ||||
| @@ -114,8 +114,7 @@ uint_fast16_t softfloat_commonNaNToF16UI( const struct commonNaN *aPtr ); | ||||
| | the combined NaN result.  If either 'uiA' or 'uiB' has the pattern of a | ||||
| | signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast16_t | ||||
|  softfloat_propagateNaNF16UI( uint_fast16_t uiA, uint_fast16_t uiB ); | ||||
| uint_fast16_t softfloat_propagateNaNF16UI(uint_fast16_t uiA, uint_fast16_t uiB); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 32-bit floating-point NaN. | ||||
| @@ -127,7 +126,7 @@ uint_fast16_t | ||||
| | 32-bit floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF32UI( uiA ) ((((uiA) & 0x7FC00000) == 0x7F800000) && ((uiA) & 0x003FFFFF)) | ||||
| #define softfloat_isSigNaNF32UI(uiA) ((((uiA)&0x7FC00000) == 0x7F800000) && ((uiA)&0x003FFFFF)) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 32-bit floating-point NaN, converts | ||||
| @@ -135,13 +134,13 @@ uint_fast16_t | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_f32UIToCommonNaN( uint_fast32_t uiA, struct commonNaN *zPtr ); | ||||
| void softfloat_f32UIToCommonNaN(uint_fast32_t uiA, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 32-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast32_t softfloat_commonNaNToF32UI( const struct commonNaN *aPtr ); | ||||
| uint_fast32_t softfloat_commonNaNToF32UI(const struct commonNaN* aPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 32-bit floating- | ||||
| @@ -149,20 +148,20 @@ uint_fast32_t softfloat_commonNaNToF32UI( const struct commonNaN *aPtr ); | ||||
| | the combined NaN result.  If either 'uiA' or 'uiB' has the pattern of a | ||||
| | signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast32_t | ||||
|  softfloat_propagateNaNF32UI( uint_fast32_t uiA, uint_fast32_t uiB ); | ||||
| uint_fast32_t softfloat_propagateNaNF32UI(uint_fast32_t uiA, uint_fast32_t uiB); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 64-bit floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNF64UI UINT64_C( 0x7FF8000000000000 ) | ||||
| #define defaultNaNF64UI UINT64_C(0x7FF8000000000000) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when 64-bit unsigned integer 'uiA' has the bit pattern of a | ||||
| | 64-bit floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF64UI( uiA ) ((((uiA) & UINT64_C( 0x7FF8000000000000 )) == UINT64_C( 0x7FF0000000000000 )) && ((uiA) & UINT64_C( 0x0007FFFFFFFFFFFF ))) | ||||
| #define softfloat_isSigNaNF64UI(uiA)                                                                                                       \ | ||||
|     ((((uiA)&UINT64_C(0x7FF8000000000000)) == UINT64_C(0x7FF0000000000000)) && ((uiA)&UINT64_C(0x0007FFFFFFFFFFFF))) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 64-bit floating-point NaN, converts | ||||
| @@ -170,13 +169,13 @@ uint_fast32_t | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_f64UIToCommonNaN( uint_fast64_t uiA, struct commonNaN *zPtr ); | ||||
| void softfloat_f64UIToCommonNaN(uint_fast64_t uiA, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 64-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast64_t softfloat_commonNaNToF64UI( const struct commonNaN *aPtr ); | ||||
| uint_fast64_t softfloat_commonNaNToF64UI(const struct commonNaN* aPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 64-bit floating- | ||||
| @@ -184,14 +183,13 @@ uint_fast64_t softfloat_commonNaNToF64UI( const struct commonNaN *aPtr ); | ||||
| | the combined NaN result.  If either 'uiA' or 'uiB' has the pattern of a | ||||
| | signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast64_t | ||||
|  softfloat_propagateNaNF64UI( uint_fast64_t uiA, uint_fast64_t uiB ); | ||||
| uint_fast64_t softfloat_propagateNaNF64UI(uint_fast64_t uiA, uint_fast64_t uiB); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 80-bit extended floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNExtF80UI64 0x7FFF | ||||
| #define defaultNaNExtF80UI0  UINT64_C( 0xC000000000000000 ) | ||||
| #define defaultNaNExtF80UI0 UINT64_C(0xC000000000000000) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when the 80-bit unsigned integer formed from concatenating | ||||
| @@ -199,7 +197,8 @@ uint_fast64_t | ||||
| | floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its arguments more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNExtF80UI( uiA64, uiA0 ) ((((uiA64) & 0x7FFF) == 0x7FFF) && ! ((uiA0) & UINT64_C( 0x4000000000000000 )) && ((uiA0) & UINT64_C( 0x3FFFFFFFFFFFFFFF ))) | ||||
| #define softfloat_isSigNaNExtF80UI(uiA64, uiA0)                                                                                            \ | ||||
|     ((((uiA64)&0x7FFF) == 0x7FFF) && !((uiA0)&UINT64_C(0x4000000000000000)) && ((uiA0)&UINT64_C(0x3FFFFFFFFFFFFFFF))) | ||||
|  | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
|  | ||||
| @@ -215,16 +214,14 @@ uint_fast64_t | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_extF80UIToCommonNaN( | ||||
|      uint_fast16_t uiA64, uint_fast64_t uiA0, struct commonNaN *zPtr ); | ||||
| void softfloat_extF80UIToCommonNaN(uint_fast16_t uiA64, uint_fast64_t uiA0, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into an 80-bit extended | ||||
| | floating-point NaN, and returns the bit pattern of this value as an unsigned | ||||
| | integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 softfloat_commonNaNToExtF80UI( const struct commonNaN *aPtr ); | ||||
| struct uint128 softfloat_commonNaNToExtF80UI(const struct commonNaN* aPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting the unsigned integer formed from concatenating 'uiA64' and | ||||
| @@ -235,19 +232,13 @@ struct uint128 softfloat_commonNaNToExtF80UI( const struct commonNaN *aPtr ); | ||||
| | result.  If either original floating-point value is a signaling NaN, the | ||||
| | invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 | ||||
|  softfloat_propagateNaNExtF80UI( | ||||
|      uint_fast16_t uiA64, | ||||
|      uint_fast64_t uiA0, | ||||
|      uint_fast16_t uiB64, | ||||
|      uint_fast64_t uiB0 | ||||
|  ); | ||||
| struct uint128 softfloat_propagateNaNExtF80UI(uint_fast16_t uiA64, uint_fast64_t uiA0, uint_fast16_t uiB64, uint_fast64_t uiB0); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 128-bit floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNF128UI64 UINT64_C( 0x7FFF800000000000 ) | ||||
| #define defaultNaNF128UI0  UINT64_C( 0 ) | ||||
| #define defaultNaNF128UI64 UINT64_C(0x7FFF800000000000) | ||||
| #define defaultNaNF128UI0 UINT64_C(0) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when the 128-bit unsigned integer formed from concatenating | ||||
| @@ -255,7 +246,8 @@ struct uint128 | ||||
| | point signaling NaN. | ||||
| | Note:  This macro evaluates its arguments more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF128UI( uiA64, uiA0 ) ((((uiA64) & UINT64_C( 0x7FFF800000000000 )) == UINT64_C( 0x7FFF000000000000 )) && ((uiA0) || ((uiA64) & UINT64_C( 0x00007FFFFFFFFFFF )))) | ||||
| #define softfloat_isSigNaNF128UI(uiA64, uiA0)                                                                                              \ | ||||
|     ((((uiA64)&UINT64_C(0x7FFF800000000000)) == UINT64_C(0x7FFF000000000000)) && ((uiA0) || ((uiA64)&UINT64_C(0x00007FFFFFFFFFFF)))) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming the unsigned integer formed from concatenating 'uiA64' and 'uiA0' | ||||
| @@ -264,15 +256,13 @@ struct uint128 | ||||
| | pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid exception | ||||
| | is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_f128UIToCommonNaN( | ||||
|      uint_fast64_t uiA64, uint_fast64_t uiA0, struct commonNaN *zPtr ); | ||||
| void softfloat_f128UIToCommonNaN(uint_fast64_t uiA64, uint_fast64_t uiA0, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 128-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 softfloat_commonNaNToF128UI( const struct commonNaN * ); | ||||
| struct uint128 softfloat_commonNaNToF128UI(const struct commonNaN*); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting the unsigned integer formed from concatenating 'uiA64' and | ||||
| @@ -283,13 +273,7 @@ struct uint128 softfloat_commonNaNToF128UI( const struct commonNaN * ); | ||||
| | If either original floating-point value is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 | ||||
|  softfloat_propagateNaNF128UI( | ||||
|      uint_fast64_t uiA64, | ||||
|      uint_fast64_t uiA0, | ||||
|      uint_fast64_t uiB64, | ||||
|      uint_fast64_t uiB0 | ||||
|  ); | ||||
| struct uint128 softfloat_propagateNaNF128UI(uint_fast64_t uiA64, uint_fast64_t uiA0, uint_fast64_t uiB64, uint_fast64_t uiB0); | ||||
|  | ||||
| #else | ||||
|  | ||||
| @@ -304,18 +288,14 @@ struct uint128 | ||||
| | common NaN at the location pointed to by 'zPtr'.  If the NaN is a signaling | ||||
| | NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_extF80MToCommonNaN( | ||||
|      const struct extFloat80M *aSPtr, struct commonNaN *zPtr ); | ||||
| void softfloat_extF80MToCommonNaN(const struct extFloat80M* aSPtr, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into an 80-bit extended | ||||
| | floating-point NaN, and stores this NaN at the location pointed to by | ||||
| | 'zSPtr'. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_commonNaNToExtF80M( | ||||
|      const struct commonNaN *aPtr, struct extFloat80M *zSPtr ); | ||||
| void softfloat_commonNaNToExtF80M(const struct commonNaN* aPtr, struct extFloat80M* zSPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming at least one of the two 80-bit extended floating-point values | ||||
| @@ -323,12 +303,7 @@ void | ||||
| | at the location pointed to by 'zSPtr'.  If either original floating-point | ||||
| | value is a signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_propagateNaNExtF80M( | ||||
|      const struct extFloat80M *aSPtr, | ||||
|      const struct extFloat80M *bSPtr, | ||||
|      struct extFloat80M *zSPtr | ||||
|  ); | ||||
| void softfloat_propagateNaNExtF80M(const struct extFloat80M* aSPtr, const struct extFloat80M* bSPtr, struct extFloat80M* zSPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 128-bit floating-point NaN. | ||||
| @@ -336,7 +311,7 @@ void | ||||
| #define defaultNaNF128UI96 0x7FFF8000 | ||||
| #define defaultNaNF128UI64 0 | ||||
| #define defaultNaNF128UI32 0 | ||||
| #define defaultNaNF128UI0  0 | ||||
| #define defaultNaNF128UI0 0 | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming the 128-bit floating-point value pointed to by 'aWPtr' is a NaN, | ||||
| @@ -346,8 +321,7 @@ void | ||||
| | four 32-bit elements that concatenate in the platform's normal endian order | ||||
| | to form a 128-bit floating-point value. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_f128MToCommonNaN( const uint32_t *aWPtr, struct commonNaN *zPtr ); | ||||
| void softfloat_f128MToCommonNaN(const uint32_t* aWPtr, struct commonNaN* zPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 128-bit floating-point | ||||
| @@ -355,8 +329,7 @@ void | ||||
| | 'zWPtr' points to an array of four 32-bit elements that concatenate in the | ||||
| | platform's normal endian order to form a 128-bit floating-point value. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_commonNaNToF128M( const struct commonNaN *aPtr, uint32_t *zWPtr ); | ||||
| void softfloat_commonNaNToF128M(const struct commonNaN* aPtr, uint32_t* zWPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming at least one of the two 128-bit floating-point values pointed to by | ||||
| @@ -366,11 +339,8 @@ void | ||||
| | and 'zWPtr' points to an array of four 32-bit elements that concatenate in | ||||
| | the platform's normal endian order to form a 128-bit floating-point value. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_propagateNaNF128M( | ||||
|      const uint32_t *aWPtr, const uint32_t *bWPtr, uint32_t *zWPtr ); | ||||
| void softfloat_propagateNaNF128M(const uint32_t* aWPtr, const uint32_t* bWPtr, uint32_t* zWPtr); | ||||
|  | ||||
| #endif | ||||
|  | ||||
| #endif | ||||
|  | ||||
|   | ||||
							
								
								
									
										5
									
								
								softfloat/source/RISCV/s_bf16UIToCommonNaN.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										5
									
								
								softfloat/source/RISCV/s_bf16UIToCommonNaN.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,5 @@ | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | This file intentionally contains no code. | ||||
| *----------------------------------------------------------------------------*/ | ||||
|  | ||||
							
								
								
									
										5
									
								
								softfloat/source/RISCV/s_commonNaNToBF16UI.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										5
									
								
								softfloat/source/RISCV/s_commonNaNToBF16UI.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,5 @@ | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | This file intentionally contains no code. | ||||
| *----------------------------------------------------------------------------*/ | ||||
|  | ||||
| @@ -4,8 +4,8 @@ | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
| @@ -34,9 +34,10 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "internals.h" | ||||
| #include "softfloat_types.h" | ||||
|  | ||||
| #define softfloat_commonNaNToExtF80M softfloat_commonNaNToExtF80M | ||||
| #include "specialize.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| @@ -49,8 +50,8 @@ void | ||||
|      const struct commonNaN *aPtr, struct extFloat80M *zSPtr ) | ||||
| { | ||||
|  | ||||
|     zSPtr->signExp = packToExtF80UI64( aPtr->sign, 0x7FFF ); | ||||
|     zSPtr->signif = UINT64_C( 0xC000000000000000 ) | aPtr->v64>>1; | ||||
|     zSPtr->signExp = defaultNaNExtF80UI64; | ||||
|     zSPtr->signif  = defaultNaNExtF80UI0; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -4,8 +4,8 @@ | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
| @@ -34,9 +34,10 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "primitives.h" | ||||
| #include "primitiveTypes.h" | ||||
|  | ||||
| #define softfloat_commonNaNToExtF80UI softfloat_commonNaNToExtF80UI | ||||
| #include "specialize.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| @@ -48,8 +49,8 @@ struct uint128 softfloat_commonNaNToExtF80UI( const struct commonNaN *aPtr ) | ||||
| { | ||||
|     struct uint128 uiZ; | ||||
|  | ||||
|     uiZ.v64 = (uint_fast16_t) aPtr->sign<<15 | 0x7FFF; | ||||
|     uiZ.v0 = UINT64_C( 0xC000000000000000 ) | aPtr->v64>>1; | ||||
|     uiZ.v64 = defaultNaNExtF80UI64; | ||||
|     uiZ.v0  = defaultNaNExtF80UI0; | ||||
|     return uiZ; | ||||
|  | ||||
| } | ||||
|   | ||||
| @@ -4,8 +4,8 @@ | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
| @@ -36,7 +36,9 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "primitives.h" | ||||
| #include "primitiveTypes.h" | ||||
|  | ||||
| #define softfloat_commonNaNToF128M softfloat_commonNaNToF128M | ||||
| #include "specialize.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| @@ -49,8 +51,10 @@ void | ||||
|  softfloat_commonNaNToF128M( const struct commonNaN *aPtr, uint32_t *zWPtr ) | ||||
| { | ||||
|  | ||||
|     softfloat_shortShiftRight128M( (const uint32_t *) &aPtr->v0, 16, zWPtr ); | ||||
|     zWPtr[indexWordHi( 4 )] |= (uint32_t) aPtr->sign<<31 | 0x7FFF8000; | ||||
|     zWPtr[indexWord( 4, 3 )] = defaultNaNF128UI96; | ||||
|     zWPtr[indexWord( 4, 2 )] = defaultNaNF128UI64; | ||||
|     zWPtr[indexWord( 4, 1 )] = defaultNaNF128UI32; | ||||
|     zWPtr[indexWord( 4, 0 )] = defaultNaNF128UI0; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -4,8 +4,8 @@ | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
| @@ -34,9 +34,10 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "primitives.h" | ||||
| #include "primitiveTypes.h" | ||||
|  | ||||
| #define softfloat_commonNaNToF128UI softfloat_commonNaNToF128UI | ||||
| #include "specialize.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| @@ -47,8 +48,8 @@ struct uint128 softfloat_commonNaNToF128UI( const struct commonNaN *aPtr ) | ||||
| { | ||||
|     struct uint128 uiZ; | ||||
|  | ||||
|     uiZ = softfloat_shortShiftRight128( aPtr->v64, aPtr->v0, 16 ); | ||||
|     uiZ.v64 |= (uint_fast64_t) aPtr->sign<<63 | UINT64_C( 0x7FFF800000000000 ); | ||||
|     uiZ.v64 = defaultNaNF128UI64; | ||||
|     uiZ.v0  = defaultNaNF128UI0; | ||||
|     return uiZ; | ||||
|  | ||||
| } | ||||
|   | ||||
| @@ -1,51 +1,5 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "specialize.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by `aPtr' into a 16-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| | This file intentionally contains no code. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast16_t softfloat_commonNaNToF16UI( const struct commonNaN *aPtr ) | ||||
| { | ||||
|  | ||||
|     return (uint_fast16_t) aPtr->sign<<15 | 0x7E00 | aPtr->v64>>54; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -1,51 +1,5 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "specialize.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by `aPtr' into a 32-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| | This file intentionally contains no code. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast32_t softfloat_commonNaNToF32UI( const struct commonNaN *aPtr ) | ||||
| { | ||||
|  | ||||
|     return (uint_fast32_t) aPtr->sign<<31 | 0x7FC00000 | aPtr->v64>>41; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -1,53 +1,5 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "specialize.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by `aPtr' into a 64-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| | This file intentionally contains no code. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast64_t softfloat_commonNaNToF64UI( const struct commonNaN *aPtr ) | ||||
| { | ||||
|  | ||||
|     return | ||||
|         (uint_fast64_t) aPtr->sign<<63 | UINT64_C( 0x7FF8000000000000 ) | ||||
|             | aPtr->v64>>12; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -1,62 +1,5 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "internals.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming the 80-bit extended floating-point value pointed to by `aSPtr' is | ||||
| | a NaN, converts this NaN to the common NaN form, and stores the resulting | ||||
| | common NaN at the location pointed to by `zPtr'.  If the NaN is a signaling | ||||
| | NaN, the invalid exception is raised. | ||||
| | This file intentionally contains no code. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_extF80MToCommonNaN( | ||||
|      const struct extFloat80M *aSPtr, struct commonNaN *zPtr ) | ||||
| { | ||||
|  | ||||
|     if ( extF80M_isSignalingNaN( (const extFloat80_t *) aSPtr ) ) { | ||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||
|     } | ||||
|     zPtr->sign = signExtF80UI64( aSPtr->signExp ); | ||||
|     zPtr->v64 = aSPtr->signif<<1; | ||||
|     zPtr->v0  = 0; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -1,62 +1,5 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming the unsigned integer formed from concatenating `uiA64' and `uiA0' | ||||
| | has the bit pattern of an 80-bit extended floating-point NaN, converts | ||||
| | this NaN to the common NaN form, and stores the resulting common NaN at the | ||||
| | location pointed to by `zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| | This file intentionally contains no code. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_extF80UIToCommonNaN( | ||||
|      uint_fast16_t uiA64, uint_fast64_t uiA0, struct commonNaN *zPtr ) | ||||
| { | ||||
|  | ||||
|     if ( softfloat_isSigNaNExtF80UI( uiA64, uiA0 ) ) { | ||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||
|     } | ||||
|     zPtr->sign = uiA64>>15; | ||||
|     zPtr->v64  = uiA0<<1; | ||||
|     zPtr->v0   = 0; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -1,62 +1,5 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "primitives.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming the 128-bit floating-point value pointed to by `aWPtr' is a NaN, | ||||
| | converts this NaN to the common NaN form, and stores the resulting common | ||||
| | NaN at the location pointed to by `zPtr'.  If the NaN is a signaling NaN, | ||||
| | the invalid exception is raised.  Argument `aWPtr' points to an array of | ||||
| | four 32-bit elements that concatenate in the platform's normal endian order | ||||
| | to form a 128-bit floating-point value. | ||||
| | This file intentionally contains no code. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_f128MToCommonNaN( const uint32_t *aWPtr, struct commonNaN *zPtr ) | ||||
| { | ||||
|  | ||||
|     if ( f128M_isSignalingNaN( (const float128_t *) aWPtr ) ) { | ||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||
|     } | ||||
|     zPtr->sign = aWPtr[indexWordHi( 4 )]>>31; | ||||
|     softfloat_shortShiftLeft128M( aWPtr, 16, (uint32_t *) &zPtr->v0 ); | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -1,65 +1,5 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "primitives.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming the unsigned integer formed from concatenating `uiA64' and `uiA0' | ||||
| | has the bit pattern of a 128-bit floating-point NaN, converts this NaN to | ||||
| | the common NaN form, and stores the resulting common NaN at the location | ||||
| | pointed to by `zPtr'.  If the NaN is a signaling NaN, the invalid exception | ||||
| | is raised. | ||||
| | This file intentionally contains no code. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_f128UIToCommonNaN( | ||||
|      uint_fast64_t uiA64, uint_fast64_t uiA0, struct commonNaN *zPtr ) | ||||
| { | ||||
|     struct uint128 NaNSig; | ||||
|  | ||||
|     if ( softfloat_isSigNaNF128UI( uiA64, uiA0 ) ) { | ||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||
|     } | ||||
|     NaNSig = softfloat_shortShiftLeft128( uiA64, uiA0, 16 ); | ||||
|     zPtr->sign = uiA64>>63; | ||||
|     zPtr->v64  = NaNSig.v64; | ||||
|     zPtr->v0   = NaNSig.v0; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -1,59 +1,5 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming `uiA' has the bit pattern of a 16-bit floating-point NaN, converts | ||||
| | this NaN to the common NaN form, and stores the resulting common NaN at the | ||||
| | location pointed to by `zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| | This file intentionally contains no code. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_f16UIToCommonNaN( uint_fast16_t uiA, struct commonNaN *zPtr ) | ||||
| { | ||||
|  | ||||
|     if ( softfloat_isSigNaNF16UI( uiA ) ) { | ||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||
|     } | ||||
|     zPtr->sign = uiA>>15; | ||||
|     zPtr->v64  = (uint_fast64_t) uiA<<54; | ||||
|     zPtr->v0   = 0; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -1,59 +1,5 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming `uiA' has the bit pattern of a 32-bit floating-point NaN, converts | ||||
| | this NaN to the common NaN form, and stores the resulting common NaN at the | ||||
| | location pointed to by `zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| | This file intentionally contains no code. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_f32UIToCommonNaN( uint_fast32_t uiA, struct commonNaN *zPtr ) | ||||
| { | ||||
|  | ||||
|     if ( softfloat_isSigNaNF32UI( uiA ) ) { | ||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||
|     } | ||||
|     zPtr->sign = uiA>>31; | ||||
|     zPtr->v64  = (uint_fast64_t) uiA<<41; | ||||
|     zPtr->v0   = 0; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -1,59 +1,5 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming `uiA' has the bit pattern of a 64-bit floating-point NaN, converts | ||||
| | this NaN to the common NaN form, and stores the resulting common NaN at the | ||||
| | location pointed to by `zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| | This file intentionally contains no code. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_f64UIToCommonNaN( uint_fast64_t uiA, struct commonNaN *zPtr ) | ||||
| { | ||||
|  | ||||
|     if ( softfloat_isSigNaNF64UI( uiA ) ) { | ||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||
|     } | ||||
|     zPtr->sign = uiA>>63; | ||||
|     zPtr->v64  = uiA<<12; | ||||
|     zPtr->v0   = 0; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -4,8 +4,8 @@ | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
| @@ -34,10 +34,9 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "internals.h" | ||||
| #include "primitiveTypes.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| @@ -54,54 +53,22 @@ void | ||||
|      struct extFloat80M *zSPtr | ||||
|  ) | ||||
| { | ||||
|     bool isSigNaNA; | ||||
|     const struct extFloat80M *sPtr; | ||||
|     bool isSigNaNB; | ||||
|     uint_fast16_t uiB64; | ||||
|     uint64_t uiB0; | ||||
|     uint_fast16_t uiA64; | ||||
|     uint64_t uiA0; | ||||
|     uint_fast16_t uiMagA64, uiMagB64; | ||||
|     uint_fast16_t ui64; | ||||
|     uint_fast64_t ui0; | ||||
|  | ||||
|     isSigNaNA = extF80M_isSignalingNaN( (const extFloat80_t *) aSPtr ); | ||||
|     sPtr = aSPtr; | ||||
|     if ( ! bSPtr ) { | ||||
|         if ( isSigNaNA ) softfloat_raiseFlags( softfloat_flag_invalid ); | ||||
|         goto copy; | ||||
|     } | ||||
|     isSigNaNB = extF80M_isSignalingNaN( (const extFloat80_t *) bSPtr ); | ||||
|     if ( isSigNaNA | isSigNaNB ) { | ||||
|     ui64 = aSPtr->signExp; | ||||
|     ui0  = aSPtr->signif; | ||||
|     if ( | ||||
|         softfloat_isSigNaNExtF80UI( ui64, ui0 ) | ||||
|             || (bSPtr | ||||
|                     && (ui64 = bSPtr->signExp, | ||||
|                         ui0  = bSPtr->signif, | ||||
|                         softfloat_isSigNaNExtF80UI( ui64, ui0 ))) | ||||
|     ) { | ||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||
|         if ( isSigNaNA ) { | ||||
|             uiB64 = bSPtr->signExp; | ||||
|             if ( isSigNaNB ) goto returnLargerUIMag; | ||||
|             uiB0 = bSPtr->signif; | ||||
|             if ( isNaNExtF80UI( uiB64, uiB0 ) ) goto copyB; | ||||
|             goto copy; | ||||
|         } else { | ||||
|             uiA64 = aSPtr->signExp; | ||||
|             uiA0 = aSPtr->signif; | ||||
|             if ( isNaNExtF80UI( uiA64, uiA0 ) ) goto copy; | ||||
|             goto copyB; | ||||
|         } | ||||
|     } | ||||
|     uiB64 = bSPtr->signExp; | ||||
|  returnLargerUIMag: | ||||
|     uiA64 = aSPtr->signExp; | ||||
|     uiMagA64 = uiA64 & 0x7FFF; | ||||
|     uiMagB64 = uiB64 & 0x7FFF; | ||||
|     if ( uiMagA64 < uiMagB64 ) goto copyB; | ||||
|     if ( uiMagB64 < uiMagA64 ) goto copy; | ||||
|     uiA0 = aSPtr->signif; | ||||
|     uiB0 = bSPtr->signif; | ||||
|     if ( uiA0 < uiB0 ) goto copyB; | ||||
|     if ( uiB0 < uiA0 ) goto copy; | ||||
|     if ( uiA64 < uiB64 ) goto copy; | ||||
|  copyB: | ||||
|     sPtr = bSPtr; | ||||
|  copy: | ||||
|     zSPtr->signExp = sPtr->signExp; | ||||
|     zSPtr->signif = sPtr->signif | UINT64_C( 0xC000000000000000 ); | ||||
|     zSPtr->signExp = defaultNaNExtF80UI64; | ||||
|     zSPtr->signif  = defaultNaNExtF80UI0; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -4,7 +4,7 @@ | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014, 2018 The Regents of the University of | ||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| @@ -34,17 +34,16 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "internals.h" | ||||
| #include "primitiveTypes.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting the unsigned integer formed from concatenating 'uiA64' and | ||||
| | 'uiA0' as an 80-bit extended floating-point value, and likewise interpreting | ||||
| | the unsigned integer formed from concatenating 'uiB64' and 'uiB0' as another | ||||
| | Interpreting the unsigned integer formed from concatenating `uiA64' and | ||||
| | `uiA0' as an 80-bit extended floating-point value, and likewise interpreting | ||||
| | the unsigned integer formed from concatenating `uiB64' and `uiB0' as another | ||||
| | 80-bit extended floating-point value, and assuming at least on of these | ||||
| | floating-point values is a NaN, returns the bit pattern of the combined NaN | ||||
| | result.  If either original floating-point value is a signaling NaN, the | ||||
| @@ -58,48 +57,16 @@ struct uint128 | ||||
|      uint_fast64_t uiB0 | ||||
|  ) | ||||
| { | ||||
|     bool isSigNaNA, isSigNaNB; | ||||
|     uint_fast64_t uiNonsigA0, uiNonsigB0; | ||||
|     uint_fast16_t uiMagA64, uiMagB64; | ||||
|     struct uint128 uiZ; | ||||
|  | ||||
|     /*------------------------------------------------------------------------ | ||||
|     *------------------------------------------------------------------------*/ | ||||
|     isSigNaNA = softfloat_isSigNaNExtF80UI( uiA64, uiA0 ); | ||||
|     isSigNaNB = softfloat_isSigNaNExtF80UI( uiB64, uiB0 ); | ||||
|     /*------------------------------------------------------------------------ | ||||
|     | Make NaNs non-signaling. | ||||
|     *------------------------------------------------------------------------*/ | ||||
|     uiNonsigA0 = uiA0 | UINT64_C( 0xC000000000000000 ); | ||||
|     uiNonsigB0 = uiB0 | UINT64_C( 0xC000000000000000 ); | ||||
|     /*------------------------------------------------------------------------ | ||||
|     *------------------------------------------------------------------------*/ | ||||
|     if ( isSigNaNA | isSigNaNB ) { | ||||
|     if ( | ||||
|            softfloat_isSigNaNExtF80UI( uiA64, uiA0 ) | ||||
|         || softfloat_isSigNaNExtF80UI( uiB64, uiB0 ) | ||||
|     ) { | ||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||
|         if ( isSigNaNA ) { | ||||
|             if ( isSigNaNB ) goto returnLargerMag; | ||||
|             if ( isNaNExtF80UI( uiB64, uiB0 ) ) goto returnB; | ||||
|             goto returnA; | ||||
|         } else { | ||||
|             if ( isNaNExtF80UI( uiA64, uiA0 ) ) goto returnA; | ||||
|             goto returnB; | ||||
|         } | ||||
|     } | ||||
|  returnLargerMag: | ||||
|     uiMagA64 = uiA64 & 0x7FFF; | ||||
|     uiMagB64 = uiB64 & 0x7FFF; | ||||
|     if ( uiMagA64 < uiMagB64 ) goto returnB; | ||||
|     if ( uiMagB64 < uiMagA64 ) goto returnA; | ||||
|     if ( uiA0 < uiB0 ) goto returnB; | ||||
|     if ( uiB0 < uiA0 ) goto returnA; | ||||
|     if ( uiA64 < uiB64 ) goto returnA; | ||||
|  returnB: | ||||
|     uiZ.v64 = uiB64; | ||||
|     uiZ.v0  = uiNonsigB0; | ||||
|     return uiZ; | ||||
|  returnA: | ||||
|     uiZ.v64 = uiA64; | ||||
|     uiZ.v0  = uiNonsigA0; | ||||
|     uiZ.v64 = defaultNaNExtF80UI64; | ||||
|     uiZ.v0  = defaultNaNExtF80UI0; | ||||
|     return uiZ; | ||||
|  | ||||
| } | ||||
|   | ||||
| @@ -4,8 +4,8 @@ | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
| Copyright 2011, 2012, 2013, 2014, 2015, 2018 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
| @@ -34,43 +34,35 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "internals.h" | ||||
| #include "primitiveTypes.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming at least one of the two 128-bit floating-point values pointed to by | ||||
| | `aWPtr' and `bWPtr' is a NaN, stores the combined NaN result at the location | ||||
| | pointed to by `zWPtr'.  If either original floating-point value is a | ||||
| | signaling NaN, the invalid exception is raised.  Each of `aWPtr', `bWPtr', | ||||
| | and `zWPtr' points to an array of four 32-bit elements that concatenate in | ||||
| | 'aWPtr' and 'bWPtr' is a NaN, stores the combined NaN result at the location | ||||
| | pointed to by 'zWPtr'.  If either original floating-point value is a | ||||
| | signaling NaN, the invalid exception is raised.  Each of 'aWPtr', 'bWPtr', | ||||
| | and 'zWPtr' points to an array of four 32-bit elements that concatenate in | ||||
| | the platform's normal endian order to form a 128-bit floating-point value. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_propagateNaNF128M( | ||||
|      const uint32_t *aWPtr, const uint32_t *bWPtr, uint32_t *zWPtr ) | ||||
| { | ||||
|     bool isSigNaNA; | ||||
|     const uint32_t *ptr; | ||||
|  | ||||
|     ptr = aWPtr; | ||||
|     isSigNaNA = f128M_isSignalingNaN( (const float128_t *) aWPtr ); | ||||
|     if ( | ||||
|         isSigNaNA | ||||
|         f128M_isSignalingNaN( (const float128_t *) aWPtr ) | ||||
|             || (bWPtr && f128M_isSignalingNaN( (const float128_t *) bWPtr )) | ||||
|     ) { | ||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||
|         if ( isSigNaNA ) goto copy; | ||||
|     } | ||||
|     if ( ! softfloat_isNaNF128M( aWPtr ) ) ptr = bWPtr; | ||||
|  copy: | ||||
|     zWPtr[indexWordHi( 4 )] = ptr[indexWordHi( 4 )] | 0x00008000; | ||||
|     zWPtr[indexWord( 4, 2 )] = ptr[indexWord( 4, 2 )]; | ||||
|     zWPtr[indexWord( 4, 1 )] = ptr[indexWord( 4, 1 )]; | ||||
|     zWPtr[indexWord( 4, 0 )] = ptr[indexWord( 4, 0 )]; | ||||
|     zWPtr[indexWord( 4, 3 )] = defaultNaNF128UI96; | ||||
|     zWPtr[indexWord( 4, 2 )] = defaultNaNF128UI64; | ||||
|     zWPtr[indexWord( 4, 1 )] = defaultNaNF128UI32; | ||||
|     zWPtr[indexWord( 4, 0 )] = defaultNaNF128UI0; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -4,8 +4,8 @@ | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
| @@ -34,10 +34,9 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "internals.h" | ||||
| #include "primitiveTypes.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| @@ -58,23 +57,16 @@ struct uint128 | ||||
|      uint_fast64_t uiB0 | ||||
|  ) | ||||
| { | ||||
|     bool isSigNaNA; | ||||
|     struct uint128 uiZ; | ||||
|  | ||||
|     isSigNaNA = softfloat_isSigNaNF128UI( uiA64, uiA0 ); | ||||
|     if ( isSigNaNA || softfloat_isSigNaNF128UI( uiB64, uiB0 ) ) { | ||||
|     if ( | ||||
|            softfloat_isSigNaNF128UI( uiA64, uiA0 ) | ||||
|         || softfloat_isSigNaNF128UI( uiB64, uiB0 ) | ||||
|     ) { | ||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||
|         if ( isSigNaNA ) goto returnNonsigA; | ||||
|     } | ||||
|     if ( isNaNF128UI( uiA64, uiA0 ) ) { | ||||
|  returnNonsigA: | ||||
|         uiZ.v64 = uiA64; | ||||
|         uiZ.v0  = uiA0; | ||||
|     } else { | ||||
|         uiZ.v64 = uiB64; | ||||
|         uiZ.v0  = uiB0; | ||||
|     } | ||||
|     uiZ.v64 |= UINT64_C( 0x0000800000000000 ); | ||||
|     uiZ.v64 = defaultNaNF128UI64; | ||||
|     uiZ.v0  = defaultNaNF128UI0; | ||||
|     return uiZ; | ||||
|  | ||||
| } | ||||
|   | ||||
| @@ -4,7 +4,7 @@ | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||
| Copyright 2011, 2012, 2013, 2014, 2015, 2016 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| @@ -34,10 +34,8 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "internals.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| @@ -50,14 +48,11 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| uint_fast16_t | ||||
|  softfloat_propagateNaNF16UI( uint_fast16_t uiA, uint_fast16_t uiB ) | ||||
| { | ||||
|     bool isSigNaNA; | ||||
|  | ||||
|     isSigNaNA = softfloat_isSigNaNF16UI( uiA ); | ||||
|     if ( isSigNaNA || softfloat_isSigNaNF16UI( uiB ) ) { | ||||
|     if ( softfloat_isSigNaNF16UI( uiA ) || softfloat_isSigNaNF16UI( uiB ) ) { | ||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||
|         if ( isSigNaNA ) return uiA | 0x0200; | ||||
|     } | ||||
|     return (isNaNF16UI( uiA ) ? uiA : uiB) | 0x0200; | ||||
|     return defaultNaNF16UI; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -4,8 +4,8 @@ | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
| @@ -34,10 +34,8 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "internals.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| @@ -50,14 +48,11 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| uint_fast32_t | ||||
|  softfloat_propagateNaNF32UI( uint_fast32_t uiA, uint_fast32_t uiB ) | ||||
| { | ||||
|     bool isSigNaNA; | ||||
|  | ||||
|     isSigNaNA = softfloat_isSigNaNF32UI( uiA ); | ||||
|     if ( isSigNaNA || softfloat_isSigNaNF32UI( uiB ) ) { | ||||
|     if ( softfloat_isSigNaNF32UI( uiA ) || softfloat_isSigNaNF32UI( uiB ) ) { | ||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||
|         if ( isSigNaNA ) return uiA | 0x00400000; | ||||
|     } | ||||
|     return (isNaNF32UI( uiA ) ? uiA : uiB) | 0x00400000; | ||||
|     return defaultNaNF32UI; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -4,8 +4,8 @@ | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014 The Regents of the University of California. | ||||
| All rights reserved. | ||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
| @@ -34,10 +34,8 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "internals.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| @@ -50,14 +48,11 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| uint_fast64_t | ||||
|  softfloat_propagateNaNF64UI( uint_fast64_t uiA, uint_fast64_t uiB ) | ||||
| { | ||||
|     bool isSigNaNA; | ||||
|  | ||||
|     isSigNaNA = softfloat_isSigNaNF64UI( uiA ); | ||||
|     if ( isSigNaNA || softfloat_isSigNaNF64UI( uiB ) ) { | ||||
|     if ( softfloat_isSigNaNF64UI( uiA ) || softfloat_isSigNaNF64UI( uiB ) ) { | ||||
|         softfloat_raiseFlags( softfloat_flag_invalid ); | ||||
|         if ( isSigNaNA ) return uiA | UINT64_C( 0x0008000000000000 ); | ||||
|     } | ||||
|     return (isNaNF64UI( uiA ) ? uiA : uiB) | UINT64_C( 0x0008000000000000 ); | ||||
|     return defaultNaNF64UI; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -37,10 +37,10 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| #ifndef specialize_h | ||||
| #define specialize_h 1 | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "primitiveTypes.h" | ||||
| #include "softfloat.h" | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Default value for 'softfloat_detectTininess'. | ||||
| @@ -51,48 +51,50 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| | The values to return on conversions to 32-bit integer formats that raise an | ||||
| | invalid exception. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define ui32_fromPosOverflow UINT32_C(0xFFFFFFFF) | ||||
| #define ui32_fromNegOverflow UINT32_C(0x0) | ||||
| #define ui32_fromNaN         UINT32_C(0xFFFFFFFF) | ||||
| #define i32_fromPosOverflow   INT64_C(0x7FFFFFFF) | ||||
| #define i32_fromNegOverflow  (-INT64_C(0x7FFFFFFF)-1) | ||||
| #define i32_fromNaN           INT64_C(0x7FFFFFFF) | ||||
| #define ui32_fromPosOverflow 0xFFFFFFFF | ||||
| #define ui32_fromNegOverflow 0 | ||||
| #define ui32_fromNaN 0xFFFFFFFF | ||||
| #define i32_fromPosOverflow 0x7FFFFFFF | ||||
| #define i32_fromNegOverflow (-0x7FFFFFFF - 1) | ||||
| #define i32_fromNaN 0x7FFFFFFF | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The values to return on conversions to 64-bit integer formats that raise an | ||||
| | invalid exception. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define ui64_fromPosOverflow UINT64_C( 0xFFFFFFFFFFFFFFFF ) | ||||
| #define ui64_fromNegOverflow UINT64_C( 0x0 ) | ||||
| #define ui64_fromNaN         UINT64_C( 0xFFFFFFFFFFFFFFFF) | ||||
| #define i64_fromPosOverflow   INT64_C( 0x7FFFFFFFFFFFFFFF) | ||||
| #define i64_fromNegOverflow  (-INT64_C( 0x7FFFFFFFFFFFFFFF)-1) | ||||
| #define i64_fromNaN           INT64_C( 0x7FFFFFFFFFFFFFFF) | ||||
| #define ui64_fromPosOverflow UINT64_C(0xFFFFFFFFFFFFFFFF) | ||||
| #define ui64_fromNegOverflow 0 | ||||
| #define ui64_fromNaN UINT64_C(0xFFFFFFFFFFFFFFFF) | ||||
| #define i64_fromPosOverflow INT64_C(0x7FFFFFFFFFFFFFFF) | ||||
| #define i64_fromNegOverflow (-INT64_C(0x7FFFFFFFFFFFFFFF) - 1) | ||||
| #define i64_fromNaN INT64_C(0x7FFFFFFFFFFFFFFF) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | "Common NaN" structure, used to transfer NaN representations from one format | ||||
| | to another. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct commonNaN { | ||||
|     bool sign; | ||||
| #ifdef LITTLEENDIAN | ||||
|     uint64_t v0, v64; | ||||
| #else | ||||
|     uint64_t v64, v0; | ||||
| #endif | ||||
|     char _unused; | ||||
| }; | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 16-bit floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNF16UI 0xFE00 | ||||
| #define defaultNaNF16UI 0x7E00 | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when 16-bit unsigned integer 'uiA' has the bit pattern of a | ||||
| | 16-bit floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF16UI( uiA ) ((((uiA) & 0x7E00) == 0x7C00) && ((uiA) & 0x01FF)) | ||||
| #define softfloat_isSigNaNF16UI(uiA) ((((uiA)&0x7E00) == 0x7C00) && ((uiA)&0x01FF)) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when 16-bit unsigned integer 'uiA' has the bit pattern of a | ||||
| | 16-bit brain floating-point (BF16) signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNBF16UI(uiA) ((((uiA)&0x7FC0) == 0x7F80) && ((uiA)&0x003F)) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 16-bit floating-point NaN, converts | ||||
| @@ -100,13 +102,25 @@ struct commonNaN { | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_f16UIToCommonNaN( uint_fast16_t uiA, struct commonNaN *zPtr ); | ||||
| #define softfloat_f16UIToCommonNaN(uiA, zPtr)                                                                                              \ | ||||
|     if(!((uiA)&0x0200))                                                                                                                    \ | ||||
|     softfloat_raiseFlags(softfloat_flag_invalid) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 16-bit BF16 floating-point NaN, converts | ||||
| | this NaN to the common NaN form, and stores the resulting common NaN at the | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_bf16UIToCommonNaN(uiA, zPtr)                                                                                             \ | ||||
|     if(!((uiA)&0x0040))                                                                                                                    \ | ||||
|     softfloat_raiseFlags(softfloat_flag_invalid) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 16-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast16_t softfloat_commonNaNToF16UI( const struct commonNaN *aPtr ); | ||||
| #define softfloat_commonNaNToF16UI(aPtr) ((uint_fast16_t)defaultNaNF16UI) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 16-bit floating- | ||||
| @@ -114,8 +128,18 @@ uint_fast16_t softfloat_commonNaNToF16UI( const struct commonNaN *aPtr ); | ||||
| | the combined NaN result.  If either 'uiA' or 'uiB' has the pattern of a | ||||
| | signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast16_t | ||||
|  softfloat_propagateNaNF16UI( uint_fast16_t uiA, uint_fast16_t uiB ); | ||||
| uint_fast16_t softfloat_propagateNaNF16UI(uint_fast16_t uiA, uint_fast16_t uiB); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 16-bit BF16 floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNBF16UI 0x7FC0 | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 16-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_commonNaNToBF16UI(aPtr) ((uint_fast16_t)defaultNaNBF16UI) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 32-bit floating-point NaN. | ||||
| @@ -127,7 +151,7 @@ uint_fast16_t | ||||
| | 32-bit floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF32UI( uiA ) ((((uiA) & 0x7FC00000) == 0x7F800000) && ((uiA) & 0x003FFFFF)) | ||||
| #define softfloat_isSigNaNF32UI(uiA) ((((uiA)&0x7FC00000) == 0x7F800000) && ((uiA)&0x003FFFFF)) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 32-bit floating-point NaN, converts | ||||
| @@ -135,13 +159,15 @@ uint_fast16_t | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_f32UIToCommonNaN( uint_fast32_t uiA, struct commonNaN *zPtr ); | ||||
| #define softfloat_f32UIToCommonNaN(uiA, zPtr)                                                                                              \ | ||||
|     if(!((uiA)&0x00400000))                                                                                                                \ | ||||
|     softfloat_raiseFlags(softfloat_flag_invalid) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 32-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast32_t softfloat_commonNaNToF32UI( const struct commonNaN *aPtr ); | ||||
| #define softfloat_commonNaNToF32UI(aPtr) ((uint_fast32_t)defaultNaNF32UI) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 32-bit floating- | ||||
| @@ -149,20 +175,20 @@ uint_fast32_t softfloat_commonNaNToF32UI( const struct commonNaN *aPtr ); | ||||
| | the combined NaN result.  If either 'uiA' or 'uiB' has the pattern of a | ||||
| | signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast32_t | ||||
|  softfloat_propagateNaNF32UI( uint_fast32_t uiA, uint_fast32_t uiB ); | ||||
| uint_fast32_t softfloat_propagateNaNF32UI(uint_fast32_t uiA, uint_fast32_t uiB); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 64-bit floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNF64UI UINT64_C( 0x7FF8000000000000 ) | ||||
| #define defaultNaNF64UI UINT64_C(0x7FF8000000000000) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when 64-bit unsigned integer 'uiA' has the bit pattern of a | ||||
| | 64-bit floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its argument more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF64UI( uiA ) ((((uiA) & UINT64_C( 0x7FF8000000000000 )) == UINT64_C( 0x7FF0000000000000 )) && ((uiA) & UINT64_C( 0x0007FFFFFFFFFFFF ))) | ||||
| #define softfloat_isSigNaNF64UI(uiA)                                                                                                       \ | ||||
|     ((((uiA)&UINT64_C(0x7FF8000000000000)) == UINT64_C(0x7FF0000000000000)) && ((uiA)&UINT64_C(0x0007FFFFFFFFFFFF))) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming 'uiA' has the bit pattern of a 64-bit floating-point NaN, converts | ||||
| @@ -170,13 +196,15 @@ uint_fast32_t | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_f64UIToCommonNaN( uint_fast64_t uiA, struct commonNaN *zPtr ); | ||||
| #define softfloat_f64UIToCommonNaN(uiA, zPtr)                                                                                              \ | ||||
|     if(!((uiA)&UINT64_C(0x0008000000000000)))                                                                                              \ | ||||
|     softfloat_raiseFlags(softfloat_flag_invalid) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 64-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast64_t softfloat_commonNaNToF64UI( const struct commonNaN *aPtr ); | ||||
| #define softfloat_commonNaNToF64UI(aPtr) ((uint_fast64_t)defaultNaNF64UI) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting 'uiA' and 'uiB' as the bit patterns of two 64-bit floating- | ||||
| @@ -184,14 +212,13 @@ uint_fast64_t softfloat_commonNaNToF64UI( const struct commonNaN *aPtr ); | ||||
| | the combined NaN result.  If either 'uiA' or 'uiB' has the pattern of a | ||||
| | signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast64_t | ||||
|  softfloat_propagateNaNF64UI( uint_fast64_t uiA, uint_fast64_t uiB ); | ||||
| uint_fast64_t softfloat_propagateNaNF64UI(uint_fast64_t uiA, uint_fast64_t uiB); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 80-bit extended floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNExtF80UI64 0xFFFF | ||||
| #define defaultNaNExtF80UI0  UINT64_C( 0xC000000000000000 ) | ||||
| #define defaultNaNExtF80UI64 0x7FFF | ||||
| #define defaultNaNExtF80UI0 UINT64_C(0xC000000000000000) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when the 80-bit unsigned integer formed from concatenating | ||||
| @@ -199,7 +226,8 @@ uint_fast64_t | ||||
| | floating-point signaling NaN. | ||||
| | Note:  This macro evaluates its arguments more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNExtF80UI( uiA64, uiA0 ) ((((uiA64) & 0x7FFF) == 0x7FFF) && ! ((uiA0) & UINT64_C( 0x4000000000000000 )) && ((uiA0) & UINT64_C( 0x3FFFFFFFFFFFFFFF ))) | ||||
| #define softfloat_isSigNaNExtF80UI(uiA64, uiA0)                                                                                            \ | ||||
|     ((((uiA64)&0x7FFF) == 0x7FFF) && !((uiA0)&UINT64_C(0x4000000000000000)) && ((uiA0)&UINT64_C(0x3FFFFFFFFFFFFFFF))) | ||||
|  | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
|  | ||||
| @@ -215,16 +243,26 @@ uint_fast64_t | ||||
| | location pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_extF80UIToCommonNaN( | ||||
|      uint_fast16_t uiA64, uint_fast64_t uiA0, struct commonNaN *zPtr ); | ||||
| #define softfloat_extF80UIToCommonNaN(uiA64, uiA0, zPtr)                                                                                   \ | ||||
|     if(!((uiA0)&UINT64_C(0x4000000000000000)))                                                                                             \ | ||||
|     softfloat_raiseFlags(softfloat_flag_invalid) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into an 80-bit extended | ||||
| | floating-point NaN, and returns the bit pattern of this value as an unsigned | ||||
| | integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 softfloat_commonNaNToExtF80UI( const struct commonNaN *aPtr ); | ||||
| #if defined INLINE && !defined softfloat_commonNaNToExtF80UI | ||||
| INLINE | ||||
| struct uint128 softfloat_commonNaNToExtF80UI(const struct commonNaN* aPtr) { | ||||
|     struct uint128 uiZ; | ||||
|     uiZ.v64 = defaultNaNExtF80UI64; | ||||
|     uiZ.v0 = defaultNaNExtF80UI0; | ||||
|     return uiZ; | ||||
| } | ||||
| #else | ||||
| struct uint128 softfloat_commonNaNToExtF80UI(const struct commonNaN* aPtr); | ||||
| #endif | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting the unsigned integer formed from concatenating 'uiA64' and | ||||
| @@ -235,19 +273,13 @@ struct uint128 softfloat_commonNaNToExtF80UI( const struct commonNaN *aPtr ); | ||||
| | result.  If either original floating-point value is a signaling NaN, the | ||||
| | invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 | ||||
|  softfloat_propagateNaNExtF80UI( | ||||
|      uint_fast16_t uiA64, | ||||
|      uint_fast64_t uiA0, | ||||
|      uint_fast16_t uiB64, | ||||
|      uint_fast64_t uiB0 | ||||
|  ); | ||||
| struct uint128 softfloat_propagateNaNExtF80UI(uint_fast16_t uiA64, uint_fast64_t uiA0, uint_fast16_t uiB64, uint_fast64_t uiB0); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 128-bit floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNF128UI64 UINT64_C( 0xFFFF800000000000 ) | ||||
| #define defaultNaNF128UI0  UINT64_C( 0 ) | ||||
| #define defaultNaNF128UI64 UINT64_C(0x7FFF800000000000) | ||||
| #define defaultNaNF128UI0 UINT64_C(0) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns true when the 128-bit unsigned integer formed from concatenating | ||||
| @@ -255,7 +287,8 @@ struct uint128 | ||||
| | point signaling NaN. | ||||
| | Note:  This macro evaluates its arguments more than once. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_isSigNaNF128UI( uiA64, uiA0 ) ((((uiA64) & UINT64_C( 0x7FFF800000000000 )) == UINT64_C( 0x7FFF000000000000 )) && ((uiA0) || ((uiA64) & UINT64_C( 0x00007FFFFFFFFFFF )))) | ||||
| #define softfloat_isSigNaNF128UI(uiA64, uiA0)                                                                                              \ | ||||
|     ((((uiA64)&UINT64_C(0x7FFF800000000000)) == UINT64_C(0x7FFF000000000000)) && ((uiA0) || ((uiA64)&UINT64_C(0x00007FFFFFFFFFFF)))) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming the unsigned integer formed from concatenating 'uiA64' and 'uiA0' | ||||
| @@ -264,15 +297,25 @@ struct uint128 | ||||
| | pointed to by 'zPtr'.  If the NaN is a signaling NaN, the invalid exception | ||||
| | is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_f128UIToCommonNaN( | ||||
|      uint_fast64_t uiA64, uint_fast64_t uiA0, struct commonNaN *zPtr ); | ||||
| #define softfloat_f128UIToCommonNaN(uiA64, uiA0, zPtr)                                                                                     \ | ||||
|     if(!((uiA64)&UINT64_C(0x0000800000000000)))                                                                                            \ | ||||
|     softfloat_raiseFlags(softfloat_flag_invalid) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 128-bit floating-point | ||||
| | NaN, and returns the bit pattern of this value as an unsigned integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 softfloat_commonNaNToF128UI( const struct commonNaN * ); | ||||
| #if defined INLINE && !defined softfloat_commonNaNToF128UI | ||||
| INLINE | ||||
| struct uint128 softfloat_commonNaNToF128UI(const struct commonNaN* aPtr) { | ||||
|     struct uint128 uiZ; | ||||
|     uiZ.v64 = defaultNaNF128UI64; | ||||
|     uiZ.v0 = defaultNaNF128UI0; | ||||
|     return uiZ; | ||||
| } | ||||
| #else | ||||
| struct uint128 softfloat_commonNaNToF128UI(const struct commonNaN*); | ||||
| #endif | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Interpreting the unsigned integer formed from concatenating 'uiA64' and | ||||
| @@ -283,13 +326,7 @@ struct uint128 softfloat_commonNaNToF128UI( const struct commonNaN * ); | ||||
| | If either original floating-point value is a signaling NaN, the invalid | ||||
| | exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 | ||||
|  softfloat_propagateNaNF128UI( | ||||
|      uint_fast64_t uiA64, | ||||
|      uint_fast64_t uiA0, | ||||
|      uint_fast64_t uiB64, | ||||
|      uint_fast64_t uiB0 | ||||
|  ); | ||||
| struct uint128 softfloat_propagateNaNF128UI(uint_fast64_t uiA64, uint_fast64_t uiA0, uint_fast64_t uiB64, uint_fast64_t uiB0); | ||||
|  | ||||
| #else | ||||
|  | ||||
| @@ -304,18 +341,24 @@ struct uint128 | ||||
| | common NaN at the location pointed to by 'zPtr'.  If the NaN is a signaling | ||||
| | NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_extF80MToCommonNaN( | ||||
|      const struct extFloat80M *aSPtr, struct commonNaN *zPtr ); | ||||
| #define softfloat_extF80MToCommonNaN(aSPtr, zPtr)                                                                                          \ | ||||
|     if(!((aSPtr)->signif & UINT64_C(0x4000000000000000)))                                                                                  \ | ||||
|     softfloat_raiseFlags(softfloat_flag_invalid) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into an 80-bit extended | ||||
| | floating-point NaN, and stores this NaN at the location pointed to by | ||||
| | 'zSPtr'. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_commonNaNToExtF80M( | ||||
|      const struct commonNaN *aPtr, struct extFloat80M *zSPtr ); | ||||
| #if defined INLINE && !defined softfloat_commonNaNToExtF80M | ||||
| INLINE | ||||
| void softfloat_commonNaNToExtF80M(const struct commonNaN* aPtr, struct extFloat80M* zSPtr) { | ||||
|     zSPtr->signExp = defaultNaNExtF80UI64; | ||||
|     zSPtr->signif = defaultNaNExtF80UI0; | ||||
| } | ||||
| #else | ||||
| void softfloat_commonNaNToExtF80M(const struct commonNaN* aPtr, struct extFloat80M* zSPtr); | ||||
| #endif | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming at least one of the two 80-bit extended floating-point values | ||||
| @@ -323,20 +366,15 @@ void | ||||
| | at the location pointed to by 'zSPtr'.  If either original floating-point | ||||
| | value is a signaling NaN, the invalid exception is raised. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_propagateNaNExtF80M( | ||||
|      const struct extFloat80M *aSPtr, | ||||
|      const struct extFloat80M *bSPtr, | ||||
|      struct extFloat80M *zSPtr | ||||
|  ); | ||||
| void softfloat_propagateNaNExtF80M(const struct extFloat80M* aSPtr, const struct extFloat80M* bSPtr, struct extFloat80M* zSPtr); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The bit pattern for a default generated 128-bit floating-point NaN. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define defaultNaNF128UI96 0xFFFF8000 | ||||
| #define defaultNaNF128UI96 0x7FFF8000 | ||||
| #define defaultNaNF128UI64 0 | ||||
| #define defaultNaNF128UI32 0 | ||||
| #define defaultNaNF128UI0  0 | ||||
| #define defaultNaNF128UI0 0 | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming the 128-bit floating-point value pointed to by 'aWPtr' is a NaN, | ||||
| @@ -346,8 +384,9 @@ void | ||||
| | four 32-bit elements that concatenate in the platform's normal endian order | ||||
| | to form a 128-bit floating-point value. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_f128MToCommonNaN( const uint32_t *aWPtr, struct commonNaN *zPtr ); | ||||
| #define softfloat_f128MToCommonNaN(aWPtr, zPtr)                                                                                            \ | ||||
|     if(!((aWPtr)[indexWordHi(4)] & UINT64_C(0x0000800000000000)))                                                                          \ | ||||
|     softfloat_raiseFlags(softfloat_flag_invalid) | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Converts the common NaN pointed to by 'aPtr' into a 128-bit floating-point | ||||
| @@ -355,8 +394,17 @@ void | ||||
| | 'zWPtr' points to an array of four 32-bit elements that concatenate in the | ||||
| | platform's normal endian order to form a 128-bit floating-point value. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_commonNaNToF128M( const struct commonNaN *aPtr, uint32_t *zWPtr ); | ||||
| #if defined INLINE && !defined softfloat_commonNaNToF128M | ||||
| INLINE | ||||
| void softfloat_commonNaNToF128M(const struct commonNaN* aPtr, uint32_t* zWPtr) { | ||||
|     zWPtr[indexWord(4, 3)] = defaultNaNF128UI96; | ||||
|     zWPtr[indexWord(4, 2)] = defaultNaNF128UI64; | ||||
|     zWPtr[indexWord(4, 1)] = defaultNaNF128UI32; | ||||
|     zWPtr[indexWord(4, 0)] = defaultNaNF128UI0; | ||||
| } | ||||
| #else | ||||
| void softfloat_commonNaNToF128M(const struct commonNaN* aPtr, uint32_t* zWPtr); | ||||
| #endif | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Assuming at least one of the two 128-bit floating-point values pointed to by | ||||
| @@ -366,11 +414,8 @@ void | ||||
| | and 'zWPtr' points to an array of four 32-bit elements that concatenate in | ||||
| | the platform's normal endian order to form a 128-bit floating-point value. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_propagateNaNF128M( | ||||
|      const uint32_t *aWPtr, const uint32_t *bWPtr, uint32_t *zWPtr ); | ||||
| void softfloat_propagateNaNF128M(const uint32_t* aWPtr, const uint32_t* bWPtr, uint32_t* zWPtr); | ||||
|  | ||||
| #endif | ||||
|  | ||||
| #endif | ||||
|  | ||||
|   | ||||
							
								
								
									
										51
									
								
								softfloat/source/bf16_isSignalingNaN.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										51
									
								
								softfloat/source/bf16_isSignalingNaN.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,51 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include "platform.h" | ||||
| #include "internals.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| bool bf16_isSignalingNaN( bfloat16_t a ) | ||||
| { | ||||
|     union ui16_bf16 uA; | ||||
|  | ||||
|     uA.f = a; | ||||
|     return softfloat_isSigNaNBF16UI( uA.ui ); | ||||
|  | ||||
| } | ||||
|  | ||||
							
								
								
									
										90
									
								
								softfloat/source/bf16_to_f32.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										90
									
								
								softfloat/source/bf16_to_f32.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,90 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "internals.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| float32_t bf16_to_f32( bfloat16_t a ) | ||||
| { | ||||
|     union ui16_bf16 uA; | ||||
|     uint_fast16_t uiA; | ||||
|     bool sign; | ||||
|     int_fast16_t exp; | ||||
|     uint_fast16_t frac; | ||||
|     struct commonNaN commonNaN; | ||||
|     uint_fast32_t uiZ; | ||||
|     struct exp8_sig16 normExpSig; | ||||
|     union ui32_f32 uZ; | ||||
|  | ||||
|     /*------------------------------------------------------------------------ | ||||
|     *------------------------------------------------------------------------*/ | ||||
|     uA.f = a; | ||||
|     uiA = uA.ui; | ||||
|     sign = signBF16UI( uiA ); | ||||
|     exp  = expBF16UI( uiA ); | ||||
|     frac = fracBF16UI( uiA ); | ||||
|     /*------------------------------------------------------------------------ | ||||
|     *------------------------------------------------------------------------*/ | ||||
|     // NaN or Inf | ||||
|     if ( exp == 0xFF ) { | ||||
|         if ( frac ) { | ||||
|             softfloat_bf16UIToCommonNaN( uiA, &commonNaN ); | ||||
|             uiZ = softfloat_commonNaNToF32UI( &commonNaN ); | ||||
|         } else { | ||||
|             uiZ = packToF32UI( sign, 0xFF, 0 ); | ||||
|         } | ||||
|         goto uiZ; | ||||
|     } | ||||
|     /*------------------------------------------------------------------------ | ||||
|     *------------------------------------------------------------------------*/ | ||||
|     // packToF32UI simply packs bitfields without any numerical change | ||||
|     // which means it can be used directly for any BF16 to f32 conversions which | ||||
|     // does not require bits manipulation | ||||
|     // (that is everything where the 16-bit are just padded right with 16 zeros, including | ||||
|     //  subnormal numbers) | ||||
|     uiZ = packToF32UI( sign, exp, ((uint_fast32_t) frac) <<16 ); | ||||
|  uiZ: | ||||
|     uZ.ui = uiZ; | ||||
|     return uZ.f; | ||||
|  | ||||
| } | ||||
|  | ||||
|  | ||||
|  | ||||
							
								
								
									
										105
									
								
								softfloat/source/f32_to_bf16.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										105
									
								
								softfloat/source/f32_to_bf16.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,105 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014, 2015 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "internals.h" | ||||
| #include "specialize.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| #include <inttypes.h> | ||||
| #include <stdio.h> | ||||
|  | ||||
| bfloat16_t f32_to_bf16( float32_t a ) | ||||
| { | ||||
|     union ui32_f32 uA; | ||||
|     uint_fast32_t uiA; | ||||
|     bool sign; | ||||
|     int_fast16_t exp; | ||||
|     uint_fast32_t frac; | ||||
|     struct commonNaN commonNaN; | ||||
|     uint_fast16_t uiZ, frac16; | ||||
|     union ui16_bf16 uZ; | ||||
|  | ||||
|     /*------------------------------------------------------------------------ | ||||
|     *------------------------------------------------------------------------*/ | ||||
|     uA.f = a; | ||||
|     uiA = uA.ui; | ||||
|     sign = signF32UI( uiA ); | ||||
|     exp  = expF32UI( uiA ); | ||||
|     frac = fracF32UI( uiA ); | ||||
|     /*------------------------------------------------------------------------ | ||||
|     *------------------------------------------------------------------------*/ | ||||
|     // infinity or NaN cases | ||||
|     if ( exp == 0xFF ) { | ||||
|         if ( frac ) { | ||||
|             // NaN case | ||||
|             softfloat_f32UIToCommonNaN( uiA, &commonNaN ); | ||||
|             uiZ = softfloat_commonNaNToBF16UI( &commonNaN ); | ||||
|         } else { | ||||
|             // infinity case | ||||
|             uiZ = packToBF16UI( sign, 0xFF, 0 ); | ||||
|         } | ||||
|         goto uiZ; | ||||
|     } | ||||
|     /*------------------------------------------------------------------------ | ||||
|     *------------------------------------------------------------------------*/ | ||||
|     // frac is a 24-bit mantissa, right shifted by 9 | ||||
|     // In the normal case, (24-9) = 15 are set  | ||||
|     frac16 = frac>>9 | ((frac & 0x1FF) != 0); | ||||
|     if ( ! (exp | frac16) ) { | ||||
|         uiZ = packToBF16UI( sign, 0, 0 ); | ||||
|         goto uiZ; | ||||
|     } | ||||
|     /*------------------------------------------------------------------------ | ||||
|     *------------------------------------------------------------------------*/ | ||||
|     // softfloat_roundPackToBF16 exponent argument (2nd argument) | ||||
|     // must correspond to the exponent of fracIn[13] bits | ||||
|     // (fracIn is the 3rd and last argument)  | ||||
|     uint_fast32_t mask = exp ? 0x4000 : 0x0; // implicit one mask added if input is a normal number | ||||
|     // exponent for the lowest normal and largest subnormal should be equal | ||||
|     // but is not in IEEE encoding so mantissa must be partially normalized | ||||
|     // (by one bit) for subnormal numbers. Such that (exp - 1) corresponds | ||||
|     // to the exponent of frac16[13] | ||||
|     frac16 = frac16 << (exp ? 0 : 1); | ||||
|     return softfloat_roundPackToBF16( sign, exp - 1, frac16 | mask ); | ||||
|  uiZ: | ||||
|     uZ.ui = uiZ; | ||||
|     return uZ.f; | ||||
|  | ||||
| } | ||||
|  | ||||
| @@ -72,6 +72,9 @@ float16_t f32_to_f16( float32_t a ) | ||||
|     } | ||||
|     /*------------------------------------------------------------------------ | ||||
|     *------------------------------------------------------------------------*/ | ||||
|     // frac is a 24-bit significand, the bottom 9 bits LSB are extracted and OR-red | ||||
|     // into a sticky flag, the top 15 MSBs are extracted, the LSB of this top slice | ||||
|     // is OR-red with the sticky  | ||||
|     frac16 = frac>>9 | ((frac & 0x1FF) != 0); | ||||
|     if ( ! (exp | frac16) ) { | ||||
|         uiZ = packToF16UI( sign, 0, 0 ); | ||||
|   | ||||
| @@ -37,242 +37,221 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| #ifndef internals_h | ||||
| #define internals_h 1 | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "primitives.h" | ||||
| #include "softfloat_types.h" | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
|  | ||||
| union ui16_f16 { uint16_t ui; float16_t f; }; | ||||
| union ui32_f32 { uint32_t ui; float32_t f; }; | ||||
| union ui64_f64 { uint64_t ui; float64_t f; }; | ||||
|  | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
| union extF80M_extF80 { struct extFloat80M fM; extFloat80_t f; }; | ||||
| union ui128_f128 { struct uint128 ui; float128_t f; }; | ||||
| #endif | ||||
|  | ||||
| enum { | ||||
|     softfloat_mulAdd_subC    = 1, | ||||
|     softfloat_mulAdd_subProd = 2 | ||||
| union ui16_f16 { | ||||
|     uint16_t ui; | ||||
|     float16_t f; | ||||
| }; | ||||
| union ui16_bf16 { | ||||
|     uint16_t ui; | ||||
|     bfloat16_t f; | ||||
| }; | ||||
| union ui32_f32 { | ||||
|     uint32_t ui; | ||||
|     float32_t f; | ||||
| }; | ||||
| union ui64_f64 { | ||||
|     uint64_t ui; | ||||
|     float64_t f; | ||||
| }; | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast32_t softfloat_roundToUI32( bool, uint_fast64_t, uint_fast8_t, bool ); | ||||
|  | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
| uint_fast64_t | ||||
|  softfloat_roundToUI64( | ||||
|      bool, uint_fast64_t, uint_fast64_t, uint_fast8_t, bool ); | ||||
| #else | ||||
| uint_fast64_t softfloat_roundMToUI64( bool, uint32_t *, uint_fast8_t, bool ); | ||||
| union extF80M_extF80 { | ||||
|     struct extFloat80M fM; | ||||
|     extFloat80_t f; | ||||
| }; | ||||
| union ui128_f128 { | ||||
|     struct uint128 ui; | ||||
|     float128_t f; | ||||
| }; | ||||
| #endif | ||||
|  | ||||
| int_fast32_t softfloat_roundToI32( bool, uint_fast64_t, uint_fast8_t, bool ); | ||||
| enum { softfloat_mulAdd_subC = 1, softfloat_mulAdd_subProd = 2 }; | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
|  *----------------------------------------------------------------------------*/ | ||||
| uint_fast32_t softfloat_roundToUI32(bool, uint_fast64_t, uint_fast8_t, bool); | ||||
|  | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
| int_fast64_t | ||||
|  softfloat_roundToI64( | ||||
|      bool, uint_fast64_t, uint_fast64_t, uint_fast8_t, bool ); | ||||
| uint_fast64_t softfloat_roundToUI64(bool, uint_fast64_t, uint_fast64_t, uint_fast8_t, bool); | ||||
| #else | ||||
| int_fast64_t softfloat_roundMToI64( bool, uint32_t *, uint_fast8_t, bool ); | ||||
| uint_fast64_t softfloat_roundMToUI64(bool, uint32_t*, uint_fast8_t, bool); | ||||
| #endif | ||||
|  | ||||
| int_fast32_t softfloat_roundToI32(bool, uint_fast64_t, uint_fast8_t, bool); | ||||
|  | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
| int_fast64_t softfloat_roundToI64(bool, uint_fast64_t, uint_fast64_t, uint_fast8_t, bool); | ||||
| #else | ||||
| int_fast64_t softfloat_roundMToI64(bool, uint32_t*, uint_fast8_t, bool); | ||||
| #endif | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define signF16UI( a ) ((bool) ((uint16_t) (a)>>15)) | ||||
| #define expF16UI( a ) ((int_fast8_t) ((a)>>10) & 0x1F) | ||||
| #define fracF16UI( a ) ((a) & 0x03FF) | ||||
| #define packToF16UI( sign, exp, sig ) (((uint16_t) (sign)<<15) + ((uint16_t) (exp)<<10) + (sig)) | ||||
|  *----------------------------------------------------------------------------*/ | ||||
| #define signF16UI(a) ((bool)((uint16_t)(a) >> 15)) | ||||
| #define expF16UI(a) ((int_fast8_t)((a) >> 10) & 0x1F) | ||||
| #define fracF16UI(a) ((a)&0x03FF) | ||||
| #define packToF16UI(sign, exp, sig) (((uint16_t)(sign) << 15) + ((uint16_t)(exp) << 10) + (sig)) | ||||
|  | ||||
| #define isNaNF16UI( a ) (((~(a) & 0x7C00) == 0) && ((a) & 0x03FF)) | ||||
| #define isNaNF16UI(a) (((~(a)&0x7C00) == 0) && ((a)&0x03FF)) | ||||
|  | ||||
| struct exp8_sig16 { int_fast8_t exp; uint_fast16_t sig; }; | ||||
| struct exp8_sig16 softfloat_normSubnormalF16Sig( uint_fast16_t ); | ||||
| struct exp8_sig16 { | ||||
|     int_fast8_t exp; | ||||
|     uint_fast16_t sig; | ||||
| }; | ||||
| struct exp8_sig16 softfloat_normSubnormalF16Sig(uint_fast16_t); | ||||
|  | ||||
| float16_t softfloat_roundPackToF16( bool, int_fast16_t, uint_fast16_t ); | ||||
| float16_t softfloat_normRoundPackToF16( bool, int_fast16_t, uint_fast16_t ); | ||||
| float16_t softfloat_roundPackToF16(bool, int_fast16_t, uint_fast16_t); | ||||
| float16_t softfloat_normRoundPackToF16(bool, int_fast16_t, uint_fast16_t); | ||||
|  | ||||
| float16_t softfloat_addMagsF16( uint_fast16_t, uint_fast16_t ); | ||||
| float16_t softfloat_subMagsF16( uint_fast16_t, uint_fast16_t ); | ||||
| float16_t | ||||
|  softfloat_mulAddF16( | ||||
|      uint_fast16_t, uint_fast16_t, uint_fast16_t, uint_fast8_t ); | ||||
| float16_t softfloat_addMagsF16(uint_fast16_t, uint_fast16_t); | ||||
| float16_t softfloat_subMagsF16(uint_fast16_t, uint_fast16_t); | ||||
| float16_t softfloat_mulAddF16(uint_fast16_t, uint_fast16_t, uint_fast16_t, uint_fast8_t); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define signF32UI( a ) ((bool) ((uint32_t) (a)>>31)) | ||||
| #define expF32UI( a ) ((int_fast16_t) ((a)>>23) & 0xFF) | ||||
| #define fracF32UI( a ) ((a) & 0x007FFFFF) | ||||
| #define packToF32UI( sign, exp, sig ) (((uint32_t) (sign)<<31) + ((uint32_t) (exp)<<23) + (sig)) | ||||
|  *----------------------------------------------------------------------------*/ | ||||
| #define signBF16UI(a) ((bool)((uint16_t)(a) >> 15)) | ||||
| #define expBF16UI(a) ((int_fast16_t)((a) >> 7) & 0xFF) | ||||
| #define fracBF16UI(a) ((a)&0x07F) | ||||
| #define packToBF16UI(sign, exp, sig) (((uint16_t)(sign) << 15) + ((uint16_t)(exp) << 7) + (sig)) | ||||
|  | ||||
| #define isNaNF32UI( a ) (((~(a) & 0x7F800000) == 0) && ((a) & 0x007FFFFF)) | ||||
| #define isNaNBF16UI(a) (((~(a)&0x7FC0) == 0) && ((a)&0x07F)) | ||||
|  | ||||
| struct exp16_sig32 { int_fast16_t exp; uint_fast32_t sig; }; | ||||
| struct exp16_sig32 softfloat_normSubnormalF32Sig( uint_fast32_t ); | ||||
|  | ||||
| float32_t softfloat_roundPackToF32( bool, int_fast16_t, uint_fast32_t ); | ||||
| float32_t softfloat_normRoundPackToF32( bool, int_fast16_t, uint_fast32_t ); | ||||
|  | ||||
| float32_t softfloat_addMagsF32( uint_fast32_t, uint_fast32_t ); | ||||
| float32_t softfloat_subMagsF32( uint_fast32_t, uint_fast32_t ); | ||||
| float32_t | ||||
|  softfloat_mulAddF32( | ||||
|      uint_fast32_t, uint_fast32_t, uint_fast32_t, uint_fast8_t ); | ||||
| bfloat16_t softfloat_roundPackToBF16(bool, int_fast16_t, uint_fast16_t); | ||||
| struct exp8_sig16 softfloat_normSubnormalBF16Sig(uint_fast16_t); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define signF64UI( a ) ((bool) ((uint64_t) (a)>>63)) | ||||
| #define expF64UI( a ) ((int_fast16_t) ((a)>>52) & 0x7FF) | ||||
| #define fracF64UI( a ) ((a) & UINT64_C( 0x000FFFFFFFFFFFFF )) | ||||
| #define packToF64UI( sign, exp, sig ) ((uint64_t) (((uint_fast64_t) (sign)<<63) + ((uint_fast64_t) (exp)<<52) + (sig))) | ||||
|  *----------------------------------------------------------------------------*/ | ||||
| #define signF32UI(a) ((bool)((uint32_t)(a) >> 31)) | ||||
| #define expF32UI(a) ((int_fast16_t)((a) >> 23) & 0xFF) | ||||
| #define fracF32UI(a) ((a)&0x007FFFFF) | ||||
| #define packToF32UI(sign, exp, sig) (((uint32_t)(sign) << 31) + ((uint32_t)(exp) << 23) + (sig)) | ||||
|  | ||||
| #define isNaNF64UI( a ) (((~(a) & UINT64_C( 0x7FF0000000000000 )) == 0) && ((a) & UINT64_C( 0x000FFFFFFFFFFFFF ))) | ||||
| #define isNaNF32UI(a) (((~(a)&0x7F800000) == 0) && ((a)&0x007FFFFF)) | ||||
|  | ||||
| struct exp16_sig64 { int_fast16_t exp; uint_fast64_t sig; }; | ||||
| struct exp16_sig64 softfloat_normSubnormalF64Sig( uint_fast64_t ); | ||||
| struct exp16_sig32 { | ||||
|     int_fast16_t exp; | ||||
|     uint_fast32_t sig; | ||||
| }; | ||||
| struct exp16_sig32 softfloat_normSubnormalF32Sig(uint_fast32_t); | ||||
|  | ||||
| float64_t softfloat_roundPackToF64( bool, int_fast16_t, uint_fast64_t ); | ||||
| float64_t softfloat_normRoundPackToF64( bool, int_fast16_t, uint_fast64_t ); | ||||
| float32_t softfloat_roundPackToF32(bool, int_fast16_t, uint_fast32_t); | ||||
| float32_t softfloat_normRoundPackToF32(bool, int_fast16_t, uint_fast32_t); | ||||
|  | ||||
| float64_t softfloat_addMagsF64( uint_fast64_t, uint_fast64_t, bool ); | ||||
| float64_t softfloat_subMagsF64( uint_fast64_t, uint_fast64_t, bool ); | ||||
| float64_t | ||||
|  softfloat_mulAddF64( | ||||
|      uint_fast64_t, uint_fast64_t, uint_fast64_t, uint_fast8_t ); | ||||
| float32_t softfloat_addMagsF32(uint_fast32_t, uint_fast32_t); | ||||
| float32_t softfloat_subMagsF32(uint_fast32_t, uint_fast32_t); | ||||
| float32_t softfloat_mulAddF32(uint_fast32_t, uint_fast32_t, uint_fast32_t, uint_fast8_t); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define signExtF80UI64( a64 ) ((bool) ((uint16_t) (a64)>>15)) | ||||
| #define expExtF80UI64( a64 ) ((a64) & 0x7FFF) | ||||
| #define packToExtF80UI64( sign, exp ) ((uint_fast16_t) (sign)<<15 | (exp)) | ||||
|  *----------------------------------------------------------------------------*/ | ||||
| #define signF64UI(a) ((bool)((uint64_t)(a) >> 63)) | ||||
| #define expF64UI(a) ((int_fast16_t)((a) >> 52) & 0x7FF) | ||||
| #define fracF64UI(a) ((a)&UINT64_C(0x000FFFFFFFFFFFFF)) | ||||
| #define packToF64UI(sign, exp, sig) ((uint64_t)(((uint_fast64_t)(sign) << 63) + ((uint_fast64_t)(exp) << 52) + (sig))) | ||||
|  | ||||
| #define isNaNExtF80UI( a64, a0 ) ((((a64) & 0x7FFF) == 0x7FFF) && ((a0) & UINT64_C( 0x7FFFFFFFFFFFFFFF ))) | ||||
| #define isNaNF64UI(a) (((~(a)&UINT64_C(0x7FF0000000000000)) == 0) && ((a)&UINT64_C(0x000FFFFFFFFFFFFF))) | ||||
|  | ||||
| struct exp16_sig64 { | ||||
|     int_fast16_t exp; | ||||
|     uint_fast64_t sig; | ||||
| }; | ||||
| struct exp16_sig64 softfloat_normSubnormalF64Sig(uint_fast64_t); | ||||
|  | ||||
| float64_t softfloat_roundPackToF64(bool, int_fast16_t, uint_fast64_t); | ||||
| float64_t softfloat_normRoundPackToF64(bool, int_fast16_t, uint_fast64_t); | ||||
|  | ||||
| float64_t softfloat_addMagsF64(uint_fast64_t, uint_fast64_t, bool); | ||||
| float64_t softfloat_subMagsF64(uint_fast64_t, uint_fast64_t, bool); | ||||
| float64_t softfloat_mulAddF64(uint_fast64_t, uint_fast64_t, uint_fast64_t, uint_fast8_t); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
|  *----------------------------------------------------------------------------*/ | ||||
| #define signExtF80UI64(a64) ((bool)((uint16_t)(a64) >> 15)) | ||||
| #define expExtF80UI64(a64) ((a64)&0x7FFF) | ||||
| #define packToExtF80UI64(sign, exp) ((uint_fast16_t)(sign) << 15 | (exp)) | ||||
|  | ||||
| #define isNaNExtF80UI(a64, a0) ((((a64)&0x7FFF) == 0x7FFF) && ((a0)&UINT64_C(0x7FFFFFFFFFFFFFFF))) | ||||
|  | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| *----------------------------------------------------------------------------*/ | ||||
|  *----------------------------------------------------------------------------*/ | ||||
|  | ||||
| struct exp32_sig64 { int_fast32_t exp; uint64_t sig; }; | ||||
| struct exp32_sig64 softfloat_normSubnormalExtF80Sig( uint_fast64_t ); | ||||
| struct exp32_sig64 { | ||||
|     int_fast32_t exp; | ||||
|     uint64_t sig; | ||||
| }; | ||||
| struct exp32_sig64 softfloat_normSubnormalExtF80Sig(uint_fast64_t); | ||||
|  | ||||
| extFloat80_t | ||||
|  softfloat_roundPackToExtF80( | ||||
|      bool, int_fast32_t, uint_fast64_t, uint_fast64_t, uint_fast8_t ); | ||||
| extFloat80_t | ||||
|  softfloat_normRoundPackToExtF80( | ||||
|      bool, int_fast32_t, uint_fast64_t, uint_fast64_t, uint_fast8_t ); | ||||
| extFloat80_t softfloat_roundPackToExtF80(bool, int_fast32_t, uint_fast64_t, uint_fast64_t, uint_fast8_t); | ||||
| extFloat80_t softfloat_normRoundPackToExtF80(bool, int_fast32_t, uint_fast64_t, uint_fast64_t, uint_fast8_t); | ||||
|  | ||||
| extFloat80_t | ||||
|  softfloat_addMagsExtF80( | ||||
|      uint_fast16_t, uint_fast64_t, uint_fast16_t, uint_fast64_t, bool ); | ||||
| extFloat80_t | ||||
|  softfloat_subMagsExtF80( | ||||
|      uint_fast16_t, uint_fast64_t, uint_fast16_t, uint_fast64_t, bool ); | ||||
| extFloat80_t softfloat_addMagsExtF80(uint_fast16_t, uint_fast64_t, uint_fast16_t, uint_fast64_t, bool); | ||||
| extFloat80_t softfloat_subMagsExtF80(uint_fast16_t, uint_fast64_t, uint_fast16_t, uint_fast64_t, bool); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define signF128UI64( a64 ) ((bool) ((uint64_t) (a64)>>63)) | ||||
| #define expF128UI64( a64 ) ((int_fast32_t) ((a64)>>48) & 0x7FFF) | ||||
| #define fracF128UI64( a64 ) ((a64) & UINT64_C( 0x0000FFFFFFFFFFFF )) | ||||
| #define packToF128UI64( sign, exp, sig64 ) (((uint_fast64_t) (sign)<<63) + ((uint_fast64_t) (exp)<<48) + (sig64)) | ||||
|  *----------------------------------------------------------------------------*/ | ||||
| #define signF128UI64(a64) ((bool)((uint64_t)(a64) >> 63)) | ||||
| #define expF128UI64(a64) ((int_fast32_t)((a64) >> 48) & 0x7FFF) | ||||
| #define fracF128UI64(a64) ((a64)&UINT64_C(0x0000FFFFFFFFFFFF)) | ||||
| #define packToF128UI64(sign, exp, sig64) (((uint_fast64_t)(sign) << 63) + ((uint_fast64_t)(exp) << 48) + (sig64)) | ||||
|  | ||||
| #define isNaNF128UI( a64, a0 ) (((~(a64) & UINT64_C( 0x7FFF000000000000 )) == 0) && (a0 || ((a64) & UINT64_C( 0x0000FFFFFFFFFFFF )))) | ||||
| #define isNaNF128UI(a64, a0) (((~(a64)&UINT64_C(0x7FFF000000000000)) == 0) && (a0 || ((a64)&UINT64_C(0x0000FFFFFFFFFFFF)))) | ||||
|  | ||||
| struct exp32_sig128 { int_fast32_t exp; struct uint128 sig; }; | ||||
| struct exp32_sig128 | ||||
|  softfloat_normSubnormalF128Sig( uint_fast64_t, uint_fast64_t ); | ||||
| struct exp32_sig128 { | ||||
|     int_fast32_t exp; | ||||
|     struct uint128 sig; | ||||
| }; | ||||
| struct exp32_sig128 softfloat_normSubnormalF128Sig(uint_fast64_t, uint_fast64_t); | ||||
|  | ||||
| float128_t | ||||
|  softfloat_roundPackToF128( | ||||
|      bool, int_fast32_t, uint_fast64_t, uint_fast64_t, uint_fast64_t ); | ||||
| float128_t | ||||
|  softfloat_normRoundPackToF128( | ||||
|      bool, int_fast32_t, uint_fast64_t, uint_fast64_t ); | ||||
| float128_t softfloat_roundPackToF128(bool, int_fast32_t, uint_fast64_t, uint_fast64_t, uint_fast64_t); | ||||
| float128_t softfloat_normRoundPackToF128(bool, int_fast32_t, uint_fast64_t, uint_fast64_t); | ||||
|  | ||||
| float128_t | ||||
|  softfloat_addMagsF128( | ||||
|      uint_fast64_t, uint_fast64_t, uint_fast64_t, uint_fast64_t, bool ); | ||||
| float128_t | ||||
|  softfloat_subMagsF128( | ||||
|      uint_fast64_t, uint_fast64_t, uint_fast64_t, uint_fast64_t, bool ); | ||||
| float128_t | ||||
|  softfloat_mulAddF128( | ||||
|      uint_fast64_t, | ||||
|      uint_fast64_t, | ||||
|      uint_fast64_t, | ||||
|      uint_fast64_t, | ||||
|      uint_fast64_t, | ||||
|      uint_fast64_t, | ||||
|      uint_fast8_t | ||||
|  ); | ||||
| float128_t softfloat_addMagsF128(uint_fast64_t, uint_fast64_t, uint_fast64_t, uint_fast64_t, bool); | ||||
| float128_t softfloat_subMagsF128(uint_fast64_t, uint_fast64_t, uint_fast64_t, uint_fast64_t, bool); | ||||
| float128_t softfloat_mulAddF128(uint_fast64_t, uint_fast64_t, uint_fast64_t, uint_fast64_t, uint_fast64_t, uint_fast64_t, uint_fast8_t); | ||||
|  | ||||
| #else | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| *----------------------------------------------------------------------------*/ | ||||
|  *----------------------------------------------------------------------------*/ | ||||
|  | ||||
| bool | ||||
|  softfloat_tryPropagateNaNExtF80M( | ||||
|      const struct extFloat80M *, | ||||
|      const struct extFloat80M *, | ||||
|      struct extFloat80M * | ||||
|  ); | ||||
| void softfloat_invalidExtF80M( struct extFloat80M * ); | ||||
| bool softfloat_tryPropagateNaNExtF80M(const struct extFloat80M*, const struct extFloat80M*, struct extFloat80M*); | ||||
| void softfloat_invalidExtF80M(struct extFloat80M*); | ||||
|  | ||||
| int softfloat_normExtF80SigM( uint64_t * ); | ||||
| int softfloat_normExtF80SigM(uint64_t*); | ||||
|  | ||||
| void | ||||
|  softfloat_roundPackMToExtF80M( | ||||
|      bool, int32_t, uint32_t *, uint_fast8_t, struct extFloat80M * ); | ||||
| void | ||||
|  softfloat_normRoundPackMToExtF80M( | ||||
|      bool, int32_t, uint32_t *, uint_fast8_t, struct extFloat80M * ); | ||||
| void softfloat_roundPackMToExtF80M(bool, int32_t, uint32_t*, uint_fast8_t, struct extFloat80M*); | ||||
| void softfloat_normRoundPackMToExtF80M(bool, int32_t, uint32_t*, uint_fast8_t, struct extFloat80M*); | ||||
|  | ||||
| void | ||||
|  softfloat_addExtF80M( | ||||
|      const struct extFloat80M *, | ||||
|      const struct extFloat80M *, | ||||
|      struct extFloat80M *, | ||||
|      bool | ||||
|  ); | ||||
| void softfloat_addExtF80M(const struct extFloat80M*, const struct extFloat80M*, struct extFloat80M*, bool); | ||||
|  | ||||
| int | ||||
|  softfloat_compareNonnormExtF80M( | ||||
|      const struct extFloat80M *, const struct extFloat80M * ); | ||||
| int softfloat_compareNonnormExtF80M(const struct extFloat80M*, const struct extFloat80M*); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define signF128UI96( a96 ) ((bool) ((uint32_t) (a96)>>31)) | ||||
| #define expF128UI96( a96 ) ((int32_t) ((a96)>>16) & 0x7FFF) | ||||
| #define fracF128UI96( a96 ) ((a96) & 0x0000FFFF) | ||||
| #define packToF128UI96( sign, exp, sig96 ) (((uint32_t) (sign)<<31) + ((uint32_t) (exp)<<16) + (sig96)) | ||||
|  *----------------------------------------------------------------------------*/ | ||||
| #define signF128UI96(a96) ((bool)((uint32_t)(a96) >> 31)) | ||||
| #define expF128UI96(a96) ((int32_t)((a96) >> 16) & 0x7FFF) | ||||
| #define fracF128UI96(a96) ((a96)&0x0000FFFF) | ||||
| #define packToF128UI96(sign, exp, sig96) (((uint32_t)(sign) << 31) + ((uint32_t)(exp) << 16) + (sig96)) | ||||
|  | ||||
| bool softfloat_isNaNF128M( const uint32_t * ); | ||||
| bool softfloat_isNaNF128M(const uint32_t*); | ||||
|  | ||||
| bool | ||||
|  softfloat_tryPropagateNaNF128M( | ||||
|      const uint32_t *, const uint32_t *, uint32_t * ); | ||||
| void softfloat_invalidF128M( uint32_t * ); | ||||
| bool softfloat_tryPropagateNaNF128M(const uint32_t*, const uint32_t*, uint32_t*); | ||||
| void softfloat_invalidF128M(uint32_t*); | ||||
|  | ||||
| int softfloat_shiftNormSigF128M( const uint32_t *, uint_fast8_t, uint32_t * ); | ||||
| int softfloat_shiftNormSigF128M(const uint32_t*, uint_fast8_t, uint32_t*); | ||||
|  | ||||
| void softfloat_roundPackMToF128M( bool, int32_t, uint32_t *, uint32_t * ); | ||||
| void softfloat_normRoundPackMToF128M( bool, int32_t, uint32_t *, uint32_t * ); | ||||
| void softfloat_roundPackMToF128M(bool, int32_t, uint32_t*, uint32_t*); | ||||
| void softfloat_normRoundPackMToF128M(bool, int32_t, uint32_t*, uint32_t*); | ||||
|  | ||||
| void | ||||
|  softfloat_addF128M( const uint32_t *, const uint32_t *, uint32_t *, bool ); | ||||
| void | ||||
|  softfloat_mulAddF128M( | ||||
|      const uint32_t *, | ||||
|      const uint32_t *, | ||||
|      const uint32_t *, | ||||
|      uint32_t *, | ||||
|      uint_fast8_t | ||||
|  ); | ||||
| void softfloat_addF128M(const uint32_t*, const uint32_t*, uint32_t*, bool); | ||||
| void softfloat_mulAddF128M(const uint32_t*, const uint32_t*, const uint32_t*, uint32_t*, uint_fast8_t); | ||||
|  | ||||
| #endif | ||||
|  | ||||
| #endif | ||||
|  | ||||
|   | ||||
| @@ -39,70 +39,70 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| #ifdef INLINE | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "primitiveTypes.h" | ||||
| #include <stdint.h> | ||||
|  | ||||
| #ifdef SOFTFLOAT_BUILTIN_CLZ | ||||
|  | ||||
| INLINE uint_fast8_t softfloat_countLeadingZeros16( uint16_t a ) | ||||
|     { return a ? __builtin_clz( a ) - 16 : 16; } | ||||
| INLINE uint_fast8_t softfloat_countLeadingZeros16(uint16_t a) { return a ? __builtin_clz(a) - 16 : 16; } | ||||
| #define softfloat_countLeadingZeros16 softfloat_countLeadingZeros16 | ||||
|  | ||||
| INLINE uint_fast8_t softfloat_countLeadingZeros32( uint32_t a ) | ||||
|     { return a ? __builtin_clz( a ) : 32; } | ||||
| INLINE uint_fast8_t softfloat_countLeadingZeros32(uint32_t a) { return a ? __builtin_clz(a) : 32; } | ||||
| #define softfloat_countLeadingZeros32 softfloat_countLeadingZeros32 | ||||
|  | ||||
| INLINE uint_fast8_t softfloat_countLeadingZeros64( uint64_t a ) | ||||
|     { return a ? __builtin_clzll( a ) : 64; } | ||||
| INLINE uint_fast8_t softfloat_countLeadingZeros64(uint64_t a) { return a ? __builtin_clzll(a) : 64; } | ||||
| #define softfloat_countLeadingZeros64 softfloat_countLeadingZeros64 | ||||
|  | ||||
| #endif | ||||
|  | ||||
| #ifdef SOFTFLOAT_INTRINSIC_INT128 | ||||
|  | ||||
| INLINE struct uint128 softfloat_mul64ByShifted32To128( uint64_t a, uint32_t b ) | ||||
| { | ||||
|     union { unsigned __int128 ui; struct uint128 s; } uZ; | ||||
|     uZ.ui = (unsigned __int128) a * ((uint_fast64_t) b<<32); | ||||
| INLINE struct uint128 softfloat_mul64ByShifted32To128(uint64_t a, uint32_t b) { | ||||
|     union { | ||||
|         unsigned __int128 ui; | ||||
|         struct uint128 s; | ||||
|     } uZ; | ||||
|     uZ.ui = (unsigned __int128)a * ((uint_fast64_t)b << 32); | ||||
|     return uZ.s; | ||||
| } | ||||
| #define softfloat_mul64ByShifted32To128 softfloat_mul64ByShifted32To128 | ||||
|  | ||||
| INLINE struct uint128 softfloat_mul64To128( uint64_t a, uint64_t b ) | ||||
| { | ||||
|     union { unsigned __int128 ui; struct uint128 s; } uZ; | ||||
|     uZ.ui = (unsigned __int128) a * b; | ||||
| INLINE struct uint128 softfloat_mul64To128(uint64_t a, uint64_t b) { | ||||
|     union { | ||||
|         unsigned __int128 ui; | ||||
|         struct uint128 s; | ||||
|     } uZ; | ||||
|     uZ.ui = (unsigned __int128)a * b; | ||||
|     return uZ.s; | ||||
| } | ||||
| #define softfloat_mul64To128 softfloat_mul64To128 | ||||
|  | ||||
| INLINE | ||||
| struct uint128 softfloat_mul128By32( uint64_t a64, uint64_t a0, uint32_t b ) | ||||
| { | ||||
|     union { unsigned __int128 ui; struct uint128 s; } uZ; | ||||
|     uZ.ui = ((unsigned __int128) a64<<64 | a0) * b; | ||||
| struct uint128 softfloat_mul128By32(uint64_t a64, uint64_t a0, uint32_t b) { | ||||
|     union { | ||||
|         unsigned __int128 ui; | ||||
|         struct uint128 s; | ||||
|     } uZ; | ||||
|     uZ.ui = ((unsigned __int128)a64 << 64 | a0) * b; | ||||
|     return uZ.s; | ||||
| } | ||||
| #define softfloat_mul128By32 softfloat_mul128By32 | ||||
|  | ||||
| INLINE | ||||
| void | ||||
|  softfloat_mul128To256M( | ||||
|      uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0, uint64_t *zPtr ) | ||||
| { | ||||
| void softfloat_mul128To256M(uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0, uint64_t* zPtr) { | ||||
|     unsigned __int128 z0, mid1, mid, z128; | ||||
|     z0 = (unsigned __int128) a0 * b0; | ||||
|     mid1 = (unsigned __int128) a64 * b0; | ||||
|     mid = mid1 + (unsigned __int128) a0 * b64; | ||||
|     z128 = (unsigned __int128) a64 * b64; | ||||
|     z128 += (unsigned __int128) (mid < mid1)<<64 | mid>>64; | ||||
|     z0 = (unsigned __int128)a0 * b0; | ||||
|     mid1 = (unsigned __int128)a64 * b0; | ||||
|     mid = mid1 + (unsigned __int128)a0 * b64; | ||||
|     z128 = (unsigned __int128)a64 * b64; | ||||
|     z128 += (unsigned __int128)(mid < mid1) << 64 | mid >> 64; | ||||
|     mid <<= 64; | ||||
|     z0 += mid; | ||||
|     z128 += (z0 < mid); | ||||
|     zPtr[indexWord( 4, 0 )] = z0; | ||||
|     zPtr[indexWord( 4, 1 )] = z0>>64; | ||||
|     zPtr[indexWord( 4, 2 )] = z128; | ||||
|     zPtr[indexWord( 4, 3 )] = z128>>64; | ||||
|     zPtr[indexWord(4, 0)] = z0; | ||||
|     zPtr[indexWord(4, 1)] = z0 >> 64; | ||||
|     zPtr[indexWord(4, 2)] = z128; | ||||
|     zPtr[indexWord(4, 3)] = z128 >> 64; | ||||
| } | ||||
| #define softfloat_mul128To256M softfloat_mul128To256M | ||||
|  | ||||
| @@ -111,4 +111,3 @@ void | ||||
| #endif | ||||
|  | ||||
| #endif | ||||
|  | ||||
|   | ||||
| @@ -42,13 +42,27 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
|  | ||||
| #ifdef LITTLEENDIAN | ||||
| struct uint128 { uint64_t v0, v64; }; | ||||
| struct uint64_extra { uint64_t extra, v; }; | ||||
| struct uint128_extra { uint64_t extra; struct uint128 v; }; | ||||
| struct uint128 { | ||||
|     uint64_t v0, v64; | ||||
| }; | ||||
| struct uint64_extra { | ||||
|     uint64_t extra, v; | ||||
| }; | ||||
| struct uint128_extra { | ||||
|     uint64_t extra; | ||||
|     struct uint128 v; | ||||
| }; | ||||
| #else | ||||
| struct uint128 { uint64_t v64, v0; }; | ||||
| struct uint64_extra { uint64_t v, extra; }; | ||||
| struct uint128_extra { struct uint128 v; uint64_t extra; }; | ||||
| struct uint128 { | ||||
|     uint64_t v64, v0; | ||||
| }; | ||||
| struct uint64_extra { | ||||
|     uint64_t v, extra; | ||||
| }; | ||||
| struct uint128_extra { | ||||
|     struct uint128 v; | ||||
|     uint64_t extra; | ||||
| }; | ||||
| #endif | ||||
|  | ||||
| #endif | ||||
| @@ -59,27 +73,28 @@ struct uint128_extra { struct uint128 v; uint64_t extra; }; | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #ifdef LITTLEENDIAN | ||||
| #define wordIncr 1 | ||||
| #define indexWord( total, n ) (n) | ||||
| #define indexWordHi( total ) ((total) - 1) | ||||
| #define indexWordLo( total ) 0 | ||||
| #define indexMultiword( total, m, n ) (n) | ||||
| #define indexMultiwordHi( total, n ) ((total) - (n)) | ||||
| #define indexMultiwordLo( total, n ) 0 | ||||
| #define indexMultiwordHiBut( total, n ) (n) | ||||
| #define indexMultiwordLoBut( total, n ) 0 | ||||
| #define INIT_UINTM4( v3, v2, v1, v0 ) { v0, v1, v2, v3 } | ||||
| #define indexWord(total, n) (n) | ||||
| #define indexWordHi(total) ((total)-1) | ||||
| #define indexWordLo(total) 0 | ||||
| #define indexMultiword(total, m, n) (n) | ||||
| #define indexMultiwordHi(total, n) ((total) - (n)) | ||||
| #define indexMultiwordLo(total, n) 0 | ||||
| #define indexMultiwordHiBut(total, n) (n) | ||||
| #define indexMultiwordLoBut(total, n) 0 | ||||
| #define INIT_UINTM4(v3, v2, v1, v0)                                                                                                        \ | ||||
|     { v0, v1, v2, v3 } | ||||
| #else | ||||
| #define wordIncr -1 | ||||
| #define indexWord( total, n ) ((total) - 1 - (n)) | ||||
| #define indexWordHi( total ) 0 | ||||
| #define indexWordLo( total ) ((total) - 1) | ||||
| #define indexMultiword( total, m, n ) ((total) - 1 - (m)) | ||||
| #define indexMultiwordHi( total, n ) 0 | ||||
| #define indexMultiwordLo( total, n ) ((total) - (n)) | ||||
| #define indexMultiwordHiBut( total, n ) 0 | ||||
| #define indexMultiwordLoBut( total, n ) (n) | ||||
| #define INIT_UINTM4( v3, v2, v1, v0 ) { v3, v2, v1, v0 } | ||||
| #define indexWord(total, n) ((total)-1 - (n)) | ||||
| #define indexWordHi(total) 0 | ||||
| #define indexWordLo(total) ((total)-1) | ||||
| #define indexMultiword(total, m, n) ((total)-1 - (m)) | ||||
| #define indexMultiwordHi(total, n) 0 | ||||
| #define indexMultiwordLo(total, n) ((total) - (n)) | ||||
| #define indexMultiwordHiBut(total, n) 0 | ||||
| #define indexMultiwordLoBut(total, n) (n) | ||||
| #define INIT_UINTM4(v3, v2, v1, v0)                                                                                                        \ | ||||
|     { v3, v2, v1, v0 } | ||||
| #endif | ||||
|  | ||||
| #endif | ||||
|  | ||||
|   | ||||
| @@ -37,9 +37,9 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| #ifndef primitives_h | ||||
| #define primitives_h 1 | ||||
|  | ||||
| #include "primitiveTypes.h" | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "primitiveTypes.h" | ||||
|  | ||||
| #ifndef softfloat_shortShiftRightJam64 | ||||
| /*---------------------------------------------------------------------------- | ||||
| @@ -50,10 +50,9 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (2 <= INLINE_LEVEL) | ||||
| INLINE | ||||
| uint64_t softfloat_shortShiftRightJam64( uint64_t a, uint_fast8_t dist ) | ||||
|     { return a>>dist | ((a & (((uint_fast64_t) 1<<dist) - 1)) != 0); } | ||||
| uint64_t softfloat_shortShiftRightJam64(uint64_t a, uint_fast8_t dist) { return a >> dist | ((a & (((uint_fast64_t)1 << dist) - 1)) != 0); } | ||||
| #else | ||||
| uint64_t softfloat_shortShiftRightJam64( uint64_t a, uint_fast8_t dist ); | ||||
| uint64_t softfloat_shortShiftRightJam64(uint64_t a, uint_fast8_t dist); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -68,13 +67,11 @@ uint64_t softfloat_shortShiftRightJam64( uint64_t a, uint_fast8_t dist ); | ||||
| | is zero or nonzero. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (2 <= INLINE_LEVEL) | ||||
| INLINE uint32_t softfloat_shiftRightJam32( uint32_t a, uint_fast16_t dist ) | ||||
| { | ||||
|     return | ||||
|         (dist < 31) ? a>>dist | ((uint32_t) (a<<(-dist & 31)) != 0) : (a != 0); | ||||
| INLINE uint32_t softfloat_shiftRightJam32(uint32_t a, uint_fast16_t dist) { | ||||
|     return (dist < 31) ? a >> dist | ((uint32_t)(a << (-dist & 31)) != 0) : (a != 0); | ||||
| } | ||||
| #else | ||||
| uint32_t softfloat_shiftRightJam32( uint32_t a, uint_fast16_t dist ); | ||||
| uint32_t softfloat_shiftRightJam32(uint32_t a, uint_fast16_t dist); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -89,13 +86,11 @@ uint32_t softfloat_shiftRightJam32( uint32_t a, uint_fast16_t dist ); | ||||
| | is zero or nonzero. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (3 <= INLINE_LEVEL) | ||||
| INLINE uint64_t softfloat_shiftRightJam64( uint64_t a, uint_fast32_t dist ) | ||||
| { | ||||
|     return | ||||
|         (dist < 63) ? a>>dist | ((uint64_t) (a<<(-dist & 63)) != 0) : (a != 0); | ||||
| INLINE uint64_t softfloat_shiftRightJam64(uint64_t a, uint_fast32_t dist) { | ||||
|     return (dist < 63) ? a >> dist | ((uint64_t)(a << (-dist & 63)) != 0) : (a != 0); | ||||
| } | ||||
| #else | ||||
| uint64_t softfloat_shiftRightJam64( uint64_t a, uint_fast32_t dist ); | ||||
| uint64_t softfloat_shiftRightJam64(uint64_t a, uint_fast32_t dist); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -112,10 +107,9 @@ extern const uint_least8_t softfloat_countLeadingZeros8[256]; | ||||
| | 'a'.  If 'a' is zero, 16 is returned. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (2 <= INLINE_LEVEL) | ||||
| INLINE uint_fast8_t softfloat_countLeadingZeros16( uint16_t a ) | ||||
| { | ||||
| INLINE uint_fast8_t softfloat_countLeadingZeros16(uint16_t a) { | ||||
|     uint_fast8_t count = 8; | ||||
|     if ( 0x100 <= a ) { | ||||
|     if(0x100 <= a) { | ||||
|         count = 0; | ||||
|         a >>= 8; | ||||
|     } | ||||
| @@ -123,7 +117,7 @@ INLINE uint_fast8_t softfloat_countLeadingZeros16( uint16_t a ) | ||||
|     return count; | ||||
| } | ||||
| #else | ||||
| uint_fast8_t softfloat_countLeadingZeros16( uint16_t a ); | ||||
| uint_fast8_t softfloat_countLeadingZeros16(uint16_t a); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -133,22 +127,21 @@ uint_fast8_t softfloat_countLeadingZeros16( uint16_t a ); | ||||
| | 'a'.  If 'a' is zero, 32 is returned. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (3 <= INLINE_LEVEL) | ||||
| INLINE uint_fast8_t softfloat_countLeadingZeros32( uint32_t a ) | ||||
| { | ||||
| INLINE uint_fast8_t softfloat_countLeadingZeros32(uint32_t a) { | ||||
|     uint_fast8_t count = 0; | ||||
|     if ( a < 0x10000 ) { | ||||
|     if(a < 0x10000) { | ||||
|         count = 16; | ||||
|         a <<= 16; | ||||
|     } | ||||
|     if ( a < 0x1000000 ) { | ||||
|     if(a < 0x1000000) { | ||||
|         count += 8; | ||||
|         a <<= 8; | ||||
|     } | ||||
|     count += softfloat_countLeadingZeros8[a>>24]; | ||||
|     count += softfloat_countLeadingZeros8[a >> 24]; | ||||
|     return count; | ||||
| } | ||||
| #else | ||||
| uint_fast8_t softfloat_countLeadingZeros32( uint32_t a ); | ||||
| uint_fast8_t softfloat_countLeadingZeros32(uint32_t a); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -157,7 +150,7 @@ uint_fast8_t softfloat_countLeadingZeros32( uint32_t a ); | ||||
| | Returns the number of leading 0 bits before the most-significant 1 bit of | ||||
| | 'a'.  If 'a' is zero, 64 is returned. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast8_t softfloat_countLeadingZeros64( uint64_t a ); | ||||
| uint_fast8_t softfloat_countLeadingZeros64(uint64_t a); | ||||
| #endif | ||||
|  | ||||
| extern const uint16_t softfloat_approxRecip_1k0s[16]; | ||||
| @@ -176,9 +169,9 @@ extern const uint16_t softfloat_approxRecip_1k1s[16]; | ||||
| | (units in the last place). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #ifdef SOFTFLOAT_FAST_DIV64TO32 | ||||
| #define softfloat_approxRecip32_1( a ) ((uint32_t) (UINT64_C( 0x7FFFFFFFFFFFFFFF ) / (uint32_t) (a))) | ||||
| #define softfloat_approxRecip32_1(a) ((uint32_t)(UINT64_C(0x7FFFFFFFFFFFFFFF) / (uint32_t)(a))) | ||||
| #else | ||||
| uint32_t softfloat_approxRecip32_1( uint32_t a ); | ||||
| uint32_t softfloat_approxRecip32_1(uint32_t a); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -204,7 +197,7 @@ extern const uint16_t softfloat_approxRecipSqrt_1k1s[16]; | ||||
| | returned is also always within the range 0.5 to 1; thus, the most- | ||||
| | significant bit of the result is always set. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint32_t softfloat_approxRecipSqrt32_1( unsigned int oddExpA, uint32_t a ); | ||||
| uint32_t softfloat_approxRecipSqrt32_1(unsigned int oddExpA, uint32_t a); | ||||
| #endif | ||||
|  | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
| @@ -222,10 +215,9 @@ uint32_t softfloat_approxRecipSqrt32_1( unsigned int oddExpA, uint32_t a ); | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (1 <= INLINE_LEVEL) | ||||
| INLINE | ||||
| bool softfloat_eq128( uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0 ) | ||||
|     { return (a64 == b64) && (a0 == b0); } | ||||
| bool softfloat_eq128(uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0) { return (a64 == b64) && (a0 == b0); } | ||||
| #else | ||||
| bool softfloat_eq128( uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0 ); | ||||
| bool softfloat_eq128(uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -237,10 +229,9 @@ bool softfloat_eq128( uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0 ); | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (2 <= INLINE_LEVEL) | ||||
| INLINE | ||||
| bool softfloat_le128( uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0 ) | ||||
|     { return (a64 < b64) || ((a64 == b64) && (a0 <= b0)); } | ||||
| bool softfloat_le128(uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0) { return (a64 < b64) || ((a64 == b64) && (a0 <= b0)); } | ||||
| #else | ||||
| bool softfloat_le128( uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0 ); | ||||
| bool softfloat_le128(uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -252,10 +243,9 @@ bool softfloat_le128( uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0 ); | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (2 <= INLINE_LEVEL) | ||||
| INLINE | ||||
| bool softfloat_lt128( uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0 ) | ||||
|     { return (a64 < b64) || ((a64 == b64) && (a0 < b0)); } | ||||
| bool softfloat_lt128(uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0) { return (a64 < b64) || ((a64 == b64) && (a0 < b0)); } | ||||
| #else | ||||
| bool softfloat_lt128( uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0 ); | ||||
| bool softfloat_lt128(uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -266,17 +256,14 @@ bool softfloat_lt128( uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0 ); | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (2 <= INLINE_LEVEL) | ||||
| INLINE | ||||
| struct uint128 | ||||
|  softfloat_shortShiftLeft128( uint64_t a64, uint64_t a0, uint_fast8_t dist ) | ||||
| { | ||||
| struct uint128 softfloat_shortShiftLeft128(uint64_t a64, uint64_t a0, uint_fast8_t dist) { | ||||
|     struct uint128 z; | ||||
|     z.v64 = a64<<dist | a0>>(-dist & 63); | ||||
|     z.v0 = a0<<dist; | ||||
|     z.v64 = a64 << dist | a0 >> (-dist & 63); | ||||
|     z.v0 = a0 << dist; | ||||
|     return z; | ||||
| } | ||||
| #else | ||||
| struct uint128 | ||||
|  softfloat_shortShiftLeft128( uint64_t a64, uint64_t a0, uint_fast8_t dist ); | ||||
| struct uint128 softfloat_shortShiftLeft128(uint64_t a64, uint64_t a0, uint_fast8_t dist); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -287,17 +274,14 @@ struct uint128 | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (2 <= INLINE_LEVEL) | ||||
| INLINE | ||||
| struct uint128 | ||||
|  softfloat_shortShiftRight128( uint64_t a64, uint64_t a0, uint_fast8_t dist ) | ||||
| { | ||||
| struct uint128 softfloat_shortShiftRight128(uint64_t a64, uint64_t a0, uint_fast8_t dist) { | ||||
|     struct uint128 z; | ||||
|     z.v64 = a64>>dist; | ||||
|     z.v0 = a64<<(-dist & 63) | a0>>dist; | ||||
|     z.v64 = a64 >> dist; | ||||
|     z.v0 = a64 << (-dist & 63) | a0 >> dist; | ||||
|     return z; | ||||
| } | ||||
| #else | ||||
| struct uint128 | ||||
|  softfloat_shortShiftRight128( uint64_t a64, uint64_t a0, uint_fast8_t dist ); | ||||
| struct uint128 softfloat_shortShiftRight128(uint64_t a64, uint64_t a0, uint_fast8_t dist); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -308,19 +292,14 @@ struct uint128 | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (2 <= INLINE_LEVEL) | ||||
| INLINE | ||||
| struct uint64_extra | ||||
|  softfloat_shortShiftRightJam64Extra( | ||||
|      uint64_t a, uint64_t extra, uint_fast8_t dist ) | ||||
| { | ||||
| struct uint64_extra softfloat_shortShiftRightJam64Extra(uint64_t a, uint64_t extra, uint_fast8_t dist) { | ||||
|     struct uint64_extra z; | ||||
|     z.v = a>>dist; | ||||
|     z.extra = a<<(-dist & 63) | (extra != 0); | ||||
|     z.v = a >> dist; | ||||
|     z.extra = a << (-dist & 63) | (extra != 0); | ||||
|     return z; | ||||
| } | ||||
| #else | ||||
| struct uint64_extra | ||||
|  softfloat_shortShiftRightJam64Extra( | ||||
|      uint64_t a, uint64_t extra, uint_fast8_t dist ); | ||||
| struct uint64_extra softfloat_shortShiftRightJam64Extra(uint64_t a, uint64_t extra, uint_fast8_t dist); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -334,22 +313,15 @@ struct uint64_extra | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (3 <= INLINE_LEVEL) | ||||
| INLINE | ||||
| struct uint128 | ||||
|  softfloat_shortShiftRightJam128( | ||||
|      uint64_t a64, uint64_t a0, uint_fast8_t dist ) | ||||
| { | ||||
| struct uint128 softfloat_shortShiftRightJam128(uint64_t a64, uint64_t a0, uint_fast8_t dist) { | ||||
|     uint_fast8_t negDist = -dist; | ||||
|     struct uint128 z; | ||||
|     z.v64 = a64>>dist; | ||||
|     z.v0 = | ||||
|         a64<<(negDist & 63) | a0>>dist | ||||
|             | ((uint64_t) (a0<<(negDist & 63)) != 0); | ||||
|     z.v64 = a64 >> dist; | ||||
|     z.v0 = a64 << (negDist & 63) | a0 >> dist | ((uint64_t)(a0 << (negDist & 63)) != 0); | ||||
|     return z; | ||||
| } | ||||
| #else | ||||
| struct uint128 | ||||
|  softfloat_shortShiftRightJam128( | ||||
|      uint64_t a64, uint64_t a0, uint_fast8_t dist ); | ||||
| struct uint128 softfloat_shortShiftRightJam128(uint64_t a64, uint64_t a0, uint_fast8_t dist); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -360,21 +332,16 @@ struct uint128 | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (3 <= INLINE_LEVEL) | ||||
| INLINE | ||||
| struct uint128_extra | ||||
|  softfloat_shortShiftRightJam128Extra( | ||||
|      uint64_t a64, uint64_t a0, uint64_t extra, uint_fast8_t dist ) | ||||
| { | ||||
| struct uint128_extra softfloat_shortShiftRightJam128Extra(uint64_t a64, uint64_t a0, uint64_t extra, uint_fast8_t dist) { | ||||
|     uint_fast8_t negDist = -dist; | ||||
|     struct uint128_extra z; | ||||
|     z.v.v64 = a64>>dist; | ||||
|     z.v.v0 = a64<<(negDist & 63) | a0>>dist; | ||||
|     z.extra = a0<<(negDist & 63) | (extra != 0); | ||||
|     z.v.v64 = a64 >> dist; | ||||
|     z.v.v0 = a64 << (negDist & 63) | a0 >> dist; | ||||
|     z.extra = a0 << (negDist & 63) | (extra != 0); | ||||
|     return z; | ||||
| } | ||||
| #else | ||||
| struct uint128_extra | ||||
|  softfloat_shortShiftRightJam128Extra( | ||||
|      uint64_t a64, uint64_t a0, uint64_t extra, uint_fast8_t dist ); | ||||
| struct uint128_extra softfloat_shortShiftRightJam128Extra(uint64_t a64, uint64_t a0, uint64_t extra, uint_fast8_t dist); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -397,14 +364,11 @@ struct uint128_extra | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (4 <= INLINE_LEVEL) | ||||
| INLINE | ||||
| struct uint64_extra | ||||
|  softfloat_shiftRightJam64Extra( | ||||
|      uint64_t a, uint64_t extra, uint_fast32_t dist ) | ||||
| { | ||||
| struct uint64_extra softfloat_shiftRightJam64Extra(uint64_t a, uint64_t extra, uint_fast32_t dist) { | ||||
|     struct uint64_extra z; | ||||
|     if ( dist < 64 ) { | ||||
|         z.v = a>>dist; | ||||
|         z.extra = a<<(-dist & 63); | ||||
|     if(dist < 64) { | ||||
|         z.v = a >> dist; | ||||
|         z.extra = a << (-dist & 63); | ||||
|     } else { | ||||
|         z.v = 0; | ||||
|         z.extra = (dist == 64) ? a : (a != 0); | ||||
| @@ -413,9 +377,7 @@ struct uint64_extra | ||||
|     return z; | ||||
| } | ||||
| #else | ||||
| struct uint64_extra | ||||
|  softfloat_shiftRightJam64Extra( | ||||
|      uint64_t a, uint64_t extra, uint_fast32_t dist ); | ||||
| struct uint64_extra softfloat_shiftRightJam64Extra(uint64_t a, uint64_t extra, uint_fast32_t dist); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -430,8 +392,7 @@ struct uint64_extra | ||||
| | greater than 128, the result will be either 0 or 1, depending on whether the | ||||
| | original 128 bits are all zeros. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 | ||||
|  softfloat_shiftRightJam128( uint64_t a64, uint64_t a0, uint_fast32_t dist ); | ||||
| struct uint128 softfloat_shiftRightJam128(uint64_t a64, uint64_t a0, uint_fast32_t dist); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shiftRightJam128Extra | ||||
| @@ -452,9 +413,7 @@ struct uint128 | ||||
| | is modified as described above and returned in the 'extra' field of the | ||||
| | result.) | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128_extra | ||||
|  softfloat_shiftRightJam128Extra( | ||||
|      uint64_t a64, uint64_t a0, uint64_t extra, uint_fast32_t dist ); | ||||
| struct uint128_extra softfloat_shiftRightJam128Extra(uint64_t a64, uint64_t a0, uint64_t extra, uint_fast32_t dist); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shiftRightJam256M | ||||
| @@ -470,9 +429,7 @@ struct uint128_extra | ||||
| | is greater than 256, the stored result will be either 0 or 1, depending on | ||||
| | whether the original 256 bits are all zeros. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_shiftRightJam256M( | ||||
|      const uint64_t *aPtr, uint_fast32_t dist, uint64_t *zPtr ); | ||||
| void softfloat_shiftRightJam256M(const uint64_t* aPtr, uint_fast32_t dist, uint64_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_add128 | ||||
| @@ -483,17 +440,14 @@ void | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (2 <= INLINE_LEVEL) | ||||
| INLINE | ||||
| struct uint128 | ||||
|  softfloat_add128( uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0 ) | ||||
| { | ||||
| struct uint128 softfloat_add128(uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0) { | ||||
|     struct uint128 z; | ||||
|     z.v0 = a0 + b0; | ||||
|     z.v64 = a64 + b64 + (z.v0 < a0); | ||||
|     return z; | ||||
| } | ||||
| #else | ||||
| struct uint128 | ||||
|  softfloat_add128( uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0 ); | ||||
| struct uint128 softfloat_add128(uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -505,9 +459,7 @@ struct uint128 | ||||
| | an array of four 64-bit elements that concatenate in the platform's normal | ||||
| | endian order to form a 256-bit integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_add256M( | ||||
|      const uint64_t *aPtr, const uint64_t *bPtr, uint64_t *zPtr ); | ||||
| void softfloat_add256M(const uint64_t* aPtr, const uint64_t* bPtr, uint64_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_sub128 | ||||
| @@ -518,9 +470,7 @@ void | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (2 <= INLINE_LEVEL) | ||||
| INLINE | ||||
| struct uint128 | ||||
|  softfloat_sub128( uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0 ) | ||||
| { | ||||
| struct uint128 softfloat_sub128(uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0) { | ||||
|     struct uint128 z; | ||||
|     z.v0 = a0 - b0; | ||||
|     z.v64 = a64 - b64; | ||||
| @@ -528,8 +478,7 @@ struct uint128 | ||||
|     return z; | ||||
| } | ||||
| #else | ||||
| struct uint128 | ||||
|  softfloat_sub128( uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0 ); | ||||
| struct uint128 softfloat_sub128(uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -542,9 +491,7 @@ struct uint128 | ||||
| | 64-bit elements that concatenate in the platform's normal endian order to | ||||
| | form a 256-bit integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_sub256M( | ||||
|      const uint64_t *aPtr, const uint64_t *bPtr, uint64_t *zPtr ); | ||||
| void softfloat_sub256M(const uint64_t* aPtr, const uint64_t* bPtr, uint64_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_mul64ByShifted32To128 | ||||
| @@ -552,17 +499,16 @@ void | ||||
| | Returns the 128-bit product of 'a', 'b', and 2^32. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (3 <= INLINE_LEVEL) | ||||
| INLINE struct uint128 softfloat_mul64ByShifted32To128( uint64_t a, uint32_t b ) | ||||
| { | ||||
| INLINE struct uint128 softfloat_mul64ByShifted32To128(uint64_t a, uint32_t b) { | ||||
|     uint_fast64_t mid; | ||||
|     struct uint128 z; | ||||
|     mid = (uint_fast64_t) (uint32_t) a * b; | ||||
|     z.v0 = mid<<32; | ||||
|     z.v64 = (uint_fast64_t) (uint32_t) (a>>32) * b + (mid>>32); | ||||
|     mid = (uint_fast64_t)(uint32_t)a * b; | ||||
|     z.v0 = mid << 32; | ||||
|     z.v64 = (uint_fast64_t)(uint32_t)(a >> 32) * b + (mid >> 32); | ||||
|     return z; | ||||
| } | ||||
| #else | ||||
| struct uint128 softfloat_mul64ByShifted32To128( uint64_t a, uint32_t b ); | ||||
| struct uint128 softfloat_mul64ByShifted32To128(uint64_t a, uint32_t b); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -570,7 +516,7 @@ struct uint128 softfloat_mul64ByShifted32To128( uint64_t a, uint32_t b ); | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Returns the 128-bit product of 'a' and 'b'. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| struct uint128 softfloat_mul64To128( uint64_t a, uint64_t b ); | ||||
| struct uint128 softfloat_mul64To128(uint64_t a, uint64_t b); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_mul128By32 | ||||
| @@ -581,19 +527,18 @@ struct uint128 softfloat_mul64To128( uint64_t a, uint64_t b ); | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (4 <= INLINE_LEVEL) | ||||
| INLINE | ||||
| struct uint128 softfloat_mul128By32( uint64_t a64, uint64_t a0, uint32_t b ) | ||||
| { | ||||
| struct uint128 softfloat_mul128By32(uint64_t a64, uint64_t a0, uint32_t b) { | ||||
|     struct uint128 z; | ||||
|     uint_fast64_t mid; | ||||
|     uint_fast32_t carry; | ||||
|     z.v0 = a0 * b; | ||||
|     mid = (uint_fast64_t) (uint32_t) (a0>>32) * b; | ||||
|     carry = (uint32_t) ((uint_fast32_t) (z.v0>>32) - (uint_fast32_t) mid); | ||||
|     z.v64 = a64 * b + (uint_fast32_t) ((mid + carry)>>32); | ||||
|     mid = (uint_fast64_t)(uint32_t)(a0 >> 32) * b; | ||||
|     carry = (uint32_t)((uint_fast32_t)(z.v0 >> 32) - (uint_fast32_t)mid); | ||||
|     z.v64 = a64 * b + (uint_fast32_t)((mid + carry) >> 32); | ||||
|     return z; | ||||
| } | ||||
| #else | ||||
| struct uint128 softfloat_mul128By32( uint64_t a64, uint64_t a0, uint32_t b ); | ||||
| struct uint128 softfloat_mul128By32(uint64_t a64, uint64_t a0, uint32_t b); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -605,9 +550,7 @@ struct uint128 softfloat_mul128By32( uint64_t a64, uint64_t a0, uint32_t b ); | ||||
| | Argument 'zPtr' points to an array of four 64-bit elements that concatenate | ||||
| | in the platform's normal endian order to form a 256-bit integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_mul128To256M( | ||||
|      uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0, uint64_t *zPtr ); | ||||
| void softfloat_mul128To256M(uint64_t a64, uint64_t a0, uint64_t b64, uint64_t b0, uint64_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #else | ||||
| @@ -626,7 +569,7 @@ void | ||||
| | Each of 'aPtr' and 'bPtr' points to an array of three 32-bit elements that | ||||
| | concatenate in the platform's normal endian order to form a 96-bit integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| int_fast8_t softfloat_compare96M( const uint32_t *aPtr, const uint32_t *bPtr ); | ||||
| int_fast8_t softfloat_compare96M(const uint32_t* aPtr, const uint32_t* bPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_compare128M | ||||
| @@ -638,8 +581,7 @@ int_fast8_t softfloat_compare96M( const uint32_t *aPtr, const uint32_t *bPtr ); | ||||
| | Each of 'aPtr' and 'bPtr' points to an array of four 32-bit elements that | ||||
| | concatenate in the platform's normal endian order to form a 128-bit integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| int_fast8_t | ||||
|  softfloat_compare128M( const uint32_t *aPtr, const uint32_t *bPtr ); | ||||
| int_fast8_t softfloat_compare128M(const uint32_t* aPtr, const uint32_t* bPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shortShiftLeft64To96M | ||||
| @@ -652,19 +594,14 @@ int_fast8_t | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #if defined INLINE_LEVEL && (2 <= INLINE_LEVEL) | ||||
| INLINE | ||||
| void | ||||
|  softfloat_shortShiftLeft64To96M( | ||||
|      uint64_t a, uint_fast8_t dist, uint32_t *zPtr ) | ||||
| { | ||||
|     zPtr[indexWord( 3, 0 )] = (uint32_t) a<<dist; | ||||
| void softfloat_shortShiftLeft64To96M(uint64_t a, uint_fast8_t dist, uint32_t* zPtr) { | ||||
|     zPtr[indexWord(3, 0)] = (uint32_t)a << dist; | ||||
|     a >>= 32 - dist; | ||||
|     zPtr[indexWord( 3, 2 )] = a>>32; | ||||
|     zPtr[indexWord( 3, 1 )] = a; | ||||
|     zPtr[indexWord(3, 2)] = a >> 32; | ||||
|     zPtr[indexWord(3, 1)] = a; | ||||
| } | ||||
| #else | ||||
| void | ||||
|  softfloat_shortShiftLeft64To96M( | ||||
|      uint64_t a, uint_fast8_t dist, uint32_t *zPtr ); | ||||
| void softfloat_shortShiftLeft64To96M(uint64_t a, uint_fast8_t dist, uint32_t* zPtr); | ||||
| #endif | ||||
| #endif | ||||
|  | ||||
| @@ -678,13 +615,7 @@ void | ||||
| | that concatenate in the platform's normal endian order to form an N-bit | ||||
| | integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_shortShiftLeftM( | ||||
|      uint_fast8_t size_words, | ||||
|      const uint32_t *aPtr, | ||||
|      uint_fast8_t dist, | ||||
|      uint32_t *zPtr | ||||
|  ); | ||||
| void softfloat_shortShiftLeftM(uint_fast8_t size_words, const uint32_t* aPtr, uint_fast8_t dist, uint32_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shortShiftLeft96M | ||||
| @@ -692,7 +623,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_shortShiftLeftM' with | ||||
| | 'size_words' = 3 (N = 96). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_shortShiftLeft96M( aPtr, dist, zPtr ) softfloat_shortShiftLeftM( 3, aPtr, dist, zPtr ) | ||||
| #define softfloat_shortShiftLeft96M(aPtr, dist, zPtr) softfloat_shortShiftLeftM(3, aPtr, dist, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shortShiftLeft128M | ||||
| @@ -700,7 +631,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_shortShiftLeftM' with | ||||
| | 'size_words' = 4 (N = 128). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_shortShiftLeft128M( aPtr, dist, zPtr ) softfloat_shortShiftLeftM( 4, aPtr, dist, zPtr ) | ||||
| #define softfloat_shortShiftLeft128M(aPtr, dist, zPtr) softfloat_shortShiftLeftM(4, aPtr, dist, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shortShiftLeft160M | ||||
| @@ -708,7 +639,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_shortShiftLeftM' with | ||||
| | 'size_words' = 5 (N = 160). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_shortShiftLeft160M( aPtr, dist, zPtr ) softfloat_shortShiftLeftM( 5, aPtr, dist, zPtr ) | ||||
| #define softfloat_shortShiftLeft160M(aPtr, dist, zPtr) softfloat_shortShiftLeftM(5, aPtr, dist, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shiftLeftM | ||||
| @@ -722,13 +653,7 @@ void | ||||
| |   The value of 'dist' can be arbitrarily large.  In particular, if 'dist' is | ||||
| | greater than N, the stored result will be 0. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_shiftLeftM( | ||||
|      uint_fast8_t size_words, | ||||
|      const uint32_t *aPtr, | ||||
|      uint32_t dist, | ||||
|      uint32_t *zPtr | ||||
|  ); | ||||
| void softfloat_shiftLeftM(uint_fast8_t size_words, const uint32_t* aPtr, uint32_t dist, uint32_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shiftLeft96M | ||||
| @@ -736,7 +661,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_shiftLeftM' with | ||||
| | 'size_words' = 3 (N = 96). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_shiftLeft96M( aPtr, dist, zPtr ) softfloat_shiftLeftM( 3, aPtr, dist, zPtr ) | ||||
| #define softfloat_shiftLeft96M(aPtr, dist, zPtr) softfloat_shiftLeftM(3, aPtr, dist, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shiftLeft128M | ||||
| @@ -744,7 +669,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_shiftLeftM' with | ||||
| | 'size_words' = 4 (N = 128). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_shiftLeft128M( aPtr, dist, zPtr ) softfloat_shiftLeftM( 4, aPtr, dist, zPtr ) | ||||
| #define softfloat_shiftLeft128M(aPtr, dist, zPtr) softfloat_shiftLeftM(4, aPtr, dist, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shiftLeft160M | ||||
| @@ -752,7 +677,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_shiftLeftM' with | ||||
| | 'size_words' = 5 (N = 160). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_shiftLeft160M( aPtr, dist, zPtr ) softfloat_shiftLeftM( 5, aPtr, dist, zPtr ) | ||||
| #define softfloat_shiftLeft160M(aPtr, dist, zPtr) softfloat_shiftLeftM(5, aPtr, dist, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shortShiftRightM | ||||
| @@ -765,13 +690,7 @@ void | ||||
| | that concatenate in the platform's normal endian order to form an N-bit | ||||
| | integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_shortShiftRightM( | ||||
|      uint_fast8_t size_words, | ||||
|      const uint32_t *aPtr, | ||||
|      uint_fast8_t dist, | ||||
|      uint32_t *zPtr | ||||
|  ); | ||||
| void softfloat_shortShiftRightM(uint_fast8_t size_words, const uint32_t* aPtr, uint_fast8_t dist, uint32_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shortShiftRight128M | ||||
| @@ -779,7 +698,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_shortShiftRightM' with | ||||
| | 'size_words' = 4 (N = 128). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_shortShiftRight128M( aPtr, dist, zPtr ) softfloat_shortShiftRightM( 4, aPtr, dist, zPtr ) | ||||
| #define softfloat_shortShiftRight128M(aPtr, dist, zPtr) softfloat_shortShiftRightM(4, aPtr, dist, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shortShiftRight160M | ||||
| @@ -787,7 +706,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_shortShiftRightM' with | ||||
| | 'size_words' = 5 (N = 160). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_shortShiftRight160M( aPtr, dist, zPtr ) softfloat_shortShiftRightM( 5, aPtr, dist, zPtr ) | ||||
| #define softfloat_shortShiftRight160M(aPtr, dist, zPtr) softfloat_shortShiftRightM(5, aPtr, dist, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shortShiftRightJamM | ||||
| @@ -801,9 +720,7 @@ void | ||||
| | to a 'size_words'-long array of 32-bit elements that concatenate in the | ||||
| | platform's normal endian order to form an N-bit integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_shortShiftRightJamM( | ||||
|      uint_fast8_t, const uint32_t *, uint_fast8_t, uint32_t * ); | ||||
| void softfloat_shortShiftRightJamM(uint_fast8_t, const uint32_t*, uint_fast8_t, uint32_t*); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shortShiftRightJam160M | ||||
| @@ -811,7 +728,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_shortShiftRightJamM' with | ||||
| | 'size_words' = 5 (N = 160). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_shortShiftRightJam160M( aPtr, dist, zPtr ) softfloat_shortShiftRightJamM( 5, aPtr, dist, zPtr ) | ||||
| #define softfloat_shortShiftRightJam160M(aPtr, dist, zPtr) softfloat_shortShiftRightJamM(5, aPtr, dist, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shiftRightM | ||||
| @@ -825,13 +742,7 @@ void | ||||
| |   The value of 'dist' can be arbitrarily large.  In particular, if 'dist' is | ||||
| | greater than N, the stored result will be 0. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_shiftRightM( | ||||
|      uint_fast8_t size_words, | ||||
|      const uint32_t *aPtr, | ||||
|      uint32_t dist, | ||||
|      uint32_t *zPtr | ||||
|  ); | ||||
| void softfloat_shiftRightM(uint_fast8_t size_words, const uint32_t* aPtr, uint32_t dist, uint32_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shiftRight96M | ||||
| @@ -839,7 +750,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_shiftRightM' with | ||||
| | 'size_words' = 3 (N = 96). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_shiftRight96M( aPtr, dist, zPtr ) softfloat_shiftRightM( 3, aPtr, dist, zPtr ) | ||||
| #define softfloat_shiftRight96M(aPtr, dist, zPtr) softfloat_shiftRightM(3, aPtr, dist, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shiftRightJamM | ||||
| @@ -856,13 +767,7 @@ void | ||||
| | is greater than N, the stored result will be either 0 or 1, depending on | ||||
| | whether the original N bits are all zeros. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_shiftRightJamM( | ||||
|      uint_fast8_t size_words, | ||||
|      const uint32_t *aPtr, | ||||
|      uint32_t dist, | ||||
|      uint32_t *zPtr | ||||
|  ); | ||||
| void softfloat_shiftRightJamM(uint_fast8_t size_words, const uint32_t* aPtr, uint32_t dist, uint32_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shiftRightJam96M | ||||
| @@ -870,7 +775,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_shiftRightJamM' with | ||||
| | 'size_words' = 3 (N = 96). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_shiftRightJam96M( aPtr, dist, zPtr ) softfloat_shiftRightJamM( 3, aPtr, dist, zPtr ) | ||||
| #define softfloat_shiftRightJam96M(aPtr, dist, zPtr) softfloat_shiftRightJamM(3, aPtr, dist, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shiftRightJam128M | ||||
| @@ -878,7 +783,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_shiftRightJamM' with | ||||
| | 'size_words' = 4 (N = 128). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_shiftRightJam128M( aPtr, dist, zPtr ) softfloat_shiftRightJamM( 4, aPtr, dist, zPtr ) | ||||
| #define softfloat_shiftRightJam128M(aPtr, dist, zPtr) softfloat_shiftRightJamM(4, aPtr, dist, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_shiftRightJam160M | ||||
| @@ -886,7 +791,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_shiftRightJamM' with | ||||
| | 'size_words' = 5 (N = 160). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_shiftRightJam160M( aPtr, dist, zPtr ) softfloat_shiftRightJamM( 5, aPtr, dist, zPtr ) | ||||
| #define softfloat_shiftRightJam160M(aPtr, dist, zPtr) softfloat_shiftRightJamM(5, aPtr, dist, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_addM | ||||
| @@ -898,13 +803,7 @@ void | ||||
| | elements that concatenate in the platform's normal endian order to form an | ||||
| | N-bit integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_addM( | ||||
|      uint_fast8_t size_words, | ||||
|      const uint32_t *aPtr, | ||||
|      const uint32_t *bPtr, | ||||
|      uint32_t *zPtr | ||||
|  ); | ||||
| void softfloat_addM(uint_fast8_t size_words, const uint32_t* aPtr, const uint32_t* bPtr, uint32_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_add96M | ||||
| @@ -912,7 +811,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_addM' with 'size_words' | ||||
| | = 3 (N = 96). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_add96M( aPtr, bPtr, zPtr ) softfloat_addM( 3, aPtr, bPtr, zPtr ) | ||||
| #define softfloat_add96M(aPtr, bPtr, zPtr) softfloat_addM(3, aPtr, bPtr, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_add128M | ||||
| @@ -920,7 +819,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_addM' with 'size_words' | ||||
| | = 4 (N = 128). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_add128M( aPtr, bPtr, zPtr ) softfloat_addM( 4, aPtr, bPtr, zPtr ) | ||||
| #define softfloat_add128M(aPtr, bPtr, zPtr) softfloat_addM(4, aPtr, bPtr, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_add160M | ||||
| @@ -928,7 +827,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_addM' with 'size_words' | ||||
| | = 5 (N = 160). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_add160M( aPtr, bPtr, zPtr ) softfloat_addM( 5, aPtr, bPtr, zPtr ) | ||||
| #define softfloat_add160M(aPtr, bPtr, zPtr) softfloat_addM(5, aPtr, bPtr, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_addCarryM | ||||
| @@ -940,14 +839,7 @@ void | ||||
| | points to a 'size_words'-long array of 32-bit elements that concatenate in | ||||
| | the platform's normal endian order to form an N-bit integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast8_t | ||||
|  softfloat_addCarryM( | ||||
|      uint_fast8_t size_words, | ||||
|      const uint32_t *aPtr, | ||||
|      const uint32_t *bPtr, | ||||
|      uint_fast8_t carry, | ||||
|      uint32_t *zPtr | ||||
|  ); | ||||
| uint_fast8_t softfloat_addCarryM(uint_fast8_t size_words, const uint32_t* aPtr, const uint32_t* bPtr, uint_fast8_t carry, uint32_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_addComplCarryM | ||||
| @@ -956,14 +848,8 @@ uint_fast8_t | ||||
| | the value of the unsigned integer pointed to by 'bPtr' is bit-wise completed | ||||
| | before the addition. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast8_t | ||||
|  softfloat_addComplCarryM( | ||||
|      uint_fast8_t size_words, | ||||
|      const uint32_t *aPtr, | ||||
|      const uint32_t *bPtr, | ||||
|      uint_fast8_t carry, | ||||
|      uint32_t *zPtr | ||||
|  ); | ||||
| uint_fast8_t softfloat_addComplCarryM(uint_fast8_t size_words, const uint32_t* aPtr, const uint32_t* bPtr, uint_fast8_t carry, | ||||
|                                       uint32_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_addComplCarry96M | ||||
| @@ -971,7 +857,7 @@ uint_fast8_t | ||||
| | This function or macro is the same as 'softfloat_addComplCarryM' with | ||||
| | 'size_words' = 3 (N = 96). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_addComplCarry96M( aPtr, bPtr, carry, zPtr ) softfloat_addComplCarryM( 3, aPtr, bPtr, carry, zPtr ) | ||||
| #define softfloat_addComplCarry96M(aPtr, bPtr, carry, zPtr) softfloat_addComplCarryM(3, aPtr, bPtr, carry, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_negXM | ||||
| @@ -981,7 +867,7 @@ uint_fast8_t | ||||
| | points to a 'size_words'-long array of 32-bit elements that concatenate in | ||||
| | the platform's normal endian order to form an N-bit integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_negXM( uint_fast8_t size_words, uint32_t *zPtr ); | ||||
| void softfloat_negXM(uint_fast8_t size_words, uint32_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_negX96M | ||||
| @@ -989,7 +875,7 @@ void softfloat_negXM( uint_fast8_t size_words, uint32_t *zPtr ); | ||||
| | This function or macro is the same as 'softfloat_negXM' with 'size_words' | ||||
| | = 3 (N = 96). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_negX96M( zPtr ) softfloat_negXM( 3, zPtr ) | ||||
| #define softfloat_negX96M(zPtr) softfloat_negXM(3, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_negX128M | ||||
| @@ -997,7 +883,7 @@ void softfloat_negXM( uint_fast8_t size_words, uint32_t *zPtr ); | ||||
| | This function or macro is the same as 'softfloat_negXM' with 'size_words' | ||||
| | = 4 (N = 128). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_negX128M( zPtr ) softfloat_negXM( 4, zPtr ) | ||||
| #define softfloat_negX128M(zPtr) softfloat_negXM(4, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_negX160M | ||||
| @@ -1005,7 +891,7 @@ void softfloat_negXM( uint_fast8_t size_words, uint32_t *zPtr ); | ||||
| | This function or macro is the same as 'softfloat_negXM' with 'size_words' | ||||
| | = 5 (N = 160). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_negX160M( zPtr ) softfloat_negXM( 5, zPtr ) | ||||
| #define softfloat_negX160M(zPtr) softfloat_negXM(5, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_negX256M | ||||
| @@ -1013,7 +899,7 @@ void softfloat_negXM( uint_fast8_t size_words, uint32_t *zPtr ); | ||||
| | This function or macro is the same as 'softfloat_negXM' with 'size_words' | ||||
| | = 8 (N = 256). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_negX256M( zPtr ) softfloat_negXM( 8, zPtr ) | ||||
| #define softfloat_negX256M(zPtr) softfloat_negXM(8, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_sub1XM | ||||
| @@ -1024,7 +910,7 @@ void softfloat_negXM( uint_fast8_t size_words, uint32_t *zPtr ); | ||||
| | elements that concatenate in the platform's normal endian order to form an | ||||
| | N-bit integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_sub1XM( uint_fast8_t size_words, uint32_t *zPtr ); | ||||
| void softfloat_sub1XM(uint_fast8_t size_words, uint32_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_sub1X96M | ||||
| @@ -1032,7 +918,7 @@ void softfloat_sub1XM( uint_fast8_t size_words, uint32_t *zPtr ); | ||||
| | This function or macro is the same as 'softfloat_sub1XM' with 'size_words' | ||||
| | = 3 (N = 96). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_sub1X96M( zPtr ) softfloat_sub1XM( 3, zPtr ) | ||||
| #define softfloat_sub1X96M(zPtr) softfloat_sub1XM(3, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_sub1X160M | ||||
| @@ -1040,7 +926,7 @@ void softfloat_sub1XM( uint_fast8_t size_words, uint32_t *zPtr ); | ||||
| | This function or macro is the same as 'softfloat_sub1XM' with 'size_words' | ||||
| | = 5 (N = 160). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_sub1X160M( zPtr ) softfloat_sub1XM( 5, zPtr ) | ||||
| #define softfloat_sub1X160M(zPtr) softfloat_sub1XM(5, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_subM | ||||
| @@ -1052,13 +938,7 @@ void softfloat_sub1XM( uint_fast8_t size_words, uint32_t *zPtr ); | ||||
| | array of 32-bit elements that concatenate in the platform's normal endian | ||||
| | order to form an N-bit integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_subM( | ||||
|      uint_fast8_t size_words, | ||||
|      const uint32_t *aPtr, | ||||
|      const uint32_t *bPtr, | ||||
|      uint32_t *zPtr | ||||
|  ); | ||||
| void softfloat_subM(uint_fast8_t size_words, const uint32_t* aPtr, const uint32_t* bPtr, uint32_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_sub96M | ||||
| @@ -1066,7 +946,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_subM' with 'size_words' | ||||
| | = 3 (N = 96). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_sub96M( aPtr, bPtr, zPtr ) softfloat_subM( 3, aPtr, bPtr, zPtr ) | ||||
| #define softfloat_sub96M(aPtr, bPtr, zPtr) softfloat_subM(3, aPtr, bPtr, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_sub128M | ||||
| @@ -1074,7 +954,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_subM' with 'size_words' | ||||
| | = 4 (N = 128). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_sub128M( aPtr, bPtr, zPtr ) softfloat_subM( 4, aPtr, bPtr, zPtr ) | ||||
| #define softfloat_sub128M(aPtr, bPtr, zPtr) softfloat_subM(4, aPtr, bPtr, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_sub160M | ||||
| @@ -1082,7 +962,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_subM' with 'size_words' | ||||
| | = 5 (N = 160). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_sub160M( aPtr, bPtr, zPtr ) softfloat_subM( 5, aPtr, bPtr, zPtr ) | ||||
| #define softfloat_sub160M(aPtr, bPtr, zPtr) softfloat_subM(5, aPtr, bPtr, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_mul64To128M | ||||
| @@ -1092,7 +972,7 @@ void | ||||
| | elements that concatenate in the platform's normal endian order to form a | ||||
| | 128-bit integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_mul64To128M( uint64_t a, uint64_t b, uint32_t *zPtr ); | ||||
| void softfloat_mul64To128M(uint64_t a, uint64_t b, uint32_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_mul128MTo256M | ||||
| @@ -1104,9 +984,7 @@ void softfloat_mul64To128M( uint64_t a, uint64_t b, uint32_t *zPtr ); | ||||
| | Argument 'zPtr' points to an array of eight 32-bit elements that concatenate | ||||
| | to form a 256-bit integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_mul128MTo256M( | ||||
|      const uint32_t *aPtr, const uint32_t *bPtr, uint32_t *zPtr ); | ||||
| void softfloat_mul128MTo256M(const uint32_t* aPtr, const uint32_t* bPtr, uint32_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_remStepMBy32 | ||||
| @@ -1119,15 +997,8 @@ void | ||||
| | to a 'size_words'-long array of 32-bit elements that concatenate in the | ||||
| | platform's normal endian order to form an N-bit integer. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void | ||||
|  softfloat_remStepMBy32( | ||||
|      uint_fast8_t size_words, | ||||
|      const uint32_t *remPtr, | ||||
|      uint_fast8_t dist, | ||||
|      const uint32_t *bPtr, | ||||
|      uint32_t q, | ||||
|      uint32_t *zPtr | ||||
|  ); | ||||
| void softfloat_remStepMBy32(uint_fast8_t size_words, const uint32_t* remPtr, uint_fast8_t dist, const uint32_t* bPtr, uint32_t q, | ||||
|                             uint32_t* zPtr); | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_remStep96MBy32 | ||||
| @@ -1135,7 +1006,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_remStepMBy32' with | ||||
| | 'size_words' = 3 (N = 96). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_remStep96MBy32( remPtr, dist, bPtr, q, zPtr ) softfloat_remStepMBy32( 3, remPtr, dist, bPtr, q, zPtr ) | ||||
| #define softfloat_remStep96MBy32(remPtr, dist, bPtr, q, zPtr) softfloat_remStepMBy32(3, remPtr, dist, bPtr, q, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_remStep128MBy32 | ||||
| @@ -1143,7 +1014,7 @@ void | ||||
| | This function or macro is the same as 'softfloat_remStepMBy32' with | ||||
| | 'size_words' = 4 (N = 128). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_remStep128MBy32( remPtr, dist, bPtr, q, zPtr ) softfloat_remStepMBy32( 4, remPtr, dist, bPtr, q, zPtr ) | ||||
| #define softfloat_remStep128MBy32(remPtr, dist, bPtr, q, zPtr) softfloat_remStepMBy32(4, remPtr, dist, bPtr, q, zPtr) | ||||
| #endif | ||||
|  | ||||
| #ifndef softfloat_remStep160MBy32 | ||||
| @@ -1151,10 +1022,9 @@ void | ||||
| | This function or macro is the same as 'softfloat_remStepMBy32' with | ||||
| | 'size_words' = 5 (N = 160). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #define softfloat_remStep160MBy32( remPtr, dist, bPtr, q, zPtr ) softfloat_remStepMBy32( 5, remPtr, dist, bPtr, q, zPtr ) | ||||
| #define softfloat_remStep160MBy32(remPtr, dist, bPtr, q, zPtr) softfloat_remStepMBy32(5, remPtr, dist, bPtr, q, zPtr) | ||||
| #endif | ||||
|  | ||||
| #endif | ||||
|  | ||||
| #endif | ||||
|  | ||||
|   | ||||
| @@ -34,7 +34,6 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
|  | ||||
| /*============================================================================ | ||||
| | Note:  If SoftFloat is made available as a general library for programs to | ||||
| | use, it is strongly recommended that a platform-specific version of this | ||||
| @@ -42,13 +41,12 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| | eliminates all dependencies on compile-time macros. | ||||
| *============================================================================*/ | ||||
|  | ||||
|  | ||||
| #ifndef softfloat_h | ||||
| #define softfloat_h 1 | ||||
|  | ||||
| #include "softfloat_types.h" | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "softfloat_types.h" | ||||
|  | ||||
| #ifndef THREAD_LOCAL | ||||
| #define THREAD_LOCAL | ||||
| @@ -58,10 +56,7 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| | Software floating-point underflow tininess-detection mode. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| extern THREAD_LOCAL uint_fast8_t softfloat_detectTininess; | ||||
| enum { | ||||
|     softfloat_tininess_beforeRounding = 0, | ||||
|     softfloat_tininess_afterRounding  = 1 | ||||
| }; | ||||
| enum { softfloat_tininess_beforeRounding = 0, softfloat_tininess_afterRounding = 1 }; | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Software floating-point rounding mode.  (Mode "odd" is supported only if | ||||
| @@ -69,175 +64,182 @@ enum { | ||||
| *----------------------------------------------------------------------------*/ | ||||
| extern THREAD_LOCAL uint_fast8_t softfloat_roundingMode; | ||||
| enum { | ||||
|     softfloat_round_near_even   = 0, | ||||
|     softfloat_round_minMag      = 1, | ||||
|     softfloat_round_min         = 2, | ||||
|     softfloat_round_max         = 3, | ||||
|     softfloat_round_near_even = 0, | ||||
|     softfloat_round_minMag = 1, | ||||
|     softfloat_round_min = 2, | ||||
|     softfloat_round_max = 3, | ||||
|     softfloat_round_near_maxMag = 4, | ||||
|     softfloat_round_odd         = 6 | ||||
|     softfloat_round_odd = 6 | ||||
| }; | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Software floating-point exception flags. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| extern THREAD_LOCAL uint_fast8_t softfloat_exceptionFlags; | ||||
| enum { | ||||
|     softfloat_flag_inexact   =  1, | ||||
|     softfloat_flag_underflow =  2, | ||||
|     softfloat_flag_overflow  =  4, | ||||
|     softfloat_flag_infinite  =  8, | ||||
|     softfloat_flag_invalid   = 16 | ||||
| }; | ||||
| typedef enum { | ||||
|     softfloat_flag_inexact = 1, | ||||
|     softfloat_flag_underflow = 2, | ||||
|     softfloat_flag_overflow = 4, | ||||
|     softfloat_flag_infinite = 8, | ||||
|     softfloat_flag_invalid = 16 | ||||
| } exceptionFlag_t; | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Routine to raise any or all of the software floating-point exception flags. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| void softfloat_raiseFlags( uint_fast8_t ); | ||||
| void softfloat_raiseFlags(uint_fast8_t); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Integer-to-floating-point conversion routines. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| float16_t ui32_to_f16( uint32_t ); | ||||
| float32_t ui32_to_f32( uint32_t ); | ||||
| float64_t ui32_to_f64( uint32_t ); | ||||
| float16_t ui32_to_f16(uint32_t); | ||||
| float32_t ui32_to_f32(uint32_t); | ||||
| float64_t ui32_to_f64(uint32_t); | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
| extFloat80_t ui32_to_extF80( uint32_t ); | ||||
| float128_t ui32_to_f128( uint32_t ); | ||||
| extFloat80_t ui32_to_extF80(uint32_t); | ||||
| float128_t ui32_to_f128(uint32_t); | ||||
| #endif | ||||
| void ui32_to_extF80M( uint32_t, extFloat80_t * ); | ||||
| void ui32_to_f128M( uint32_t, float128_t * ); | ||||
| float16_t ui64_to_f16( uint64_t ); | ||||
| float32_t ui64_to_f32( uint64_t ); | ||||
| float64_t ui64_to_f64( uint64_t ); | ||||
| void ui32_to_extF80M(uint32_t, extFloat80_t*); | ||||
| void ui32_to_f128M(uint32_t, float128_t*); | ||||
| float16_t ui64_to_f16(uint64_t); | ||||
| float32_t ui64_to_f32(uint64_t); | ||||
| float64_t ui64_to_f64(uint64_t); | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
| extFloat80_t ui64_to_extF80( uint64_t ); | ||||
| float128_t ui64_to_f128( uint64_t ); | ||||
| extFloat80_t ui64_to_extF80(uint64_t); | ||||
| float128_t ui64_to_f128(uint64_t); | ||||
| #endif | ||||
| void ui64_to_extF80M( uint64_t, extFloat80_t * ); | ||||
| void ui64_to_f128M( uint64_t, float128_t * ); | ||||
| float16_t i32_to_f16( int32_t ); | ||||
| float32_t i32_to_f32( int32_t ); | ||||
| float64_t i32_to_f64( int32_t ); | ||||
| void ui64_to_extF80M(uint64_t, extFloat80_t*); | ||||
| void ui64_to_f128M(uint64_t, float128_t*); | ||||
| float16_t i32_to_f16(int32_t); | ||||
| float32_t i32_to_f32(int32_t); | ||||
| float64_t i32_to_f64(int32_t); | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
| extFloat80_t i32_to_extF80( int32_t ); | ||||
| float128_t i32_to_f128( int32_t ); | ||||
| extFloat80_t i32_to_extF80(int32_t); | ||||
| float128_t i32_to_f128(int32_t); | ||||
| #endif | ||||
| void i32_to_extF80M( int32_t, extFloat80_t * ); | ||||
| void i32_to_f128M( int32_t, float128_t * ); | ||||
| float16_t i64_to_f16( int64_t ); | ||||
| float32_t i64_to_f32( int64_t ); | ||||
| float64_t i64_to_f64( int64_t ); | ||||
| void i32_to_extF80M(int32_t, extFloat80_t*); | ||||
| void i32_to_f128M(int32_t, float128_t*); | ||||
| float16_t i64_to_f16(int64_t); | ||||
| float32_t i64_to_f32(int64_t); | ||||
| float64_t i64_to_f64(int64_t); | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
| extFloat80_t i64_to_extF80( int64_t ); | ||||
| float128_t i64_to_f128( int64_t ); | ||||
| extFloat80_t i64_to_extF80(int64_t); | ||||
| float128_t i64_to_f128(int64_t); | ||||
| #endif | ||||
| void i64_to_extF80M( int64_t, extFloat80_t * ); | ||||
| void i64_to_f128M( int64_t, float128_t * ); | ||||
| void i64_to_extF80M(int64_t, extFloat80_t*); | ||||
| void i64_to_f128M(int64_t, float128_t*); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | 16-bit (half-precision) floating-point operations. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast32_t f16_to_ui32( float16_t, uint_fast8_t, bool ); | ||||
| uint_fast64_t f16_to_ui64( float16_t, uint_fast8_t, bool ); | ||||
| int_fast32_t f16_to_i32( float16_t, uint_fast8_t, bool ); | ||||
| int_fast64_t f16_to_i64( float16_t, uint_fast8_t, bool ); | ||||
| uint_fast32_t f16_to_ui32_r_minMag( float16_t, bool ); | ||||
| uint_fast64_t f16_to_ui64_r_minMag( float16_t, bool ); | ||||
| int_fast32_t f16_to_i32_r_minMag( float16_t, bool ); | ||||
| int_fast64_t f16_to_i64_r_minMag( float16_t, bool ); | ||||
| float32_t f16_to_f32( float16_t ); | ||||
| float64_t f16_to_f64( float16_t ); | ||||
| uint_fast32_t f16_to_ui32(float16_t, uint_fast8_t, bool); | ||||
| uint_fast64_t f16_to_ui64(float16_t, uint_fast8_t, bool); | ||||
| int_fast32_t f16_to_i32(float16_t, uint_fast8_t, bool); | ||||
| int_fast64_t f16_to_i64(float16_t, uint_fast8_t, bool); | ||||
| uint_fast32_t f16_to_ui32_r_minMag(float16_t, bool); | ||||
| uint_fast64_t f16_to_ui64_r_minMag(float16_t, bool); | ||||
| int_fast32_t f16_to_i32_r_minMag(float16_t, bool); | ||||
| int_fast64_t f16_to_i64_r_minMag(float16_t, bool); | ||||
| float32_t f16_to_f32(float16_t); | ||||
| float64_t f16_to_f64(float16_t); | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
| extFloat80_t f16_to_extF80( float16_t ); | ||||
| float128_t f16_to_f128( float16_t ); | ||||
| extFloat80_t f16_to_extF80(float16_t); | ||||
| float128_t f16_to_f128(float16_t); | ||||
| #endif | ||||
| void f16_to_extF80M( float16_t, extFloat80_t * ); | ||||
| void f16_to_f128M( float16_t, float128_t * ); | ||||
| float16_t f16_roundToInt( float16_t, uint_fast8_t, bool ); | ||||
| float16_t f16_add( float16_t, float16_t ); | ||||
| float16_t f16_sub( float16_t, float16_t ); | ||||
| float16_t f16_mul( float16_t, float16_t ); | ||||
| float16_t f16_mulAdd( float16_t, float16_t, float16_t ); | ||||
| float16_t f16_div( float16_t, float16_t ); | ||||
| float16_t f16_rem( float16_t, float16_t ); | ||||
| float16_t f16_sqrt( float16_t ); | ||||
| bool f16_eq( float16_t, float16_t ); | ||||
| bool f16_le( float16_t, float16_t ); | ||||
| bool f16_lt( float16_t, float16_t ); | ||||
| bool f16_eq_signaling( float16_t, float16_t ); | ||||
| bool f16_le_quiet( float16_t, float16_t ); | ||||
| bool f16_lt_quiet( float16_t, float16_t ); | ||||
| bool f16_isSignalingNaN( float16_t ); | ||||
| void f16_to_extF80M(float16_t, extFloat80_t*); | ||||
| void f16_to_f128M(float16_t, float128_t*); | ||||
| float16_t f16_roundToInt(float16_t, uint_fast8_t, bool); | ||||
| float16_t f16_add(float16_t, float16_t); | ||||
| float16_t f16_sub(float16_t, float16_t); | ||||
| float16_t f16_mul(float16_t, float16_t); | ||||
| float16_t f16_mulAdd(float16_t, float16_t, float16_t); | ||||
| float16_t f16_div(float16_t, float16_t); | ||||
| float16_t f16_rem(float16_t, float16_t); | ||||
| float16_t f16_sqrt(float16_t); | ||||
| bool f16_eq(float16_t, float16_t); | ||||
| bool f16_le(float16_t, float16_t); | ||||
| bool f16_lt(float16_t, float16_t); | ||||
| bool f16_eq_signaling(float16_t, float16_t); | ||||
| bool f16_le_quiet(float16_t, float16_t); | ||||
| bool f16_lt_quiet(float16_t, float16_t); | ||||
| bool f16_isSignalingNaN(float16_t); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | 16-bit (brain float 16) floating-point operations. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| float32_t bf16_to_f32(bfloat16_t); | ||||
| bfloat16_t f32_to_bf16(float32_t); | ||||
| bool bf16_isSignalingNaN(bfloat16_t); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | 32-bit (single-precision) floating-point operations. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast32_t f32_to_ui32( float32_t, uint_fast8_t, bool ); | ||||
| uint_fast64_t f32_to_ui64( float32_t, uint_fast8_t, bool ); | ||||
| int_fast32_t f32_to_i32( float32_t, uint_fast8_t, bool ); | ||||
| int_fast64_t f32_to_i64( float32_t, uint_fast8_t, bool ); | ||||
| uint_fast32_t f32_to_ui32_r_minMag( float32_t, bool ); | ||||
| uint_fast64_t f32_to_ui64_r_minMag( float32_t, bool ); | ||||
| int_fast32_t f32_to_i32_r_minMag( float32_t, bool ); | ||||
| int_fast64_t f32_to_i64_r_minMag( float32_t, bool ); | ||||
| float16_t f32_to_f16( float32_t ); | ||||
| float64_t f32_to_f64( float32_t ); | ||||
| uint_fast32_t f32_to_ui32(float32_t, uint_fast8_t, bool); | ||||
| uint_fast64_t f32_to_ui64(float32_t, uint_fast8_t, bool); | ||||
| int_fast32_t f32_to_i32(float32_t, uint_fast8_t, bool); | ||||
| int_fast64_t f32_to_i64(float32_t, uint_fast8_t, bool); | ||||
| uint_fast32_t f32_to_ui32_r_minMag(float32_t, bool); | ||||
| uint_fast64_t f32_to_ui64_r_minMag(float32_t, bool); | ||||
| int_fast32_t f32_to_i32_r_minMag(float32_t, bool); | ||||
| int_fast64_t f32_to_i64_r_minMag(float32_t, bool); | ||||
| float16_t f32_to_f16(float32_t); | ||||
| float64_t f32_to_f64(float32_t); | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
| extFloat80_t f32_to_extF80( float32_t ); | ||||
| float128_t f32_to_f128( float32_t ); | ||||
| extFloat80_t f32_to_extF80(float32_t); | ||||
| float128_t f32_to_f128(float32_t); | ||||
| #endif | ||||
| void f32_to_extF80M( float32_t, extFloat80_t * ); | ||||
| void f32_to_f128M( float32_t, float128_t * ); | ||||
| float32_t f32_roundToInt( float32_t, uint_fast8_t, bool ); | ||||
| float32_t f32_add( float32_t, float32_t ); | ||||
| float32_t f32_sub( float32_t, float32_t ); | ||||
| float32_t f32_mul( float32_t, float32_t ); | ||||
| float32_t f32_mulAdd( float32_t, float32_t, float32_t ); | ||||
| float32_t f32_div( float32_t, float32_t ); | ||||
| float32_t f32_rem( float32_t, float32_t ); | ||||
| float32_t f32_sqrt( float32_t ); | ||||
| bool f32_eq( float32_t, float32_t ); | ||||
| bool f32_le( float32_t, float32_t ); | ||||
| bool f32_lt( float32_t, float32_t ); | ||||
| bool f32_eq_signaling( float32_t, float32_t ); | ||||
| bool f32_le_quiet( float32_t, float32_t ); | ||||
| bool f32_lt_quiet( float32_t, float32_t ); | ||||
| bool f32_isSignalingNaN( float32_t ); | ||||
| void f32_to_extF80M(float32_t, extFloat80_t*); | ||||
| void f32_to_f128M(float32_t, float128_t*); | ||||
| float32_t f32_roundToInt(float32_t, uint_fast8_t, bool); | ||||
| float32_t f32_add(float32_t, float32_t); | ||||
| float32_t f32_sub(float32_t, float32_t); | ||||
| float32_t f32_mul(float32_t, float32_t); | ||||
| float32_t f32_mulAdd(float32_t, float32_t, float32_t); | ||||
| float32_t f32_div(float32_t, float32_t); | ||||
| float32_t f32_rem(float32_t, float32_t); | ||||
| float32_t f32_sqrt(float32_t); | ||||
| bool f32_eq(float32_t, float32_t); | ||||
| bool f32_le(float32_t, float32_t); | ||||
| bool f32_lt(float32_t, float32_t); | ||||
| bool f32_eq_signaling(float32_t, float32_t); | ||||
| bool f32_le_quiet(float32_t, float32_t); | ||||
| bool f32_lt_quiet(float32_t, float32_t); | ||||
| bool f32_isSignalingNaN(float32_t); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | 64-bit (double-precision) floating-point operations. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| uint_fast32_t f64_to_ui32( float64_t, uint_fast8_t, bool ); | ||||
| uint_fast64_t f64_to_ui64( float64_t, uint_fast8_t, bool ); | ||||
| int_fast32_t f64_to_i32( float64_t, uint_fast8_t, bool ); | ||||
| int_fast64_t f64_to_i64( float64_t, uint_fast8_t, bool ); | ||||
| uint_fast32_t f64_to_ui32_r_minMag( float64_t, bool ); | ||||
| uint_fast64_t f64_to_ui64_r_minMag( float64_t, bool ); | ||||
| int_fast32_t f64_to_i32_r_minMag( float64_t, bool ); | ||||
| int_fast64_t f64_to_i64_r_minMag( float64_t, bool ); | ||||
| float16_t f64_to_f16( float64_t ); | ||||
| float32_t f64_to_f32( float64_t ); | ||||
| uint_fast32_t f64_to_ui32(float64_t, uint_fast8_t, bool); | ||||
| uint_fast64_t f64_to_ui64(float64_t, uint_fast8_t, bool); | ||||
| int_fast32_t f64_to_i32(float64_t, uint_fast8_t, bool); | ||||
| int_fast64_t f64_to_i64(float64_t, uint_fast8_t, bool); | ||||
| uint_fast32_t f64_to_ui32_r_minMag(float64_t, bool); | ||||
| uint_fast64_t f64_to_ui64_r_minMag(float64_t, bool); | ||||
| int_fast32_t f64_to_i32_r_minMag(float64_t, bool); | ||||
| int_fast64_t f64_to_i64_r_minMag(float64_t, bool); | ||||
| float16_t f64_to_f16(float64_t); | ||||
| float32_t f64_to_f32(float64_t); | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
| extFloat80_t f64_to_extF80( float64_t ); | ||||
| float128_t f64_to_f128( float64_t ); | ||||
| extFloat80_t f64_to_extF80(float64_t); | ||||
| float128_t f64_to_f128(float64_t); | ||||
| #endif | ||||
| void f64_to_extF80M( float64_t, extFloat80_t * ); | ||||
| void f64_to_f128M( float64_t, float128_t * ); | ||||
| float64_t f64_roundToInt( float64_t, uint_fast8_t, bool ); | ||||
| float64_t f64_add( float64_t, float64_t ); | ||||
| float64_t f64_sub( float64_t, float64_t ); | ||||
| float64_t f64_mul( float64_t, float64_t ); | ||||
| float64_t f64_mulAdd( float64_t, float64_t, float64_t ); | ||||
| float64_t f64_div( float64_t, float64_t ); | ||||
| float64_t f64_rem( float64_t, float64_t ); | ||||
| float64_t f64_sqrt( float64_t ); | ||||
| bool f64_eq( float64_t, float64_t ); | ||||
| bool f64_le( float64_t, float64_t ); | ||||
| bool f64_lt( float64_t, float64_t ); | ||||
| bool f64_eq_signaling( float64_t, float64_t ); | ||||
| bool f64_le_quiet( float64_t, float64_t ); | ||||
| bool f64_lt_quiet( float64_t, float64_t ); | ||||
| bool f64_isSignalingNaN( float64_t ); | ||||
| void f64_to_extF80M(float64_t, extFloat80_t*); | ||||
| void f64_to_f128M(float64_t, float128_t*); | ||||
| float64_t f64_roundToInt(float64_t, uint_fast8_t, bool); | ||||
| float64_t f64_add(float64_t, float64_t); | ||||
| float64_t f64_sub(float64_t, float64_t); | ||||
| float64_t f64_mul(float64_t, float64_t); | ||||
| float64_t f64_mulAdd(float64_t, float64_t, float64_t); | ||||
| float64_t f64_div(float64_t, float64_t); | ||||
| float64_t f64_rem(float64_t, float64_t); | ||||
| float64_t f64_sqrt(float64_t); | ||||
| bool f64_eq(float64_t, float64_t); | ||||
| bool f64_le(float64_t, float64_t); | ||||
| bool f64_lt(float64_t, float64_t); | ||||
| bool f64_eq_signaling(float64_t, float64_t); | ||||
| bool f64_le_quiet(float64_t, float64_t); | ||||
| bool f64_lt_quiet(float64_t, float64_t); | ||||
| bool f64_isSignalingNaN(float64_t); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | Rounding precision for 80-bit extended double-precision floating-point. | ||||
| @@ -249,124 +251,118 @@ extern THREAD_LOCAL uint_fast8_t extF80_roundingPrecision; | ||||
| | 80-bit extended double-precision floating-point operations. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
| uint_fast32_t extF80_to_ui32( extFloat80_t, uint_fast8_t, bool ); | ||||
| uint_fast64_t extF80_to_ui64( extFloat80_t, uint_fast8_t, bool ); | ||||
| int_fast32_t extF80_to_i32( extFloat80_t, uint_fast8_t, bool ); | ||||
| int_fast64_t extF80_to_i64( extFloat80_t, uint_fast8_t, bool ); | ||||
| uint_fast32_t extF80_to_ui32_r_minMag( extFloat80_t, bool ); | ||||
| uint_fast64_t extF80_to_ui64_r_minMag( extFloat80_t, bool ); | ||||
| int_fast32_t extF80_to_i32_r_minMag( extFloat80_t, bool ); | ||||
| int_fast64_t extF80_to_i64_r_minMag( extFloat80_t, bool ); | ||||
| float16_t extF80_to_f16( extFloat80_t ); | ||||
| float32_t extF80_to_f32( extFloat80_t ); | ||||
| float64_t extF80_to_f64( extFloat80_t ); | ||||
| float128_t extF80_to_f128( extFloat80_t ); | ||||
| extFloat80_t extF80_roundToInt( extFloat80_t, uint_fast8_t, bool ); | ||||
| extFloat80_t extF80_add( extFloat80_t, extFloat80_t ); | ||||
| extFloat80_t extF80_sub( extFloat80_t, extFloat80_t ); | ||||
| extFloat80_t extF80_mul( extFloat80_t, extFloat80_t ); | ||||
| extFloat80_t extF80_div( extFloat80_t, extFloat80_t ); | ||||
| extFloat80_t extF80_rem( extFloat80_t, extFloat80_t ); | ||||
| extFloat80_t extF80_sqrt( extFloat80_t ); | ||||
| bool extF80_eq( extFloat80_t, extFloat80_t ); | ||||
| bool extF80_le( extFloat80_t, extFloat80_t ); | ||||
| bool extF80_lt( extFloat80_t, extFloat80_t ); | ||||
| bool extF80_eq_signaling( extFloat80_t, extFloat80_t ); | ||||
| bool extF80_le_quiet( extFloat80_t, extFloat80_t ); | ||||
| bool extF80_lt_quiet( extFloat80_t, extFloat80_t ); | ||||
| bool extF80_isSignalingNaN( extFloat80_t ); | ||||
| uint_fast32_t extF80_to_ui32(extFloat80_t, uint_fast8_t, bool); | ||||
| uint_fast64_t extF80_to_ui64(extFloat80_t, uint_fast8_t, bool); | ||||
| int_fast32_t extF80_to_i32(extFloat80_t, uint_fast8_t, bool); | ||||
| int_fast64_t extF80_to_i64(extFloat80_t, uint_fast8_t, bool); | ||||
| uint_fast32_t extF80_to_ui32_r_minMag(extFloat80_t, bool); | ||||
| uint_fast64_t extF80_to_ui64_r_minMag(extFloat80_t, bool); | ||||
| int_fast32_t extF80_to_i32_r_minMag(extFloat80_t, bool); | ||||
| int_fast64_t extF80_to_i64_r_minMag(extFloat80_t, bool); | ||||
| float16_t extF80_to_f16(extFloat80_t); | ||||
| float32_t extF80_to_f32(extFloat80_t); | ||||
| float64_t extF80_to_f64(extFloat80_t); | ||||
| float128_t extF80_to_f128(extFloat80_t); | ||||
| extFloat80_t extF80_roundToInt(extFloat80_t, uint_fast8_t, bool); | ||||
| extFloat80_t extF80_add(extFloat80_t, extFloat80_t); | ||||
| extFloat80_t extF80_sub(extFloat80_t, extFloat80_t); | ||||
| extFloat80_t extF80_mul(extFloat80_t, extFloat80_t); | ||||
| extFloat80_t extF80_div(extFloat80_t, extFloat80_t); | ||||
| extFloat80_t extF80_rem(extFloat80_t, extFloat80_t); | ||||
| extFloat80_t extF80_sqrt(extFloat80_t); | ||||
| bool extF80_eq(extFloat80_t, extFloat80_t); | ||||
| bool extF80_le(extFloat80_t, extFloat80_t); | ||||
| bool extF80_lt(extFloat80_t, extFloat80_t); | ||||
| bool extF80_eq_signaling(extFloat80_t, extFloat80_t); | ||||
| bool extF80_le_quiet(extFloat80_t, extFloat80_t); | ||||
| bool extF80_lt_quiet(extFloat80_t, extFloat80_t); | ||||
| bool extF80_isSignalingNaN(extFloat80_t); | ||||
| #endif | ||||
| uint_fast32_t extF80M_to_ui32( const extFloat80_t *, uint_fast8_t, bool ); | ||||
| uint_fast64_t extF80M_to_ui64( const extFloat80_t *, uint_fast8_t, bool ); | ||||
| int_fast32_t extF80M_to_i32( const extFloat80_t *, uint_fast8_t, bool ); | ||||
| int_fast64_t extF80M_to_i64( const extFloat80_t *, uint_fast8_t, bool ); | ||||
| uint_fast32_t extF80M_to_ui32_r_minMag( const extFloat80_t *, bool ); | ||||
| uint_fast64_t extF80M_to_ui64_r_minMag( const extFloat80_t *, bool ); | ||||
| int_fast32_t extF80M_to_i32_r_minMag( const extFloat80_t *, bool ); | ||||
| int_fast64_t extF80M_to_i64_r_minMag( const extFloat80_t *, bool ); | ||||
| float16_t extF80M_to_f16( const extFloat80_t * ); | ||||
| float32_t extF80M_to_f32( const extFloat80_t * ); | ||||
| float64_t extF80M_to_f64( const extFloat80_t * ); | ||||
| void extF80M_to_f128M( const extFloat80_t *, float128_t * ); | ||||
| void | ||||
|  extF80M_roundToInt( | ||||
|      const extFloat80_t *, uint_fast8_t, bool, extFloat80_t * ); | ||||
| void extF80M_add( const extFloat80_t *, const extFloat80_t *, extFloat80_t * ); | ||||
| void extF80M_sub( const extFloat80_t *, const extFloat80_t *, extFloat80_t * ); | ||||
| void extF80M_mul( const extFloat80_t *, const extFloat80_t *, extFloat80_t * ); | ||||
| void extF80M_div( const extFloat80_t *, const extFloat80_t *, extFloat80_t * ); | ||||
| void extF80M_rem( const extFloat80_t *, const extFloat80_t *, extFloat80_t * ); | ||||
| void extF80M_sqrt( const extFloat80_t *, extFloat80_t * ); | ||||
| bool extF80M_eq( const extFloat80_t *, const extFloat80_t * ); | ||||
| bool extF80M_le( const extFloat80_t *, const extFloat80_t * ); | ||||
| bool extF80M_lt( const extFloat80_t *, const extFloat80_t * ); | ||||
| bool extF80M_eq_signaling( const extFloat80_t *, const extFloat80_t * ); | ||||
| bool extF80M_le_quiet( const extFloat80_t *, const extFloat80_t * ); | ||||
| bool extF80M_lt_quiet( const extFloat80_t *, const extFloat80_t * ); | ||||
| bool extF80M_isSignalingNaN( const extFloat80_t * ); | ||||
| uint_fast32_t extF80M_to_ui32(const extFloat80_t*, uint_fast8_t, bool); | ||||
| uint_fast64_t extF80M_to_ui64(const extFloat80_t*, uint_fast8_t, bool); | ||||
| int_fast32_t extF80M_to_i32(const extFloat80_t*, uint_fast8_t, bool); | ||||
| int_fast64_t extF80M_to_i64(const extFloat80_t*, uint_fast8_t, bool); | ||||
| uint_fast32_t extF80M_to_ui32_r_minMag(const extFloat80_t*, bool); | ||||
| uint_fast64_t extF80M_to_ui64_r_minMag(const extFloat80_t*, bool); | ||||
| int_fast32_t extF80M_to_i32_r_minMag(const extFloat80_t*, bool); | ||||
| int_fast64_t extF80M_to_i64_r_minMag(const extFloat80_t*, bool); | ||||
| float16_t extF80M_to_f16(const extFloat80_t*); | ||||
| float32_t extF80M_to_f32(const extFloat80_t*); | ||||
| float64_t extF80M_to_f64(const extFloat80_t*); | ||||
| void extF80M_to_f128M(const extFloat80_t*, float128_t*); | ||||
| void extF80M_roundToInt(const extFloat80_t*, uint_fast8_t, bool, extFloat80_t*); | ||||
| void extF80M_add(const extFloat80_t*, const extFloat80_t*, extFloat80_t*); | ||||
| void extF80M_sub(const extFloat80_t*, const extFloat80_t*, extFloat80_t*); | ||||
| void extF80M_mul(const extFloat80_t*, const extFloat80_t*, extFloat80_t*); | ||||
| void extF80M_div(const extFloat80_t*, const extFloat80_t*, extFloat80_t*); | ||||
| void extF80M_rem(const extFloat80_t*, const extFloat80_t*, extFloat80_t*); | ||||
| void extF80M_sqrt(const extFloat80_t*, extFloat80_t*); | ||||
| bool extF80M_eq(const extFloat80_t*, const extFloat80_t*); | ||||
| bool extF80M_le(const extFloat80_t*, const extFloat80_t*); | ||||
| bool extF80M_lt(const extFloat80_t*, const extFloat80_t*); | ||||
| bool extF80M_eq_signaling(const extFloat80_t*, const extFloat80_t*); | ||||
| bool extF80M_le_quiet(const extFloat80_t*, const extFloat80_t*); | ||||
| bool extF80M_lt_quiet(const extFloat80_t*, const extFloat80_t*); | ||||
| bool extF80M_isSignalingNaN(const extFloat80_t*); | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | 128-bit (quadruple-precision) floating-point operations. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #ifdef SOFTFLOAT_FAST_INT64 | ||||
| uint_fast32_t f128_to_ui32( float128_t, uint_fast8_t, bool ); | ||||
| uint_fast64_t f128_to_ui64( float128_t, uint_fast8_t, bool ); | ||||
| int_fast32_t f128_to_i32( float128_t, uint_fast8_t, bool ); | ||||
| int_fast64_t f128_to_i64( float128_t, uint_fast8_t, bool ); | ||||
| uint_fast32_t f128_to_ui32_r_minMag( float128_t, bool ); | ||||
| uint_fast64_t f128_to_ui64_r_minMag( float128_t, bool ); | ||||
| int_fast32_t f128_to_i32_r_minMag( float128_t, bool ); | ||||
| int_fast64_t f128_to_i64_r_minMag( float128_t, bool ); | ||||
| float16_t f128_to_f16( float128_t ); | ||||
| float32_t f128_to_f32( float128_t ); | ||||
| float64_t f128_to_f64( float128_t ); | ||||
| extFloat80_t f128_to_extF80( float128_t ); | ||||
| float128_t f128_roundToInt( float128_t, uint_fast8_t, bool ); | ||||
| float128_t f128_add( float128_t, float128_t ); | ||||
| float128_t f128_sub( float128_t, float128_t ); | ||||
| float128_t f128_mul( float128_t, float128_t ); | ||||
| float128_t f128_mulAdd( float128_t, float128_t, float128_t ); | ||||
| float128_t f128_div( float128_t, float128_t ); | ||||
| float128_t f128_rem( float128_t, float128_t ); | ||||
| float128_t f128_sqrt( float128_t ); | ||||
| bool f128_eq( float128_t, float128_t ); | ||||
| bool f128_le( float128_t, float128_t ); | ||||
| bool f128_lt( float128_t, float128_t ); | ||||
| bool f128_eq_signaling( float128_t, float128_t ); | ||||
| bool f128_le_quiet( float128_t, float128_t ); | ||||
| bool f128_lt_quiet( float128_t, float128_t ); | ||||
| bool f128_isSignalingNaN( float128_t ); | ||||
| uint_fast32_t f128_to_ui32(float128_t, uint_fast8_t, bool); | ||||
| uint_fast64_t f128_to_ui64(float128_t, uint_fast8_t, bool); | ||||
| int_fast32_t f128_to_i32(float128_t, uint_fast8_t, bool); | ||||
| int_fast64_t f128_to_i64(float128_t, uint_fast8_t, bool); | ||||
| uint_fast32_t f128_to_ui32_r_minMag(float128_t, bool); | ||||
| uint_fast64_t f128_to_ui64_r_minMag(float128_t, bool); | ||||
| int_fast32_t f128_to_i32_r_minMag(float128_t, bool); | ||||
| int_fast64_t f128_to_i64_r_minMag(float128_t, bool); | ||||
| float16_t f128_to_f16(float128_t); | ||||
| float32_t f128_to_f32(float128_t); | ||||
| float64_t f128_to_f64(float128_t); | ||||
| extFloat80_t f128_to_extF80(float128_t); | ||||
| float128_t f128_roundToInt(float128_t, uint_fast8_t, bool); | ||||
| float128_t f128_add(float128_t, float128_t); | ||||
| float128_t f128_sub(float128_t, float128_t); | ||||
| float128_t f128_mul(float128_t, float128_t); | ||||
| float128_t f128_mulAdd(float128_t, float128_t, float128_t); | ||||
| float128_t f128_div(float128_t, float128_t); | ||||
| float128_t f128_rem(float128_t, float128_t); | ||||
| float128_t f128_sqrt(float128_t); | ||||
| bool f128_eq(float128_t, float128_t); | ||||
| bool f128_le(float128_t, float128_t); | ||||
| bool f128_lt(float128_t, float128_t); | ||||
| bool f128_eq_signaling(float128_t, float128_t); | ||||
| bool f128_le_quiet(float128_t, float128_t); | ||||
| bool f128_lt_quiet(float128_t, float128_t); | ||||
| bool f128_isSignalingNaN(float128_t); | ||||
| #endif | ||||
| uint_fast32_t f128M_to_ui32( const float128_t *, uint_fast8_t, bool ); | ||||
| uint_fast64_t f128M_to_ui64( const float128_t *, uint_fast8_t, bool ); | ||||
| int_fast32_t f128M_to_i32( const float128_t *, uint_fast8_t, bool ); | ||||
| int_fast64_t f128M_to_i64( const float128_t *, uint_fast8_t, bool ); | ||||
| uint_fast32_t f128M_to_ui32_r_minMag( const float128_t *, bool ); | ||||
| uint_fast64_t f128M_to_ui64_r_minMag( const float128_t *, bool ); | ||||
| int_fast32_t f128M_to_i32_r_minMag( const float128_t *, bool ); | ||||
| int_fast64_t f128M_to_i64_r_minMag( const float128_t *, bool ); | ||||
| float16_t f128M_to_f16( const float128_t * ); | ||||
| float32_t f128M_to_f32( const float128_t * ); | ||||
| float64_t f128M_to_f64( const float128_t * ); | ||||
| void f128M_to_extF80M( const float128_t *, extFloat80_t * ); | ||||
| void f128M_roundToInt( const float128_t *, uint_fast8_t, bool, float128_t * ); | ||||
| void f128M_add( const float128_t *, const float128_t *, float128_t * ); | ||||
| void f128M_sub( const float128_t *, const float128_t *, float128_t * ); | ||||
| void f128M_mul( const float128_t *, const float128_t *, float128_t * ); | ||||
| void | ||||
|  f128M_mulAdd( | ||||
|      const float128_t *, const float128_t *, const float128_t *, float128_t * | ||||
|  ); | ||||
| void f128M_div( const float128_t *, const float128_t *, float128_t * ); | ||||
| void f128M_rem( const float128_t *, const float128_t *, float128_t * ); | ||||
| void f128M_sqrt( const float128_t *, float128_t * ); | ||||
| bool f128M_eq( const float128_t *, const float128_t * ); | ||||
| bool f128M_le( const float128_t *, const float128_t * ); | ||||
| bool f128M_lt( const float128_t *, const float128_t * ); | ||||
| bool f128M_eq_signaling( const float128_t *, const float128_t * ); | ||||
| bool f128M_le_quiet( const float128_t *, const float128_t * ); | ||||
| bool f128M_lt_quiet( const float128_t *, const float128_t * ); | ||||
| bool f128M_isSignalingNaN( const float128_t * ); | ||||
| uint_fast32_t f128M_to_ui32(const float128_t*, uint_fast8_t, bool); | ||||
| uint_fast64_t f128M_to_ui64(const float128_t*, uint_fast8_t, bool); | ||||
| int_fast32_t f128M_to_i32(const float128_t*, uint_fast8_t, bool); | ||||
| int_fast64_t f128M_to_i64(const float128_t*, uint_fast8_t, bool); | ||||
| uint_fast32_t f128M_to_ui32_r_minMag(const float128_t*, bool); | ||||
| uint_fast64_t f128M_to_ui64_r_minMag(const float128_t*, bool); | ||||
| int_fast32_t f128M_to_i32_r_minMag(const float128_t*, bool); | ||||
| int_fast64_t f128M_to_i64_r_minMag(const float128_t*, bool); | ||||
| float16_t f128M_to_f16(const float128_t*); | ||||
| float32_t f128M_to_f32(const float128_t*); | ||||
| float64_t f128M_to_f64(const float128_t*); | ||||
| void f128M_to_extF80M(const float128_t*, extFloat80_t*); | ||||
| void f128M_roundToInt(const float128_t*, uint_fast8_t, bool, float128_t*); | ||||
| void f128M_add(const float128_t*, const float128_t*, float128_t*); | ||||
| void f128M_sub(const float128_t*, const float128_t*, float128_t*); | ||||
| void f128M_mul(const float128_t*, const float128_t*, float128_t*); | ||||
| void f128M_mulAdd(const float128_t*, const float128_t*, const float128_t*, float128_t*); | ||||
| void f128M_div(const float128_t*, const float128_t*, float128_t*); | ||||
| void f128M_rem(const float128_t*, const float128_t*, float128_t*); | ||||
| void f128M_sqrt(const float128_t*, float128_t*); | ||||
| bool f128M_eq(const float128_t*, const float128_t*); | ||||
| bool f128M_le(const float128_t*, const float128_t*); | ||||
| bool f128M_lt(const float128_t*, const float128_t*); | ||||
| bool f128M_eq_signaling(const float128_t*, const float128_t*); | ||||
| bool f128M_le_quiet(const float128_t*, const float128_t*); | ||||
| bool f128M_lt_quiet(const float128_t*, const float128_t*); | ||||
| bool f128M_isSignalingNaN(const float128_t*); | ||||
|  | ||||
| #endif | ||||
|  | ||||
|   | ||||
| @@ -47,10 +47,21 @@ SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
| | the types below may, if desired, be defined as aliases for the native types | ||||
| | (typically 'float' and 'double', and possibly 'long double'). | ||||
| *----------------------------------------------------------------------------*/ | ||||
| typedef struct { uint16_t v; } float16_t; | ||||
| typedef struct { uint32_t v; } float32_t; | ||||
| typedef struct { uint64_t v; } float64_t; | ||||
| typedef struct { uint64_t v[2]; } float128_t; | ||||
| typedef struct { | ||||
|     uint16_t v; | ||||
| } float16_t; | ||||
| typedef struct { | ||||
|     uint16_t v; | ||||
| } bfloat16_t; | ||||
| typedef struct { | ||||
|     uint32_t v; | ||||
| } float32_t; | ||||
| typedef struct { | ||||
|     uint64_t v; | ||||
| } float64_t; | ||||
| typedef struct { | ||||
|     uint64_t v[2]; | ||||
| } float128_t; | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| | The format of an 80-bit extended floating-point number in memory.  This | ||||
| @@ -58,9 +69,15 @@ typedef struct { uint64_t v[2]; } float128_t; | ||||
| | named 'signif'. | ||||
| *----------------------------------------------------------------------------*/ | ||||
| #ifdef LITTLEENDIAN | ||||
| struct extFloat80M { uint64_t signif; uint16_t signExp; }; | ||||
| struct extFloat80M { | ||||
|     uint64_t signif; | ||||
|     uint16_t signExp; | ||||
| }; | ||||
| #else | ||||
| struct extFloat80M { uint16_t signExp; uint64_t signif; }; | ||||
| struct extFloat80M { | ||||
|     uint16_t signExp; | ||||
|     uint64_t signif; | ||||
| }; | ||||
| #endif | ||||
|  | ||||
| /*---------------------------------------------------------------------------- | ||||
| @@ -78,4 +95,3 @@ struct extFloat80M { uint16_t signExp; uint64_t signif; }; | ||||
| typedef struct extFloat80M extFloat80_t; | ||||
|  | ||||
| #endif | ||||
|  | ||||
|   | ||||
| @@ -221,4 +221,3 @@ float32_t | ||||
|     return uZ.f; | ||||
|  | ||||
| } | ||||
|  | ||||
|   | ||||
							
								
								
									
										52
									
								
								softfloat/source/s_normSubnormalBF16Sig.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										52
									
								
								softfloat/source/s_normSubnormalBF16Sig.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,52 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014, 2015, 2016 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "internals.h" | ||||
|  | ||||
| struct exp8_sig16 softfloat_normSubnormalBF16Sig( uint_fast16_t sig ) | ||||
| { | ||||
|     int_fast8_t shiftDist; | ||||
|     struct exp8_sig16 z; | ||||
|  | ||||
|     shiftDist = softfloat_countLeadingZeros16( sig ) - 8; | ||||
|     z.exp = 1 - shiftDist; | ||||
|     z.sig = sig<<shiftDist; | ||||
|     return z; | ||||
|  | ||||
| } | ||||
|  | ||||
							
								
								
									
										114
									
								
								softfloat/source/s_roundPackToBF16.c
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										114
									
								
								softfloat/source/s_roundPackToBF16.c
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,114 @@ | ||||
|  | ||||
| /*============================================================================ | ||||
|  | ||||
| This C source file is part of the SoftFloat IEEE Floating-Point Arithmetic | ||||
| Package, Release 3e, by John R. Hauser. | ||||
|  | ||||
| Copyright 2011, 2012, 2013, 2014, 2015, 2017 The Regents of the University of | ||||
| California.  All rights reserved. | ||||
|  | ||||
| Redistribution and use in source and binary forms, with or without | ||||
| modification, are permitted provided that the following conditions are met: | ||||
|  | ||||
|  1. Redistributions of source code must retain the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer. | ||||
|  | ||||
|  2. Redistributions in binary form must reproduce the above copyright notice, | ||||
|     this list of conditions, and the following disclaimer in the documentation | ||||
|     and/or other materials provided with the distribution. | ||||
|  | ||||
|  3. Neither the name of the University nor the names of its contributors may | ||||
|     be used to endorse or promote products derived from this software without | ||||
|     specific prior written permission. | ||||
|  | ||||
| THIS SOFTWARE IS PROVIDED BY THE REGENTS AND CONTRIBUTORS "AS IS", AND ANY | ||||
| EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED | ||||
| WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE, ARE | ||||
| DISCLAIMED.  IN NO EVENT SHALL THE REGENTS OR CONTRIBUTORS BE LIABLE FOR ANY | ||||
| DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES | ||||
| (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; | ||||
| LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND | ||||
| ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | ||||
| (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS | ||||
| SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | ||||
|  | ||||
| =============================================================================*/ | ||||
|  | ||||
| #include <stdbool.h> | ||||
| #include <stdint.h> | ||||
| #include "platform.h" | ||||
| #include "internals.h" | ||||
| #include "softfloat.h" | ||||
|  | ||||
| /** sig last significant bit is sig[7], the 7 LSBs will be used for rounding */ | ||||
| bfloat16_t | ||||
|  softfloat_roundPackToBF16( bool sign, int_fast16_t exp, uint_fast16_t sig ) | ||||
| { | ||||
|     uint_fast8_t roundingMode; | ||||
|     bool roundNearEven; | ||||
|     uint_fast8_t roundIncrement, roundBits; | ||||
|     bool isTiny; | ||||
|     uint_fast16_t uiZ; | ||||
|     union ui16_bf16 uZ; | ||||
|  | ||||
|     /*------------------------------------------------------------------------ | ||||
|     *------------------------------------------------------------------------*/ | ||||
|     roundingMode = softfloat_roundingMode; | ||||
|     roundNearEven = (roundingMode == softfloat_round_near_even); | ||||
|     roundIncrement = 0x40; | ||||
|     if ( ! roundNearEven && (roundingMode != softfloat_round_near_maxMag) ) { | ||||
|         roundIncrement = | ||||
|             (roundingMode | ||||
|                  == (sign ? softfloat_round_min : softfloat_round_max)) | ||||
|                 ? 0x7F | ||||
|                 : 0; | ||||
|     } | ||||
|     roundBits = sig & 0x7F; | ||||
|     /*------------------------------------------------------------------------ | ||||
|     *------------------------------------------------------------------------*/ | ||||
|     if ( 0xFD <= (unsigned int) exp ) { | ||||
|         if ( exp < 0 ) { | ||||
|             /*---------------------------------------------------------------- | ||||
|             *----------------------------------------------------------------*/ | ||||
|             isTiny = | ||||
|                 (softfloat_detectTininess == softfloat_tininess_beforeRounding) | ||||
|                     || (exp < -1) || (sig + roundIncrement < 0x8000); | ||||
|             sig = softfloat_shiftRightJam32( sig, -exp ); | ||||
|             exp = 0; | ||||
|             roundBits = sig & 0x7F; | ||||
|             if ( isTiny && roundBits ) { | ||||
|                 softfloat_raiseFlags( softfloat_flag_underflow ); | ||||
|             } | ||||
|         } else if ( (0xFD < exp) || (0x8000 <= sig + roundIncrement) ) { | ||||
|             /*---------------------------------------------------------------- | ||||
|             *----------------------------------------------------------------*/ | ||||
|             softfloat_raiseFlags( | ||||
|                 softfloat_flag_overflow | softfloat_flag_inexact ); | ||||
|             uiZ = packToBF16UI( sign, 0xFF, 0 ) - ! roundIncrement; | ||||
|             goto uiZ; | ||||
|         } | ||||
|     } | ||||
|     /*------------------------------------------------------------------------ | ||||
|     *------------------------------------------------------------------------*/ | ||||
|     sig = (sig + roundIncrement)>>7; | ||||
|     if ( roundBits ) { | ||||
|         softfloat_exceptionFlags |= softfloat_flag_inexact; | ||||
| #ifdef SOFTFLOAT_ROUND_ODD | ||||
|         if ( roundingMode == softfloat_round_odd ) { | ||||
|             sig |= 1; | ||||
|             goto packReturn; | ||||
|         } | ||||
| #endif | ||||
|     } | ||||
|     sig &= ~(uint_fast16_t) (! (roundBits ^ 0x40) & roundNearEven); | ||||
|     if ( ! sig ) exp = 0; | ||||
|     /*------------------------------------------------------------------------ | ||||
|     *------------------------------------------------------------------------*/ | ||||
|  packReturn: | ||||
|     uiZ = packToBF16UI( sign, exp, sig ); | ||||
|  uiZ: | ||||
|     uZ.ui = uiZ; | ||||
|     return uZ.f; | ||||
|  | ||||
| } | ||||
|  | ||||
							
								
								
									
										35
									
								
								src/elfio.cpp
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										35
									
								
								src/elfio.cpp
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,35 @@ | ||||
| #ifdef _MSC_VER | ||||
| #define _SCL_SECURE_NO_WARNINGS | ||||
| #define ELFIO_NO_INTTYPES | ||||
| #endif | ||||
|  | ||||
| #include <elfio/elfio_dump.hpp> | ||||
| #include <iostream> | ||||
|  | ||||
| using namespace ELFIO; | ||||
|  | ||||
| int main(int argc, char** argv) { | ||||
|     if(argc != 2) { | ||||
|         printf("Usage: elfdump <file_name>\n"); | ||||
|         return 1; | ||||
|     } | ||||
|  | ||||
|     elfio reader; | ||||
|  | ||||
|     if(!reader.load(argv[1])) { | ||||
|         printf("File %s is not found or it is not an ELF file\n", argv[1]); | ||||
|         return 1; | ||||
|     } | ||||
|  | ||||
|     dump::header(std::cout, reader); | ||||
|     dump::section_headers(std::cout, reader); | ||||
|     dump::segment_headers(std::cout, reader); | ||||
|     dump::symbol_tables(std::cout, reader); | ||||
|     dump::notes(std::cout, reader); | ||||
|     dump::modinfo(std::cout, reader); | ||||
|     dump::dynamic_tags(std::cout, reader); | ||||
|     dump::section_datas(std::cout, reader); | ||||
|     dump::segment_datas(std::cout, reader); | ||||
|  | ||||
|     return 0; | ||||
| } | ||||
| @@ -35,6 +35,7 @@ | ||||
| #ifndef _RISCV_HART_M_P_HWL_H | ||||
| #define _RISCV_HART_M_P_HWL_H | ||||
|  | ||||
| #include "riscv_hart_common.h" | ||||
| #include <iss/vm_types.h> | ||||
|  | ||||
| namespace iss { | ||||
| @@ -50,45 +51,67 @@ public: | ||||
|     virtual ~hwl() = default; | ||||
|  | ||||
| protected: | ||||
|     iss::status read_custom_csr_reg(unsigned addr, reg_t &val) override; | ||||
|     iss::status write_custom_csr_reg(unsigned addr, reg_t val) override; | ||||
|     iss::status read_custom_csr(unsigned addr, reg_t& val) override; | ||||
|     iss::status write_custom_csr(unsigned addr, reg_t val) override; | ||||
| }; | ||||
|  | ||||
|  | ||||
| template<typename BASE> | ||||
| inline hwl<BASE>::hwl(feature_config cfg): BASE(cfg) { | ||||
|     for (unsigned addr = 0x800; addr < 0x803; ++addr){ | ||||
| template <typename BASE> | ||||
| inline hwl<BASE>::hwl(feature_config cfg) | ||||
| : BASE(cfg) { | ||||
|     for(unsigned addr = 0x800; addr < 0x803; ++addr) { | ||||
|         this->register_custom_csr_rd(addr); | ||||
|         this->register_custom_csr_wr(addr); | ||||
|     } | ||||
|     for (unsigned addr = 0x804; addr < 0x807; ++addr){ | ||||
|     for(unsigned addr = 0x804; addr < 0x807; ++addr) { | ||||
|         this->register_custom_csr_rd(addr); | ||||
|         this->register_custom_csr_wr(addr); | ||||
|     } | ||||
| } | ||||
|  | ||||
| template<typename BASE> | ||||
| inline iss::status iss::arch::hwl<BASE>::read_custom_csr_reg(unsigned addr, reg_t &val) { | ||||
|     switch(addr){ | ||||
|     case 0x800: val = this->reg.lpstart0; break; | ||||
|     case 0x801: val = this->reg.lpend0;   break; | ||||
|     case 0x802: val = this->reg.lpcount0; break; | ||||
|     case 0x804: val = this->reg.lpstart1; break; | ||||
|     case 0x805: val = this->reg.lpend1;   break; | ||||
|     case 0x806: val = this->reg.lpcount1; break; | ||||
| template <typename BASE> inline iss::status iss::arch::hwl<BASE>::read_custom_csr(unsigned addr, reg_t& val) { | ||||
|     switch(addr) { | ||||
|     case 0x800: | ||||
|         val = this->reg.lpstart0; | ||||
|         break; | ||||
|     case 0x801: | ||||
|         val = this->reg.lpend0; | ||||
|         break; | ||||
|     case 0x802: | ||||
|         val = this->reg.lpcount0; | ||||
|         break; | ||||
|     case 0x804: | ||||
|         val = this->reg.lpstart1; | ||||
|         break; | ||||
|     case 0x805: | ||||
|         val = this->reg.lpend1; | ||||
|         break; | ||||
|     case 0x806: | ||||
|         val = this->reg.lpcount1; | ||||
|         break; | ||||
|     } | ||||
|     return iss::Ok; | ||||
| } | ||||
|  | ||||
| template<typename BASE> | ||||
| inline iss::status iss::arch::hwl<BASE>::write_custom_csr_reg(unsigned addr, reg_t val) { | ||||
|     switch(addr){ | ||||
|     case 0x800: this->reg.lpstart0 = val; break; | ||||
|     case 0x801: this->reg.lpend0   = val; break; | ||||
|     case 0x802: this->reg.lpcount0 = val; break; | ||||
|     case 0x804: this->reg.lpstart1 = val; break; | ||||
|     case 0x805: this->reg.lpend1   = val; break; | ||||
|     case 0x806: this->reg.lpcount1 = val; break; | ||||
| template <typename BASE> inline iss::status iss::arch::hwl<BASE>::write_custom_csr(unsigned addr, reg_t val) { | ||||
|     switch(addr) { | ||||
|     case 0x800: | ||||
|         this->reg.lpstart0 = val; | ||||
|         break; | ||||
|     case 0x801: | ||||
|         this->reg.lpend0 = val; | ||||
|         break; | ||||
|     case 0x802: | ||||
|         this->reg.lpcount0 = val; | ||||
|         break; | ||||
|     case 0x804: | ||||
|         this->reg.lpstart1 = val; | ||||
|         break; | ||||
|     case 0x805: | ||||
|         this->reg.lpend1 = val; | ||||
|         break; | ||||
|     case 0x806: | ||||
|         this->reg.lpcount1 = val; | ||||
|         break; | ||||
|     } | ||||
|     return iss::Ok; | ||||
| } | ||||
| @@ -96,5 +119,4 @@ inline iss::status iss::arch::hwl<BASE>::write_custom_csr_reg(unsigned addr, reg | ||||
| } // namespace arch | ||||
| } // namespace iss | ||||
|  | ||||
|  | ||||
| #endif /* _RISCV_HART_M_P_H */ | ||||
|   | ||||
| @@ -35,15 +35,31 @@ | ||||
| #ifndef _RISCV_HART_COMMON | ||||
| #define _RISCV_HART_COMMON | ||||
|  | ||||
| #include "iss/arch_if.h" | ||||
| #include "iss/vm_types.h" | ||||
| #include <array> | ||||
| #include <cstdint> | ||||
| #include <elfio/elfio.hpp> | ||||
| #include <fmt/format.h> | ||||
| #include <iss/arch_if.h> | ||||
| #include <iss/log_categories.h> | ||||
| #include <limits> | ||||
| #include <sstream> | ||||
| #include <string> | ||||
| #include <unordered_map> | ||||
| #include <util/logging.h> | ||||
|  | ||||
| #if defined(__GNUC__) | ||||
| #define likely(x) ::__builtin_expect(!!(x), 1) | ||||
| #define unlikely(x) ::__builtin_expect(!!(x), 0) | ||||
| #else | ||||
| #define likely(x) x | ||||
| #define unlikely(x) x | ||||
| #endif | ||||
|  | ||||
| namespace iss { | ||||
| namespace arch { | ||||
|  | ||||
| enum { tohost_dflt = 0xF0001000, fromhost_dflt = 0xF0001040 }; | ||||
|  | ||||
| enum features_e{FEAT_NONE, FEAT_PMP=1, FEAT_EXT_N=2, FEAT_CLIC=4, FEAT_DEBUG=8, FEAT_TCM=16}; | ||||
| enum features_e { FEAT_NONE, FEAT_PMP = 1, FEAT_EXT_N = 2, FEAT_CLIC = 4, FEAT_DEBUG = 8, FEAT_TCM = 16 }; | ||||
|  | ||||
| enum riscv_csr { | ||||
|     /* user-level CSR */ | ||||
| @@ -51,17 +67,17 @@ enum riscv_csr { | ||||
|     ustatus = 0x000, | ||||
|     uie = 0x004, | ||||
|     utvec = 0x005, | ||||
|     utvt = 0x007, //CLIC | ||||
|     utvt = 0x007, // CLIC | ||||
|     // User Trap Handling | ||||
|     uscratch = 0x040, | ||||
|     uepc = 0x041, | ||||
|     ucause = 0x042, | ||||
|     utval = 0x043, | ||||
|     uip = 0x044, | ||||
|     uxnti = 0x045, //CLIC | ||||
|     uintstatus   = 0xCB1, // MRW Current interrupt levels (CLIC) - addr subject to change | ||||
|     uintthresh   = 0x047, // MRW Interrupt-level threshold (CLIC) - addr subject to change | ||||
|     uscratchcsw  = 0x048, // MRW Conditional scratch swap on priv mode change (CLIC) | ||||
|     uxnti = 0x045,        // CLIC | ||||
|     uintstatus = 0xCB1,   // MRW Current interrupt levels (CLIC) - addr subject to change | ||||
|     uintthresh = 0x047,   // MRW Interrupt-level threshold (CLIC) - addr subject to change | ||||
|     uscratchcsw = 0x048,  // MRW Conditional scratch swap on priv mode change (CLIC) | ||||
|     uscratchcswl = 0x049, // MRW Conditional scratch swap on level change (CLIC) | ||||
|     // User Floating-Point CSRs | ||||
|     fflags = 0x001, | ||||
| @@ -112,17 +128,17 @@ enum riscv_csr { | ||||
|     mie = 0x304, | ||||
|     mtvec = 0x305, | ||||
|     mcounteren = 0x306, | ||||
|     mtvt = 0x307, //CLIC | ||||
|     mtvt = 0x307, // CLIC | ||||
|     // Machine Trap Handling | ||||
|     mscratch = 0x340, | ||||
|     mepc = 0x341, | ||||
|     mcause = 0x342, | ||||
|     mtval = 0x343, | ||||
|     mip = 0x344, | ||||
|     mxnti = 0x345, //CLIC | ||||
|     mintstatus   = 0xFB1, // MRW Current interrupt levels (CLIC) - addr subject to change | ||||
|     mintthresh   = 0x347, // MRW Interrupt-level threshold (CLIC) - addr subject to change | ||||
|     mscratchcsw  = 0x348, // MRW Conditional scratch swap on priv mode change (CLIC) | ||||
|     mxnti = 0x345,        // CLIC | ||||
|     mintstatus = 0xFB1,   // MRW Current interrupt levels (CLIC) - addr subject to change | ||||
|     mintthresh = 0x347,   // MRW Interrupt-level threshold (CLIC) - addr subject to change | ||||
|     mscratchcsw = 0x348,  // MRW Conditional scratch swap on priv mode change (CLIC) | ||||
|     mscratchcswl = 0x349, // MRW Conditional scratch swap on level change (CLIC) | ||||
|     // Physical Memory Protection | ||||
|     pmpcfg0 = 0x3A0, | ||||
| @@ -175,7 +191,6 @@ enum riscv_csr { | ||||
|     dscratch1 = 0x7B3 | ||||
| }; | ||||
|  | ||||
|  | ||||
| enum { | ||||
|     PGSHIFT = 12, | ||||
|     PTE_PPN_SHIFT = 10, | ||||
| @@ -193,7 +208,7 @@ enum { | ||||
|  | ||||
| template <typename T> inline bool PTE_TABLE(T PTE) { return (((PTE) & (PTE_V | PTE_R | PTE_W | PTE_X)) == PTE_V); } | ||||
|  | ||||
| enum { PRIV_U = 0, PRIV_S = 1, PRIV_M = 3, PRIV_D = 4}; | ||||
| enum { PRIV_U = 0, PRIV_S = 1, PRIV_M = 3, PRIV_D = 4 }; | ||||
|  | ||||
| enum { | ||||
|     ISA_A = 1, | ||||
| @@ -256,49 +271,147 @@ public: | ||||
|     : trap_access(15 << 16, badaddr) {} | ||||
| }; | ||||
|  | ||||
| inline void read_reg_uint32(uint64_t offs, uint32_t& reg, uint8_t *const data, unsigned length) { | ||||
| inline void read_reg_uint32(uint64_t offs, uint32_t& reg, uint8_t* const data, unsigned length) { | ||||
|     auto reg_ptr = reinterpret_cast<uint8_t*>(®); | ||||
|     switch (offs & 0x3) { | ||||
|     switch(offs & 0x3) { | ||||
|     case 0: | ||||
|         for (auto i = 0U; i < length; ++i) | ||||
|         for(auto i = 0U; i < length; ++i) | ||||
|             *(data + i) = *(reg_ptr + i); | ||||
|     break; | ||||
|         break; | ||||
|     case 1: | ||||
|         for (auto i = 0U; i < length; ++i) | ||||
|         for(auto i = 0U; i < length; ++i) | ||||
|             *(data + i) = *(reg_ptr + 1 + i); | ||||
|     break; | ||||
|         break; | ||||
|     case 2: | ||||
|         for (auto i = 0U; i < length; ++i) | ||||
|         for(auto i = 0U; i < length; ++i) | ||||
|             *(data + i) = *(reg_ptr + 2 + i); | ||||
|     break; | ||||
|         break; | ||||
|     case 3: | ||||
|         *data = *(reg_ptr + 3); | ||||
|     break; | ||||
|         break; | ||||
|     } | ||||
| } | ||||
|  | ||||
| inline void write_reg_uint32(uint64_t offs, uint32_t& reg, const uint8_t *const data, unsigned length) { | ||||
| inline void write_reg_uint32(uint64_t offs, uint32_t& reg, const uint8_t* const data, unsigned length) { | ||||
|     auto reg_ptr = reinterpret_cast<uint8_t*>(®); | ||||
|     switch (offs & 0x3) { | ||||
|     switch(offs & 0x3) { | ||||
|     case 0: | ||||
|         for (auto i = 0U; i < length; ++i) | ||||
|         for(auto i = 0U; i < length; ++i) | ||||
|             *(reg_ptr + i) = *(data + i); | ||||
|     break; | ||||
|         break; | ||||
|     case 1: | ||||
|         for (auto i = 0U; i < length; ++i) | ||||
|         for(auto i = 0U; i < length; ++i) | ||||
|             *(reg_ptr + 1 + i) = *(data + i); | ||||
|     break; | ||||
|         break; | ||||
|     case 2: | ||||
|         for (auto i = 0U; i < length; ++i) | ||||
|         for(auto i = 0U; i < length; ++i) | ||||
|             *(reg_ptr + 2 + i) = *(data + i); | ||||
|     break; | ||||
|         break; | ||||
|     case 3: | ||||
|         *(reg_ptr + 3) = *data ; | ||||
|     break; | ||||
|         *(reg_ptr + 3) = *data; | ||||
|         break; | ||||
|     } | ||||
| } | ||||
| struct riscv_hart_common { | ||||
|     riscv_hart_common(){}; | ||||
|     ~riscv_hart_common() { | ||||
|         if(io_buf.str().length()) { | ||||
|             CPPLOG(INFO) << "tohost send '" << io_buf.str() << "'"; | ||||
|         } | ||||
|     }; | ||||
|     std::unordered_map<std::string, uint64_t> symbol_table; | ||||
|     uint64_t entry_address{0}; | ||||
|     uint64_t tohost = std::numeric_limits<uint64_t>::max(); | ||||
|     uint64_t fromhost = std::numeric_limits<uint64_t>::max(); | ||||
|     std::stringstream io_buf; | ||||
|  | ||||
| } | ||||
| } | ||||
|     bool read_elf_file(std::string name, uint8_t expected_elf_class, | ||||
|                        std::function<iss::status(uint64_t, uint64_t, const uint8_t* const)> cb) { | ||||
|         // Create elfio reader | ||||
|         ELFIO::elfio reader; | ||||
|         // Load ELF data | ||||
|         if(reader.load(name)) { | ||||
|             // check elf properties | ||||
|             if(reader.get_class() != expected_elf_class) | ||||
|                 return false; | ||||
|             if(reader.get_type() != ELFIO::ET_EXEC) | ||||
|                 return false; | ||||
|             if(reader.get_machine() != ELFIO::EM_RISCV) | ||||
|                 return false; | ||||
|             entry_address = reader.get_entry(); | ||||
|             for(const auto& pseg : reader.segments) { | ||||
|                 const auto fsize = pseg->get_file_size(); // 0x42c/0x0 | ||||
|                 const auto seg_data = pseg->get_data(); | ||||
|                 const auto type = pseg->get_type(); | ||||
|                 if(type == 1 && fsize > 0) { | ||||
|                     auto res = cb(pseg->get_physical_address(), fsize, reinterpret_cast<const uint8_t* const>(seg_data)); | ||||
|                     if(res != iss::Ok) | ||||
|                         CPPLOG(ERR) << "problem writing " << fsize << "bytes to 0x" << std::hex << pseg->get_physical_address(); | ||||
|                 } | ||||
|             } | ||||
|             const auto sym_sec = reader.sections[".symtab"]; | ||||
|             if(ELFIO::SHT_SYMTAB == sym_sec->get_type() || ELFIO::SHT_DYNSYM == sym_sec->get_type()) { | ||||
|                 ELFIO::symbol_section_accessor symbols(reader, sym_sec); | ||||
|                 auto sym_no = symbols.get_symbols_num(); | ||||
|                 std::string name; | ||||
|                 ELFIO::Elf64_Addr value = 0; | ||||
|                 ELFIO::Elf_Xword size = 0; | ||||
|                 unsigned char bind = 0; | ||||
|                 unsigned char type = 0; | ||||
|                 ELFIO::Elf_Half section = 0; | ||||
|                 unsigned char other = 0; | ||||
|                 for(auto i = 0U; i < sym_no; ++i) { | ||||
|                     symbols.get_symbol(i, name, value, size, bind, type, section, other); | ||||
|                     if(name != "") { | ||||
|                         this->symbol_table[name] = value; | ||||
| #ifndef NDEBUG | ||||
|                         CPPLOG(DEBUG) << "Found Symbol " << name; | ||||
| #endif | ||||
|                     } | ||||
|                 } | ||||
|                 try { | ||||
|                     tohost = symbol_table.at("tohost"); | ||||
|                 } catch(std::out_of_range& e) { | ||||
|                 } | ||||
|                 try { | ||||
|                     fromhost = symbol_table.at("fromhost"); | ||||
|                 } catch(std::out_of_range& e) { | ||||
|                 } | ||||
|             } | ||||
|             return true; | ||||
|         } | ||||
|         return false; | ||||
|     }; | ||||
|     iss::status execute_sys_write(arch_if* aif, const std::array<uint64_t, 8>& loaded_payload, unsigned mem_type) { | ||||
|         uint64_t fd = loaded_payload[1]; | ||||
|         uint64_t buf_ptr = loaded_payload[2]; | ||||
|         uint64_t len = loaded_payload[3]; | ||||
|         std::vector<char> buf(len); | ||||
|         if(aif->read(address_type::PHYSICAL, access_type::DEBUG_READ, mem_type, buf_ptr, len, reinterpret_cast<uint8_t*>(buf.data()))) { | ||||
|             CPPLOG(ERR) << "SYS_WRITE buffer read went wrong"; | ||||
|             return iss::Err; | ||||
|         } | ||||
|         // we disregard the fd and just log to stdout | ||||
|         for(size_t i = 0; i < len; i++) { | ||||
|             if(buf[i] == '\n' || buf[i] == '\0') { | ||||
|                 CPPLOG(INFO) << "tohost send '" << io_buf.str() << "'"; | ||||
|                 io_buf.str(""); | ||||
|             } else | ||||
|                 io_buf << buf[i]; | ||||
|         } | ||||
|  | ||||
|         // Not sure what the correct return value should be | ||||
|         uint8_t ret_val = 1; | ||||
|         if(fromhost != std::numeric_limits<uint64_t>::max()) | ||||
|             if(aif->write(address_type::PHYSICAL, access_type::DEBUG_WRITE, mem_type, fromhost, 1, &ret_val)) { | ||||
|                 CPPLOG(ERR) << "Fromhost write went wrong"; | ||||
|                 return iss::Err; | ||||
|             } | ||||
|         return iss::Ok; | ||||
|     } | ||||
| }; | ||||
|  | ||||
| } // namespace arch | ||||
| } // namespace iss | ||||
|  | ||||
| #endif | ||||
|   | ||||
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							| @@ -1,5 +1,5 @@ | ||||
| /******************************************************************************* | ||||
|  * Copyright (C) 2017 - 2020 MINRES Technologies GmbH | ||||
|  * Copyright (C) 2024 MINRES Technologies GmbH | ||||
|  * All rights reserved. | ||||
|  * | ||||
|  * Redistribution and use in source and binary forms, with or without | ||||
| @@ -30,6 +30,7 @@ | ||||
|  * | ||||
|  *******************************************************************************/ | ||||
|  | ||||
| // clang-format off | ||||
| #include "tgc5c.h" | ||||
| #include "util/ities.h" | ||||
| #include <util/logging.h> | ||||
| @@ -66,4 +67,4 @@ uint8_t *tgc5c::get_regs_base_ptr() { | ||||
| tgc5c::phys_addr_t tgc5c::virt2phys(const iss::addr_t &addr) { | ||||
|     return phys_addr_t(addr.access, addr.space, addr.val&traits<tgc5c>::addr_mask); | ||||
| } | ||||
|  | ||||
| // clang-format on | ||||
|   | ||||
										
											
												File diff suppressed because one or more lines are too long
											
										
									
								
							| @@ -15,36 +15,43 @@ using tgc5a_plat_type = iss::arch::riscv_hart_m_p<iss::arch::tgc5a>; | ||||
| using tgc5b_plat_type = iss::arch::riscv_hart_m_p<iss::arch::tgc5b>; | ||||
| #endif | ||||
| #ifdef CORE_TGC5C_XRB_NN | ||||
| #include "riscv_hart_m_p.h" | ||||
| #include "hwl.h" | ||||
| #include "riscv_hart_m_p.h" | ||||
| #include <iss/arch/tgc5c_xrb_nn.h> | ||||
| using tgc5c_xrb_nn_plat_type = iss::arch::hwl<iss::arch::riscv_hart_m_p<iss::arch::tgc5c_xrb_nn>>; | ||||
| #endif | ||||
| #ifdef CORE_TGC5D | ||||
| #include "riscv_hart_mu_p.h" | ||||
| #include <iss/arch/tgc5d.h> | ||||
| using tgc5d_plat_type = iss::arch::riscv_hart_mu_p<iss::arch::tgc5d, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_CLIC | iss::arch::FEAT_EXT_N)>; | ||||
| using tgc5d_plat_type = iss::arch::riscv_hart_mu_p<iss::arch::tgc5d, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_CLIC | | ||||
|                                                                                              iss::arch::FEAT_EXT_N)>; | ||||
| #endif | ||||
| #ifdef CORE_TGC5D_XRB_MAC | ||||
| #include "riscv_hart_mu_p.h" | ||||
| #include <iss/arch/tgc5d_xrb_mac.h> | ||||
| using tgc5d_xrb_mac_plat_type = iss::arch::riscv_hart_mu_p<iss::arch::tgc5d_xrb_mac, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_CLIC | iss::arch::FEAT_EXT_N)>; | ||||
| using tgc5d_xrb_mac_plat_type = | ||||
|     iss::arch::riscv_hart_mu_p<iss::arch::tgc5d_xrb_mac, | ||||
|                                (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_CLIC | iss::arch::FEAT_EXT_N)>; | ||||
| #endif | ||||
| #ifdef CORE_TGC5D_XRB_NN | ||||
| #include "riscv_hart_mu_p.h" | ||||
| #include "hwl.h" | ||||
| #include "riscv_hart_mu_p.h" | ||||
| #include <iss/arch/tgc5d_xrb_nn.h> | ||||
| using tgc5d_xrb_nn_plat_type = iss::arch::hwl<iss::arch::riscv_hart_mu_p<iss::arch::tgc5d_xrb_nn, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_CLIC | iss::arch::FEAT_EXT_N)>>; | ||||
| using tgc5d_xrb_nn_plat_type = | ||||
|     iss::arch::hwl<iss::arch::riscv_hart_mu_p<iss::arch::tgc5d_xrb_nn, | ||||
|                                               (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_CLIC | iss::arch::FEAT_EXT_N)>>; | ||||
| #endif | ||||
| #ifdef CORE_TGC5E | ||||
| #include "riscv_hart_mu_p.h" | ||||
| #include <iss/arch/tgc5e.h> | ||||
| using tgc5e_plat_type = iss::arch::riscv_hart_mu_p<iss::arch::tgc5e, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_CLIC | iss::arch::FEAT_EXT_N)>; | ||||
| using tgc5e_plat_type = iss::arch::riscv_hart_mu_p<iss::arch::tgc5e, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_CLIC | | ||||
|                                                                                              iss::arch::FEAT_EXT_N)>; | ||||
| #endif | ||||
| #ifdef CORE_TGC5X | ||||
| #include "riscv_hart_mu_p.h" | ||||
| #include <iss/arch/tgc5x.h> | ||||
| using tgc5x_plat_type = iss::arch::riscv_hart_mu_p<iss::arch::tgc5x, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_CLIC | iss::arch::FEAT_EXT_N | iss::arch::FEAT_TCM)>; | ||||
| using tgc5x_plat_type = iss::arch::riscv_hart_mu_p<iss::arch::tgc5x, (iss::arch::features_e)(iss::arch::FEAT_PMP | iss::arch::FEAT_CLIC | | ||||
|                                                                                              iss::arch::FEAT_EXT_N | iss::arch::FEAT_TCM)>; | ||||
| #endif | ||||
|  | ||||
| #endif | ||||
|   | ||||
| @@ -36,25 +36,27 @@ | ||||
| #define _RISCV_HART_M_P_WT_CACHE_H | ||||
|  | ||||
| #include <iss/vm_types.h> | ||||
| #include <util/ities.h> | ||||
| #include <vector> | ||||
| #include <map> | ||||
| #include <memory> | ||||
| #include <util/ities.h> | ||||
| #include <vector> | ||||
|  | ||||
| namespace iss { | ||||
| namespace arch { | ||||
| namespace cache { | ||||
|  | ||||
| enum class state { INVALID, VALID}; | ||||
| enum class state { INVALID, VALID }; | ||||
| struct line { | ||||
|     uint64_t tag_addr{0}; | ||||
|     state st{state::INVALID}; | ||||
|     std::vector<uint8_t> data; | ||||
|     line(unsigned line_sz):  data(line_sz) {} | ||||
|     line(unsigned line_sz) | ||||
|     : data(line_sz) {} | ||||
| }; | ||||
| struct set { | ||||
|     std::vector<line> ways; | ||||
|     set(unsigned ways_count, line const& l): ways(ways_count, l) {} | ||||
|     set(unsigned ways_count, line const& l) | ||||
|     : ways(ways_count, l) {} | ||||
| }; | ||||
| struct cache { | ||||
|     std::vector<set> sets; | ||||
| @@ -62,14 +64,14 @@ struct cache { | ||||
|     cache(unsigned size, unsigned line_sz, unsigned ways) { | ||||
|         line const ref_line{line_sz}; | ||||
|         set const ref_set{ways, ref_line}; | ||||
|         sets.resize(size/(ways*line_sz), ref_set); | ||||
|         sets.resize(size / (ways * line_sz), ref_set); | ||||
|     } | ||||
| }; | ||||
|  | ||||
| struct wt_policy { | ||||
|     bool is_cacheline_hit(cache& c ); | ||||
|     bool is_cacheline_hit(cache& c); | ||||
| }; | ||||
| } | ||||
| } // namespace cache | ||||
|  | ||||
| // write thru, allocate on read, direct mapped or set-associative with round-robin replacement policy | ||||
| template <typename BASE> class wt_cache : public BASE { | ||||
| @@ -85,82 +87,77 @@ public: | ||||
|     virtual ~wt_cache() = default; | ||||
|  | ||||
|     unsigned size{4096}; | ||||
|     unsigned line_sz{32}; | ||||
|     unsigned line_sz{64}; | ||||
|     unsigned ways{1}; | ||||
|     uint64_t io_address{0xf0000000}; | ||||
|     uint64_t io_addr_mask{0xf0000000}; | ||||
|  | ||||
| protected: | ||||
|     iss::status read_cache(phys_addr_t addr, unsigned, uint8_t *const); | ||||
|     iss::status write_cache(phys_addr_t addr, unsigned, uint8_t const *const); | ||||
|     iss::status read_cache(phys_addr_t addr, unsigned, uint8_t* const); | ||||
|     iss::status write_cache(phys_addr_t addr, unsigned, uint8_t const* const); | ||||
|     std::function<mem_read_f> cache_mem_rd_delegate; | ||||
|     std::function<mem_write_f> cache_mem_wr_delegate; | ||||
|     std::unique_ptr<cache::cache> dcache_ptr; | ||||
|     std::unique_ptr<cache::cache> icache_ptr; | ||||
|     size_t get_way_select() { | ||||
|         return 0; | ||||
|     } | ||||
|     size_t get_way_select() { return 0; } | ||||
| }; | ||||
|  | ||||
|  | ||||
| template<typename BASE> | ||||
| template <typename BASE> | ||||
| inline wt_cache<BASE>::wt_cache(feature_config cfg) | ||||
| :BASE(cfg) | ||||
| : BASE(cfg) | ||||
| , io_address{cfg.io_address} | ||||
| , io_addr_mask{cfg.io_addr_mask} | ||||
| { | ||||
| , io_addr_mask{cfg.io_addr_mask} { | ||||
|     auto cb = base_class::replace_mem_access( | ||||
|             [this](phys_addr_t a, unsigned l, uint8_t* const d) -> iss::status { return read_cache(a, l,d);}, | ||||
|             [this](phys_addr_t a, unsigned l, uint8_t const* const d) -> iss::status { return write_cache(a, l,d);}); | ||||
|         [this](phys_addr_t a, unsigned l, uint8_t* const d) -> iss::status { return read_cache(a, l, d); }, | ||||
|         [this](phys_addr_t a, unsigned l, uint8_t const* const d) -> iss::status { return write_cache(a, l, d); }); | ||||
|     cache_mem_rd_delegate = cb.first; | ||||
|     cache_mem_wr_delegate = cb.second; | ||||
| } | ||||
|  | ||||
| template<typename BASE> | ||||
| iss::status iss::arch::wt_cache<BASE>::read_cache(phys_addr_t a, unsigned l, uint8_t* const d) { | ||||
| template <typename BASE> iss::status iss::arch::wt_cache<BASE>::read_cache(phys_addr_t a, unsigned l, uint8_t* const d) { | ||||
|     if(!icache_ptr) { | ||||
|         icache_ptr.reset(new cache::cache(size, line_sz, ways)); | ||||
|         dcache_ptr.reset(new cache::cache(size, line_sz, ways)); | ||||
|     } | ||||
|     if((a.val&io_addr_mask) != io_address) { | ||||
|         auto set_addr=(a.val&(size-1))>>util::ilog2(line_sz*ways); | ||||
|         auto tag_addr=a.val>>util::ilog2(line_sz); | ||||
|         auto& set = (is_fetch(a.access)?icache_ptr:dcache_ptr)->sets[set_addr]; | ||||
|         for(auto& cl: set.ways) { | ||||
|             if(cl.st==cache::state::VALID && cl.tag_addr==tag_addr) { | ||||
|                 auto start_addr = a.val&(line_sz-1); | ||||
|                 for(auto i = 0U; i<l; ++i) | ||||
|                     d[i] = cl.data[start_addr+i]; | ||||
|     if((a.access & iss::access_type::FETCH) == iss::access_type::FETCH || (a.val & io_addr_mask) != io_address) { | ||||
|         auto set_addr = (a.val & (size - 1)) >> util::ilog2(line_sz * ways); | ||||
|         auto tag_addr = a.val >> util::ilog2(line_sz); | ||||
|         auto& set = (is_fetch(a.access) ? icache_ptr : dcache_ptr)->sets[set_addr]; | ||||
|         for(auto& cl : set.ways) { | ||||
|             if(cl.st == cache::state::VALID && cl.tag_addr == tag_addr) { | ||||
|                 auto start_addr = a.val & (line_sz - 1); | ||||
|                 for(auto i = 0U; i < l; ++i) | ||||
|                     d[i] = cl.data[start_addr + i]; | ||||
|                 return iss::Ok; | ||||
|             } | ||||
|         } | ||||
|         auto& cl = set.ways[get_way_select()]; | ||||
|         phys_addr_t cl_addr{a}; | ||||
|         cl_addr.val=tag_addr<<util::ilog2(line_sz); | ||||
|         cl_addr.val = tag_addr << util::ilog2(line_sz); | ||||
|         cache_mem_rd_delegate(cl_addr, line_sz, cl.data.data()); | ||||
|         cl.tag_addr=tag_addr; | ||||
|         cl.st=cache::state::VALID; | ||||
|         auto start_addr = a.val&(line_sz-1); | ||||
|         for(auto i = 0U; i<l; ++i) | ||||
|             d[i] = cl.data[start_addr+i]; | ||||
|         cl.tag_addr = tag_addr; | ||||
|         cl.st = cache::state::VALID; | ||||
|         auto start_addr = a.val & (line_sz - 1); | ||||
|         for(auto i = 0U; i < l; ++i) | ||||
|             d[i] = cl.data[start_addr + i]; | ||||
|         return iss::Ok; | ||||
|     } else | ||||
|         return cache_mem_rd_delegate(a, l, d); | ||||
| } | ||||
|  | ||||
| template<typename BASE> | ||||
| iss::status iss::arch::wt_cache<BASE>::write_cache(phys_addr_t a, unsigned l, const uint8_t* const d) { | ||||
| template <typename BASE> iss::status iss::arch::wt_cache<BASE>::write_cache(phys_addr_t a, unsigned l, const uint8_t* const d) { | ||||
|     if(!dcache_ptr) | ||||
|         dcache_ptr.reset(new cache::cache(size, line_sz, ways)); | ||||
|     auto res = cache_mem_wr_delegate(a, l, d); | ||||
|     if(res == iss::Ok && ((a.val&io_addr_mask) != io_address)) { | ||||
|         auto set_addr=(a.val&(size-1))>>util::ilog2(line_sz*ways); | ||||
|         auto tag_addr=a.val>>util::ilog2(line_sz); | ||||
|     if(res == iss::Ok && ((a.val & io_addr_mask) != io_address)) { | ||||
|         auto set_addr = (a.val & (size - 1)) >> util::ilog2(line_sz * ways); | ||||
|         auto tag_addr = a.val >> util::ilog2(line_sz); | ||||
|         auto& set = dcache_ptr->sets[set_addr]; | ||||
|         for(auto& cl: set.ways) { | ||||
|             if(cl.st==cache::state::VALID && cl.tag_addr==tag_addr) { | ||||
|                 auto start_addr = a.val&(line_sz-1); | ||||
|                 for(auto i = 0U; i<l; ++i) | ||||
|                     cl.data[start_addr+i] = d[i]; | ||||
|         for(auto& cl : set.ways) { | ||||
|             if(cl.st == cache::state::VALID && cl.tag_addr == tag_addr) { | ||||
|                 auto start_addr = a.val & (line_sz - 1); | ||||
|                 for(auto i = 0U; i < l; ++i) | ||||
|                     cl.data[start_addr + i] = d[i]; | ||||
|                 break; | ||||
|             } | ||||
|         } | ||||
| @@ -168,8 +165,6 @@ iss::status iss::arch::wt_cache<BASE>::write_cache(phys_addr_t a, unsigned l, co | ||||
|     return res; | ||||
| } | ||||
|  | ||||
|  | ||||
|  | ||||
| } // namespace arch | ||||
| } // namespace iss | ||||
|  | ||||
|   | ||||
							
								
								
									
										4108
									
								
								src/iss/debugger/csr_names.cpp
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										4108
									
								
								src/iss/debugger/csr_names.cpp
									
									
									
									
									
										Normal file
									
								
							
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							| @@ -30,8 +30,8 @@ | ||||
|  * | ||||
|  *******************************************************************************/ | ||||
|  | ||||
| #ifndef _ISS_DEBUGGER_RISCV_TARGET_ADAPTER_H_ | ||||
| #define _ISS_DEBUGGER_RISCV_TARGET_ADAPTER_H_ | ||||
| #ifndef _ISS_ARCH_DEBUGGER_RISCV_TARGET_ADAPTER_H_ | ||||
| #define _ISS_ARCH_DEBUGGER_RISCV_TARGET_ADAPTER_H_ | ||||
|  | ||||
| #include "iss/arch_if.h" | ||||
| #include <iss/arch/traits.h> | ||||
| @@ -48,25 +48,29 @@ | ||||
|  | ||||
| namespace iss { | ||||
| namespace debugger { | ||||
|  | ||||
| char const* const get_csr_name(unsigned); | ||||
| constexpr auto csr_offset = 100U; | ||||
|  | ||||
| using namespace iss::arch; | ||||
| using namespace iss::debugger; | ||||
|  | ||||
| template <typename ARCH> class riscv_target_adapter : public target_adapter_base { | ||||
| public: | ||||
|     riscv_target_adapter(server_if *srv, iss::arch_if *core) | ||||
|     riscv_target_adapter(server_if* srv, iss::arch_if* core) | ||||
|     : target_adapter_base(srv) | ||||
|     , core(core) {} | ||||
|  | ||||
|     /*============== Thread Control ===============================*/ | ||||
|  | ||||
|     /* Set generic thread */ | ||||
|     status set_gen_thread(rp_thread_ref &thread) override; | ||||
|     status set_gen_thread(rp_thread_ref& thread) override; | ||||
|  | ||||
|     /* Set control thread */ | ||||
|     status set_ctrl_thread(rp_thread_ref &thread) override; | ||||
|     status set_ctrl_thread(rp_thread_ref& thread) override; | ||||
|  | ||||
|     /* Get thread status */ | ||||
|     status is_thread_alive(rp_thread_ref &thread, bool &alive) override; | ||||
|     status is_thread_alive(rp_thread_ref& thread, bool& alive) override; | ||||
|  | ||||
|     /*============= Register Access ================================*/ | ||||
|  | ||||
| @@ -74,79 +78,83 @@ public: | ||||
|      target byte order. If  register is not available | ||||
|      corresponding bytes in avail_buf are 0, otherwise | ||||
|      avail buf is 1 */ | ||||
|     status read_registers(std::vector<uint8_t> &data, std::vector<uint8_t> &avail) override; | ||||
|     status read_registers(std::vector<uint8_t>& data, std::vector<uint8_t>& avail) override; | ||||
|  | ||||
|     /* Write all registers. buf is 4-byte aligned and it is in target | ||||
|      byte order */ | ||||
|     status write_registers(const std::vector<uint8_t> &data) override; | ||||
|     status write_registers(const std::vector<uint8_t>& data) override; | ||||
|  | ||||
|     /* Read one register. buf is 4-byte aligned and it is in | ||||
|      target byte order. If  register is not available | ||||
|      corresponding bytes in avail_buf are 0, otherwise | ||||
|      avail buf is 1 */ | ||||
|     status read_single_register(unsigned int reg_no, std::vector<uint8_t> &buf, | ||||
|             std::vector<uint8_t> &avail_buf) override; | ||||
|     status read_single_register(unsigned int reg_no, std::vector<uint8_t>& buf, std::vector<uint8_t>& avail_buf) override; | ||||
|  | ||||
|     /* Write one register. buf is 4-byte aligned and it is in target byte | ||||
|      order */ | ||||
|     status write_single_register(unsigned int reg_no, const std::vector<uint8_t> &buf) override; | ||||
|     status write_single_register(unsigned int reg_no, const std::vector<uint8_t>& buf) override; | ||||
|  | ||||
|     /*=================== Memory Access =====================*/ | ||||
|  | ||||
|     /* Read memory, buf is 4-bytes aligned and it is in target | ||||
|      byte order */ | ||||
|     status read_mem(uint64_t addr, std::vector<uint8_t> &buf) override; | ||||
|     status read_mem(uint64_t addr, std::vector<uint8_t>& buf) override; | ||||
|  | ||||
|     /* Write memory, buf is 4-bytes aligned and it is in target | ||||
|      byte order */ | ||||
|     status write_mem(uint64_t addr, const std::vector<uint8_t> &buf) override; | ||||
|     status write_mem(uint64_t addr, const std::vector<uint8_t>& buf) override; | ||||
|  | ||||
|     status process_query(unsigned int &mask, const rp_thread_ref &arg, rp_thread_info &info) override; | ||||
|     status process_query(unsigned int& mask, const rp_thread_ref& arg, rp_thread_info& info) override; | ||||
|  | ||||
|     status thread_list_query(int first, const rp_thread_ref &arg, std::vector<rp_thread_ref> &result, size_t max_num, | ||||
|             size_t &num, bool &done) override; | ||||
|     status thread_list_query(int first, const rp_thread_ref& arg, std::vector<rp_thread_ref>& result, size_t max_num, size_t& num, | ||||
|                              bool& done) override; | ||||
|  | ||||
|     status current_thread_query(rp_thread_ref &thread) override; | ||||
|     status current_thread_query(rp_thread_ref& thread) override; | ||||
|  | ||||
|     status offsets_query(uint64_t &text, uint64_t &data, uint64_t &bss) override; | ||||
|     status offsets_query(uint64_t& text, uint64_t& data, uint64_t& bss) override; | ||||
|  | ||||
|     status crc_query(uint64_t addr, size_t len, uint32_t &val) override; | ||||
|     status crc_query(uint64_t addr, size_t len, uint32_t& val) override; | ||||
|  | ||||
|     status raw_query(std::string in_buf, std::string &out_buf) override; | ||||
|     status raw_query(std::string in_buf, std::string& out_buf) override; | ||||
|  | ||||
|     status threadinfo_query(int first, std::string &out_buf) override; | ||||
|     status threadinfo_query(int first, std::string& out_buf) override; | ||||
|  | ||||
|     status threadextrainfo_query(const rp_thread_ref &thread, std::string &out_buf) override; | ||||
|     status threadextrainfo_query(const rp_thread_ref& thread, std::string& out_buf) override; | ||||
|  | ||||
|     status packetsize_query(std::string &out_buf) override; | ||||
|     status packetsize_query(std::string& out_buf) override; | ||||
|  | ||||
|     status add_break(break_type type, uint64_t addr, unsigned int length) override; | ||||
|  | ||||
|     status remove_break(break_type type, uint64_t addr, unsigned int length) override; | ||||
|  | ||||
|     status resume_from_addr(bool step, int sig, uint64_t addr, rp_thread_ref thread, | ||||
|             std::function<void(unsigned)> stop_callback) override; | ||||
|     status resume_from_addr(bool step, int sig, uint64_t addr, rp_thread_ref thread, std::function<void(unsigned)> stop_callback) override; | ||||
|  | ||||
|     status target_xml_query(std::string &out_buf) override; | ||||
|     status target_xml_query(std::string& out_buf) override; | ||||
|  | ||||
| protected: | ||||
|     static inline constexpr addr_t map_addr(const addr_t &i) { return i; } | ||||
|  | ||||
|     iss::arch_if *core; | ||||
|     static inline constexpr addr_t map_addr(const addr_t& i) { return i; } | ||||
|     std::string csr_xml; | ||||
|     iss::arch_if* core; | ||||
|     rp_thread_ref thread_idx; | ||||
| }; | ||||
|  | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::set_gen_thread(rp_thread_ref &thread) { | ||||
| template <typename ARCH> typename std::enable_if<iss::arch::traits<ARCH>::FLEN != 0, unsigned>::type get_f0_offset() { | ||||
|     return iss::arch::traits<ARCH>::F0; | ||||
| } | ||||
|  | ||||
| template <typename ARCH> typename std::enable_if<iss::arch::traits<ARCH>::FLEN == 0, unsigned>::type get_f0_offset() { return 0; } | ||||
|  | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::set_gen_thread(rp_thread_ref& thread) { | ||||
|     thread_idx = thread; | ||||
|     return Ok; | ||||
| } | ||||
|  | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::set_ctrl_thread(rp_thread_ref &thread) { | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::set_ctrl_thread(rp_thread_ref& thread) { | ||||
|     thread_idx = thread; | ||||
|     return Ok; | ||||
| } | ||||
|  | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::is_thread_alive(rp_thread_ref &thread, bool &alive) { | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::is_thread_alive(rp_thread_ref& thread, bool& alive) { | ||||
|     alive = 1; | ||||
|     return Ok; | ||||
| } | ||||
| @@ -158,10 +166,9 @@ template <typename ARCH> status riscv_target_adapter<ARCH>::is_thread_alive(rp_t | ||||
|  * set if all threads are processed. | ||||
|  */ | ||||
| template <typename ARCH> | ||||
| status riscv_target_adapter<ARCH>::thread_list_query(int first, const rp_thread_ref &arg, | ||||
|         std::vector<rp_thread_ref> &result, size_t max_num, size_t &num, | ||||
|         bool &done) { | ||||
|     if (first == 0) { | ||||
| status riscv_target_adapter<ARCH>::thread_list_query(int first, const rp_thread_ref& arg, std::vector<rp_thread_ref>& result, | ||||
|                                                      size_t max_num, size_t& num, bool& done) { | ||||
|     if(first == 0) { | ||||
|         result.clear(); | ||||
|         result.push_back(thread_idx); | ||||
|         num = 1; | ||||
| @@ -171,80 +178,81 @@ status riscv_target_adapter<ARCH>::thread_list_query(int first, const rp_thread_ | ||||
|         return NotSupported; | ||||
| } | ||||
|  | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::current_thread_query(rp_thread_ref &thread) { | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::current_thread_query(rp_thread_ref& thread) { | ||||
|     thread = thread_idx; | ||||
|     return Ok; | ||||
| } | ||||
|  | ||||
| template <typename ARCH> | ||||
| status riscv_target_adapter<ARCH>::read_registers(std::vector<uint8_t> &data, std::vector<uint8_t> &avail) { | ||||
|     LOG(TRACE) << "reading target registers"; | ||||
|     // return idx<0?:; | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::read_registers(std::vector<uint8_t>& data, std::vector<uint8_t>& avail) { | ||||
|     CPPLOG(TRACE) << "reading target registers"; | ||||
|     data.clear(); | ||||
|     avail.clear(); | ||||
|     const uint8_t *reg_base = core->get_regs_base_ptr(); | ||||
|     auto start_reg=arch::traits<ARCH>::X0; | ||||
|     for (size_t reg_no = start_reg; reg_no < start_reg+33/*arch::traits<ARCH>::NUM_REGS*/; ++reg_no) { | ||||
|         auto reg_width = arch::traits<ARCH>::reg_bit_widths[reg_no] / 8; | ||||
|         unsigned offset = traits<ARCH>::reg_byte_offsets[reg_no]; | ||||
|         for (size_t j = 0; j < reg_width; ++j) { | ||||
|             data.push_back(*(reg_base + offset + j)); | ||||
|             avail.push_back(0xff); | ||||
|     const uint8_t* reg_base = core->get_regs_base_ptr(); | ||||
|     auto start_reg = arch::traits<ARCH>::X0; | ||||
|     for(size_t i = 0; i < 33; ++i) { | ||||
|         if(i < arch::traits<ARCH>::RFS || i == arch::traits<ARCH>::PC) { | ||||
|             auto reg_no = i < 32 ? start_reg + i : arch::traits<ARCH>::PC; | ||||
|             unsigned offset = traits<ARCH>::reg_byte_offsets[reg_no]; | ||||
|             for(size_t j = 0; j < arch::traits<ARCH>::XLEN / 8; ++j) { | ||||
|                 data.push_back(*(reg_base + offset + j)); | ||||
|                 avail.push_back(0xff); | ||||
|             } | ||||
|         } else { | ||||
|             for(size_t j = 0; j < arch::traits<ARCH>::XLEN / 8; ++j) { | ||||
|                 data.push_back(0); | ||||
|                 avail.push_back(0); | ||||
|             } | ||||
|         } | ||||
|     } | ||||
|     if(iss::arch::traits<ARCH>::FLEN > 0) { | ||||
|         auto fstart_reg = get_f0_offset<ARCH>(); | ||||
|         for(size_t i = 0; i < 32; ++i) { | ||||
|             auto reg_no = fstart_reg + i; | ||||
|             auto reg_width = arch::traits<ARCH>::reg_bit_widths[reg_no] / 8; | ||||
|             unsigned offset = traits<ARCH>::reg_byte_offsets[reg_no]; | ||||
|             for(size_t j = 0; j < reg_width; ++j) { | ||||
|                 data.push_back(*(reg_base + offset + j)); | ||||
|                 avail.push_back(0xff); | ||||
|             } | ||||
|         } | ||||
|     } | ||||
|     // work around fill with F type registers | ||||
|     //    if (arch::traits<ARCH>::NUM_REGS < 65) { | ||||
|     //        auto reg_width = sizeof(typename arch::traits<ARCH>::reg_t); | ||||
|     //        for (size_t reg_no = 0; reg_no < 33; ++reg_no) { | ||||
|     //            for (size_t j = 0; j < reg_width; ++j) { | ||||
|     //                data.push_back(0x0); | ||||
|     //                avail.push_back(0x00); | ||||
|     //            } | ||||
|     //            // if(arch::traits<ARCH>::XLEN < 64) | ||||
|     //            //     for(unsigned j=0; j<4; ++j){ | ||||
|     //            //         data.push_back(0x0); | ||||
|     //            //         avail.push_back(0x00); | ||||
|     //            //     } | ||||
|     //        } | ||||
|     //    } | ||||
|     return Ok; | ||||
| } | ||||
|  | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::write_registers(const std::vector<uint8_t> &data) { | ||||
|     auto start_reg=arch::traits<ARCH>::X0; | ||||
|     auto *reg_base = core->get_regs_base_ptr(); | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::write_registers(const std::vector<uint8_t>& data) { | ||||
|     auto start_reg = arch::traits<ARCH>::X0; | ||||
|     auto* reg_base = core->get_regs_base_ptr(); | ||||
|     auto iter = data.data(); | ||||
|     bool e_ext = arch::traits<ARCH>::PC<32; | ||||
|     for (size_t reg_no = 0; reg_no < start_reg+33/*arch::traits<ARCH>::NUM_REGS*/; ++reg_no) { | ||||
|         if(e_ext && reg_no>15){ | ||||
|             if(reg_no==32){ | ||||
|                 auto reg_width = arch::traits<ARCH>::reg_bit_widths[arch::traits<ARCH>::PC] / 8; | ||||
|                 auto offset = traits<ARCH>::reg_byte_offsets[arch::traits<ARCH>::PC]; | ||||
|                 std::copy(iter, iter + reg_width, reg_base); | ||||
|             } else { | ||||
|                 const uint64_t zero_val=0; | ||||
|                 auto reg_width = arch::traits<ARCH>::reg_bit_widths[15] / 8; | ||||
|                 auto iter = (uint8_t*)&zero_val; | ||||
|                 std::copy(iter, iter + reg_width, reg_base); | ||||
|             } | ||||
|         } else { | ||||
|             auto reg_width = arch::traits<ARCH>::reg_bit_widths[reg_no] / 8; | ||||
|             auto offset = traits<ARCH>::reg_byte_offsets[reg_no]; | ||||
|             std::copy(iter, iter + reg_width, reg_base); | ||||
|             iter += 4; | ||||
|             reg_base += offset; | ||||
|     auto iter_end = data.data() + data.size(); | ||||
|     for(size_t i = 0; i < 33 && iter < iter_end; ++i) { | ||||
|         auto reg_width = arch::traits<ARCH>::XLEN / 8; | ||||
|         if(i < arch::traits<ARCH>::RFS) { | ||||
|             auto offset = traits<ARCH>::reg_byte_offsets[start_reg + i]; | ||||
|             std::copy(iter, iter + reg_width, reg_base + offset); | ||||
|         } else if(i == 32) { | ||||
|             auto offset = traits<ARCH>::reg_byte_offsets[arch::traits<ARCH>::PC]; | ||||
|             std::copy(iter, iter + reg_width, reg_base + offset); | ||||
|         } | ||||
|         iter += reg_width; | ||||
|     } | ||||
|     if(iss::arch::traits<ARCH>::FLEN > 0) { | ||||
|         auto fstart_reg = get_f0_offset<ARCH>(); | ||||
|         auto reg_width = arch::traits<ARCH>::FLEN / 8; | ||||
|         for(size_t i = 0; i < 32 && iter < iter_end; ++i) { | ||||
|             unsigned offset = traits<ARCH>::reg_byte_offsets[fstart_reg + i]; | ||||
|             std::copy(iter, iter + reg_width, reg_base + offset); | ||||
|             iter += reg_width; | ||||
|         } | ||||
|     } | ||||
|     return Ok; | ||||
| } | ||||
|  | ||||
| template <typename ARCH> | ||||
| status riscv_target_adapter<ARCH>::read_single_register(unsigned int reg_no, std::vector<uint8_t> &data, | ||||
|         std::vector<uint8_t> &avail) { | ||||
|     if (reg_no < 65) { | ||||
| status riscv_target_adapter<ARCH>::read_single_register(unsigned int reg_no, std::vector<uint8_t>& data, std::vector<uint8_t>& avail) { | ||||
|     if(reg_no < csr_offset) { | ||||
|         // auto reg_size = arch::traits<ARCH>::reg_bit_width(static_cast<typename | ||||
|         // arch::traits<ARCH>::reg_e>(reg_no))/8; | ||||
|         auto *reg_base = core->get_regs_base_ptr(); | ||||
|         auto* reg_base = core->get_regs_base_ptr(); | ||||
|         auto reg_width = arch::traits<ARCH>::reg_bit_widths[reg_no] / 8; | ||||
|         data.resize(reg_width); | ||||
|         avail.resize(reg_width); | ||||
| @@ -252,64 +260,59 @@ status riscv_target_adapter<ARCH>::read_single_register(unsigned int reg_no, std | ||||
|         std::copy(reg_base + offset, reg_base + offset + reg_width, data.begin()); | ||||
|         std::fill(avail.begin(), avail.end(), 0xff); | ||||
|     } else { | ||||
|         typed_addr_t<iss::address_type::PHYSICAL> a(iss::access_type::DEBUG_READ, traits<ARCH>::CSR, reg_no - 65); | ||||
|         typed_addr_t<iss::address_type::PHYSICAL> a(iss::access_type::DEBUG_READ, traits<ARCH>::CSR, reg_no - csr_offset); | ||||
|         data.resize(sizeof(typename traits<ARCH>::reg_t)); | ||||
|         avail.resize(sizeof(typename traits<ARCH>::reg_t)); | ||||
|         std::fill(avail.begin(), avail.end(), 0xff); | ||||
|         core->read(a, data.size(), data.data()); | ||||
|         std::fill(avail.begin(), avail.end(), 0xff); | ||||
|     } | ||||
|     return data.size() > 0 ? Ok : Err; | ||||
| } | ||||
|  | ||||
| template <typename ARCH> | ||||
| status riscv_target_adapter<ARCH>::write_single_register(unsigned int reg_no, const std::vector<uint8_t> &data) { | ||||
|     if (reg_no < 65) { | ||||
|         auto *reg_base = core->get_regs_base_ptr(); | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::write_single_register(unsigned int reg_no, const std::vector<uint8_t>& data) { | ||||
|     if(reg_no < csr_offset) { | ||||
|         auto* reg_base = core->get_regs_base_ptr(); | ||||
|         auto reg_width = arch::traits<ARCH>::reg_bit_widths[static_cast<typename arch::traits<ARCH>::reg_e>(reg_no)] / 8; | ||||
|         auto offset = traits<ARCH>::reg_byte_offsets[reg_no]; | ||||
|         std::copy(data.begin(), data.begin() + reg_width, reg_base + offset); | ||||
|     } else { | ||||
|         typed_addr_t<iss::address_type::PHYSICAL> a(iss::access_type::DEBUG_WRITE, traits<ARCH>::CSR, reg_no - 65); | ||||
|         typed_addr_t<iss::address_type::PHYSICAL> a(iss::access_type::DEBUG_WRITE, traits<ARCH>::CSR, reg_no - csr_offset); | ||||
|         core->write(a, data.size(), data.data()); | ||||
|     } | ||||
|     return Ok; | ||||
| } | ||||
|  | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::read_mem(uint64_t addr, std::vector<uint8_t> &data) { | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::read_mem(uint64_t addr, std::vector<uint8_t>& data) { | ||||
|     auto a = map_addr({iss::access_type::DEBUG_READ, iss::address_type::VIRTUAL, 0, addr}); | ||||
|     auto f = [&]() -> status { return core->read(a, data.size(), data.data()); }; | ||||
|     return srv->execute_syncronized(f); | ||||
| } | ||||
|  | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::write_mem(uint64_t addr, const std::vector<uint8_t> &data) { | ||||
|     auto a = map_addr({iss::access_type::DEBUG_READ, iss::address_type::VIRTUAL, 0, addr}); | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::write_mem(uint64_t addr, const std::vector<uint8_t>& data) { | ||||
|     auto a = map_addr({iss::access_type::DEBUG_WRITE, iss::address_type::VIRTUAL, 0, addr}); | ||||
|     auto f = [&]() -> status { return core->write(a, data.size(), data.data()); }; | ||||
|     return srv->execute_syncronized(f); | ||||
| } | ||||
|  | ||||
| template <typename ARCH> | ||||
| status riscv_target_adapter<ARCH>::process_query(unsigned int &mask, const rp_thread_ref &arg, rp_thread_info &info) { | ||||
| status riscv_target_adapter<ARCH>::process_query(unsigned int& mask, const rp_thread_ref& arg, rp_thread_info& info) { | ||||
|     return NotSupported; | ||||
| } | ||||
|  | ||||
| template <typename ARCH> | ||||
| status riscv_target_adapter<ARCH>::offsets_query(uint64_t &text, uint64_t &data, uint64_t &bss) { | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::offsets_query(uint64_t& text, uint64_t& data, uint64_t& bss) { | ||||
|     text = 0; | ||||
|     data = 0; | ||||
|     bss = 0; | ||||
|     return Ok; | ||||
| } | ||||
|  | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::crc_query(uint64_t addr, size_t len, uint32_t &val) { | ||||
|     return NotSupported; | ||||
| } | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::crc_query(uint64_t addr, size_t len, uint32_t& val) { return NotSupported; } | ||||
|  | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::raw_query(std::string in_buf, std::string &out_buf) { | ||||
|     return NotSupported; | ||||
| } | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::raw_query(std::string in_buf, std::string& out_buf) { return NotSupported; } | ||||
|  | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::threadinfo_query(int first, std::string &out_buf) { | ||||
|     if (first) { | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::threadinfo_query(int first, std::string& out_buf) { | ||||
|     if(first) { | ||||
|         out_buf = fmt::format("m{:x}", thread_idx.val); | ||||
|     } else { | ||||
|         out_buf = "l"; | ||||
| @@ -317,8 +320,7 @@ template <typename ARCH> status riscv_target_adapter<ARCH>::threadinfo_query(int | ||||
|     return Ok; | ||||
| } | ||||
|  | ||||
| template <typename ARCH> | ||||
| status riscv_target_adapter<ARCH>::threadextrainfo_query(const rp_thread_ref &thread, std::string &out_buf) { | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::threadextrainfo_query(const rp_thread_ref& thread, std::string& out_buf) { | ||||
|     std::array<char, 20> buf; | ||||
|     memset(buf.data(), 0, 20); | ||||
|     sprintf(buf.data(), "%02x%02x%02x%02x%02x%02x%02x%02x%02x", 'R', 'u', 'n', 'n', 'a', 'b', 'l', 'e', 0); | ||||
| @@ -326,7 +328,7 @@ status riscv_target_adapter<ARCH>::threadextrainfo_query(const rp_thread_ref &th | ||||
|     return Ok; | ||||
| } | ||||
|  | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::packetsize_query(std::string &out_buf) { | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::packetsize_query(std::string& out_buf) { | ||||
|     out_buf = "PacketSize=1000"; | ||||
|     return Ok; | ||||
| } | ||||
| @@ -340,9 +342,9 @@ template <typename ARCH> status riscv_target_adapter<ARCH>::add_break(break_type | ||||
|         auto saddr = map_addr({iss::access_type::FETCH, iss::address_type::PHYSICAL, 0, addr}); | ||||
|         auto eaddr = map_addr({iss::access_type::FETCH, iss::address_type::PHYSICAL, 0, addr + length}); | ||||
|         target_adapter_base::bp_lut.addEntry(++target_adapter_base::bp_count, saddr.val, eaddr.val - saddr.val); | ||||
|         LOG(TRACE) << "Adding breakpoint with handle " << target_adapter_base::bp_count << " for addr 0x" << std::hex | ||||
|                 << saddr.val << std::dec; | ||||
|         LOG(TRACE) << "Now having " << target_adapter_base::bp_lut.size() << " breakpoints"; | ||||
|         CPPLOG(TRACE) << "Adding breakpoint with handle " << target_adapter_base::bp_count << " for addr 0x" << std::hex << saddr.val | ||||
|                       << std::dec; | ||||
|         CPPLOG(TRACE) << "Now having " << target_adapter_base::bp_lut.size() << " breakpoints"; | ||||
|         return Ok; | ||||
|     } | ||||
|     } | ||||
| @@ -356,15 +358,14 @@ template <typename ARCH> status riscv_target_adapter<ARCH>::remove_break(break_t | ||||
|     case HW_EXEC: { | ||||
|         auto saddr = map_addr({iss::access_type::FETCH, iss::address_type::PHYSICAL, 0, addr}); | ||||
|         unsigned handle = target_adapter_base::bp_lut.getEntry(saddr.val); | ||||
|         if (handle) { | ||||
|             LOG(TRACE) << "Removing breakpoint with handle " << handle << " for addr 0x" << std::hex << saddr.val | ||||
|                     << std::dec; | ||||
|         if(handle) { | ||||
|             CPPLOG(TRACE) << "Removing breakpoint with handle " << handle << " for addr 0x" << std::hex << saddr.val << std::dec; | ||||
|             // TODO: check length of addr range | ||||
|             target_adapter_base::bp_lut.removeEntry(handle); | ||||
|             LOG(TRACE) << "Now having " << target_adapter_base::bp_lut.size() << " breakpoints"; | ||||
|             CPPLOG(TRACE) << "Now having " << target_adapter_base::bp_lut.size() << " breakpoints"; | ||||
|             return Ok; | ||||
|         } | ||||
|         LOG(TRACE) << "Now having " << target_adapter_base::bp_lut.size() << " breakpoints"; | ||||
|         CPPLOG(TRACE) << "Now having " << target_adapter_base::bp_lut.size() << " breakpoints"; | ||||
|         return Err; | ||||
|     } | ||||
|     } | ||||
| @@ -372,103 +373,67 @@ template <typename ARCH> status riscv_target_adapter<ARCH>::remove_break(break_t | ||||
|  | ||||
| template <typename ARCH> | ||||
| status riscv_target_adapter<ARCH>::resume_from_addr(bool step, int sig, uint64_t addr, rp_thread_ref thread, | ||||
|         std::function<void(unsigned)> stop_callback) { | ||||
|     auto *reg_base = core->get_regs_base_ptr(); | ||||
|                                                     std::function<void(unsigned)> stop_callback) { | ||||
|     auto* reg_base = core->get_regs_base_ptr(); | ||||
|     auto reg_width = arch::traits<ARCH>::reg_bit_widths[arch::traits<ARCH>::PC] / 8; | ||||
|     auto offset = traits<ARCH>::reg_byte_offsets[arch::traits<ARCH>::PC]; | ||||
|     const uint8_t *iter = reinterpret_cast<const uint8_t *>(&addr); | ||||
|     const uint8_t* iter = reinterpret_cast<const uint8_t*>(&addr); | ||||
|     std::copy(iter, iter + reg_width, reg_base); | ||||
|     return resume_from_current(step, sig, thread, stop_callback); | ||||
| } | ||||
|  | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::target_xml_query(std::string &out_buf) { | ||||
|     const std::string res{"<?xml version=\"1.0\"?><!DOCTYPE target SYSTEM \"gdb-target.dtd\">" | ||||
|         "<target><architecture>riscv:rv32</architecture>" | ||||
|         //"  <feature name=\"org.gnu.gdb.riscv.rv32i\">\n" | ||||
|         //"    <reg name=\"x0\"  bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x1\"  bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x2\"  bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x3\"  bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x4\"  bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x5\"  bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x6\"  bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x7\"  bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x8\"  bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x9\"  bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x10\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x11\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x12\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x13\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x14\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x15\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x16\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x17\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x18\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x19\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x20\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x21\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x22\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x23\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x24\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x25\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x26\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x27\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x28\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x29\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x30\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"    <reg name=\"x31\" bitsize=\"32\" group=\"general\"/>\n" | ||||
|         //"  </feature>\n" | ||||
|         "</target>"}; | ||||
|     out_buf = res; | ||||
| template <typename ARCH> status riscv_target_adapter<ARCH>::target_xml_query(std::string& out_buf) { | ||||
|     if(!csr_xml.size()) { | ||||
|         std::ostringstream oss; | ||||
|         oss << "<?xml version=\"1.0\"?><!DOCTYPE feature SYSTEM \"gdb-target.dtd\"><target version=\"1.0\">\n"; | ||||
|         if(iss::arch::traits<ARCH>::XLEN == 32) | ||||
|             oss << "<architecture>riscv:rv32</architecture>\n"; | ||||
|         else if(iss::arch::traits<ARCH>::XLEN == 64) | ||||
|             oss << "  <architectureriscv:rv64</architecture>\n"; | ||||
|         oss << "  <feature name=\"org.gnu.gdb.riscv.cpu\">\n"; | ||||
|         auto reg_base_num = iss::arch::traits<ARCH>::X0; | ||||
|         for(auto i = 0U; i < iss::arch::traits<ARCH>::RFS; ++i) { | ||||
|             oss << "    <reg name=\"x" << i << "\" bitsize=\"" << iss::arch::traits<ARCH>::reg_bit_widths[reg_base_num + i] | ||||
|                 << "\" type=\"int\" regnum=\"" << i << "\"/>\n"; | ||||
|         } | ||||
|         oss << "    <reg name=\"pc\" bitsize=\"" << iss::arch::traits<ARCH>::reg_bit_widths[iss::arch::traits<ARCH>::PC] | ||||
|             << "\" type=\"code_ptr\" regnum=\"" << 32U << "\"/>\n"; | ||||
|         oss << "  </feature>\n"; | ||||
|         if(iss::arch::traits<ARCH>::FLEN > 0) { | ||||
|             oss << "  <feature name=\"org.gnu.gdb.riscv.fpu\">\n"; | ||||
|             auto reg_base_num = get_f0_offset<ARCH>(); | ||||
|             auto type = iss::arch::traits<ARCH>::FLEN == 32 ? "ieee_single" : "riscv_double"; | ||||
|             for(auto i = 0U; i < 32; ++i) { | ||||
|                 oss << "    <reg name=\"f" << i << "\" bitsize=\"" << iss::arch::traits<ARCH>::reg_bit_widths[reg_base_num + i] | ||||
|                     << "\" type=\"" << type << "\" regnum=\"" << i + 33 << "\"/>\n"; | ||||
|             } | ||||
|             oss << "    <reg name=\"fcsr\" bitsize=\"" << iss::arch::traits<ARCH>::XLEN << "\" regnum=\"103\" type int/>\n"; | ||||
|             oss << "    <reg name=\"fflags\" bitsize=\"" << iss::arch::traits<ARCH>::XLEN << "\" regnum=\"101\" type int/>\n"; | ||||
|             oss << "    <reg name=\"frm\" bitsize=\"" << iss::arch::traits<ARCH>::XLEN << "\" regnum=\"102\" type int/>\n"; | ||||
|             oss << "  </feature>\n"; | ||||
|         } | ||||
|         oss << "  <feature name=\"org.gnu.gdb.riscv.csr\">\n"; | ||||
|         std::vector<uint8_t> data; | ||||
|         std::vector<uint8_t> avail; | ||||
|         data.resize(sizeof(typename traits<ARCH>::reg_t)); | ||||
|         avail.resize(sizeof(typename traits<ARCH>::reg_t)); | ||||
|         for(auto i = 0U; i < 4096; ++i) { | ||||
|             typed_addr_t<iss::address_type::PHYSICAL> a(iss::access_type::DEBUG_READ, traits<ARCH>::CSR, i); | ||||
|             std::fill(avail.begin(), avail.end(), 0xff); | ||||
|             auto res = core->read(a, data.size(), data.data()); | ||||
|             if(res == iss::Ok) { | ||||
|                 oss << "    <reg name=\"" << get_csr_name(i) << "\" bitsize=\"" << iss::arch::traits<ARCH>::XLEN | ||||
|                     << "\"  type=\"int\" regnum=\"" << (i + csr_offset) << "\"/>\n"; | ||||
|             } | ||||
|         } | ||||
|         oss << "  </feature>\n"; | ||||
|         oss << "</target>\n"; | ||||
|         csr_xml = oss.str(); | ||||
|     } | ||||
|     out_buf = csr_xml; | ||||
|     return Ok; | ||||
| } | ||||
| } // namespace debugger | ||||
| } // namespace iss | ||||
|  | ||||
| /* | ||||
|  * | ||||
| <?xml version="1.0"?> | ||||
| <!DOCTYPE target SYSTEM "gdb-target.dtd"> | ||||
| <target> | ||||
|   <architecture>riscv:rv32</architecture> | ||||
|  | ||||
|   <feature name="org.gnu.gdb.riscv.rv32i"> | ||||
|     <reg name="x0"  bitsize="32" group="general"/> | ||||
|     <reg name="x1"  bitsize="32" group="general"/> | ||||
|     <reg name="x2"  bitsize="32" group="general"/> | ||||
|     <reg name="x3"  bitsize="32" group="general"/> | ||||
|     <reg name="x4"  bitsize="32" group="general"/> | ||||
|     <reg name="x5"  bitsize="32" group="general"/> | ||||
|     <reg name="x6"  bitsize="32" group="general"/> | ||||
|     <reg name="x7"  bitsize="32" group="general"/> | ||||
|     <reg name="x8"  bitsize="32" group="general"/> | ||||
|     <reg name="x9"  bitsize="32" group="general"/> | ||||
|     <reg name="x10" bitsize="32" group="general"/> | ||||
|     <reg name="x11" bitsize="32" group="general"/> | ||||
|     <reg name="x12" bitsize="32" group="general"/> | ||||
|     <reg name="x13" bitsize="32" group="general"/> | ||||
|     <reg name="x14" bitsize="32" group="general"/> | ||||
|     <reg name="x15" bitsize="32" group="general"/> | ||||
|     <reg name="x16" bitsize="32" group="general"/> | ||||
|     <reg name="x17" bitsize="32" group="general"/> | ||||
|     <reg name="x18" bitsize="32" group="general"/> | ||||
|     <reg name="x19" bitsize="32" group="general"/> | ||||
|     <reg name="x20" bitsize="32" group="general"/> | ||||
|     <reg name="x21" bitsize="32" group="general"/> | ||||
|     <reg name="x22" bitsize="32" group="general"/> | ||||
|     <reg name="x23" bitsize="32" group="general"/> | ||||
|     <reg name="x24" bitsize="32" group="general"/> | ||||
|     <reg name="x25" bitsize="32" group="general"/> | ||||
|     <reg name="x26" bitsize="32" group="general"/> | ||||
|     <reg name="x27" bitsize="32" group="general"/> | ||||
|     <reg name="x28" bitsize="32" group="general"/> | ||||
|     <reg name="x29" bitsize="32" group="general"/> | ||||
|     <reg name="x30" bitsize="32" group="general"/> | ||||
|     <reg name="x31" bitsize="32" group="general"/> | ||||
|   </feature> | ||||
|  | ||||
| </target> | ||||
|  | ||||
|  */ | ||||
| } | ||||
| } | ||||
|  | ||||
| #endif /* _ISS_DEBUGGER_RISCV_TARGET_ADAPTER_H_ */ | ||||
| #endif /* _ISS_ARCH_DEBUGGER_RISCV_TARGET_ADAPTER_H_ */ | ||||
|   | ||||
| @@ -33,21 +33,20 @@ | ||||
| #ifndef _ISS_FACTORY_H_ | ||||
| #define _ISS_FACTORY_H_ | ||||
|  | ||||
| #include <algorithm> | ||||
| #include <functional> | ||||
| #include <iss/iss.h> | ||||
| #include <memory> | ||||
| #include <unordered_map> | ||||
| #include <functional> | ||||
| #include <string> | ||||
| #include <algorithm> | ||||
| #include <unordered_map> | ||||
| #include <vector> | ||||
|  | ||||
| namespace iss { | ||||
|  | ||||
| using cpu_ptr = std::unique_ptr<iss::arch_if>; | ||||
| using vm_ptr= std::unique_ptr<iss::vm_if>; | ||||
| using vm_ptr = std::unique_ptr<iss::vm_if>; | ||||
|  | ||||
| template<typename PLAT> | ||||
| std::tuple<cpu_ptr, vm_ptr> create_cpu(std::string const& backend, unsigned gdb_port){ | ||||
| template <typename PLAT> std::tuple<cpu_ptr, vm_ptr> create_cpu(std::string const& backend, unsigned gdb_port) { | ||||
|     using core_type = typename PLAT::core; | ||||
|     core_type* lcpu = new PLAT(); | ||||
|     if(backend == "interp") | ||||
| @@ -63,44 +62,45 @@ std::tuple<cpu_ptr, vm_ptr> create_cpu(std::string const& backend, unsigned gdb_ | ||||
|     return {nullptr, nullptr}; | ||||
| } | ||||
|  | ||||
|  | ||||
| class core_factory { | ||||
|     using cpu_ptr = std::unique_ptr<iss::arch_if>; | ||||
|     using vm_ptr= std::unique_ptr<iss::vm_if>; | ||||
|     using vm_ptr = std::unique_ptr<iss::vm_if>; | ||||
|     using base_t = std::tuple<cpu_ptr, vm_ptr>; | ||||
|     using create_fn = std::function<base_t(unsigned, void*) >; | ||||
|     using registry_t = std::unordered_map<std::string, create_fn> ; | ||||
|     using create_fn = std::function<base_t(unsigned, void*)>; | ||||
|     using registry_t = std::unordered_map<std::string, create_fn>; | ||||
|  | ||||
|     registry_t registry; | ||||
|  | ||||
|     core_factory() = default; | ||||
|     core_factory(const core_factory &) = delete; | ||||
|     core_factory & operator=(const core_factory &) = delete; | ||||
|     core_factory(const core_factory&) = delete; | ||||
|     core_factory& operator=(const core_factory&) = delete; | ||||
|  | ||||
| public: | ||||
|     static core_factory & instance() { static core_factory bf; return bf; } | ||||
|     static core_factory& instance() { | ||||
|         static core_factory bf; | ||||
|         return bf; | ||||
|     } | ||||
|  | ||||
|     bool register_creator(const std::string & className, create_fn const& fn) { | ||||
|     bool register_creator(const std::string& className, create_fn const& fn) { | ||||
|         registry[className] = fn; | ||||
|         return true; | ||||
|     } | ||||
|  | ||||
|     base_t create(std::string const& className, unsigned gdb_port=0, void* init_data=nullptr) const { | ||||
|     base_t create(std::string const& className, unsigned gdb_port = 0, void* init_data = nullptr) const { | ||||
|         registry_t::const_iterator regEntry = registry.find(className); | ||||
|         if (regEntry != registry.end()) | ||||
|         if(regEntry != registry.end()) | ||||
|             return regEntry->second(gdb_port, init_data); | ||||
|         return {nullptr, nullptr}; | ||||
|     } | ||||
|  | ||||
|     std::vector<std::string> get_names() { | ||||
|         std::vector<std::string> keys{registry.size()}; | ||||
|         std::transform(std::begin(registry), std::end(registry), std::begin(keys), [](std::pair<std::string, create_fn> const& p){ | ||||
|             return p.first; | ||||
|         }); | ||||
|         std::transform(std::begin(registry), std::end(registry), std::begin(keys), | ||||
|                        [](std::pair<std::string, create_fn> const& p) { return p.first; }); | ||||
|         return keys; | ||||
|     } | ||||
| }; | ||||
|  | ||||
| } | ||||
| } // namespace iss | ||||
|  | ||||
| #endif /* _ISS_FACTORY_H_ */ | ||||
|   | ||||
| @@ -1,4 +1,3 @@ | ||||
|  | ||||
| /******************************************************************************* | ||||
|  * Copyright (C) 2017 - 2023, MINRES Technologies GmbH | ||||
|  * All rights reserved. | ||||
| @@ -34,71 +33,82 @@ | ||||
|  ******************************************************************************/ | ||||
|  | ||||
| #include "cycle_estimate.h" | ||||
| #include <iss/plugin/calculator.h> | ||||
| #include <yaml-cpp/yaml.h> | ||||
|  | ||||
| #include <fstream> | ||||
| #include <iss/arch_if.h> | ||||
| #include <util/logging.h> | ||||
| #include <fstream> | ||||
|  | ||||
| using namespace std; | ||||
|  | ||||
| iss::plugin::cycle_estimate::cycle_estimate(string const& config_file_name) | ||||
| : instr_if(nullptr) | ||||
| , config_file_name(config_file_name) | ||||
| { | ||||
| } | ||||
| , config_file_name(config_file_name) {} | ||||
|  | ||||
| iss::plugin::cycle_estimate::~cycle_estimate() { | ||||
| } | ||||
| iss::plugin::cycle_estimate::~cycle_estimate() = default; | ||||
|  | ||||
| bool iss::plugin::cycle_estimate::registration(const char* const version, vm_if& vm) { | ||||
|     instr_if = vm.get_arch()->get_instrumentation_if(); | ||||
|     if(!instr_if) return false; | ||||
|     const string  core_name = instr_if->core_type_name(); | ||||
|     if (config_file_name.length() > 0) { | ||||
|     assert(instr_if && "No instrumentation interface available but callback executed"); | ||||
|     reg_base_ptr = reinterpret_cast<uint32_t*>(vm.get_arch()->get_regs_base_ptr()); | ||||
|     if(!instr_if) | ||||
|         return false; | ||||
|     const string core_name = instr_if->core_type_name(); | ||||
|     if(config_file_name.length() > 0) { | ||||
|         std::ifstream is(config_file_name); | ||||
|         if (is.is_open()) { | ||||
|         if(is.is_open()) { | ||||
|             try { | ||||
|                 auto root = YAML::LoadAll(is); | ||||
|                 if(root.size()!=1) { | ||||
|                     LOG(ERR) << "Too many root nodes in YAML file " << config_file_name; | ||||
|                 if(root.size() != 1) { | ||||
|                     CPPLOG(ERR) << "Too many root nodes in YAML file " << config_file_name; | ||||
|                 } | ||||
|                 for (auto p : root[0]) { | ||||
|                 for(auto p : root[0]) { | ||||
|                     auto isa_subset = p.first; | ||||
|                     auto instructions = p.second; | ||||
|                     for (auto const& instr : instructions) { | ||||
|                         instr_desc res; | ||||
|                     for(auto const& instr : instructions) { | ||||
|                         auto idx = instr.second["index"].as<unsigned>(); | ||||
|                         if(delays.size() <= idx) | ||||
|                             delays.resize(idx + 1); | ||||
|                         auto& res = delays[idx]; | ||||
|                         res.is_branch = instr.second["branch"].as<bool>(); | ||||
|                         auto delay = instr.second["delay"]; | ||||
|                         if(delay.IsSequence()) { | ||||
|                             res.not_taken = delay[0].as<uint64_t>(); | ||||
|                             res.taken = delay[1].as<uint64_t>(); | ||||
|                         } else { | ||||
|                             res.not_taken = delay.as<uint64_t>(); | ||||
|                             res.taken = res.not_taken; | ||||
|                             try { | ||||
|                                 res.not_taken = delay.as<uint64_t>(); | ||||
|                                 res.taken = res.not_taken; | ||||
|                             } catch(const YAML::BadConversion& e) { | ||||
|                                 res.f = iss::plugin::calculator(reg_base_ptr, delay.as<std::string>()); | ||||
|                             } | ||||
|                         } | ||||
|                         delays.push_back(std::move(res)); | ||||
|                     } | ||||
|                 } | ||||
|             } catch (YAML::ParserException &e) { | ||||
|                 LOG(ERR) << "Could not parse input file " << config_file_name << ", reason: " << e.what(); | ||||
|             } catch(YAML::ParserException& e) { | ||||
|                 CPPLOG(ERR) << "Could not parse input file " << config_file_name << ", reason: " << e.what(); | ||||
|                 return false; | ||||
|             } | ||||
|         } else { | ||||
|             LOG(ERR) << "Could not open input file " << config_file_name; | ||||
|             CPPLOG(ERR) << "Could not open input file " << config_file_name; | ||||
|             return false; | ||||
|         } | ||||
|     } | ||||
|     return true; | ||||
|  | ||||
| } | ||||
|  | ||||
| void iss::plugin::cycle_estimate::callback(instr_info_t instr_info) { | ||||
|     assert(instr_if && "No instrumentation interface available but callback executed"); | ||||
|     auto entry = delays[instr_info.instr_id]; | ||||
|     bool taken = instr_if->is_branch_taken(); | ||||
|     if (taken && (entry.taken > 1)) | ||||
|         instr_if->update_last_instr_cycles(entry.taken); | ||||
|     else if (entry.not_taken > 1) | ||||
|         instr_if->update_last_instr_cycles(entry.not_taken); | ||||
|     size_t instr_id = instr_info.instr_id; | ||||
|     auto& entry = instr_id < delays.size() ? delays[instr_id] : illegal_desc; | ||||
|     if(instr_info.phase_id == PRE_SYNC) { | ||||
|         if(entry.f) | ||||
|             current_delay = entry.f(instr_if->get_instr_word()); | ||||
|     } else { | ||||
|         if(!entry.f) | ||||
|             current_delay = instr_if->is_branch_taken() ? entry.taken : entry.not_taken; | ||||
|         if(current_delay > 1) | ||||
|             instr_if->update_last_instr_cycles(current_delay); | ||||
|         current_delay = 1; | ||||
|     } | ||||
| } | ||||
|   | ||||
| @@ -37,6 +37,7 @@ | ||||
|  | ||||
| #include "iss/instrumentation_if.h" | ||||
| #include "iss/vm_plugin.h" | ||||
| #include <functional> | ||||
| #include <string> | ||||
| #include <unordered_map> | ||||
| #include <vector> | ||||
| @@ -45,46 +46,44 @@ namespace iss { | ||||
|  | ||||
| namespace plugin { | ||||
|  | ||||
| class cycle_estimate: public vm_plugin { | ||||
| 	BEGIN_BF_DECL(instr_desc, uint32_t) | ||||
| 		BF_FIELD(taken, 24, 8) | ||||
| 		BF_FIELD(not_taken, 16, 8) | ||||
|         BF_FIELD(is_branch, 8, 8) | ||||
|         BF_FIELD(size, 0, 8) | ||||
| 		instr_desc(uint32_t size, uint32_t taken, uint32_t not_taken, bool branch): instr_desc() { | ||||
| 			this->size=size; | ||||
| 			this->taken=taken; | ||||
| 			this->not_taken=not_taken; | ||||
| 			this->is_branch=branch; | ||||
| 		} | ||||
| 	END_BF_DECL(); | ||||
| class cycle_estimate : public vm_plugin { | ||||
|     struct instr_desc { | ||||
|         size_t size{0}; | ||||
|         bool is_branch{false}; | ||||
|         unsigned not_taken{1}; | ||||
|         unsigned taken{1}; | ||||
|         std::function<unsigned(uint64_t)> f; | ||||
|     }; | ||||
|  | ||||
| public: | ||||
|     cycle_estimate() = delete; | ||||
|  | ||||
|     cycle_estimate(const cycle_estimate &) = delete; | ||||
|     cycle_estimate(const cycle_estimate&) = delete; | ||||
|  | ||||
|     cycle_estimate(const cycle_estimate &&) = delete; | ||||
|     cycle_estimate(const cycle_estimate&&) = delete; | ||||
|  | ||||
|     cycle_estimate(std::string const& config_file_name); | ||||
|  | ||||
|     virtual ~cycle_estimate(); | ||||
|  | ||||
|     cycle_estimate &operator=(const cycle_estimate &) = delete; | ||||
|     cycle_estimate& operator=(const cycle_estimate&) = delete; | ||||
|  | ||||
|     cycle_estimate &operator=(const cycle_estimate &&) = delete; | ||||
|     cycle_estimate& operator=(const cycle_estimate&&) = delete; | ||||
|  | ||||
|     bool registration(const char *const version, vm_if &arch) override; | ||||
|     bool registration(const char* const version, vm_if& arch) override; | ||||
|  | ||||
|     sync_type get_sync() override { return POST_SYNC; }; | ||||
|     sync_type get_sync() override { return ALL_SYNC; }; | ||||
|  | ||||
|     void callback(instr_info_t instr_info) override; | ||||
|  | ||||
| private: | ||||
|     iss::instrumentation_if *instr_if; | ||||
|     iss::instrumentation_if* instr_if{nullptr}; | ||||
|     uint32_t* reg_base_ptr{nullptr}; | ||||
|     instr_desc illegal_desc{}; | ||||
|     std::vector<instr_desc> delays; | ||||
|     unsigned current_delay{0}; | ||||
|     struct pair_hash { | ||||
|         size_t operator()(const std::pair<uint64_t, uint64_t> &p) const { | ||||
|         size_t operator()(const std::pair<uint64_t, uint64_t>& p) const { | ||||
|             std::hash<uint64_t> hash; | ||||
|             return hash(p.first) + hash(p.second); | ||||
|         } | ||||
| @@ -92,7 +91,7 @@ private: | ||||
|     std::unordered_map<std::pair<uint64_t, uint64_t>, uint64_t, pair_hash> blocks; | ||||
|     std::string config_file_name; | ||||
| }; | ||||
| } | ||||
| } | ||||
| } // namespace plugin | ||||
| } // namespace iss | ||||
|  | ||||
| #endif /* _ISS_PLUGIN_CYCLE_ESTIMATE_H_ */ | ||||
|   | ||||
| @@ -36,26 +36,26 @@ | ||||
| #include <iss/instrumentation_if.h> | ||||
| #include <yaml-cpp/yaml.h> | ||||
|  | ||||
| #include <fstream> | ||||
| #include <iss/arch_if.h> | ||||
| #include <util/logging.h> | ||||
| #include <fstream> | ||||
|  | ||||
| iss::plugin::instruction_count::instruction_count(std::string config_file_name) { | ||||
|     if (config_file_name.length() > 0) { | ||||
|     if(config_file_name.length() > 0) { | ||||
|         std::ifstream is(config_file_name); | ||||
|         if (is.is_open()) { | ||||
|         if(is.is_open()) { | ||||
|             try { | ||||
|                 auto root = YAML::LoadAll(is); | ||||
|                 if(root.size()!=1) { | ||||
|                     LOG(ERR) << "Too many rro nodes in YAML file " << config_file_name; | ||||
|                 if(root.size() != 1) { | ||||
|                     CPPLOG(ERR) << "Too many rro nodes in YAML file " << config_file_name; | ||||
|                 } | ||||
|                 for (auto p : root[0]) { | ||||
|                 for(auto p : root[0]) { | ||||
|                     auto isa_subset = p.first; | ||||
|                     auto instructions = p.second; | ||||
|                     for (auto const& instr : instructions) { | ||||
|                     for(auto const& instr : instructions) { | ||||
|                         instr_delay res; | ||||
|                         res.instr_name = instr.first.as<std::string>(); | ||||
|                         res.size = instr.second["encoding"].as<std::string>().size()-2; // not counting 0b | ||||
|                         res.size = instr.second["encoding"].as<std::string>().size() - 2; // not counting 0b | ||||
|                         auto delay = instr.second["delay"]; | ||||
|                         if(delay.IsSequence()) { | ||||
|                             res.not_taken_delay = delay[0].as<uint64_t>(); | ||||
| @@ -68,30 +68,29 @@ iss::plugin::instruction_count::instruction_count(std::string config_file_name) | ||||
|                     } | ||||
|                 } | ||||
|                 rep_counts.resize(delays.size()); | ||||
|             } catch (YAML::ParserException &e) { | ||||
|                 LOG(ERR) << "Could not parse input file " << config_file_name << ", reason: " << e.what(); | ||||
|             } catch(YAML::ParserException& e) { | ||||
|                 CPPLOG(ERR) << "Could not parse input file " << config_file_name << ", reason: " << e.what(); | ||||
|             } | ||||
|         } else { | ||||
|             LOG(ERR) << "Could not open input file " << config_file_name; | ||||
|             CPPLOG(ERR) << "Could not open input file " << config_file_name; | ||||
|         } | ||||
|     } | ||||
| } | ||||
|  | ||||
| iss::plugin::instruction_count::~instruction_count() { | ||||
| 	size_t idx=0; | ||||
| 	for(auto it:delays){ | ||||
| 		if(rep_counts[idx]>0 && it.instr_name.find("__"!=0)) | ||||
| 			LOG(INFO)<<it.instr_name<<";"<<rep_counts[idx]; | ||||
| 		idx++; | ||||
| 	} | ||||
|     size_t idx = 0; | ||||
|     for(auto it : delays) { | ||||
|         if(rep_counts[idx] > 0 && it.instr_name.find("__" != 0)) | ||||
|             CPPLOG(INFO) << it.instr_name << ";" << rep_counts[idx]; | ||||
|         idx++; | ||||
|     } | ||||
| } | ||||
|  | ||||
| bool iss::plugin::instruction_count::registration(const char* const version, vm_if& vm) { | ||||
|     auto instr_if = vm.get_arch()->get_instrumentation_if(); | ||||
|     if(!instr_if) return false; | ||||
| 	return true; | ||||
|     if(!instr_if) | ||||
|         return false; | ||||
|     return true; | ||||
| } | ||||
|  | ||||
| void iss::plugin::instruction_count::callback(instr_info_t instr_info) { | ||||
| 	rep_counts[instr_info.instr_id]++; | ||||
| } | ||||
| void iss::plugin::instruction_count::callback(instr_info_t instr_info) { rep_counts[instr_info.instr_id]++; } | ||||
|   | ||||
| @@ -53,19 +53,19 @@ class instruction_count : public iss::vm_plugin { | ||||
| public: | ||||
|     instruction_count() = delete; | ||||
|  | ||||
|     instruction_count(const instruction_count &) = delete; | ||||
|     instruction_count(const instruction_count&) = delete; | ||||
|  | ||||
|     instruction_count(const instruction_count &&) = delete; | ||||
|     instruction_count(const instruction_count&&) = delete; | ||||
|  | ||||
|     instruction_count(std::string config_file_name); | ||||
|  | ||||
|     virtual ~instruction_count(); | ||||
|  | ||||
|     instruction_count &operator=(const instruction_count &) = delete; | ||||
|     instruction_count& operator=(const instruction_count&) = delete; | ||||
|  | ||||
|     instruction_count &operator=(const instruction_count &&) = delete; | ||||
|     instruction_count& operator=(const instruction_count&&) = delete; | ||||
|  | ||||
|     bool registration(const char *const version, vm_if &arch) override; | ||||
|     bool registration(const char* const version, vm_if& arch) override; | ||||
|  | ||||
|     sync_type get_sync() override { return POST_SYNC; }; | ||||
|  | ||||
| @@ -75,7 +75,7 @@ private: | ||||
|     std::vector<instr_delay> delays; | ||||
|     std::vector<uint64_t> rep_counts; | ||||
| }; | ||||
| } | ||||
| } | ||||
| } // namespace plugin | ||||
| } // namespace iss | ||||
|  | ||||
| #endif /* _ISS_PLUGIN_INSTRUCTION_COUNTER_H_ */ | ||||
|   | ||||
							
								
								
									
										297
									
								
								src/iss/semihosting/semihosting.cpp
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										297
									
								
								src/iss/semihosting/semihosting.cpp
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,297 @@ | ||||
| #include "semihosting.h" | ||||
| #include <chrono> | ||||
| #include <cstdint> | ||||
| #include <iss/vm_types.h> | ||||
| #include <map> | ||||
| #include <stdexcept> | ||||
| // explanation of syscalls can be found at https://github.com/SpinalHDL/openocd_riscv/blob/riscv_spinal/src/target/semihosting_common.h | ||||
|  | ||||
| const char* SYS_OPEN_MODES_STRS[] = {"r", "rb", "r+", "r+b", "w", "wb", "w+", "w+b", "a", "ab", "a+", "a+b"}; | ||||
|  | ||||
| template <typename T> T sh_read_field(iss::arch_if* arch_if_ptr, T addr, int len = 4) { | ||||
|     uint8_t bytes[4]; | ||||
|     auto res = arch_if_ptr->read(iss::address_type::PHYSICAL, iss::access_type::DEBUG_READ, 0, addr, 4, &bytes[0]); | ||||
|     // auto res = arch_if_ptr->read(iss::address_type::PHYSICAL, iss::access_type::DEBUG_READ, 0, *parameter, 1, &character); | ||||
|  | ||||
|     if(res != iss::Ok) { | ||||
|         return 0; // TODO THROW ERROR | ||||
|     } else | ||||
|         return static_cast<T>(bytes[0]) | (static_cast<T>(bytes[1]) << 8) | (static_cast<T>(bytes[2]) << 16) | | ||||
|                (static_cast<T>(bytes[3]) << 24); | ||||
| } | ||||
|  | ||||
| template <typename T> std::string sh_read_string(iss::arch_if* arch_if_ptr, T addr, T str_len) { | ||||
|     std::vector<uint8_t> buffer(str_len); | ||||
|     for(int i = 0; i < str_len; i++) { | ||||
|         buffer[i] = sh_read_field(arch_if_ptr, addr + i, 1); | ||||
|     } | ||||
|     std::string str(buffer.begin(), buffer.end()); | ||||
|     return str; | ||||
| } | ||||
|  | ||||
| template <typename T> void semihosting_callback<T>::operator()(iss::arch_if* arch_if_ptr, T* call_number, T* parameter) { | ||||
|     static std::map<T, FILE*> openFiles; | ||||
|     static T file_count = 3; | ||||
|     static T semihostingErrno; | ||||
|  | ||||
|     switch(static_cast<semihosting_syscalls>(*call_number)) { | ||||
|     case semihosting_syscalls::SYS_CLOCK: { | ||||
|         auto end = std::chrono::high_resolution_clock::now(); // end measurement | ||||
|         auto elapsed = end - timeVar; | ||||
|         auto millis = std::chrono::duration_cast<std::chrono::milliseconds>(elapsed).count(); | ||||
|         *call_number = millis; // TODO get time now | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_CLOSE: { | ||||
|         T file_handle = *parameter; | ||||
|         if(openFiles.size() <= file_handle && file_handle < 0) { | ||||
|             semihostingErrno = EBADF; | ||||
|             return; | ||||
|         } | ||||
|         auto file = openFiles[file_handle]; | ||||
|         openFiles.erase(file_handle); | ||||
|         if(!(file == stdin || file == stdout || file == stderr)) { | ||||
|             int i = fclose(file); | ||||
|             *call_number = i; | ||||
|         } else { | ||||
|             *call_number = -1; | ||||
|             semihostingErrno = EINTR; | ||||
|         } | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_ELAPSED: { | ||||
|         throw std::runtime_error("Semihosting Call not Implemented"); | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_ERRNO: { | ||||
|         *call_number = semihostingErrno; | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_EXIT: { | ||||
|  | ||||
|         throw std::runtime_error("ISS terminated by Semihost: SYS_EXIT"); | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_EXIT_EXTENDED: { | ||||
|         throw std::runtime_error("ISS terminated by Semihost: SYS_EXIT_EXTENDED"); | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_FLEN: { | ||||
|         T file_handle = *parameter; | ||||
|         auto file = openFiles[file_handle]; | ||||
|  | ||||
|         size_t currentPos = ftell(file); | ||||
|         if(currentPos < 0) | ||||
|             throw std::runtime_error("SYS_FLEN negative value"); | ||||
|         fseek(file, 0, SEEK_END); | ||||
|         size_t length = ftell(file); | ||||
|         fseek(file, currentPos, SEEK_SET); | ||||
|         *call_number = (T)length; | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_GET_CMDLINE: { | ||||
|         throw std::runtime_error("Semihosting Call not Implemented"); | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_HEAPINFO: { | ||||
|         throw std::runtime_error("Semihosting Call not Implemented"); | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_ISERROR: { | ||||
|         T value = *parameter; | ||||
|         *call_number = (value != 0); | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_ISTTY: { | ||||
|         T file_handle = *parameter; | ||||
|         *call_number = (file_handle == 0 || file_handle == 1 || file_handle == 2); | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_OPEN: { | ||||
|         T path_str_addr = sh_read_field<T>(arch_if_ptr, *parameter); | ||||
|         T mode = sh_read_field<T>(arch_if_ptr, 4 + (*parameter)); | ||||
|         T path_len = sh_read_field<T>(arch_if_ptr, 8 + (*parameter)); | ||||
|  | ||||
|         std::string path_str = sh_read_string<T>(arch_if_ptr, path_str_addr, path_len); | ||||
|  | ||||
|         // TODO LOG INFO | ||||
|  | ||||
|         if(mode >= 12) { | ||||
|             // TODO throw ERROR | ||||
|             return; | ||||
|         } | ||||
|  | ||||
|         FILE* file = nullptr; | ||||
|         if(path_str == ":tt") { | ||||
|             if(mode < 4) | ||||
|                 file = stdin; | ||||
|             else if(mode < 8) | ||||
|                 file = stdout; | ||||
|             else | ||||
|                 file = stderr; | ||||
|         } else { | ||||
|             file = fopen(path_str.c_str(), SYS_OPEN_MODES_STRS[mode]); | ||||
|             if(file == nullptr) { | ||||
|                 // TODO throw error | ||||
|                 return; | ||||
|             } | ||||
|         } | ||||
|         T file_handle = file_count++; | ||||
|         openFiles[file_handle] = file; | ||||
|         *call_number = file_handle; | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_READ: { | ||||
|         T file_handle = sh_read_field<T>(arch_if_ptr, (*parameter) + 4); | ||||
|         T addr = sh_read_field<T>(arch_if_ptr, *parameter); | ||||
|         T count = sh_read_field<T>(arch_if_ptr, (*parameter) + 8); | ||||
|  | ||||
|         auto file = openFiles[file_handle]; | ||||
|  | ||||
|         std::vector<uint8_t> buffer(count); | ||||
|         size_t num_read = 0; | ||||
|         if(file == stdin) { | ||||
|             // when reading from stdin: mimic behaviour from read syscall | ||||
|             // and return on newline. | ||||
|             while(num_read < count) { | ||||
|                 char c = fgetc(file); | ||||
|                 buffer[num_read] = c; | ||||
|                 num_read++; | ||||
|                 if(c == '\n') | ||||
|                     break; | ||||
|             } | ||||
|         } else { | ||||
|             num_read = fread(buffer.data(), 1, count, file); | ||||
|         } | ||||
|         buffer.resize(num_read); | ||||
|         for(int i = 0; i < num_read; i++) { | ||||
|             auto res = arch_if_ptr->write(iss::address_type::PHYSICAL, iss::access_type::DEBUG_READ, 0, addr + i, 1, &buffer[i]); | ||||
|             if(res != iss::Ok) | ||||
|                 return; | ||||
|         } | ||||
|         *call_number = count - num_read; | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_READC: { | ||||
|         uint8_t character = getchar(); | ||||
|         // character = getchar(); | ||||
|         /*if(character != iss::Ok) | ||||
|             std::cout << "Not OK"; | ||||
|             return;*/ | ||||
|         *call_number = character; | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_REMOVE: { | ||||
|         T path_str_addr = sh_read_field<T>(arch_if_ptr, *parameter); | ||||
|         T path_len = sh_read_field<T>(arch_if_ptr, (*parameter) + 4); | ||||
|         std::string path_str = sh_read_string<T>(arch_if_ptr, path_str_addr, path_len); | ||||
|  | ||||
|         if(remove(path_str.c_str()) < 0) | ||||
|             *call_number = -1; | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_RENAME: { | ||||
|         T path_str_addr_old = sh_read_field<T>(arch_if_ptr, *parameter); | ||||
|         T path_len_old = sh_read_field<T>(arch_if_ptr, (*parameter) + 4); | ||||
|         T path_str_addr_new = sh_read_field<T>(arch_if_ptr, (*parameter) + 8); | ||||
|         T path_len_new = sh_read_field<T>(arch_if_ptr, (*parameter) + 12); | ||||
|  | ||||
|         std::string path_str_old = sh_read_string<T>(arch_if_ptr, path_str_addr_old, path_len_old); | ||||
|         std::string path_str_new = sh_read_string<T>(arch_if_ptr, path_str_addr_new, path_len_new); | ||||
|         rename(path_str_old.c_str(), path_str_new.c_str()); | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_SEEK: { | ||||
|         T file_handle = sh_read_field<T>(arch_if_ptr, *parameter); | ||||
|         T pos = sh_read_field<T>(arch_if_ptr, (*parameter) + 1); | ||||
|         auto file = openFiles[file_handle]; | ||||
|  | ||||
|         int retval = fseek(file, pos, SEEK_SET); | ||||
|         if(retval < 0) | ||||
|             throw std::runtime_error("SYS_SEEK negative return value"); | ||||
|  | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_SYSTEM: { | ||||
|         T cmd_addr = sh_read_field<T>(arch_if_ptr, *parameter); | ||||
|         T cmd_len = sh_read_field<T>(arch_if_ptr, (*parameter) + 1); | ||||
|         std::string cmd = sh_read_string<T>(arch_if_ptr, cmd_addr, cmd_len); | ||||
|         system(cmd.c_str()); | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_TICKFREQ: { | ||||
|         throw std::runtime_error("Semihosting Call not Implemented"); | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_TIME: { | ||||
|         // returns time in seconds scince 01.01.1970 00:00 | ||||
|         *call_number = time(NULL); | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_TMPNAM: { | ||||
|         T buffer_addr = sh_read_field<T>(arch_if_ptr, *parameter); | ||||
|         T identifier = sh_read_field<T>(arch_if_ptr, (*parameter) + 1); | ||||
|         T buffer_len = sh_read_field<T>(arch_if_ptr, (*parameter) + 2); | ||||
|  | ||||
|         if(identifier > 255) { | ||||
|             *call_number = -1; | ||||
|             return; | ||||
|         } | ||||
|         std::stringstream ss; | ||||
|         ss << "tmp/file-" << std::setfill('0') << std::setw(3) << identifier; | ||||
|         std::string filename = ss.str(); | ||||
|  | ||||
|         for(int i = 0; i < buffer_len; i++) { | ||||
|             uint8_t character = filename[i]; | ||||
|             auto res = arch_if_ptr->write(iss::address_type::PHYSICAL, iss::access_type::DEBUG_READ, 0, (*parameter) + i, 1, &character); | ||||
|             if(res != iss::Ok) | ||||
|                 return; | ||||
|         } | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_WRITE: { | ||||
|         T file_handle = sh_read_field<T>(arch_if_ptr, (*parameter) + 4); | ||||
|         T addr = sh_read_field<T>(arch_if_ptr, *parameter); | ||||
|         T count = sh_read_field<T>(arch_if_ptr, (*parameter) + 8); | ||||
|  | ||||
|         auto file = openFiles[file_handle]; | ||||
|         std::string str = sh_read_string<T>(arch_if_ptr, addr, count); | ||||
|         fwrite(&str[0], 1, count, file); | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_WRITEC: { | ||||
|         uint8_t character; | ||||
|         auto res = arch_if_ptr->read(iss::address_type::PHYSICAL, iss::access_type::DEBUG_READ, 0, *parameter, 1, &character); | ||||
|         if(res != iss::Ok) | ||||
|             return; | ||||
|         putchar(character); | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::SYS_WRITE0: { | ||||
|         uint8_t character; | ||||
|         while(1) { | ||||
|             auto res = arch_if_ptr->read(iss::address_type::PHYSICAL, iss::access_type::DEBUG_READ, 0, *parameter, 1, &character); | ||||
|             if(res != iss::Ok) | ||||
|                 return; | ||||
|             if(character == 0) | ||||
|                 break; | ||||
|             putchar(character); | ||||
|             (*parameter)++; | ||||
|         } | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::USER_CMD_0x100: { | ||||
|         throw std::runtime_error("Semihosting Call not Implemented"); | ||||
|         break; | ||||
|     } | ||||
|     case semihosting_syscalls::USER_CMD_0x1FF: { | ||||
|         throw std::runtime_error("Semihosting Call not Implemented"); | ||||
|         break; | ||||
|     } | ||||
|     default: | ||||
|         throw std::runtime_error("Semihosting Call not Implemented"); | ||||
|         break; | ||||
|     } | ||||
| } | ||||
| template class semihosting_callback<uint32_t>; | ||||
| template class semihosting_callback<uint64_t>; | ||||
							
								
								
									
										61
									
								
								src/iss/semihosting/semihosting.h
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										61
									
								
								src/iss/semihosting/semihosting.h
									
									
									
									
									
										Normal file
									
								
							| @@ -0,0 +1,61 @@ | ||||
| #ifndef _SEMIHOSTING_H_ | ||||
| #define _SEMIHOSTING_H_ | ||||
| #include <chrono> | ||||
| #include <functional> | ||||
| #include <iss/arch_if.h> | ||||
| /* | ||||
|  * According to: | ||||
|  * "Semihosting for AArch32 and AArch64, Release 2.0" | ||||
|  * https://static.docs.arm.com/100863/0200/semihosting.pdf | ||||
|  * from ARM Ltd. | ||||
|  * | ||||
|  * The available semihosting operation numbers passed in A0 are allocated | ||||
|  * as follows: | ||||
|  * - 0x00-0x31 Used by ARM. | ||||
|  * - 0x32-0xFF Reserved for future use by ARM. | ||||
|  * - 0x100-0x1FF Reserved for user applications. These are not used by ARM. | ||||
|  *   However, if you are writing your own SVC operations, you are advised | ||||
|  *   to use a different SVC number rather than using the semihosted | ||||
|  *   SVC number and these operation type numbers. | ||||
|  * - 0x200-0xFFFFFFFF Undefined and currently unused. It is recommended | ||||
|  *   that you do not use these. | ||||
|  */ | ||||
| enum class semihosting_syscalls { | ||||
|  | ||||
|     SYS_OPEN = 0x01, | ||||
|     SYS_CLOSE = 0x02, | ||||
|     SYS_WRITEC = 0x03, | ||||
|     SYS_WRITE0 = 0x04, | ||||
|     SYS_WRITE = 0x05, | ||||
|     SYS_READ = 0x06, | ||||
|     SYS_READC = 0x07, | ||||
|     SYS_ISERROR = 0x08, | ||||
|     SYS_ISTTY = 0x09, | ||||
|     SYS_SEEK = 0x0A, | ||||
|     SYS_FLEN = 0x0C, | ||||
|     SYS_TMPNAM = 0x0D, | ||||
|     SYS_REMOVE = 0x0E, | ||||
|     SYS_RENAME = 0x0F, | ||||
|     SYS_CLOCK = 0x10, | ||||
|     SYS_TIME = 0x11, | ||||
|     SYS_SYSTEM = 0x12, | ||||
|     SYS_ERRNO = 0x13, | ||||
|     SYS_GET_CMDLINE = 0x15, | ||||
|     SYS_HEAPINFO = 0x16, | ||||
|     SYS_EXIT = 0x18, | ||||
|     SYS_EXIT_EXTENDED = 0x20, | ||||
|     SYS_ELAPSED = 0x30, | ||||
|     SYS_TICKFREQ = 0x31, | ||||
|     USER_CMD_0x100 = 0x100, | ||||
|     USER_CMD_0x1FF = 0x1FF, | ||||
| }; | ||||
|  | ||||
| template <typename T> struct semihosting_callback { | ||||
|     std::chrono::high_resolution_clock::time_point timeVar; | ||||
|     semihosting_callback() | ||||
|     : timeVar(std::chrono::high_resolution_clock::now()) {} | ||||
|     void operator()(iss::arch_if* arch_if_ptr, T* call_number, T* parameter); | ||||
| }; | ||||
|  | ||||
| template <typename T> using semihosting_cb_t = std::function<void(iss::arch_if*, T*, T*)>; | ||||
| #endif | ||||
							
								
								
									
										159
									
								
								src/main.cpp
									
									
									
									
									
								
							
							
						
						
									
										159
									
								
								src/main.cpp
									
									
									
									
									
								
							| @@ -30,20 +30,24 @@ | ||||
|  * | ||||
|  *******************************************************************************/ | ||||
|  | ||||
| #include <iostream> | ||||
| #include <vector> | ||||
| #include <array> | ||||
| #include <cstdint> | ||||
| #include <iostream> | ||||
| #include <iss/factory.h> | ||||
| #include <iss/semihosting/semihosting.h> | ||||
| #include <string> | ||||
| #include <unordered_map> | ||||
| #include <vector> | ||||
|  | ||||
| #include "iss/arch/tgc_mapper.h" | ||||
| #include <boost/lexical_cast.hpp> | ||||
| #include <boost/program_options.hpp> | ||||
| #include "iss/arch/tgc_mapper.h" | ||||
| #ifdef WITH_LLVM | ||||
| #include <iss/llvm/jit_init.h> | ||||
| #endif | ||||
| #include <iss/log_categories.h> | ||||
| #include "iss/plugin/cycle_estimate.h" | ||||
| #include "iss/plugin/instruction_count.h" | ||||
| #include <iss/log_categories.h> | ||||
| #ifndef WIN32 | ||||
| #include <iss/plugin/loader.h> | ||||
| #endif | ||||
| @@ -52,8 +56,7 @@ | ||||
| #endif | ||||
|  | ||||
| namespace po = boost::program_options; | ||||
|  | ||||
| int main(int argc, char *argv[]) { | ||||
| int main(int argc, char* argv[]) { | ||||
|     /* | ||||
|      *  Define and parse the program options | ||||
|      */ | ||||
| @@ -66,25 +69,26 @@ int main(int argc, char *argv[]) { | ||||
|         ("logfile,l", po::value<std::string>(), "Sets default log file.") | ||||
|         ("disass,d", po::value<std::string>()->implicit_value(""), "Enables disassembly") | ||||
|         ("gdb-port,g", po::value<unsigned>()->default_value(0), "enable gdb server and specify port to use") | ||||
|         ("instructions,i", po::value<uint64_t>()->default_value(std::numeric_limits<uint64_t>::max()), "max. number of instructions to simulate") | ||||
|         ("ilimit,i", po::value<uint64_t>()->default_value(std::numeric_limits<uint64_t>::max()), "max. number of instructions to simulate") | ||||
|         ("flimit", po::value<uint64_t>()->default_value(std::numeric_limits<uint64_t>::max()), "max. number of fetches to simulate") | ||||
|         ("reset,r", po::value<std::string>(), "reset address") | ||||
|         ("dump-ir", "dump the intermediate representation") | ||||
|         ("elf,f", po::value<std::vector<std::string>>(), "ELF file(s) to load") | ||||
|         ("mem,m", po::value<std::string>(), "the memory input file") | ||||
|         ("plugin,p", po::value<std::vector<std::string>>(), "plugin to activate") | ||||
|         ("backend", po::value<std::string>()->default_value("interp"), "the ISS backend to use, options are: interp, tcc") | ||||
|         ("backend", po::value<std::string>()->default_value("interp"), "the ISS backend to use, options are: interp, llvm, tcc, asmjit") | ||||
|         ("isa", po::value<std::string>()->default_value("tgc5c"), "core or isa name to use for simulation, use '?' to get list"); | ||||
|     // clang-format on | ||||
|     auto parsed = po::command_line_parser(argc, argv).options(desc).allow_unregistered().run(); | ||||
|     try { | ||||
|         po::store(parsed, clim); // can throw | ||||
|         // --help option | ||||
|         if (clim.count("help")) { | ||||
|         if(clim.count("help")) { | ||||
|             std::cout << "DBT-RISE-TGC simulator for TGC RISC-V cores" << std::endl << desc << std::endl; | ||||
|             return 0; | ||||
|         } | ||||
|         po::notify(clim); // throws on error, so do after help in case | ||||
|     } catch (po::error &e) { | ||||
|     } catch(po::error& e) { | ||||
|         // there are problems | ||||
|         std::cerr << "ERROR: " << e.what() << std::endl << std::endl; | ||||
|         std::cerr << desc << std::endl; | ||||
| @@ -97,14 +101,14 @@ int main(int argc, char *argv[]) { | ||||
|     auto l = logging::as_log_level(clim["verbose"].as<int>()); | ||||
|     LOGGER(DEFAULT)::reporting_level() = l; | ||||
|     LOGGER(connection)::reporting_level() = l; | ||||
|     if (clim.count("logfile")) { | ||||
|     if(clim.count("logfile")) { | ||||
|         // configure the connection logger | ||||
|         auto f = fopen(clim["logfile"].as<std::string>().c_str(), "w"); | ||||
|         LOG_OUTPUT(DEFAULT)::stream() = f; | ||||
|         LOG_OUTPUT(connection)::stream() = f; | ||||
|     } | ||||
|  | ||||
|     std::vector<iss::vm_plugin *> plugin_list; | ||||
|     std::vector<iss::vm_plugin*> plugin_list; | ||||
|     auto res = 0; | ||||
|     try { | ||||
| #ifdef WITH_LLVM | ||||
| @@ -112,51 +116,57 @@ int main(int argc, char *argv[]) { | ||||
|         iss::init_jit_debug(argc, argv); | ||||
| #endif | ||||
|         bool dump = clim.count("dump-ir"); | ||||
|         auto & f = iss::core_factory::instance(); | ||||
|         auto& f = iss::core_factory::instance(); | ||||
|         // instantiate the simulator | ||||
|         iss::vm_ptr vm{nullptr}; | ||||
|         iss::cpu_ptr cpu{nullptr}; | ||||
|         semihosting_callback<uint32_t> cb{}; | ||||
|         semihosting_cb_t<uint32_t> semihosting_cb = [&cb](iss::arch_if* i, uint32_t* a0, uint32_t* a1) { cb(i, a0, a1); }; | ||||
|         std::string isa_opt(clim["isa"].as<std::string>()); | ||||
|         if(isa_opt.size()==0 || isa_opt == "?") { | ||||
|         if(isa_opt.size() == 0 || isa_opt == "?") { | ||||
|             auto list = f.get_names(); | ||||
|             std::sort(std::begin(list), std::end(list)); | ||||
|             std::cout<<"Available implementations (core|platform|backend):\n  - "<<util::join(list, "\n  - ")<<std::endl; | ||||
|             std::cout << "Available implementations (core|platform|backend):\n  - " << util::join(list, "\n  - ") << std::endl; | ||||
|             return 0; | ||||
|         } else if (isa_opt.find('|') != std::string::npos) { | ||||
|             std::tie(cpu, vm) = f.create(isa_opt+"|"+clim["backend"].as<std::string>(), clim["gdb-port"].as<unsigned>()); | ||||
|         } else if(isa_opt.find('|') != std::string::npos) { | ||||
|             std::tie(cpu, vm) = | ||||
|                 f.create(isa_opt + "|" + clim["backend"].as<std::string>(), clim["gdb-port"].as<unsigned>(), &semihosting_cb); | ||||
|         } else { | ||||
|             auto base_isa = isa_opt.substr(0, 5); | ||||
|             if(base_isa=="tgc5d" || base_isa=="tgc5e") { | ||||
|                 isa_opt += "|mu_p_clic_pmp|"+clim["backend"].as<std::string>(); | ||||
|             if(base_isa == "tgc5d" || base_isa == "tgc5e") { | ||||
|                 isa_opt += "|mu_p_clic_pmp|" + clim["backend"].as<std::string>(); | ||||
|             } else { | ||||
|                 isa_opt += "|m_p|"+clim["backend"].as<std::string>(); | ||||
|                 isa_opt += "|m_p|" + clim["backend"].as<std::string>(); | ||||
|             } | ||||
|             std::tie(cpu, vm) = f.create(isa_opt, clim["gdb-port"].as<unsigned>()); | ||||
|             std::tie(cpu, vm) = f.create(isa_opt, clim["gdb-port"].as<unsigned>(), &semihosting_cb); | ||||
|         } | ||||
|         if(!cpu ){ | ||||
|             LOG(ERR) << "Could not create cpu for isa " << isa_opt << " and backend " <<clim["backend"].as<std::string>()<< std::endl; | ||||
|         if(!cpu) { | ||||
|             auto list = f.get_names(); | ||||
|             std::sort(std::begin(list), std::end(list)); | ||||
|             CPPLOG(ERR) << "Could not create cpu for isa " << isa_opt << " and backend " << clim["backend"].as<std::string>() << "\n" | ||||
|                         << "Available implementations (core|platform|backend):\n  - " << util::join(list, "\n  - ") << std::endl; | ||||
|             return 127; | ||||
|         } | ||||
|         if(!vm ){ | ||||
|             LOG(ERR) << "Could not create vm for isa " << isa_opt << " and backend " <<clim["backend"].as<std::string>()<< std::endl; | ||||
|         if(!vm) { | ||||
|             CPPLOG(ERR) << "Could not create vm for isa " << isa_opt << " and backend " << clim["backend"].as<std::string>() << std::endl; | ||||
|             return 127; | ||||
|         } | ||||
|         if (clim.count("plugin")) { | ||||
|             for (std::string const& opt_val : clim["plugin"].as<std::vector<std::string>>()) { | ||||
|                 std::string plugin_name=opt_val; | ||||
|         if(clim.count("plugin")) { | ||||
|             for(std::string const& opt_val : clim["plugin"].as<std::vector<std::string>>()) { | ||||
|                 std::string plugin_name = opt_val; | ||||
|                 std::string arg{""}; | ||||
|                 std::size_t found = opt_val.find('='); | ||||
|                 if (found != std::string::npos) { | ||||
|                 if(found != std::string::npos) { | ||||
|                     plugin_name = opt_val.substr(0, found); | ||||
|                     arg = opt_val.substr(found + 1, opt_val.size()); | ||||
|                 } | ||||
| #if defined(WITH_PLUGINS) | ||||
|                 if (plugin_name == "ic") { | ||||
|                     auto *ic_plugin = new iss::plugin::instruction_count(arg); | ||||
|                 if(plugin_name == "ic") { | ||||
|                     auto* ic_plugin = new iss::plugin::instruction_count(arg); | ||||
|                     vm->register_plugin(*ic_plugin); | ||||
|                     plugin_list.push_back(ic_plugin); | ||||
|                 } else if (plugin_name == "ce") { | ||||
|                     auto *ce_plugin = new iss::plugin::cycle_estimate(arg); | ||||
|                 } else if(plugin_name == "ce") { | ||||
|                     auto* ce_plugin = new iss::plugin::cycle_estimate(arg); | ||||
|                     vm->register_plugin(*ce_plugin); | ||||
|                     plugin_list.push_back(ce_plugin); | ||||
|                 } else | ||||
| @@ -168,54 +178,101 @@ int main(int argc, char *argv[]) { | ||||
|                         a.push_back({arg.c_str()}); | ||||
|                     iss::plugin::loader l(plugin_name, {{"initPlugin"}}); | ||||
|                     auto* plugin = l.call_function<iss::vm_plugin*>("initPlugin", a.size(), a.data()); | ||||
|                     if(plugin){ | ||||
|                     if(plugin) { | ||||
|                         vm->register_plugin(*plugin); | ||||
|                         plugin_list.push_back(plugin); | ||||
|                     } else | ||||
| #endif | ||||
|                     { | ||||
|                         LOG(ERR) << "Unknown plugin name: " << plugin_name << ", valid names are 'ce', 'ic'" << std::endl; | ||||
|                         CPPLOG(ERR) << "Unknown plugin name: " << plugin_name << ", valid names are 'ce', 'ic'" << std::endl; | ||||
|                         return 127; | ||||
|                     } | ||||
|                 } | ||||
|             } | ||||
|         } | ||||
|         if (clim.count("disass")) { | ||||
|         if(clim.count("disass")) { | ||||
|             vm->setDisassEnabled(true); | ||||
|             LOGGER(disass)::reporting_level() = logging::INFO; | ||||
|             LOGGER(disass)::print_time() = false; | ||||
|             auto file_name = clim["disass"].as<std::string>(); | ||||
|             if (file_name.length() > 0) { | ||||
|             if(file_name.length() > 0) { | ||||
|                 LOG_OUTPUT(disass)::stream() = fopen(file_name.c_str(), "w"); | ||||
|                 LOGGER(disass)::print_severity() = false; | ||||
|             } | ||||
|         } | ||||
|         uint64_t start_address = 0; | ||||
|         if (clim.count("mem")) | ||||
|         if(clim.count("mem")) | ||||
|             vm->get_arch()->load_file(clim["mem"].as<std::string>()); | ||||
|         if (clim.count("elf")) | ||||
|             for (std::string input : clim["elf"].as<std::vector<std::string>>()) { | ||||
|         if(clim.count("elf")) | ||||
|             for(std::string input : clim["elf"].as<std::vector<std::string>>()) { | ||||
|                 auto start_addr = vm->get_arch()->load_file(input); | ||||
|                 if (start_addr.second) start_address = start_addr.first; | ||||
|                 if(start_addr.second) | ||||
|                     start_address = start_addr.first; | ||||
|                 else { | ||||
|                     LOG(ERR) << "Error occured while loading file " << input << std::endl; | ||||
|                     return 1; | ||||
|                 } | ||||
|             } | ||||
|         for (std::string input : args) { | ||||
|         for(std::string input : args) { | ||||
|             auto start_addr = vm->get_arch()->load_file(input); // treat remaining arguments as elf files | ||||
|             if (start_addr.second) start_address = start_addr.first; | ||||
|             if(start_addr.second) | ||||
|                 start_address = start_addr.first; | ||||
|             else { | ||||
|                 LOG(ERR) << "Error occured while loading file " << input << std::endl; | ||||
|                 return 1; | ||||
|             } | ||||
|         } | ||||
|         if (clim.count("reset")) { | ||||
|         if(clim.count("reset")) { | ||||
|             auto str = clim["reset"].as<std::string>(); | ||||
|             start_address = str.find("0x") == 0 ? std::stoull(str.substr(2), nullptr, 16) : std::stoull(str, nullptr, 10); | ||||
|         } | ||||
|         vm->reset(start_address); | ||||
|         auto cycles = clim["instructions"].as<uint64_t>(); | ||||
|         res = vm->start(cycles, dump); | ||||
|     } catch (std::exception &e) { | ||||
|         LOG(ERR) << "Unhandled Exception reached the top of main: " << e.what() << ", application will now exit" | ||||
|                    << std::endl; | ||||
|         auto limit = clim["ilimit"].as<uint64_t>(); | ||||
|         auto cond = iss::finish_cond_e::JUMP_TO_SELF; | ||||
|         if(clim.count("flimit")) { | ||||
|             cond = cond | iss::finish_cond_e::FCOUNT_LIMIT; | ||||
|             limit = clim["flimit"].as<uint64_t>(); | ||||
|         } else { | ||||
|             cond = cond | iss::finish_cond_e::ICOUNT_LIMIT; | ||||
|         } | ||||
|         res = vm->start(limit, dump, cond); | ||||
|  | ||||
|         auto instr_if = vm->get_arch()->get_instrumentation_if(); | ||||
|         // this assumes a single input file | ||||
|         std::unordered_map<std::string, uint64_t> sym_table; | ||||
|         if(args.empty()) | ||||
|             sym_table = instr_if->get_symbol_table(clim["elf"].as<std::vector<std::string>>()[0]); | ||||
|         else | ||||
|             sym_table = instr_if->get_symbol_table(args[0]); | ||||
|         if(sym_table.find("begin_signature") != std::end(sym_table) && sym_table.find("end_signature") != std::end(sym_table)) { | ||||
|             auto start_addr = sym_table["begin_signature"]; | ||||
|             auto end_addr = sym_table["end_signature"]; | ||||
|             std::array<uint8_t, 4> data; | ||||
|             std::ofstream file; | ||||
|             std::string filename = fmt::format("{}.signature", isa_opt); | ||||
|             std::replace(std::begin(filename), std::end(filename), '|', '_'); | ||||
|             // default riscof requires this filename | ||||
|             filename = "DUT-tgc.signature"; | ||||
|             file.open(filename, std::ios::out); | ||||
|             if(!file.is_open()) { | ||||
|                 LOG(ERR) << "Error opening file " << filename << std::endl; | ||||
|                 return 1; | ||||
|             } | ||||
|             for(auto addr = start_addr; addr < end_addr; addr += data.size()) { | ||||
|                 vm->get_arch()->read(iss::address_type::PHYSICAL, iss::access_type::DEBUG_READ, 0 /*MEM*/, addr, data.size(), | ||||
|                                      data.data()); // FIXME: get space from iss::arch::traits<ARCH>::mem_type_e::MEM | ||||
|  | ||||
|                 // TODO : obey Target endianess | ||||
|                 uint32_t to_print = (data[3] << 24) + (data[2] << 16) + (data[1] << 8) + data[0]; | ||||
|                 file << std::hex << fmt::format("{:08x}", to_print) << std::dec << std::endl; | ||||
|             } | ||||
|         } | ||||
|     } catch(std::exception& e) { | ||||
|         CPPLOG(ERR) << "Unhandled Exception reached the top of main: " << e.what() << ", application will now exit" << std::endl; | ||||
|         res = 2; | ||||
|     } | ||||
|     // cleanup to let plugins report of needed | ||||
|     for (auto *p : plugin_list) { | ||||
|     // cleanup to let plugins report if needed | ||||
|     for(auto* p : plugin_list) { | ||||
|         delete p; | ||||
|     } | ||||
|     return res; | ||||
|   | ||||
| @@ -42,20 +42,22 @@ | ||||
| #include <iss/plugin/loader.h> | ||||
| #endif | ||||
| #include "sc_core_adapter_if.h" | ||||
| #include <iss/arch/tgc_mapper.h> | ||||
| #include <scc/report.h> | ||||
| #include <util/ities.h> | ||||
| #include <iostream> | ||||
| #include <sstream> | ||||
| #include <array> | ||||
| #include <numeric> | ||||
| #include <iss/plugin/cycle_estimate.h> | ||||
| #include <iss/plugin/instruction_count.h> | ||||
|  | ||||
| // clang-format on | ||||
|  | ||||
| #define STR(X) #X | ||||
| #define CREATE_CORE(CN) \ | ||||
| if (type == STR(CN)) { std::tie(cpu, vm) = create_core<CN ## _plat_type>(backend, gdb_port, hart_id); } else | ||||
| #define CREATE_CORE(CN)                                                                                                                    \ | ||||
|     if(type == STR(CN)) {                                                                                                                  \ | ||||
|         std::tie(cpu, vm) = create_core<CN##_plat_type>(backend, gdb_port, hart_id);                                                       \ | ||||
|     } else | ||||
|  | ||||
| #ifdef HAS_SCV | ||||
| #include <scv.h> | ||||
| @@ -86,23 +88,22 @@ using namespace sc_core; | ||||
| namespace { | ||||
| iss::debugger::encoder_decoder encdec; | ||||
| std::array<const char, 4> lvl = {{'U', 'S', 'H', 'M'}}; | ||||
| } | ||||
| } // namespace | ||||
|  | ||||
| int cmd_sysc(int argc, char *argv[], debugger::out_func of, debugger::data_func df, | ||||
|              debugger::target_adapter_if *tgt_adapter) { | ||||
|     if (argc > 1) { | ||||
|         if (strcasecmp(argv[1], "print_time") == 0) { | ||||
| int cmd_sysc(int argc, char* argv[], debugger::out_func of, debugger::data_func df, debugger::target_adapter_if* tgt_adapter) { | ||||
|     if(argc > 1) { | ||||
|         if(strcasecmp(argv[1], "print_time") == 0) { | ||||
|             std::string t = sc_time_stamp().to_string(); | ||||
|             of(t.c_str()); | ||||
|             std::array<char, 64> buf; | ||||
|             encdec.enc_string(t.c_str(), buf.data(), 63); | ||||
|             df(buf.data()); | ||||
|             return Ok; | ||||
|         } else if (strcasecmp(argv[1], "break") == 0) { | ||||
|         } else if(strcasecmp(argv[1], "break") == 0) { | ||||
|             sc_time t; | ||||
|             if (argc == 4) { | ||||
|             if(argc == 4) { | ||||
|                 t = scc::parse_from_string(argv[2], argv[3]); | ||||
|             } else if (argc == 3) { | ||||
|             } else if(argc == 3) { | ||||
|                 t = scc::parse_from_string(argv[2]); | ||||
|             } else | ||||
|                 return Err; | ||||
| @@ -119,17 +120,19 @@ int cmd_sysc(int argc, char *argv[], debugger::out_func of, debugger::data_func | ||||
| } | ||||
|  | ||||
| using cpu_ptr = std::unique_ptr<iss::arch_if>; | ||||
| using vm_ptr= std::unique_ptr<iss::vm_if>; | ||||
| using vm_ptr = std::unique_ptr<iss::vm_if>; | ||||
|  | ||||
| class core_wrapper { | ||||
| public: | ||||
|     core_wrapper(core_complex *owner) : owner(owner) { } | ||||
|     core_wrapper(core_complex_if* owner) | ||||
|     : owner(owner) {} | ||||
|  | ||||
|     void reset(uint64_t addr){vm->reset(addr);} | ||||
|     inline void start(){vm->start();} | ||||
|     inline std::pair<uint64_t, bool> load_file(std::string const& name){ | ||||
|     void reset(uint64_t addr) { vm->reset(addr); } | ||||
|     inline void start(bool dump = false) { vm->start(std::numeric_limits<uint64_t>::max(), dump); } | ||||
|     inline std::pair<uint64_t, bool> load_file(std::string const& name) { | ||||
|         iss::arch_if* cc = cpu->get_arch_if(); | ||||
|         return cc->load_file(name);}; | ||||
|         return cc->load_file(name); | ||||
|     }; | ||||
|  | ||||
|     std::function<unsigned(void)> get_mode; | ||||
|     std::function<uint64_t(void)> get_state; | ||||
| @@ -137,26 +140,26 @@ public: | ||||
|     std::function<void(bool)> set_interrupt_execution; | ||||
|     std::function<void(short, bool)> local_irq; | ||||
|  | ||||
|     void create_cpu(std::string const& type, std::string const& backend, unsigned gdb_port, uint32_t hart_id){ | ||||
|         auto & f = sysc::iss_factory::instance(); | ||||
|         if(type.size()==0 || type == "?") { | ||||
|             std::cout<<"Available cores: "<<util::join(f.get_names(), ", ")<<std::endl; | ||||
|     void create_cpu(std::string const& type, std::string const& backend, unsigned gdb_port, uint32_t hart_id) { | ||||
|         auto& f = sysc::iss_factory::instance(); | ||||
|         if(type.size() == 0 || type == "?") { | ||||
|             std::cout << "Available cores: " << util::join(f.get_names(), ", ") << std::endl; | ||||
|             sc_core::sc_stop(); | ||||
|         } else if (type.find('|') != std::string::npos) { | ||||
|             std::tie(cpu, vm) = f.create(type+"|"+backend); | ||||
|         } else if(type.find('|') != std::string::npos) { | ||||
|             std::tie(cpu, vm) = f.create(type + "|" + backend); | ||||
|         } else { | ||||
|             auto base_isa = type.substr(0, 5); | ||||
|             if(base_isa=="tgc5d" || base_isa=="tgc5e") { | ||||
|                 std::tie(cpu, vm) = f.create(type + "|mu_p_clic_pmp|" + backend, gdb_port); | ||||
|             if(base_isa == "tgc5d" || base_isa == "tgc5e") { | ||||
|                 std::tie(cpu, vm) = f.create(type + "|mu_p_clic_pmp|" + backend, gdb_port, owner); | ||||
|             } else { | ||||
|                 std::tie(cpu, vm) = f.create(type + "|m_p|" + backend, gdb_port, owner); | ||||
|            } | ||||
|             } | ||||
|         } | ||||
|         if(!cpu ){ | ||||
|             SCCFATAL() << "Could not create cpu for isa " << type << " and backend " <<backend; | ||||
|         if(!cpu) { | ||||
|             SCCFATAL() << "Could not create cpu for isa " << type << " and backend " << backend; | ||||
|         } | ||||
|         if(!vm ){ | ||||
|             SCCFATAL() << "Could not create vm for isa " << type << " and backend " <<backend; | ||||
|         if(!vm) { | ||||
|             SCCFATAL() << "Could not create vm for isa " << type << " and backend " << backend; | ||||
|         } | ||||
|         auto* sc_cpu_if = reinterpret_cast<sc_core_adapter_if*>(cpu.get()); | ||||
|         sc_cpu_if->set_mhartid(hart_id); | ||||
| @@ -166,63 +169,64 @@ public: | ||||
|         set_interrupt_execution = [sc_cpu_if](bool b) { return sc_cpu_if->set_interrupt_execution(b); }; | ||||
|         local_irq = [sc_cpu_if](short s, bool b) { return sc_cpu_if->local_irq(s, b); }; | ||||
|  | ||||
|         auto *srv = debugger::server<debugger::gdb_session>::get(); | ||||
|         if (srv) tgt_adapter = srv->get_target(); | ||||
|         if (tgt_adapter) | ||||
|             tgt_adapter->add_custom_command( | ||||
|                 {"sysc", [this](int argc, char *argv[], debugger::out_func of, | ||||
|                                 debugger::data_func df) -> int { return cmd_sysc(argc, argv, of, df, tgt_adapter); }, | ||||
|                  "SystemC sub-commands: break <time>, print_time"}); | ||||
|  | ||||
|         auto* srv = debugger::server<debugger::gdb_session>::get(); | ||||
|         if(srv) | ||||
|             tgt_adapter = srv->get_target(); | ||||
|         if(tgt_adapter) | ||||
|             tgt_adapter->add_custom_command({"sysc", | ||||
|                                              [this](int argc, char* argv[], debugger::out_func of, debugger::data_func df) -> int { | ||||
|                                                  return cmd_sysc(argc, argv, of, df, tgt_adapter); | ||||
|                                              }, | ||||
|                                              "SystemC sub-commands: break <time>, print_time"}); | ||||
|     } | ||||
|  | ||||
|     core_complex * const owner; | ||||
|     core_complex_if* const owner; | ||||
|     vm_ptr vm{nullptr}; | ||||
|     sc_cpu_ptr cpu{nullptr}; | ||||
|     iss::debugger::target_adapter_if *tgt_adapter{nullptr}; | ||||
|     iss::debugger::target_adapter_if* tgt_adapter{nullptr}; | ||||
| }; | ||||
|  | ||||
| struct core_trace { | ||||
|     //! transaction recording database | ||||
|     scv_tr_db *m_db{nullptr}; | ||||
|     scv_tr_db* m_db{nullptr}; | ||||
|     //! blocking transaction recording stream handle | ||||
|     scv_tr_stream *stream_handle{nullptr}; | ||||
|     scv_tr_stream* stream_handle{nullptr}; | ||||
|     //! transaction generator handle for blocking transactions | ||||
|     scv_tr_generator<_scv_tr_generator_default_data, _scv_tr_generator_default_data> *instr_tr_handle{nullptr}; | ||||
|     scv_tr_generator<_scv_tr_generator_default_data, _scv_tr_generator_default_data>* instr_tr_handle{nullptr}; | ||||
|     scv_tr_handle tr_handle; | ||||
| }; | ||||
|  | ||||
| SC_HAS_PROCESS(core_complex);// NOLINT | ||||
| #ifndef CWR_SYSTEMC | ||||
| core_complex::core_complex(sc_module_name const& name) | ||||
| template <unsigned int BUSWIDTH> | ||||
| core_complex<BUSWIDTH>::core_complex(sc_module_name const& name) | ||||
| : sc_module(name) | ||||
| , fetch_lut(tlm_dmi_ext()) | ||||
| , read_lut(tlm_dmi_ext()) | ||||
| , write_lut(tlm_dmi_ext()) | ||||
| { | ||||
| 	init(); | ||||
| , write_lut(tlm_dmi_ext()) { | ||||
|     init(); | ||||
| } | ||||
| #endif | ||||
|  | ||||
| void core_complex::init(){ | ||||
| 	trc=new core_trace(); | ||||
| template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::init() { | ||||
|     trc = new core_trace(); | ||||
|     ibus.register_invalidate_direct_mem_ptr([=](uint64_t start, uint64_t end) -> void { | ||||
|         auto lut_entry = fetch_lut.getEntry(start); | ||||
|         if (lut_entry.get_granted_access() != tlm::tlm_dmi::DMI_ACCESS_NONE && end <= lut_entry.get_end_address() + 1) { | ||||
|         if(lut_entry.get_granted_access() != tlm::tlm_dmi::DMI_ACCESS_NONE && end <= lut_entry.get_end_address() + 1) { | ||||
|             fetch_lut.removeEntry(lut_entry); | ||||
|         } | ||||
|     }); | ||||
|     dbus.register_invalidate_direct_mem_ptr([=](uint64_t start, uint64_t end) -> void { | ||||
|         auto lut_entry = read_lut.getEntry(start); | ||||
|         if (lut_entry.get_granted_access() != tlm::tlm_dmi::DMI_ACCESS_NONE && end <= lut_entry.get_end_address() + 1) { | ||||
|         if(lut_entry.get_granted_access() != tlm::tlm_dmi::DMI_ACCESS_NONE && end <= lut_entry.get_end_address() + 1) { | ||||
|             read_lut.removeEntry(lut_entry); | ||||
|         } | ||||
|         lut_entry = write_lut.getEntry(start); | ||||
|         if (lut_entry.get_granted_access() != tlm::tlm_dmi::DMI_ACCESS_NONE && end <= lut_entry.get_end_address() + 1) { | ||||
|         if(lut_entry.get_granted_access() != tlm::tlm_dmi::DMI_ACCESS_NONE && end <= lut_entry.get_end_address() + 1) { | ||||
|             write_lut.removeEntry(lut_entry); | ||||
|         } | ||||
|     }); | ||||
|  | ||||
|     SC_HAS_PROCESS(core_complex<BUSWIDTH>); // NOLINT | ||||
|     SC_THREAD(run); | ||||
|     SC_METHOD(rst_cb); | ||||
|     sensitive << rst_i; | ||||
| @@ -233,53 +237,53 @@ void core_complex::init(){ | ||||
|     SC_METHOD(ext_irq_cb); | ||||
|     sensitive << ext_irq_i; | ||||
|     SC_METHOD(local_irq_cb); | ||||
|     for(auto pin:local_irq_i) | ||||
|     for(auto pin : local_irq_i) | ||||
|         sensitive << pin; | ||||
|     trc->m_db=scv_tr_db::get_default_db(); | ||||
|     trc->m_db = scv_tr_db::get_default_db(); | ||||
|  | ||||
| 	SC_METHOD(forward); | ||||
|     SC_METHOD(forward); | ||||
| #ifndef CWR_SYSTEMC | ||||
| 	sensitive<<clk_i; | ||||
|     sensitive << clk_i; | ||||
| #else | ||||
| 	sensitive<<curr_clk; | ||||
| 	t2t.reset(new scc::tick2time{"t2t"}); | ||||
| 	t2t->clk_i(clk_i); | ||||
| 	t2t->clk_o(curr_clk); | ||||
|     sensitive << curr_clk; | ||||
|     t2t.reset(new scc::tick2time{"t2t"}); | ||||
|     t2t->clk_i(clk_i); | ||||
|     t2t->clk_o(curr_clk); | ||||
| #endif | ||||
| } | ||||
|  | ||||
| core_complex::~core_complex(){ | ||||
| template <unsigned int BUSWIDTH> core_complex<BUSWIDTH>::~core_complex() { | ||||
|     delete cpu; | ||||
|     delete trc; | ||||
|     for (auto *p : plugin_list) | ||||
|     for(auto* p : plugin_list) | ||||
|         delete p; | ||||
| } | ||||
|  | ||||
| void core_complex::trace(sc_trace_file *trf) const {} | ||||
| template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::trace(sc_trace_file* trf) const {} | ||||
|  | ||||
| void core_complex::before_end_of_elaboration() { | ||||
|     SCCDEBUG(SCMOD)<<"instantiating iss::arch::tgf with "<<GET_PROP_VALUE(backend)<<" backend"; | ||||
| template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::before_end_of_elaboration() { | ||||
|     SCCDEBUG(SCMOD) << "instantiating iss::arch::tgf with " << GET_PROP_VALUE(backend) << " backend"; | ||||
|     // cpu = scc::make_unique<core_wrapper>(this); | ||||
|     cpu = new core_wrapper(this); | ||||
|     cpu->create_cpu(GET_PROP_VALUE(core_type), GET_PROP_VALUE(backend), GET_PROP_VALUE(gdb_server_port), GET_PROP_VALUE(mhartid)); | ||||
|     sc_assert(cpu->vm!=nullptr); | ||||
|     sc_assert(cpu->vm != nullptr); | ||||
|     cpu->vm->setDisassEnabled(GET_PROP_VALUE(enable_disass) || trc->m_db != nullptr); | ||||
|     if (GET_PROP_VALUE(plugins).length()) { | ||||
|     if(GET_PROP_VALUE(plugins).length()) { | ||||
|         auto p = util::split(GET_PROP_VALUE(plugins), ';'); | ||||
|         for (std::string const& opt_val : p) { | ||||
|             std::string plugin_name=opt_val; | ||||
|         for(std::string const& opt_val : p) { | ||||
|             std::string plugin_name = opt_val; | ||||
|             std::string filename{"cycles.txt"}; | ||||
|             std::size_t found = opt_val.find('='); | ||||
|             if (found != std::string::npos) { | ||||
|             if(found != std::string::npos) { | ||||
|                 plugin_name = opt_val.substr(0, found); | ||||
|                 filename = opt_val.substr(found + 1, opt_val.size()); | ||||
|             } | ||||
|             if (plugin_name == "ic") { | ||||
|                 auto *plugin = new iss::plugin::instruction_count(filename); | ||||
|             if(plugin_name == "ic") { | ||||
|                 auto* plugin = new iss::plugin::instruction_count(filename); | ||||
|                 cpu->vm->register_plugin(*plugin); | ||||
|                 plugin_list.push_back(plugin); | ||||
|             } else if (plugin_name == "ce") { | ||||
|                 auto *plugin = new iss::plugin::cycle_estimate(filename); | ||||
|             } else if(plugin_name == "ce") { | ||||
|                 auto* plugin = new iss::plugin::cycle_estimate(filename); | ||||
|                 cpu->vm->register_plugin(*plugin); | ||||
|                 plugin_list.push_back(plugin); | ||||
|             } else { | ||||
| @@ -287,7 +291,7 @@ void core_complex::before_end_of_elaboration() { | ||||
|                 std::array<char const*, 1> a{{filename.c_str()}}; | ||||
|                 iss::plugin::loader l(plugin_name, {{"initPlugin"}}); | ||||
|                 auto* plugin = l.call_function<iss::vm_plugin*>("initPlugin", a.size(), a.data()); | ||||
|                 if(plugin){ | ||||
|                 if(plugin) { | ||||
|                     cpu->vm->register_plugin(*plugin); | ||||
|                     plugin_list.push_back(plugin); | ||||
|                 } else | ||||
| @@ -296,35 +300,36 @@ void core_complex::before_end_of_elaboration() { | ||||
|             } | ||||
|         } | ||||
|     } | ||||
|  | ||||
| } | ||||
|  | ||||
| void core_complex::start_of_simulation() { | ||||
| template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::start_of_simulation() { | ||||
|     // quantum_keeper.reset(); | ||||
|     if (GET_PROP_VALUE(elf_file).size() > 0) { | ||||
|     if(GET_PROP_VALUE(elf_file).size() > 0) { | ||||
|         istringstream is(GET_PROP_VALUE(elf_file)); | ||||
|         string s; | ||||
|         while (getline(is, s, ',')) { | ||||
|         while(getline(is, s, ',')) { | ||||
|             std::pair<uint64_t, bool> start_addr = cpu->load_file(s); | ||||
| #ifndef CWR_SYSTEMC | ||||
|             if (reset_address.is_default_value() && start_addr.second == true) | ||||
|             if(reset_address.is_default_value() && start_addr.second == true) | ||||
|                 reset_address.set_value(start_addr.first); | ||||
| #else | ||||
|             if (start_addr.second == true) | ||||
|                 reset_address=start_addr.first; | ||||
|             if(start_addr.second == true) | ||||
|                 reset_address = start_addr.first; | ||||
| #endif | ||||
|         } | ||||
|     } | ||||
|     if (trc->m_db != nullptr && trc->stream_handle == nullptr) { | ||||
|     if(trc->m_db != nullptr && trc->stream_handle == nullptr) { | ||||
|         string basename(this->name()); | ||||
|         trc->stream_handle = new scv_tr_stream((basename + ".instr").c_str(), "TRANSACTOR", trc->m_db); | ||||
|         trc->instr_tr_handle = new scv_tr_generator<>("execute", *trc->stream_handle); | ||||
|     } | ||||
| } | ||||
|  | ||||
| bool core_complex::disass_output(uint64_t pc, const std::string instr_str) { | ||||
|     if (trc->m_db == nullptr) return false; | ||||
|     if (trc->tr_handle.is_active()) trc->tr_handle.end_transaction(); | ||||
| template <unsigned int BUSWIDTH> bool core_complex<BUSWIDTH>::disass_output(uint64_t pc, const std::string instr_str) { | ||||
|     if(trc->m_db == nullptr) | ||||
|         return false; | ||||
|     if(trc->tr_handle.is_active()) | ||||
|         trc->tr_handle.end_transaction(); | ||||
|     trc->tr_handle = trc->instr_tr_handle->begin_transaction(); | ||||
|     trc->tr_handle.record_attribute("PC", pc); | ||||
|     trc->tr_handle.record_attribute("INSTR", instr_str); | ||||
| @@ -334,111 +339,122 @@ bool core_complex::disass_output(uint64_t pc, const std::string instr_str) { | ||||
|     return true; | ||||
| } | ||||
|  | ||||
| void core_complex::forward() { | ||||
| template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::forward() { | ||||
| #ifndef CWR_SYSTEMC | ||||
| 	set_clock_period(clk_i.read()); | ||||
|     set_clock_period(clk_i.read()); | ||||
| #else | ||||
| 	set_clock_period(curr_clk.read()); | ||||
|     set_clock_period(curr_clk.read()); | ||||
|  | ||||
| #endif | ||||
| } | ||||
|  | ||||
| void core_complex::set_clock_period(sc_core::sc_time period) { | ||||
| 	curr_clk = period; | ||||
|     if (period == SC_ZERO_TIME) cpu->set_interrupt_execution(true); | ||||
| template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::set_clock_period(sc_core::sc_time period) { | ||||
|     curr_clk = period; | ||||
|     if(period == SC_ZERO_TIME) | ||||
|         cpu->set_interrupt_execution(true); | ||||
| } | ||||
|  | ||||
| void core_complex::rst_cb() { | ||||
|     if (rst_i.read()) cpu->set_interrupt_execution(true); | ||||
| template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::rst_cb() { | ||||
|     if(rst_i.read()) | ||||
|         cpu->set_interrupt_execution(true); | ||||
| } | ||||
|  | ||||
| void core_complex::sw_irq_cb() { cpu->local_irq(3, sw_irq_i.read()); } | ||||
| template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::sw_irq_cb() { cpu->local_irq(3, sw_irq_i.read()); } | ||||
|  | ||||
| void core_complex::timer_irq_cb() { cpu->local_irq(7, timer_irq_i.read()); } | ||||
| template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::timer_irq_cb() { cpu->local_irq(7, timer_irq_i.read()); } | ||||
|  | ||||
| void core_complex::ext_irq_cb() { cpu->local_irq(11, ext_irq_i.read()); } | ||||
| template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::ext_irq_cb() { cpu->local_irq(11, ext_irq_i.read()); } | ||||
|  | ||||
| void core_complex::local_irq_cb() { | ||||
|     for(auto i=0U; i<local_irq_i.size(); ++i) { | ||||
| template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::local_irq_cb() { | ||||
|     for(auto i = 0U; i < local_irq_i.size(); ++i) { | ||||
|         if(local_irq_i[i].event()) { | ||||
|             cpu->local_irq(16+i, local_irq_i[i].read()); | ||||
|             cpu->local_irq(16 + i, local_irq_i[i].read()); | ||||
|         } | ||||
|     } | ||||
| } | ||||
|  | ||||
| void core_complex::run() { | ||||
| template <unsigned int BUSWIDTH> void core_complex<BUSWIDTH>::run() { | ||||
|     wait(SC_ZERO_TIME); // separate from elaboration phase | ||||
|     do { | ||||
|         wait(SC_ZERO_TIME); | ||||
|         if (rst_i.read()) { | ||||
|         if(rst_i.read()) { | ||||
|             cpu->reset(GET_PROP_VALUE(reset_address)); | ||||
|             wait(rst_i.negedge_event()); | ||||
|         } | ||||
|         while (curr_clk.read() == SC_ZERO_TIME) { | ||||
|         while(curr_clk.read() == SC_ZERO_TIME) { | ||||
|             wait(curr_clk.value_changed_event()); | ||||
|         } | ||||
|         quantum_keeper.reset(); | ||||
|         cpu->set_interrupt_execution(false); | ||||
|         cpu->start(); | ||||
|     } while (cpu->get_interrupt_execution()); | ||||
|         cpu->start(dump_ir); | ||||
|     } while(cpu->get_interrupt_execution()); | ||||
|     sc_stop(); | ||||
| } | ||||
|  | ||||
| bool core_complex::read_mem(uint64_t addr, unsigned length, uint8_t *const data, bool is_fetch) { | ||||
|     auto& dmi_lut = is_fetch?fetch_lut:read_lut; | ||||
| template <unsigned int BUSWIDTH> bool core_complex<BUSWIDTH>::read_mem(uint64_t addr, unsigned length, uint8_t* const data, bool is_fetch) { | ||||
|     auto& dmi_lut = is_fetch ? fetch_lut : read_lut; | ||||
|     auto lut_entry = dmi_lut.getEntry(addr); | ||||
|     if (lut_entry.get_granted_access() != tlm::tlm_dmi::DMI_ACCESS_NONE && addr + length <= lut_entry.get_end_address() + 1) { | ||||
|     if(lut_entry.get_granted_access() != tlm::tlm_dmi::DMI_ACCESS_NONE && addr + length <= lut_entry.get_end_address() + 1) { | ||||
|         auto offset = addr - lut_entry.get_start_address(); | ||||
|         std::copy(lut_entry.get_dmi_ptr() + offset, lut_entry.get_dmi_ptr() + offset + length, data); | ||||
|         quantum_keeper.inc(lut_entry.get_read_latency()); | ||||
|         if(is_fetch) | ||||
|             ibus_inc += lut_entry.get_read_latency() / curr_clk; | ||||
|         else | ||||
|             dbus_inc += lut_entry.get_read_latency() / curr_clk; | ||||
|         return true; | ||||
|     } else { | ||||
|         auto& sckt = is_fetch? ibus : dbus; | ||||
|         auto& sckt = is_fetch ? ibus : dbus; | ||||
|         tlm::tlm_generic_payload gp; | ||||
|         gp.set_command(tlm::TLM_READ_COMMAND); | ||||
|         gp.set_address(addr); | ||||
|         gp.set_data_ptr(data); | ||||
|         gp.set_data_length(length); | ||||
|         gp.set_streaming_width(length); | ||||
|         sc_time delay=quantum_keeper.get_local_time(); | ||||
|         if (trc->m_db != nullptr && trc->tr_handle.is_valid()) { | ||||
|             if (is_fetch && trc->tr_handle.is_active()) { | ||||
|         sc_time delay = quantum_keeper.get_local_time(); | ||||
|         if(trc->m_db != nullptr && trc->tr_handle.is_valid()) { | ||||
|             if(is_fetch && trc->tr_handle.is_active()) { | ||||
|                 trc->tr_handle.end_transaction(); | ||||
|             } | ||||
|             auto preExt = new tlm::scc::scv::tlm_recording_extension(trc->tr_handle, this); | ||||
|             gp.set_extension(preExt); | ||||
|         } | ||||
|         sckt->b_transport(gp, delay); | ||||
|         auto incr = delay-quantum_keeper.get_local_time(); | ||||
|         if(is_fetch) | ||||
|             ibus_inc+=incr; | ||||
|         else | ||||
|             dbus_inc+=incr; | ||||
|         SCCTRACE(this->name()) << "[local time: "<<delay<<"]: finish read_mem(0x" << std::hex << addr << ") : 0x" << (length==4?*(uint32_t*)data:length==2?*(uint16_t*)data:(unsigned)*data); | ||||
|         if (gp.get_response_status() != tlm::TLM_OK_RESPONSE) { | ||||
|         auto pre_delay = delay; | ||||
|         dbus->b_transport(gp, delay); | ||||
|         if(pre_delay > delay) { | ||||
|             quantum_keeper.reset(); | ||||
|         } else { | ||||
|             auto incr = (delay - quantum_keeper.get_local_time()) / curr_clk; | ||||
|             if(is_fetch) | ||||
|                 ibus_inc += incr; | ||||
|             else | ||||
|                 dbus_inc += incr; | ||||
|         } | ||||
|         SCCTRACE(this->name()) << "[local time: " << delay << "]: finish read_mem(0x" << std::hex << addr << ") : 0x" | ||||
|                                << (length == 4   ? *(uint32_t*)data | ||||
|                                    : length == 2 ? *(uint16_t*)data | ||||
|                                                  : (unsigned)*data); | ||||
|         if(gp.get_response_status() != tlm::TLM_OK_RESPONSE) { | ||||
|             return false; | ||||
|         } | ||||
|         if (gp.is_dmi_allowed()) { | ||||
|         if(gp.is_dmi_allowed() && !GET_PROP_VALUE(disable_dmi)) { | ||||
|             gp.set_command(tlm::TLM_READ_COMMAND); | ||||
|             gp.set_address(addr); | ||||
|             tlm_dmi_ext dmi_data; | ||||
|             if (sckt->get_direct_mem_ptr(gp, dmi_data)) { | ||||
|                 if (dmi_data.is_read_allowed()) | ||||
|                     dmi_lut.addEntry(dmi_data, dmi_data.get_start_address(), | ||||
|                                       dmi_data.get_end_address() - dmi_data.get_start_address() + 1); | ||||
|             if(sckt->get_direct_mem_ptr(gp, dmi_data)) { | ||||
|                 if(dmi_data.is_read_allowed()) | ||||
|                     dmi_lut.addEntry(dmi_data, dmi_data.get_start_address(), dmi_data.get_end_address() - dmi_data.get_start_address() + 1); | ||||
|             } | ||||
|         } | ||||
|         return true; | ||||
|     } | ||||
| } | ||||
|  | ||||
| bool core_complex::write_mem(uint64_t addr, unsigned length, const uint8_t *const data) { | ||||
| template <unsigned int BUSWIDTH> bool core_complex<BUSWIDTH>::write_mem(uint64_t addr, unsigned length, const uint8_t* const data) { | ||||
|     auto lut_entry = write_lut.getEntry(addr); | ||||
|     if (lut_entry.get_granted_access() != tlm::tlm_dmi::DMI_ACCESS_NONE && | ||||
|         addr + length <= lut_entry.get_end_address() + 1) { | ||||
|     if(lut_entry.get_granted_access() != tlm::tlm_dmi::DMI_ACCESS_NONE && addr + length <= lut_entry.get_end_address() + 1) { | ||||
|         auto offset = addr - lut_entry.get_start_address(); | ||||
|         std::copy(data, data + length, lut_entry.get_dmi_ptr() + offset); | ||||
|         quantum_keeper.inc(lut_entry.get_read_latency()); | ||||
|         dbus_inc += lut_entry.get_write_latency() / curr_clk; | ||||
|         return true; | ||||
|     } else { | ||||
|         write_buf.resize(length); | ||||
| @@ -449,23 +465,30 @@ bool core_complex::write_mem(uint64_t addr, unsigned length, const uint8_t *cons | ||||
|         gp.set_data_ptr(write_buf.data()); | ||||
|         gp.set_data_length(length); | ||||
|         gp.set_streaming_width(length); | ||||
|         sc_time delay=quantum_keeper.get_local_time(); | ||||
|         if (trc->m_db != nullptr && trc->tr_handle.is_valid()) { | ||||
|         sc_time delay = quantum_keeper.get_local_time(); | ||||
|         if(trc->m_db != nullptr && trc->tr_handle.is_valid()) { | ||||
|             auto preExt = new tlm::scc::scv::tlm_recording_extension(trc->tr_handle, this); | ||||
|             gp.set_extension(preExt); | ||||
|         } | ||||
|         auto pre_delay = delay; | ||||
|         dbus->b_transport(gp, delay); | ||||
|         dbus_inc+=delay-quantum_keeper.get_local_time(); | ||||
|         SCCTRACE() << "[local time: "<<delay<<"]: finish write_mem(0x" << std::hex << addr << ") : 0x" << (length==4?*(uint32_t*)data:length==2?*(uint16_t*)data:(unsigned)*data); | ||||
|         if (gp.get_response_status() != tlm::TLM_OK_RESPONSE) { | ||||
|         if(pre_delay > delay) | ||||
|             quantum_keeper.reset(); | ||||
|         else | ||||
|             dbus_inc += (delay - quantum_keeper.get_local_time()) / curr_clk; | ||||
|         SCCTRACE() << "[local time: " << delay << "]: finish write_mem(0x" << std::hex << addr << ") : 0x" | ||||
|                    << (length == 4   ? *(uint32_t*)data | ||||
|                        : length == 2 ? *(uint16_t*)data | ||||
|                                      : (unsigned)*data); | ||||
|         if(gp.get_response_status() != tlm::TLM_OK_RESPONSE) { | ||||
|             return false; | ||||
|         } | ||||
|         if (gp.is_dmi_allowed()) { | ||||
|         if(gp.is_dmi_allowed() && !GET_PROP_VALUE(disable_dmi)) { | ||||
|             gp.set_command(tlm::TLM_READ_COMMAND); | ||||
|             gp.set_address(addr); | ||||
|             tlm_dmi_ext dmi_data; | ||||
|             if (dbus->get_direct_mem_ptr(gp, dmi_data)) { | ||||
|                 if (dmi_data.is_write_allowed()) | ||||
|             if(dbus->get_direct_mem_ptr(gp, dmi_data)) { | ||||
|                 if(dmi_data.is_write_allowed()) | ||||
|                     write_lut.addEntry(dmi_data, dmi_data.get_start_address(), | ||||
|                                        dmi_data.get_end_address() - dmi_data.get_start_address() + 1); | ||||
|             } | ||||
| @@ -474,7 +497,7 @@ bool core_complex::write_mem(uint64_t addr, unsigned length, const uint8_t *cons | ||||
|     } | ||||
| } | ||||
|  | ||||
| bool core_complex::read_mem_dbg(uint64_t addr, unsigned length, uint8_t *const data) { | ||||
| template <unsigned int BUSWIDTH> bool core_complex<BUSWIDTH>::read_mem_dbg(uint64_t addr, unsigned length, uint8_t* const data) { | ||||
|     tlm::tlm_generic_payload gp; | ||||
|     gp.set_command(tlm::TLM_READ_COMMAND); | ||||
|     gp.set_address(addr); | ||||
| @@ -484,7 +507,7 @@ bool core_complex::read_mem_dbg(uint64_t addr, unsigned length, uint8_t *const d | ||||
|     return dbus->transport_dbg(gp) == length; | ||||
| } | ||||
|  | ||||
| bool core_complex::write_mem_dbg(uint64_t addr, unsigned length, const uint8_t *const data) { | ||||
| template <unsigned int BUSWIDTH> bool core_complex<BUSWIDTH>::write_mem_dbg(uint64_t addr, unsigned length, const uint8_t* const data) { | ||||
|     write_buf.resize(length); | ||||
|     std::copy(data, data + length, write_buf.begin()); // need to copy as TLM does not guarantee data integrity | ||||
|     tlm::tlm_generic_payload gp; | ||||
| @@ -495,5 +518,10 @@ bool core_complex::write_mem_dbg(uint64_t addr, unsigned length, const uint8_t * | ||||
|     gp.set_streaming_width(length); | ||||
|     return dbus->transport_dbg(gp) == length; | ||||
| } | ||||
|  | ||||
| template class core_complex<scc::LT>; | ||||
| template class core_complex<32>; | ||||
| template class core_complex<64>; | ||||
|  | ||||
| } /* namespace tgfs */ | ||||
| } /* namespace sysc */ | ||||
|   | ||||
| @@ -33,47 +33,69 @@ | ||||
| #ifndef _SYSC_CORE_COMPLEX_H_ | ||||
| #define _SYSC_CORE_COMPLEX_H_ | ||||
|  | ||||
| #include <tlm/scc/initiator_mixin.h> | ||||
| #include <scc/traceable.h> | ||||
| #include <scc/signal_opt_ports.h> | ||||
| #include <scc/tick2time.h> | ||||
| #include <scc/traceable.h> | ||||
| #include <scc/utilities.h> | ||||
| #include <tlm/scc/initiator_mixin.h> | ||||
| #include <tlm/scc/scv/tlm_rec_initiator_socket.h> | ||||
| #ifdef CWR_SYSTEMC | ||||
| #include <scmlinc/scml_property.h> | ||||
| #define SOCKET_WIDTH 32 | ||||
| #else | ||||
| #include <cci_configuration> | ||||
| #define SOCKET_WIDTH scc::LT | ||||
| #endif | ||||
| #include <memory> | ||||
| #include <tlm> | ||||
| #include <tlm_utils/tlm_quantumkeeper.h> | ||||
| #include <util/range_lut.h> | ||||
| #include <memory> | ||||
|  | ||||
| namespace iss { | ||||
|     class vm_plugin; | ||||
| class vm_plugin; | ||||
| } | ||||
| namespace sysc { | ||||
|  | ||||
| class tlm_dmi_ext : public tlm::tlm_dmi { | ||||
| public: | ||||
|     bool operator==(const tlm_dmi_ext &o) const { | ||||
|         return this->get_granted_access() == o.get_granted_access() && | ||||
|                this->get_start_address() == o.get_start_address() && this->get_end_address() == o.get_end_address(); | ||||
|     bool operator==(const tlm_dmi_ext& o) const { | ||||
|         return this->get_granted_access() == o.get_granted_access() && this->get_start_address() == o.get_start_address() && | ||||
|                this->get_end_address() == o.get_end_address(); | ||||
|     } | ||||
|  | ||||
|     bool operator!=(const tlm_dmi_ext &o) const { return !operator==(o); } | ||||
|     bool operator!=(const tlm_dmi_ext& o) const { return !operator==(o); } | ||||
| }; | ||||
|  | ||||
| namespace tgfs { | ||||
| class core_wrapper; | ||||
| struct core_trace; | ||||
| struct core_complex_if { | ||||
|  | ||||
| class core_complex : public sc_core::sc_module, public scc::traceable { | ||||
|     virtual ~core_complex_if() = default; | ||||
|  | ||||
|     virtual bool read_mem(uint64_t addr, unsigned length, uint8_t* const data, bool is_fetch) = 0; | ||||
|  | ||||
|     virtual bool write_mem(uint64_t addr, unsigned length, const uint8_t* const data) = 0; | ||||
|  | ||||
|     virtual bool read_mem_dbg(uint64_t addr, unsigned length, uint8_t* const data) = 0; | ||||
|  | ||||
|     virtual bool write_mem_dbg(uint64_t addr, unsigned length, const uint8_t* const data) = 0; | ||||
|  | ||||
|     virtual bool disass_output(uint64_t pc, const std::string instr) = 0; | ||||
|  | ||||
|     virtual unsigned get_last_bus_cycles() = 0; | ||||
|  | ||||
|     //! Allow quantum keeper handling | ||||
|     virtual void sync(uint64_t) = 0; | ||||
|  | ||||
|     virtual char const* hier_name() = 0; | ||||
|  | ||||
|     scc::sc_in_opt<uint64_t> mtime_i{"mtime_i"}; | ||||
| }; | ||||
|  | ||||
| template <unsigned int BUSWIDTH = scc::LT> class core_complex : public sc_core::sc_module, public scc::traceable, public core_complex_if { | ||||
| public: | ||||
|     tlm::scc::initiator_mixin<tlm::tlm_initiator_socket<SOCKET_WIDTH>> ibus{"ibus"}; | ||||
|     tlm::scc::initiator_mixin<tlm::tlm_initiator_socket<BUSWIDTH>> ibus{"ibus"}; | ||||
|  | ||||
|     tlm::scc::initiator_mixin<tlm::tlm_initiator_socket<SOCKET_WIDTH>> dbus{"dbus"}; | ||||
|     tlm::scc::initiator_mixin<tlm::tlm_initiator_socket<BUSWIDTH>> dbus{"dbus"}; | ||||
|  | ||||
|     sc_core::sc_in<bool> rst_i{"rst_i"}; | ||||
|  | ||||
| @@ -86,14 +108,14 @@ public: | ||||
|     sc_core::sc_vector<sc_core::sc_in<bool>> local_irq_i{"local_irq_i", 16}; | ||||
|  | ||||
| #ifndef CWR_SYSTEMC | ||||
| 	sc_core::sc_in<sc_core::sc_time> clk_i{"clk_i"}; | ||||
|  | ||||
|     sc_core::sc_port<tlm::tlm_peek_if<uint64_t>, 1, sc_core::SC_ZERO_OR_MORE_BOUND> mtime_o{"mtime_o"}; | ||||
|     sc_core::sc_in<sc_core::sc_time> clk_i{"clk_i"}; | ||||
|  | ||||
|     cci::cci_param<std::string> elf_file{"elf_file", ""}; | ||||
|  | ||||
|     cci::cci_param<bool> enable_disass{"enable_disass", false}; | ||||
|  | ||||
|     cci::cci_param<bool> disable_dmi{"disable_dmi", false}; | ||||
|  | ||||
|     cci::cci_param<uint64_t> reset_address{"reset_address", 0ULL}; | ||||
|  | ||||
|     cci::cci_param<std::string> core_type{"core_type", "tgc5c"}; | ||||
| @@ -111,14 +133,14 @@ public: | ||||
|     core_complex(sc_core::sc_module_name const& name); | ||||
|  | ||||
| #else | ||||
| 	sc_core::sc_in<bool> clk_i{"clk_i"}; | ||||
|     sc_core::sc_in<bool> clk_i{"clk_i"}; | ||||
|  | ||||
| 	sc_core::sc_in<uint64_t> mtime_i{"mtime_i"}; | ||||
|  | ||||
| 	scml_property<std::string> elf_file{"elf_file", ""}; | ||||
|     scml_property<std::string> elf_file{"elf_file", ""}; | ||||
|  | ||||
|     scml_property<bool> enable_disass{"enable_disass", false}; | ||||
|  | ||||
|     scml_property<bool> disable_dmi{"disable_dmi", false}; | ||||
|  | ||||
|     scml_property<unsigned long long> reset_address{"reset_address", 0ULL}; | ||||
|  | ||||
|     scml_property<std::string> core_type{"core_type", "tgc5c"}; | ||||
| @@ -147,45 +169,50 @@ public: | ||||
|     , plugins{"plugins", ""} | ||||
|     , fetch_lut(tlm_dmi_ext()) | ||||
|     , read_lut(tlm_dmi_ext()) | ||||
|     , write_lut(tlm_dmi_ext()) | ||||
|     { | ||||
|     	init(); | ||||
|     , write_lut(tlm_dmi_ext()) { | ||||
|         init(); | ||||
|     } | ||||
|  | ||||
| #endif | ||||
|  | ||||
|     ~core_complex(); | ||||
|  | ||||
|     inline void sync(uint64_t cycle) { | ||||
|     unsigned get_last_bus_cycles() override { | ||||
|         auto mem_incr = std::max(ibus_inc, dbus_inc); | ||||
|         ibus_inc = dbus_inc = 0; | ||||
|         return mem_incr > 1 ? mem_incr : 1; | ||||
|     } | ||||
|  | ||||
|     void sync(uint64_t cycle) override { | ||||
|         auto core_inc = curr_clk * (cycle - last_sync_cycle); | ||||
|         auto incr = std::max(core_inc, std::max(ibus_inc, dbus_inc)); | ||||
|         quantum_keeper.inc(incr); | ||||
|         if (quantum_keeper.need_sync()) { | ||||
|         quantum_keeper.inc(core_inc); | ||||
|         if(quantum_keeper.need_sync()) { | ||||
|             wait(quantum_keeper.get_local_time()); | ||||
|             quantum_keeper.reset(); | ||||
|         } | ||||
|         last_sync_cycle = cycle; | ||||
|         ibus_inc = sc_core::SC_ZERO_TIME; | ||||
|         dbus_inc = sc_core::SC_ZERO_TIME; | ||||
|     } | ||||
|  | ||||
|     bool read_mem(uint64_t addr, unsigned length, uint8_t *const data, bool is_fetch); | ||||
|     bool read_mem(uint64_t addr, unsigned length, uint8_t* const data, bool is_fetch) override; | ||||
|  | ||||
|     bool write_mem(uint64_t addr, unsigned length, const uint8_t *const data); | ||||
|     bool write_mem(uint64_t addr, unsigned length, const uint8_t* const data) override; | ||||
|  | ||||
|     bool read_mem_dbg(uint64_t addr, unsigned length, uint8_t *const data); | ||||
|     bool read_mem_dbg(uint64_t addr, unsigned length, uint8_t* const data) override; | ||||
|  | ||||
|     bool write_mem_dbg(uint64_t addr, unsigned length, const uint8_t *const data); | ||||
|     bool write_mem_dbg(uint64_t addr, unsigned length, const uint8_t* const data) override; | ||||
|  | ||||
|     void trace(sc_core::sc_trace_file *trf) const override; | ||||
|     void trace(sc_core::sc_trace_file* trf) const override; | ||||
|  | ||||
|     bool disass_output(uint64_t pc, const std::string instr); | ||||
|     bool disass_output(uint64_t pc, const std::string instr) override; | ||||
|  | ||||
|     void set_clock_period(sc_core::sc_time period); | ||||
|  | ||||
|     char const* hier_name() override { return name(); } | ||||
|  | ||||
| protected: | ||||
|     void before_end_of_elaboration() override; | ||||
|     void start_of_simulation() override; | ||||
| 	void forward(); | ||||
|     void forward(); | ||||
|     void run(); | ||||
|     void rst_cb(); | ||||
|     void sw_irq_cb(); | ||||
| @@ -198,13 +225,13 @@ protected: | ||||
|     std::vector<uint8_t> write_buf; | ||||
|     core_wrapper* cpu{nullptr}; | ||||
|     sc_core::sc_signal<sc_core::sc_time> curr_clk; | ||||
|     sc_core::sc_time ibus_inc, dbus_inc; | ||||
|     uint64_t ibus_inc{0}, dbus_inc{0}; | ||||
|     core_trace* trc{nullptr}; | ||||
|     std::unique_ptr<scc::tick2time> t2t; | ||||
|  | ||||
| private: | ||||
|     void init(); | ||||
|     std::vector<iss::vm_plugin *> plugin_list; | ||||
|  | ||||
|     std::vector<iss::vm_plugin*> plugin_list; | ||||
| }; | ||||
| } /* namespace tgfs */ | ||||
| } /* namespace sysc */ | ||||
|   | ||||
| @@ -33,56 +33,58 @@ | ||||
| #ifndef _ISS_FACTORY_H_ | ||||
| #define _ISS_FACTORY_H_ | ||||
|  | ||||
| #include <iss/iss.h> | ||||
| #include "sc_core_adapter_if.h" | ||||
| #include <memory> | ||||
| #include <unordered_map> | ||||
| #include <functional> | ||||
| #include <string> | ||||
| #include <algorithm> | ||||
| #include <functional> | ||||
| #include <iss/iss.h> | ||||
| #include <memory> | ||||
| #include <string> | ||||
| #include <unordered_map> | ||||
| #include <vector> | ||||
|  | ||||
| namespace sysc { | ||||
|  | ||||
| using sc_cpu_ptr = std::unique_ptr<sc_core_adapter_if>; | ||||
| using vm_ptr= std::unique_ptr<iss::vm_if>; | ||||
| using vm_ptr = std::unique_ptr<iss::vm_if>; | ||||
|  | ||||
| class iss_factory { | ||||
| public: | ||||
|     using base_t = std::tuple<sc_cpu_ptr, vm_ptr>; | ||||
|     using create_fn = std::function<base_t(unsigned, void*) >; | ||||
|     using registry_t = std::unordered_map<std::string, create_fn> ; | ||||
|     using create_fn = std::function<base_t(unsigned, void*)>; | ||||
|     using registry_t = std::unordered_map<std::string, create_fn>; | ||||
|  | ||||
|     iss_factory() = default; | ||||
|     iss_factory(const iss_factory &) = delete; | ||||
|     iss_factory & operator=(const iss_factory &) = delete; | ||||
|     iss_factory(const iss_factory&) = delete; | ||||
|     iss_factory& operator=(const iss_factory&) = delete; | ||||
|  | ||||
|     static iss_factory & instance() { static iss_factory bf; return bf; } | ||||
|     static iss_factory& instance() { | ||||
|         static iss_factory bf; | ||||
|         return bf; | ||||
|     } | ||||
|  | ||||
|     bool register_creator(const std::string & className, create_fn const& fn) { | ||||
|     bool register_creator(const std::string& className, create_fn const& fn) { | ||||
|         registry[className] = fn; | ||||
|         return true; | ||||
|     } | ||||
|  | ||||
|     base_t create(std::string const& className, unsigned gdb_port=0, void* init_data=nullptr) const { | ||||
|     base_t create(std::string const& className, unsigned gdb_port = 0, void* init_data = nullptr) const { | ||||
|         registry_t::const_iterator regEntry = registry.find(className); | ||||
|         if (regEntry != registry.end()) | ||||
|         if(regEntry != registry.end()) | ||||
|             return regEntry->second(gdb_port, init_data); | ||||
|         return {nullptr, nullptr}; | ||||
|     } | ||||
|  | ||||
|     std::vector<std::string> get_names() { | ||||
|         std::vector<std::string> keys{registry.size()}; | ||||
|         std::transform(std::begin(registry), std::end(registry), std::begin(keys), [](std::pair<std::string, create_fn> const& p){ | ||||
|             return p.first; | ||||
|         }); | ||||
|         std::transform(std::begin(registry), std::end(registry), std::begin(keys), | ||||
|                        [](std::pair<std::string, create_fn> const& p) { return p.first; }); | ||||
|         return keys; | ||||
|     } | ||||
|  | ||||
| private: | ||||
|     registry_t registry; | ||||
|  | ||||
| }; | ||||
|  | ||||
| } | ||||
| } // namespace sysc | ||||
|  | ||||
| #endif /* _ISS_FACTORY_H_ */ | ||||
|   | ||||
| @@ -30,6 +30,7 @@ | ||||
|  * | ||||
|  *******************************************************************************/ | ||||
|  | ||||
| // clang-format off | ||||
| #include "iss_factory.h" | ||||
| #include <iss/arch/tgc5c.h> | ||||
| #include <iss/arch/riscv_hart_m_p.h> | ||||
| @@ -37,38 +38,73 @@ | ||||
| #include "sc_core_adapter.h" | ||||
| #include "core_complex.h" | ||||
| #include <array> | ||||
| // clang-format on | ||||
|  | ||||
| namespace iss { | ||||
| namespace interp { | ||||
| using namespace sysc; | ||||
| volatile std::array<bool, 2> tgc_init = { | ||||
|         iss_factory::instance().register_creator("tgc5c|m_p|interp", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|             auto cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); | ||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::tgc5c>>(cc); | ||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||
|         }), | ||||
|         iss_factory::instance().register_creator("tgc5c|mu_p|interp", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|             auto cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); | ||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::tgc5c>>(cc); | ||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||
|         }) | ||||
| }; | ||||
| } | ||||
|     iss_factory::instance().register_creator("tgc5c|m_p|interp", | ||||
|                                              [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|                                                  auto cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|                                                  auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::tgc5c>>(cc); | ||||
|                                                  return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||
|                                              }), | ||||
|     iss_factory::instance().register_creator("tgc5c|mu_p|interp", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|         auto cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|         auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::tgc5c>>(cc); | ||||
|         return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||
|     })}; | ||||
| } // namespace interp | ||||
| #if defined(WITH_LLVM) | ||||
| namespace llvm { | ||||
| using namespace sysc; | ||||
| volatile std::array<bool, 2> tgc_init = { | ||||
|     iss_factory::instance().register_creator("tgc5c|m_p|llvm", | ||||
|                                              [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|                                                  auto cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|                                                  auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::tgc5c>>(cc); | ||||
|                                                  return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||
|                                              }), | ||||
|     iss_factory::instance().register_creator("tgc5c|mu_p|llvm", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|         auto cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|         auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::tgc5c>>(cc); | ||||
|         return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||
|     })}; | ||||
| } // namespace llvm | ||||
| #endif | ||||
| #if defined(WITH_TCC) | ||||
| namespace tcc { | ||||
| using namespace sysc; | ||||
| volatile std::array<bool, 2> tgc_init = { | ||||
|         iss_factory::instance().register_creator("tgc5c|m_p|tcc", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|             auto cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); | ||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::tgc5c>>(cc); | ||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||
|         }), | ||||
|         iss_factory::instance().register_creator("tgc5c|mu_p|tcc", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|             auto cc = reinterpret_cast<sysc::tgfs::core_complex*>(data); | ||||
|             auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::tgc5c>>(cc); | ||||
|             return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||
|         }) | ||||
| }; | ||||
| } | ||||
|     iss_factory::instance().register_creator("tgc5c|m_p|tcc", | ||||
|                                              [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|                                                  auto cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|                                                  auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::tgc5c>>(cc); | ||||
|                                                  return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||
|                                              }), | ||||
|     iss_factory::instance().register_creator("tgc5c|mu_p|tcc", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|         auto cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|         auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::tgc5c>>(cc); | ||||
|         return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||
|     })}; | ||||
| } // namespace tcc | ||||
| #endif | ||||
| } | ||||
| #if defined(WITH_ASMJIT) | ||||
| namespace asmjit { | ||||
| using namespace sysc; | ||||
| volatile std::array<bool, 2> tgc_init = { | ||||
|     iss_factory::instance().register_creator("tgc5c|m_p|asmjit", | ||||
|                                              [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|                                                  auto cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|                                                  auto* cpu = new sc_core_adapter<arch::riscv_hart_m_p<arch::tgc5c>>(cc); | ||||
|                                                  return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||
|                                              }), | ||||
|     iss_factory::instance().register_creator("tgc5c|mu_p|asmjit", [](unsigned gdb_port, void* data) -> iss_factory::base_t { | ||||
|         auto cc = reinterpret_cast<sysc::tgfs::core_complex_if*>(data); | ||||
|         auto* cpu = new sc_core_adapter<arch::riscv_hart_mu_p<arch::tgc5c>>(cc); | ||||
|         return {sysc::sc_cpu_ptr{cpu}, vm_ptr{create(static_cast<arch::tgc5c*>(cpu), gdb_port)}}; | ||||
|     })}; | ||||
| } // namespace asmjit | ||||
| #endif | ||||
| } // namespace iss | ||||
|   | ||||
| @@ -8,109 +8,127 @@ | ||||
| #ifndef _SYSC_SC_CORE_ADAPTER_H_ | ||||
| #define _SYSC_SC_CORE_ADAPTER_H_ | ||||
|  | ||||
|  | ||||
| #include <scc/report.h> | ||||
| #include <util/ities.h> | ||||
| #include "sc_core_adapter_if.h" | ||||
| #include <iostream> | ||||
| #include <iss/iss.h> | ||||
| #include <iss/vm_types.h> | ||||
| #include <iostream> | ||||
| #include <scc/report.h> | ||||
| #include <util/ities.h> | ||||
|  | ||||
| namespace sysc { | ||||
| template<typename PLAT> | ||||
| class sc_core_adapter : public PLAT, public sc_core_adapter_if { | ||||
| template <typename PLAT> class sc_core_adapter : public PLAT, public sc_core_adapter_if { | ||||
| public: | ||||
|     using reg_t       = typename iss::arch::traits<typename PLAT::core>::reg_t; | ||||
|     using reg_t = typename iss::arch::traits<typename PLAT::core>::reg_t; | ||||
|     using phys_addr_t = typename iss::arch::traits<typename PLAT::core>::phys_addr_t; | ||||
|     using heart_state_t = typename PLAT::hart_state_type; | ||||
|     sc_core_adapter(sysc::tgfs::core_complex *owner) | ||||
|     : owner(owner) { } | ||||
|     sc_core_adapter(sysc::tgfs::core_complex_if* owner) | ||||
|     : owner(owner) {} | ||||
|  | ||||
|     iss::arch_if* get_arch_if() override { return this;} | ||||
|     iss::arch_if* get_arch_if() override { return this; } | ||||
|  | ||||
|     void set_mhartid(unsigned id) override { PLAT::set_mhartid(id); } | ||||
|  | ||||
|     uint32_t get_mode() override { return this->reg.PRIV; } | ||||
|  | ||||
|     void set_interrupt_execution(bool v) override { this->interrupt_sim = v?1:0; } | ||||
|     void set_interrupt_execution(bool v) override { this->interrupt_sim = v ? 1 : 0; } | ||||
|  | ||||
|     bool get_interrupt_execution() override { return this->interrupt_sim; } | ||||
|  | ||||
|     uint64_t get_state() override { return this->state.mstatus.backing.val; } | ||||
|  | ||||
|     void notify_phase(iss::arch_if::exec_phase p) override { | ||||
|         if (p == iss::arch_if::ISTART) | ||||
|         if(p == iss::arch_if::ISTART && !first) { | ||||
|             auto cycle_incr = owner->get_last_bus_cycles(); | ||||
|             if(cycle_incr > 1) | ||||
|                 this->instr_if.update_last_instr_cycles(cycle_incr); | ||||
|             owner->sync(this->instr_if.get_total_cycles()); | ||||
|         } | ||||
|         first = false; | ||||
|     } | ||||
|  | ||||
|     iss::sync_type needed_sync() const override { return iss::PRE_SYNC; } | ||||
|  | ||||
|     void disass_output(uint64_t pc, const std::string instr) override { | ||||
|         static constexpr std::array<const char, 4> lvl = {{'U', 'S', 'H', 'M'}}; | ||||
|         if (!owner->disass_output(pc, instr)) { | ||||
|         if(!owner->disass_output(pc, instr)) { | ||||
|             std::stringstream s; | ||||
|             s << "[p:" << lvl[this->reg.PRIV] << ";s:0x" << std::hex << std::setfill('0') | ||||
|               << std::setw(sizeof(reg_t) * 2) << (reg_t)this->state.mstatus << std::dec << ";c:" | ||||
|               << this->reg.icount + this->cycle_offset << "]"; | ||||
|             SCCDEBUG(owner->name())<<"disass: " | ||||
|                 << "0x" << std::setw(16) << std::right << std::setfill('0') << std::hex << pc << "\t\t" << std::setw(40) | ||||
|                 << std::setfill(' ') << std::left << instr << s.str(); | ||||
|             s << "[p:" << lvl[this->reg.PRIV] << ";s:0x" << std::hex << std::setfill('0') << std::setw(sizeof(reg_t) * 2) | ||||
|               << (reg_t)this->state.mstatus << std::dec << ";c:" << this->reg.icount + this->cycle_offset << "]"; | ||||
|             SCCDEBUG(owner->hier_name()) << "disass: " | ||||
|                                          << "0x" << std::setw(16) << std::right << std::setfill('0') << std::hex << pc << "\t\t" | ||||
|                                          << std::setw(40) << std::setfill(' ') << std::left << instr << s.str(); | ||||
|         } | ||||
|     }; | ||||
|  | ||||
|     iss::status read_mem(phys_addr_t addr, unsigned length, uint8_t *const data) override { | ||||
|         if (addr.access && iss::access_type::DEBUG) | ||||
|     iss::status read_mem(phys_addr_t addr, unsigned length, uint8_t* const data) override { | ||||
|         if(addr.access && iss::access_type::DEBUG) | ||||
|             return owner->read_mem_dbg(addr.val, length, data) ? iss::Ok : iss::Err; | ||||
|         else { | ||||
|             return owner->read_mem(addr.val, length, data, is_fetch(addr.access)) ? iss::Ok : iss::Err; | ||||
|         } | ||||
|     } | ||||
|  | ||||
|     iss::status write_mem(phys_addr_t addr, unsigned length, const uint8_t *const data) override { | ||||
|         if (addr.access && iss::access_type::DEBUG) | ||||
|     iss::status write_mem(phys_addr_t addr, unsigned length, const uint8_t* const data) override { | ||||
|         if(addr.access && iss::access_type::DEBUG) | ||||
|             return owner->write_mem_dbg(addr.val, length, data) ? iss::Ok : iss::Err; | ||||
|         else { | ||||
|             auto res = owner->write_mem(addr.val, length, data) ? iss::Ok : iss::Err; | ||||
|             // clear MTIP on mtimecmp write | ||||
|             if (addr.val == 0x2004000) { | ||||
|                 reg_t val; | ||||
|                 this->read_csr(iss::arch::mip, val); | ||||
|                 if (val & (1ULL << 7)) this->write_csr(iss::arch::mip, val & ~(1ULL << 7)); | ||||
|             auto tohost_upper = (sizeof(reg_t) == 4 && addr.val == (this->tohost + 4)) || (sizeof(reg_t) == 8 && addr.val == this->tohost); | ||||
|             auto tohost_lower = (sizeof(reg_t) == 4 && addr.val == this->tohost) || (sizeof(reg_t) == 64 && addr.val == this->tohost); | ||||
|             if(tohost_lower || tohost_upper) { | ||||
|                 if(tohost_upper || (tohost_lower && to_host_wr_cnt > 0)) { | ||||
|                     switch(hostvar >> 48) { | ||||
|                     case 0: | ||||
|                         if(hostvar != 0x1) { | ||||
|                             SCCINFO(owner->hier_name()) | ||||
|                                 << "tohost value is 0x" << std::hex << hostvar << std::dec << " (" << hostvar << "), stopping simulation"; | ||||
|                         } else { | ||||
|                             SCCINFO(owner->hier_name()) | ||||
|                                 << "tohost value is 0x" << std::hex << hostvar << std::dec << " (" << hostvar << "), stopping simulation"; | ||||
|                         } | ||||
|                         this->reg.trap_state = std::numeric_limits<uint32_t>::max(); | ||||
|                         this->interrupt_sim = hostvar; | ||||
| #ifndef WITH_TCC | ||||
|                         throw(iss::simulation_stopped(hostvar)); | ||||
| #endif | ||||
|                         break; | ||||
|                     default: | ||||
|                         break; | ||||
|                     } | ||||
|                 } else if(tohost_lower) | ||||
|                     to_host_wr_cnt++; | ||||
|                 return iss::Ok; | ||||
|             } else { | ||||
|                 auto res = owner->write_mem(addr.val, length, data) ? iss::Ok : iss::Err; | ||||
|                 // clear MTIP on mtimecmp write | ||||
|                 if(addr.val == 0x2004000) { | ||||
|                     reg_t val; | ||||
|                     this->read_csr(iss::arch::mip, val); | ||||
|                     if(val & (1ULL << 7)) | ||||
|                         this->write_csr(iss::arch::mip, val & ~(1ULL << 7)); | ||||
|                 } | ||||
|                 return res; | ||||
|             } | ||||
|             return res; | ||||
|         } | ||||
|     } | ||||
|  | ||||
|     iss::status read_csr(unsigned addr, reg_t &val) override { | ||||
| #ifndef CWR_SYSTEMC | ||||
|         if((addr==iss::arch::time || addr==iss::arch::timeh) && owner->mtime_o.get_interface(0)){ | ||||
|             uint64_t time_val; | ||||
|             bool ret = owner->mtime_o->nb_peek(time_val); | ||||
|             if (addr == iss::arch::time) { | ||||
|     iss::status read_csr(unsigned addr, reg_t& val) override { | ||||
|         if((addr == iss::arch::time || addr == iss::arch::timeh)) { | ||||
|             uint64_t time_val = owner->mtime_i.get_interface() ? owner->mtime_i.read() : 0; | ||||
|             if(addr == iss::arch::time) { | ||||
|                 val = static_cast<reg_t>(time_val); | ||||
|             } else if (addr == iss::arch::timeh) { | ||||
|                 if (sizeof(reg_t) != 4) return iss::Err; | ||||
|                 val = static_cast<reg_t>(time_val >> 32); | ||||
|             } | ||||
|             return ret?iss::Ok:iss::Err; | ||||
| #else | ||||
|         if((addr==iss::arch::time || addr==iss::arch::timeh)){ | ||||
|             uint64_t time_val = owner->mtime_i.read(); | ||||
|             if (addr == iss::arch::time) { | ||||
|                 val = static_cast<reg_t>(time_val); | ||||
|             } else if (addr == iss::arch::timeh) { | ||||
|                 if (sizeof(reg_t) != 4) return iss::Err; | ||||
|             } else if(addr == iss::arch::timeh) { | ||||
|                 if(sizeof(reg_t) != 4) | ||||
|                     return iss::Err; | ||||
|                 val = static_cast<reg_t>(time_val >> 32); | ||||
|             } | ||||
|             return iss::Ok; | ||||
| #endif | ||||
|         } else { | ||||
|             return PLAT::read_csr(addr, val); | ||||
|         } | ||||
|     } | ||||
|  | ||||
|     void wait_until(uint64_t flags) override { | ||||
|         SCCDEBUG(owner->name()) << "Sleeping until interrupt"; | ||||
|         SCCDEBUG(owner->hier_name()) << "Sleeping until interrupt"; | ||||
|         while(this->reg.pending_trap == 0 && (this->csr[iss::arch::mip] & this->csr[iss::arch::mie]) == 0) { | ||||
|             sc_core::wait(wfi_evt); | ||||
|         } | ||||
| @@ -119,7 +137,7 @@ public: | ||||
|  | ||||
|     void local_irq(short id, bool value) override { | ||||
|         reg_t mask = 0; | ||||
|         switch (id) { | ||||
|         switch(id) { | ||||
|         case 3: // SW | ||||
|             mask = 1 << 3; | ||||
|             break; | ||||
| @@ -130,22 +148,26 @@ public: | ||||
|             mask = 1 << 11; | ||||
|             break; | ||||
|         default: | ||||
|             if(id>15) mask = 1 << id; | ||||
|             if(id > 15) | ||||
|                 mask = 1 << id; | ||||
|             break; | ||||
|         } | ||||
|         if (value) { | ||||
|         if(value) { | ||||
|             this->csr[iss::arch::mip] |= mask; | ||||
|             wfi_evt.notify(); | ||||
|         } else | ||||
|             this->csr[iss::arch::mip] &= ~mask; | ||||
|         this->check_interrupt(); | ||||
|         if(value) | ||||
|             SCCTRACE(owner->name()) << "Triggering interrupt " << id << " Pending trap: " << this->reg.pending_trap; | ||||
|             SCCTRACE(owner->hier_name()) << "Triggering interrupt " << id << " Pending trap: " << this->reg.pending_trap; | ||||
|     } | ||||
|  | ||||
| private: | ||||
|     sysc::tgfs::core_complex *const owner; | ||||
|     sysc::tgfs::core_complex_if* const owner{nullptr}; | ||||
|     sc_core::sc_event wfi_evt; | ||||
|     uint64_t hostvar{std::numeric_limits<uint64_t>::max()}; | ||||
|     unsigned to_host_wr_cnt = 0; | ||||
|     bool first{true}; | ||||
| }; | ||||
| } | ||||
| } // namespace sysc | ||||
| #endif /* _SYSC_SC_CORE_ADAPTER_H_ */ | ||||
|   | ||||
| @@ -8,13 +8,12 @@ | ||||
| #ifndef _SYSC_SC_CORE_ADAPTER_IF_H_ | ||||
| #define _SYSC_SC_CORE_ADAPTER_IF_H_ | ||||
|  | ||||
|  | ||||
| #include <scc/report.h> | ||||
| #include <util/ities.h> | ||||
| #include "core_complex.h" | ||||
| #include <iostream> | ||||
| #include <iss/iss.h> | ||||
| #include <iss/vm_types.h> | ||||
| #include <iostream> | ||||
| #include <scc/report.h> | ||||
| #include <util/ities.h> | ||||
|  | ||||
| namespace sysc { | ||||
| struct sc_core_adapter_if { | ||||
| @@ -27,5 +26,5 @@ struct sc_core_adapter_if { | ||||
|     virtual void local_irq(short id, bool value) = 0; | ||||
|     virtual ~sc_core_adapter_if() = default; | ||||
| }; | ||||
| } | ||||
| } // namespace sysc | ||||
| #endif /* _SYSC_SC_CORE_ADAPTER_IF_H_ */ | ||||
|   | ||||
							
								
								
									
										4929
									
								
								src/vm/asmjit/vm_tgc5c.cpp
									
									
									
									
									
										Normal file
									
								
							
							
						
						
									
										4929
									
								
								src/vm/asmjit/vm_tgc5c.cpp
									
									
									
									
									
										Normal file
									
								
							
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							| @@ -33,99 +33,94 @@ | ||||
| //////////////////////////////////////////////////////////////////////////////// | ||||
|  | ||||
| #include "fp_functions.h" | ||||
| #include <array> | ||||
|  | ||||
| extern "C" { | ||||
| #include <softfloat.h> | ||||
| #include "internals.h" | ||||
| #include "specialize.h" | ||||
| #include <softfloat.h> | ||||
| } | ||||
|  | ||||
| #include <limits> | ||||
|  | ||||
| using this_t = uint8_t *; | ||||
| const uint8_t rmm_map[] = { | ||||
|         softfloat_round_near_even /*RNE*/, | ||||
|         softfloat_round_minMag/*RTZ*/, | ||||
|         softfloat_round_min/*RDN*/, | ||||
|         softfloat_round_max/*RUP?*/, | ||||
|         softfloat_round_near_maxMag /*RMM*/, | ||||
|         softfloat_round_max/*RTZ*/, | ||||
|         softfloat_round_max/*RTZ*/, | ||||
|         softfloat_round_max/*RTZ*/, | ||||
| using this_t = uint8_t*; | ||||
| // this does not inlcude any reserved rm or the DYN rm, as DYN rm should be taken care of in the vm_impl | ||||
| const std::array<uint8_t, 5> rmm_map = { | ||||
|     softfloat_round_near_even /*RNE*/, softfloat_round_minMag /*RTZ*/, softfloat_round_min /*RDN*/, softfloat_round_max /*RUP?*/, | ||||
|     softfloat_round_near_maxMag /*RMM*/ | ||||
| }; | ||||
|  | ||||
| const uint32_t quiet_nan32=0x7fC00000; | ||||
| const uint32_t quiet_nan32 = 0x7fC00000; | ||||
|  | ||||
| extern "C" { | ||||
|  | ||||
| uint32_t fget_flags(){ | ||||
|     return softfloat_exceptionFlags&0x1f; | ||||
| } | ||||
| uint32_t fget_flags() { return softfloat_exceptionFlags & 0x1f; } | ||||
|  | ||||
| uint32_t fadd_s(uint32_t v1, uint32_t v2, uint8_t mode) { | ||||
|     float32_t v1f{v1},v2f{v2}; | ||||
|     softfloat_roundingMode=rmm_map[mode&0x7]; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     float32_t r =f32_add(v1f, v2f); | ||||
|     float32_t v1f{v1}, v2f{v2}; | ||||
|     softfloat_roundingMode = rmm_map.at(mode); | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     float32_t r = f32_add(v1f, v2f); | ||||
|     return r.v; | ||||
| } | ||||
|  | ||||
| uint32_t fsub_s(uint32_t v1, uint32_t v2, uint8_t mode) { | ||||
|     float32_t v1f{v1},v2f{v2}; | ||||
|     softfloat_roundingMode=rmm_map[mode&0x7]; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     float32_t r=f32_sub(v1f, v2f); | ||||
|     float32_t v1f{v1}, v2f{v2}; | ||||
|     softfloat_roundingMode = rmm_map.at(mode); | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     float32_t r = f32_sub(v1f, v2f); | ||||
|     return r.v; | ||||
| } | ||||
|  | ||||
| uint32_t fmul_s(uint32_t v1, uint32_t v2, uint8_t mode) { | ||||
|     float32_t v1f{v1},v2f{v2}; | ||||
|     softfloat_roundingMode=rmm_map[mode&0x7]; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     float32_t r=f32_mul(v1f, v2f); | ||||
|     float32_t v1f{v1}, v2f{v2}; | ||||
|     softfloat_roundingMode = rmm_map.at(mode); | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     float32_t r = f32_mul(v1f, v2f); | ||||
|     return r.v; | ||||
| } | ||||
|  | ||||
| uint32_t fdiv_s(uint32_t v1, uint32_t v2, uint8_t mode) { | ||||
|     float32_t v1f{v1},v2f{v2}; | ||||
|     softfloat_roundingMode=rmm_map[mode&0x7]; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     float32_t r=f32_div(v1f, v2f); | ||||
|     float32_t v1f{v1}, v2f{v2}; | ||||
|     softfloat_roundingMode = rmm_map.at(mode); | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     float32_t r = f32_div(v1f, v2f); | ||||
|     return r.v; | ||||
| } | ||||
|  | ||||
| uint32_t fsqrt_s(uint32_t v1, uint8_t mode) { | ||||
|     float32_t v1f{v1}; | ||||
|     softfloat_roundingMode=rmm_map[mode&0x7]; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     float32_t r=f32_sqrt(v1f); | ||||
|     softfloat_roundingMode = rmm_map.at(mode); | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     float32_t r = f32_sqrt(v1f); | ||||
|     return r.v; | ||||
| } | ||||
|  | ||||
| uint32_t fcmp_s(uint32_t v1, uint32_t v2, uint32_t op) { | ||||
|     float32_t v1f{v1},v2f{v2}; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     bool nan = (v1&defaultNaNF32UI)==quiet_nan32 || (v2&defaultNaNF32UI)==quiet_nan32; | ||||
|     float32_t v1f{v1}, v2f{v2}; | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     bool nan = (v1 & defaultNaNF32UI) == quiet_nan32 || (v2 & defaultNaNF32UI) == quiet_nan32; | ||||
|     bool snan = softfloat_isSigNaNF32UI(v1) || softfloat_isSigNaNF32UI(v2); | ||||
|     switch(op){ | ||||
|     switch(op) { | ||||
|     case 0: | ||||
|         if(nan | snan){ | ||||
|             if(snan) softfloat_raiseFlags(softfloat_flag_invalid); | ||||
|         if(nan | snan) { | ||||
|             if(snan) | ||||
|                 softfloat_raiseFlags(softfloat_flag_invalid); | ||||
|             return 0; | ||||
|         } else | ||||
|             return f32_eq(v1f,v2f )?1:0; | ||||
|             return f32_eq(v1f, v2f) ? 1 : 0; | ||||
|     case 1: | ||||
|         if(nan | snan){ | ||||
|         if(nan | snan) { | ||||
|             softfloat_raiseFlags(softfloat_flag_invalid); | ||||
|             return 0; | ||||
|         } else | ||||
|             return f32_le(v1f,v2f )?1:0; | ||||
|             return f32_le(v1f, v2f) ? 1 : 0; | ||||
|     case 2: | ||||
|         if(nan | snan){ | ||||
|         if(nan | snan) { | ||||
|             softfloat_raiseFlags(softfloat_flag_invalid); | ||||
|             return 0; | ||||
|         } else | ||||
|             return f32_lt(v1f,v2f )?1:0; | ||||
|             return f32_lt(v1f, v2f) ? 1 : 0; | ||||
|     default: | ||||
|         break; | ||||
|     } | ||||
| @@ -134,33 +129,46 @@ uint32_t fcmp_s(uint32_t v1, uint32_t v2, uint32_t op) { | ||||
|  | ||||
| uint32_t fcvt_s(uint32_t v1, uint32_t op, uint8_t mode) { | ||||
|     float32_t v1f{v1}; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     float32_t r; | ||||
|     switch(op){ | ||||
|     case 0:{ //w->s, fp to int32 | ||||
|         uint_fast32_t res = f32_to_i32(v1f,rmm_map[mode&0x7],true); | ||||
|     switch(op) { | ||||
|     case 0: { // FCVT__W__S | ||||
|         uint_fast32_t res = f32_to_i32(v1f, rmm_map.at(mode), true); | ||||
|         return (uint32_t)res; | ||||
|     } | ||||
|     case 1:{ //wu->s | ||||
|         uint_fast32_t res = f32_to_ui32(v1f,rmm_map[mode&0x7],true); | ||||
|     case 1: { // FCVT__WU__S | ||||
|         uint_fast32_t res = f32_to_ui32(v1f, rmm_map.at(mode), true); | ||||
|         return (uint32_t)res; | ||||
|     } | ||||
|     case 2: //s->w | ||||
|         r=i32_to_f32(v1); | ||||
|     case 2: // FCVT__S__W | ||||
|         r = i32_to_f32((int32_t)v1); | ||||
|         return r.v; | ||||
|     case 3: //s->wu | ||||
|         r=ui32_to_f32(v1); | ||||
|     case 3: // FCVT__S__WU | ||||
|         r = ui32_to_f32(v1); | ||||
|         return r.v; | ||||
|     } | ||||
|     return 0; | ||||
| } | ||||
|  | ||||
| uint32_t fmadd_s(uint32_t v1, uint32_t v2, uint32_t v3, uint32_t op, uint8_t mode) { | ||||
|     // op should be {softfloat_mulAdd_subProd(2), softfloat_mulAdd_subC(1)} | ||||
|     softfloat_roundingMode=rmm_map[mode&0x7]; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     float32_t res = softfloat_mulAddF32(v1, v2, v3, op&0x1); | ||||
|     if(op>1) res.v ^= 1ULL<<31; | ||||
|     uint32_t F32_SIGN = 1UL << 31; | ||||
|     switch(op) { | ||||
|     case 0: // FMADD_S | ||||
|         break; | ||||
|     case 1: // FMSUB_S | ||||
|         v3 ^= F32_SIGN; | ||||
|         break; | ||||
|     case 2: // FNMADD_S | ||||
|         v1 ^= F32_SIGN; | ||||
|         v3 ^= F32_SIGN; | ||||
|         break; | ||||
|     case 3: // FNMSUB_S | ||||
|         v1 ^= F32_SIGN; | ||||
|         break; | ||||
|     } | ||||
|     softfloat_roundingMode = rmm_map.at(mode); | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     float32_t res = softfloat_mulAddF32(v1, v2, v3, 0); | ||||
|     return res.v; | ||||
| } | ||||
|  | ||||
| @@ -170,23 +178,23 @@ uint32_t fsel_s(uint32_t v1, uint32_t v2, uint32_t op) { | ||||
|     bool v2_nan = (v2 & defaultNaNF32UI) == defaultNaNF32UI; | ||||
|     bool v1_snan = softfloat_isSigNaNF32UI(v1); | ||||
|     bool v2_snan = softfloat_isSigNaNF32UI(v2); | ||||
|     if (v1_snan || v2_snan) softfloat_raiseFlags(softfloat_flag_invalid); | ||||
|     if (v1_nan || v1_snan) | ||||
|     if(v1_snan || v2_snan) | ||||
|         softfloat_raiseFlags(softfloat_flag_invalid); | ||||
|     if(v1_nan || v1_snan) | ||||
|         return (v2_nan || v2_snan) ? defaultNaNF32UI : v2; | ||||
|     else | ||||
|         if (v2_nan || v2_snan) | ||||
|             return v1; | ||||
|         else { | ||||
|             if ((v1 & 0x7fffffff) == 0 && (v2 & 0x7fffffff) == 0) { | ||||
|                 return op == 0 ? ((v1 & 0x80000000) ? v1 : v2) : ((v1 & 0x80000000) ? v2 : v1); | ||||
|             } else { | ||||
|                 float32_t v1f{ v1 }, v2f{ v2 }; | ||||
|                 return op == 0 ? (f32_lt(v1f, v2f) ? v1 : v2) : (f32_lt(v1f, v2f) ? v2 : v1); | ||||
|             } | ||||
|     else if(v2_nan || v2_snan) | ||||
|         return v1; | ||||
|     else { | ||||
|         if((v1 & 0x7fffffff) == 0 && (v2 & 0x7fffffff) == 0) { | ||||
|             return op == 0 ? ((v1 & 0x80000000) ? v1 : v2) : ((v1 & 0x80000000) ? v2 : v1); | ||||
|         } else { | ||||
|             float32_t v1f{v1}, v2f{v2}; | ||||
|             return op == 0 ? (f32_lt(v1f, v2f) ? v1 : v2) : (f32_lt(v1f, v2f) ? v2 : v1); | ||||
|         } | ||||
|     } | ||||
| } | ||||
|  | ||||
| uint32_t fclass_s( uint32_t v1 ){ | ||||
| uint32_t fclass_s(uint32_t v1) { | ||||
|  | ||||
|     float32_t a{v1}; | ||||
|     union ui32_f32 uA; | ||||
| @@ -195,30 +203,27 @@ uint32_t fclass_s( uint32_t v1 ){ | ||||
|     uA.f = a; | ||||
|     uiA = uA.ui; | ||||
|  | ||||
|     uint_fast16_t infOrNaN = expF32UI( uiA ) == 0xFF; | ||||
|     uint_fast16_t subnormalOrZero = expF32UI( uiA ) == 0; | ||||
|     bool sign = signF32UI( uiA ); | ||||
|     bool fracZero = fracF32UI( uiA ) == 0; | ||||
|     bool isNaN = isNaNF32UI( uiA ); | ||||
|     bool isSNaN = softfloat_isSigNaNF32UI( uiA ); | ||||
|     bool infOrNaN = expF32UI(uiA) == 0xFF; | ||||
|     bool subnormalOrZero = expF32UI(uiA) == 0; | ||||
|     bool sign = signF32UI(uiA); | ||||
|     bool fracZero = fracF32UI(uiA) == 0; | ||||
|     bool isNaN = isNaNF32UI(uiA); | ||||
|     bool isSNaN = softfloat_isSigNaNF32UI(uiA); | ||||
|  | ||||
|     return | ||||
|         (  sign && infOrNaN && fracZero )          << 0 | | ||||
|         (  sign && !infOrNaN && !subnormalOrZero ) << 1 | | ||||
|         (  sign && subnormalOrZero && !fracZero )  << 2 | | ||||
|         (  sign && subnormalOrZero && fracZero )   << 3 | | ||||
|         ( !sign && infOrNaN && fracZero )          << 7 | | ||||
|         ( !sign && !infOrNaN && !subnormalOrZero ) << 6 | | ||||
|         ( !sign && subnormalOrZero && !fracZero )  << 5 | | ||||
|         ( !sign && subnormalOrZero && fracZero )   << 4 | | ||||
|         ( isNaN &&  isSNaN )                       << 8 | | ||||
|         ( isNaN && !isSNaN )                       << 9; | ||||
|     return (sign && infOrNaN && fracZero) << 0 | (sign && !infOrNaN && !subnormalOrZero) << 1 | | ||||
|            (sign && subnormalOrZero && !fracZero) << 2 | (sign && subnormalOrZero && fracZero) << 3 | (!sign && infOrNaN && fracZero) << 7 | | ||||
|            (!sign && !infOrNaN && !subnormalOrZero) << 6 | (!sign && subnormalOrZero && !fracZero) << 5 | | ||||
|            (!sign && subnormalOrZero && fracZero) << 4 | (isNaN && isSNaN) << 8 | (isNaN && !isSNaN) << 9; | ||||
| } | ||||
|  | ||||
| uint32_t fconv_d2f(uint64_t v1, uint8_t mode){ | ||||
|     softfloat_roundingMode=rmm_map[mode&0x7]; | ||||
|     bool nan = (v1 & defaultNaNF64UI)==defaultNaNF64UI; | ||||
|     if(nan){ | ||||
| uint32_t fconv_d2f(uint64_t v1, uint8_t mode) { | ||||
|     bool isNan = isNaNF64UI(v1); | ||||
|     bool isSNaN = softfloat_isSigNaNF64UI(v1); | ||||
|     softfloat_roundingMode = rmm_map.at(mode); | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     if(isNan) { | ||||
|         if(isSNaN) | ||||
|             softfloat_raiseFlags(softfloat_flag_invalid); | ||||
|         return defaultNaNF32UI; | ||||
|     } else { | ||||
|         float32_t res = f64_to_f32(float64_t{v1}); | ||||
| @@ -226,83 +231,84 @@ uint32_t fconv_d2f(uint64_t v1, uint8_t mode){ | ||||
|     } | ||||
| } | ||||
|  | ||||
| uint64_t fconv_f2d(uint32_t v1, uint8_t mode){ | ||||
|     bool nan = (v1 & defaultNaNF32UI)==defaultNaNF32UI; | ||||
|     if(nan){ | ||||
| uint64_t fconv_f2d(uint32_t v1, uint8_t mode) { | ||||
|     bool infOrNaN = expF32UI(v1) == 0xFF; | ||||
|     bool subnormalOrZero = expF32UI(v1) == 0; | ||||
|     if(infOrNaN || subnormalOrZero) { | ||||
|         return defaultNaNF64UI; | ||||
|     } else { | ||||
|         softfloat_roundingMode=rmm_map[mode&0x7]; | ||||
|         float64_t res = f32_to_f64(float32_t{v1}); | ||||
|         return res.v; | ||||
|     } | ||||
| } | ||||
|  | ||||
| uint64_t fadd_d(uint64_t v1, uint64_t v2, uint8_t mode) { | ||||
|     bool nan = (v1&defaultNaNF32UI)==quiet_nan32; | ||||
|     bool nan = (v1 & defaultNaNF32UI) == quiet_nan32; | ||||
|     bool snan = softfloat_isSigNaNF32UI(v1); | ||||
|    float64_t v1f{v1},v2f{v2}; | ||||
|     softfloat_roundingMode=rmm_map[mode&0x7]; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     float64_t r =f64_add(v1f, v2f); | ||||
|     float64_t v1f{v1}, v2f{v2}; | ||||
|     softfloat_roundingMode = rmm_map.at(mode); | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     float64_t r = f64_add(v1f, v2f); | ||||
|     return r.v; | ||||
| } | ||||
|  | ||||
| uint64_t fsub_d(uint64_t v1, uint64_t v2, uint8_t mode) { | ||||
|     float64_t v1f{v1},v2f{v2}; | ||||
|     softfloat_roundingMode=rmm_map[mode&0x7]; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     float64_t r=f64_sub(v1f, v2f); | ||||
|     float64_t v1f{v1}, v2f{v2}; | ||||
|     softfloat_roundingMode = rmm_map.at(mode); | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     float64_t r = f64_sub(v1f, v2f); | ||||
|     return r.v; | ||||
| } | ||||
|  | ||||
| uint64_t fmul_d(uint64_t v1, uint64_t v2, uint8_t mode) { | ||||
|     float64_t v1f{v1},v2f{v2}; | ||||
|     softfloat_roundingMode=rmm_map[mode&0x7]; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     float64_t r=f64_mul(v1f, v2f); | ||||
|     float64_t v1f{v1}, v2f{v2}; | ||||
|     softfloat_roundingMode = rmm_map.at(mode); | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     float64_t r = f64_mul(v1f, v2f); | ||||
|     return r.v; | ||||
| } | ||||
|  | ||||
| uint64_t fdiv_d(uint64_t v1, uint64_t v2, uint8_t mode) { | ||||
|     float64_t v1f{v1},v2f{v2}; | ||||
|     softfloat_roundingMode=rmm_map[mode&0x7]; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     float64_t r=f64_div(v1f, v2f); | ||||
|     float64_t v1f{v1}, v2f{v2}; | ||||
|     softfloat_roundingMode = rmm_map.at(mode); | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     float64_t r = f64_div(v1f, v2f); | ||||
|     return r.v; | ||||
| } | ||||
|  | ||||
| uint64_t fsqrt_d(uint64_t v1, uint8_t mode) { | ||||
|     float64_t v1f{v1}; | ||||
|     softfloat_roundingMode=rmm_map[mode&0x7]; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     float64_t r=f64_sqrt(v1f); | ||||
|     softfloat_roundingMode = rmm_map.at(mode); | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     float64_t r = f64_sqrt(v1f); | ||||
|     return r.v; | ||||
| } | ||||
|  | ||||
| uint64_t fcmp_d(uint64_t v1, uint64_t v2, uint32_t op) { | ||||
|     float64_t v1f{v1},v2f{v2}; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     bool nan = (v1&defaultNaNF64UI)==quiet_nan32 || (v2&defaultNaNF64UI)==quiet_nan32; | ||||
|     float64_t v1f{v1}, v2f{v2}; | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     bool nan = (v1 & defaultNaNF64UI) == quiet_nan32 || (v2 & defaultNaNF64UI) == quiet_nan32; | ||||
|     bool snan = softfloat_isSigNaNF64UI(v1) || softfloat_isSigNaNF64UI(v2); | ||||
|     switch(op){ | ||||
|     switch(op) { | ||||
|     case 0: | ||||
|         if(nan | snan){ | ||||
|             if(snan) softfloat_raiseFlags(softfloat_flag_invalid); | ||||
|         if(nan | snan) { | ||||
|             if(snan) | ||||
|                 softfloat_raiseFlags(softfloat_flag_invalid); | ||||
|             return 0; | ||||
|         } else | ||||
|             return f64_eq(v1f,v2f )?1:0; | ||||
|             return f64_eq(v1f, v2f) ? 1 : 0; | ||||
|     case 1: | ||||
|         if(nan | snan){ | ||||
|         if(nan | snan) { | ||||
|             softfloat_raiseFlags(softfloat_flag_invalid); | ||||
|             return 0; | ||||
|         } else | ||||
|             return f64_le(v1f,v2f )?1:0; | ||||
|             return f64_le(v1f, v2f) ? 1 : 0; | ||||
|     case 2: | ||||
|         if(nan | snan){ | ||||
|         if(nan | snan) { | ||||
|             softfloat_raiseFlags(softfloat_flag_invalid); | ||||
|             return 0; | ||||
|         } else | ||||
|             return f64_lt(v1f,v2f )?1:0; | ||||
|             return f64_lt(v1f, v2f) ? 1 : 0; | ||||
|     default: | ||||
|         break; | ||||
|     } | ||||
| @@ -310,34 +316,48 @@ uint64_t fcmp_d(uint64_t v1, uint64_t v2, uint32_t op) { | ||||
| } | ||||
|  | ||||
| uint64_t fcvt_d(uint64_t v1, uint32_t op, uint8_t mode) { | ||||
|  | ||||
|     float64_t v1f{v1}; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     float64_t r; | ||||
|     switch(op){ | ||||
|     case 0:{ //l->d, fp to int32 | ||||
|         int64_t res = f64_to_i64(v1f,rmm_map[mode&0x7],true); | ||||
|     switch(op) { | ||||
|     case 0: { // l from d | ||||
|         int64_t res = f64_to_i64(v1f, rmm_map.at(mode), true); | ||||
|         return (uint64_t)res; | ||||
|     } | ||||
|     case 1:{ //lu->s | ||||
|         uint64_t res = f64_to_ui64(v1f,rmm_map[mode&0x7],true); | ||||
|     case 1: { // lu from d | ||||
|         uint64_t res = f64_to_ui64(v1f, rmm_map.at(mode), true); | ||||
|         return res; | ||||
|     } | ||||
|     case 2: //s->l | ||||
|         r=i64_to_f64(v1); | ||||
|     case 2: // d from l | ||||
|         r = i64_to_f64(v1); | ||||
|         return r.v; | ||||
|     case 3: //s->lu | ||||
|         r=ui64_to_f64(v1); | ||||
|     case 3: // d from lu | ||||
|         r = ui64_to_f64(v1); | ||||
|         return r.v; | ||||
|     } | ||||
|     return 0; | ||||
| } | ||||
|  | ||||
| uint64_t fmadd_d(uint64_t v1, uint64_t v2, uint64_t v3, uint32_t op, uint8_t mode) { | ||||
|     // op should be {softfloat_mulAdd_subProd(2), softfloat_mulAdd_subC(1)} | ||||
|     softfloat_roundingMode=rmm_map[mode&0x7]; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     float64_t res = softfloat_mulAddF64(v1, v2, v3, op&0x1); | ||||
|     if(op>1) res.v ^= 1ULL<<63; | ||||
|     uint64_t F64_SIGN = 1ULL << 63; | ||||
|     switch(op) { | ||||
|     case 0: // FMADD_D | ||||
|         break; | ||||
|     case 1: // FMSUB_D | ||||
|         v3 ^= F64_SIGN; | ||||
|         break; | ||||
|     case 2: // FNMADD_D | ||||
|         v1 ^= F64_SIGN; | ||||
|         v3 ^= F64_SIGN; | ||||
|         break; | ||||
|     case 3: // FNMSUB_D | ||||
|         v1 ^= F64_SIGN; | ||||
|         break; | ||||
|     } | ||||
|     softfloat_roundingMode = rmm_map.at(mode); | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     float64_t res = softfloat_mulAddF64(v1, v2, v3, 0); | ||||
|     return res.v; | ||||
| } | ||||
|  | ||||
| @@ -347,27 +367,24 @@ uint64_t fsel_d(uint64_t v1, uint64_t v2, uint32_t op) { | ||||
|     bool v2_nan = (v2 & defaultNaNF64UI) == defaultNaNF64UI; | ||||
|     bool v1_snan = softfloat_isSigNaNF64UI(v1); | ||||
|     bool v2_snan = softfloat_isSigNaNF64UI(v2); | ||||
|     if (v1_snan || v2_snan) softfloat_raiseFlags(softfloat_flag_invalid); | ||||
|     if (v1_nan || v1_snan) | ||||
|     if(v1_snan || v2_snan) | ||||
|         softfloat_raiseFlags(softfloat_flag_invalid); | ||||
|     if(v1_nan || v1_snan) | ||||
|         return (v2_nan || v2_snan) ? defaultNaNF64UI : v2; | ||||
|     else | ||||
|         if (v2_nan || v2_snan) | ||||
|             return v1; | ||||
|         else { | ||||
|             if ((v1 & std::numeric_limits<int64_t>::max()) == 0 && (v2 & std::numeric_limits<int64_t>::max()) == 0) { | ||||
|                 return op == 0 ? | ||||
|                         ((v1 & std::numeric_limits<int64_t>::min()) ? v1 : v2) : | ||||
|                         ((v1 & std::numeric_limits<int64_t>::min()) ? v2 : v1); | ||||
|             } else { | ||||
|                 float64_t v1f{ v1 }, v2f{ v2 }; | ||||
|                 return op == 0 ? | ||||
|                         (f64_lt(v1f, v2f) ? v1 : v2) : | ||||
|                         (f64_lt(v1f, v2f) ? v2 : v1); | ||||
|             } | ||||
|     else if(v2_nan || v2_snan) | ||||
|         return v1; | ||||
|     else { | ||||
|         if((v1 & std::numeric_limits<int64_t>::max()) == 0 && (v2 & std::numeric_limits<int64_t>::max()) == 0) { | ||||
|             return op == 0 ? ((v1 & std::numeric_limits<int64_t>::min()) ? v1 : v2) | ||||
|                            : ((v1 & std::numeric_limits<int64_t>::min()) ? v2 : v1); | ||||
|         } else { | ||||
|             float64_t v1f{v1}, v2f{v2}; | ||||
|             return op == 0 ? (f64_lt(v1f, v2f) ? v1 : v2) : (f64_lt(v1f, v2f) ? v2 : v1); | ||||
|         } | ||||
|     } | ||||
| } | ||||
|  | ||||
| uint64_t fclass_d(uint64_t v1  ){ | ||||
| uint64_t fclass_d(uint64_t v1) { | ||||
|  | ||||
|     float64_t a{v1}; | ||||
|     union ui64_f64 uA; | ||||
| @@ -376,68 +393,61 @@ uint64_t fclass_d(uint64_t v1  ){ | ||||
|     uA.f = a; | ||||
|     uiA = uA.ui; | ||||
|  | ||||
|     uint_fast16_t infOrNaN = expF64UI( uiA ) == 0x7FF; | ||||
|     uint_fast16_t subnormalOrZero = expF64UI( uiA ) == 0; | ||||
|     bool sign = signF64UI( uiA ); | ||||
|     bool fracZero = fracF64UI( uiA ) == 0; | ||||
|     bool isNaN = isNaNF64UI( uiA ); | ||||
|     bool isSNaN = softfloat_isSigNaNF64UI( uiA ); | ||||
|     bool infOrNaN = expF64UI(uiA) == 0x7FF; | ||||
|     bool subnormalOrZero = expF64UI(uiA) == 0; | ||||
|     bool sign = signF64UI(uiA); | ||||
|     bool fracZero = fracF64UI(uiA) == 0; | ||||
|     bool isNaN = isNaNF64UI(uiA); | ||||
|     bool isSNaN = softfloat_isSigNaNF64UI(uiA); | ||||
|  | ||||
|     return | ||||
|         (  sign && infOrNaN && fracZero )          << 0 | | ||||
|         (  sign && !infOrNaN && !subnormalOrZero ) << 1 | | ||||
|         (  sign && subnormalOrZero && !fracZero )  << 2 | | ||||
|         (  sign && subnormalOrZero && fracZero )   << 3 | | ||||
|         ( !sign && infOrNaN && fracZero )          << 7 | | ||||
|         ( !sign && !infOrNaN && !subnormalOrZero ) << 6 | | ||||
|         ( !sign && subnormalOrZero && !fracZero )  << 5 | | ||||
|         ( !sign && subnormalOrZero && fracZero )   << 4 | | ||||
|         ( isNaN &&  isSNaN )                       << 8 | | ||||
|         ( isNaN && !isSNaN )                       << 9; | ||||
|     return (sign && infOrNaN && fracZero) << 0 | (sign && !infOrNaN && !subnormalOrZero) << 1 | | ||||
|            (sign && subnormalOrZero && !fracZero) << 2 | (sign && subnormalOrZero && fracZero) << 3 | (!sign && infOrNaN && fracZero) << 7 | | ||||
|            (!sign && !infOrNaN && !subnormalOrZero) << 6 | (!sign && subnormalOrZero && !fracZero) << 5 | | ||||
|            (!sign && subnormalOrZero && fracZero) << 4 | (isNaN && isSNaN) << 8 | (isNaN && !isSNaN) << 9; | ||||
| } | ||||
|  | ||||
| uint64_t fcvt_32_64(uint32_t v1, uint32_t op, uint8_t mode) { | ||||
|     float32_t v1f{v1}; | ||||
|     softfloat_exceptionFlags=0; | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     float64_t r; | ||||
|     switch(op){ | ||||
|     case 0: //l->s, fp to int32 | ||||
|         return f32_to_i64(v1f,rmm_map[mode&0x7],true); | ||||
|     case 1: //wu->s | ||||
|         return f32_to_ui64(v1f,rmm_map[mode&0x7],true); | ||||
|     case 2: //s->w | ||||
|         r=i32_to_f64(v1); | ||||
|     switch(op) { | ||||
|     case 0: // l->s, fp to int32 | ||||
|         return f32_to_i64(v1f, rmm_map.at(mode), true); | ||||
|     case 1: // wu->s | ||||
|         return f32_to_ui64(v1f, rmm_map.at(mode), true); | ||||
|     case 2: // s->w | ||||
|         r = i32_to_f64(v1); | ||||
|         return r.v; | ||||
|     case 3: //s->wu | ||||
|         r=ui32_to_f64(v1); | ||||
|     case 3: // s->wu | ||||
|         r = ui32_to_f64(v1); | ||||
|         return r.v; | ||||
|     } | ||||
|     return 0; | ||||
| } | ||||
|  | ||||
| uint32_t fcvt_64_32(uint64_t v1, uint32_t op, uint8_t mode) { | ||||
|     softfloat_exceptionFlags=0; | ||||
|     softfloat_exceptionFlags = 0; | ||||
|     float32_t r; | ||||
|     switch(op){ | ||||
|     case 0:{ //wu->s | ||||
|         int32_t r=f64_to_i32(float64_t{v1}, rmm_map[mode&0x7],true); | ||||
|     switch(op) { | ||||
|     case 0: { // wu->s | ||||
|         int32_t r = f64_to_i32(float64_t{v1}, rmm_map.at(mode), true); | ||||
|         return r; | ||||
|     } | ||||
|     case 1:{ //wu->s | ||||
|         uint32_t r=f64_to_ui32(float64_t{v1}, rmm_map[mode&0x7],true); | ||||
|     case 1: { // wu->s | ||||
|         uint32_t r = f64_to_ui32(float64_t{v1}, rmm_map.at(mode), true); | ||||
|         return r; | ||||
|     } | ||||
|     case 2: //l->s, fp to int32 | ||||
|         r=i64_to_f32(v1); | ||||
|     case 2: // l->s, fp to int32 | ||||
|         r = i64_to_f32(v1); | ||||
|         return r.v; | ||||
|     case 3: //wu->s | ||||
|         r=ui64_to_f32(v1); | ||||
|     case 3: // wu->s | ||||
|         r = ui64_to_f32(v1); | ||||
|         return r.v; | ||||
|     } | ||||
|     return 0; | ||||
| } | ||||
|  | ||||
| uint32_t unbox_s(uint64_t v){ | ||||
| uint32_t unbox_s(uint64_t v) { | ||||
|     constexpr uint64_t mask = std::numeric_limits<uint64_t>::max() & ~((uint64_t)std::numeric_limits<uint32_t>::max()); | ||||
|     if((v & mask) != mask) | ||||
|         return 0x7fc00000; | ||||
| @@ -445,4 +455,3 @@ uint32_t unbox_s(uint64_t v){ | ||||
|         return v & std::numeric_limits<uint32_t>::max(); | ||||
| } | ||||
| } | ||||
|  | ||||
|   | ||||
| @@ -44,11 +44,11 @@ uint32_t fsub_s(uint32_t v1, uint32_t v2, uint8_t mode); | ||||
| uint32_t fmul_s(uint32_t v1, uint32_t v2, uint8_t mode); | ||||
| uint32_t fdiv_s(uint32_t v1, uint32_t v2, uint8_t mode); | ||||
| uint32_t fsqrt_s(uint32_t v1, uint8_t mode); | ||||
| uint32_t fcmp_s(uint32_t v1, uint32_t v2, uint32_t op) ; | ||||
| uint32_t fcmp_s(uint32_t v1, uint32_t v2, uint32_t op); | ||||
| uint32_t fcvt_s(uint32_t v1, uint32_t op, uint8_t mode); | ||||
| uint32_t fmadd_s(uint32_t v1, uint32_t v2, uint32_t v3, uint32_t op, uint8_t mode); | ||||
| uint32_t fsel_s(uint32_t v1, uint32_t v2, uint32_t op); | ||||
| uint32_t fclass_s( uint32_t v1 ); | ||||
| uint32_t fclass_s(uint32_t v1); | ||||
| uint32_t fconv_d2f(uint64_t v1, uint8_t mode); | ||||
| uint64_t fconv_f2d(uint32_t v1, uint8_t mode); | ||||
| uint64_t fadd_d(uint64_t v1, uint64_t v2, uint8_t mode); | ||||
| @@ -59,8 +59,8 @@ uint64_t fsqrt_d(uint64_t v1, uint8_t mode); | ||||
| uint64_t fcmp_d(uint64_t v1, uint64_t v2, uint32_t op); | ||||
| uint64_t fcvt_d(uint64_t v1, uint32_t op, uint8_t mode); | ||||
| uint64_t fmadd_d(uint64_t v1, uint64_t v2, uint64_t v3, uint32_t op, uint8_t mode); | ||||
| uint64_t fsel_d(uint64_t v1, uint64_t v2, uint32_t op) ; | ||||
| uint64_t fclass_d(uint64_t v1  ); | ||||
| uint64_t fsel_d(uint64_t v1, uint64_t v2, uint32_t op); | ||||
| uint64_t fclass_d(uint64_t v1); | ||||
| uint64_t fcvt_32_64(uint32_t v1, uint32_t op, uint8_t mode); | ||||
| uint32_t fcvt_64_32(uint64_t v1, uint32_t op, uint8_t mode); | ||||
| uint32_t unbox_s(uint64_t v); | ||||
|   | ||||
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							| @@ -36,9 +36,9 @@ | ||||
| #include <iss/llvm/vm_base.h> | ||||
|  | ||||
| extern "C" { | ||||
| #include <softfloat.h> | ||||
| #include "internals.h" | ||||
| #include "specialize.h" | ||||
| #include <softfloat.h> | ||||
| } | ||||
|  | ||||
| #include <limits> | ||||
| @@ -50,60 +50,58 @@ namespace fp_impl { | ||||
| using namespace std; | ||||
| using namespace ::llvm; | ||||
|  | ||||
| #define INT_TYPE(L)   Type::getIntNTy(mod->getContext(), L) | ||||
| #define FLOAT_TYPE    Type::getFloatTy(mod->getContext()) | ||||
| #define DOUBLE_TYPE   Type::getDoubleTy(mod->getContext()) | ||||
| #define VOID_TYPE     Type::getVoidTy(mod->getContext()) | ||||
| #define INT_TYPE(L) Type::getIntNTy(mod->getContext(), L) | ||||
| #define FLOAT_TYPE Type::getFloatTy(mod->getContext()) | ||||
| #define DOUBLE_TYPE Type::getDoubleTy(mod->getContext()) | ||||
| #define VOID_TYPE Type::getVoidTy(mod->getContext()) | ||||
| #define THIS_PTR_TYPE Type::getIntNPtrTy(mod->getContext(), 8) | ||||
| #define FDECLL(NAME, RET, ...)                                                                                         \ | ||||
|     Function *NAME##_func = CurrentModule->getFunction(#NAME);                                                         \ | ||||
|     if (!NAME##_func) {                                                                                                \ | ||||
|         std::vector<Type *> NAME##_args{__VA_ARGS__};                                                                  \ | ||||
|         FunctionType *NAME##_type = FunctionType::get(RET, NAME##_args, false);                                        \ | ||||
|         NAME##_func = Function::Create(NAME##_type, GlobalValue::ExternalLinkage, #NAME, CurrentModule);               \ | ||||
|         NAME##_func->setCallingConv(CallingConv::C);                                                                   \ | ||||
| #define FDECLL(NAME, RET, ...)                                                                                                             \ | ||||
|     Function* NAME##_func = CurrentModule->getFunction(#NAME);                                                                             \ | ||||
|     if(!NAME##_func) {                                                                                                                     \ | ||||
|         std::vector<Type*> NAME##_args{__VA_ARGS__};                                                                                       \ | ||||
|         FunctionType* NAME##_type = FunctionType::get(RET, NAME##_args, false);                                                            \ | ||||
|         NAME##_func = Function::Create(NAME##_type, GlobalValue::ExternalLinkage, #NAME, CurrentModule);                                   \ | ||||
|         NAME##_func->setCallingConv(CallingConv::C);                                                                                       \ | ||||
|     } | ||||
|  | ||||
| #define FDECL(NAME, RET, ...)                                                                                          \ | ||||
|     std::vector<Type *> NAME##_args{__VA_ARGS__};                                                                      \ | ||||
|     FunctionType *NAME##_type = FunctionType::get(RET, NAME##_args, false);                                      \ | ||||
| #define FDECL(NAME, RET, ...)                                                                                                              \ | ||||
|     std::vector<Type*> NAME##_args{__VA_ARGS__};                                                                                           \ | ||||
|     FunctionType* NAME##_type = FunctionType::get(RET, NAME##_args, false);                                                                \ | ||||
|     mod->getOrInsertFunction(#NAME, NAME##_type); | ||||
|  | ||||
|  | ||||
| void add_fp_functions_2_module(Module *mod, uint32_t flen, uint32_t xlen) { | ||||
|     if(flen){ | ||||
| void add_fp_functions_2_module(Module* mod, uint32_t flen, uint32_t xlen) { | ||||
|     if(flen) { | ||||
|         FDECL(fget_flags, INT_TYPE(32)); | ||||
|         FDECL(fadd_s,     INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||
|         FDECL(fsub_s,     INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||
|         FDECL(fmul_s,     INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||
|         FDECL(fdiv_s,     INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||
|         FDECL(fsqrt_s,    INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||
|         FDECL(fcmp_s,     INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(32)); | ||||
|         FDECL(fcvt_s,     INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||
|         FDECL(fmadd_s,    INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||
|         FDECL(fsel_s,     INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(32)); | ||||
|         FDECL(fclass_s,   INT_TYPE(32), INT_TYPE(32)); | ||||
|         FDECL(fcvt_32_64,     INT_TYPE(64), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||
|         FDECL(fcvt_64_32,     INT_TYPE(32), INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); | ||||
|         if(flen>32){ | ||||
|             FDECL(fconv_d2f,  INT_TYPE(32), INT_TYPE(64), INT_TYPE(8)); | ||||
|             FDECL(fconv_f2d,  INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); | ||||
|             FDECL(fadd_d,     INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||
|             FDECL(fsub_d,     INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||
|             FDECL(fmul_d,     INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||
|             FDECL(fdiv_d,     INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||
|             FDECL(fsqrt_d,    INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||
|             FDECL(fcmp_d,     INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(32)); | ||||
|             FDECL(fcvt_d,     INT_TYPE(64), INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); | ||||
|             FDECL(fmadd_d,    INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); | ||||
|             FDECL(fsel_d,     INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(32)); | ||||
|             FDECL(fclass_d,   INT_TYPE(64), INT_TYPE(64)); | ||||
|             FDECL(unbox_s,      INT_TYPE(32), INT_TYPE(64)); | ||||
|  | ||||
|         FDECL(fadd_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||
|         FDECL(fsub_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||
|         FDECL(fmul_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||
|         FDECL(fdiv_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||
|         FDECL(fsqrt_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||
|         FDECL(fcmp_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(32)); | ||||
|         FDECL(fcvt_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||
|         FDECL(fmadd_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||
|         FDECL(fsel_s, INT_TYPE(32), INT_TYPE(32), INT_TYPE(32), INT_TYPE(32)); | ||||
|         FDECL(fclass_s, INT_TYPE(32), INT_TYPE(32)); | ||||
|         FDECL(fcvt_32_64, INT_TYPE(64), INT_TYPE(32), INT_TYPE(32), INT_TYPE(8)); | ||||
|         FDECL(fcvt_64_32, INT_TYPE(32), INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); | ||||
|         if(flen > 32) { | ||||
|             FDECL(fconv_d2f, INT_TYPE(32), INT_TYPE(64), INT_TYPE(8)); | ||||
|             FDECL(fconv_f2d, INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); | ||||
|             FDECL(fadd_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||
|             FDECL(fsub_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||
|             FDECL(fmul_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||
|             FDECL(fdiv_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||
|             FDECL(fsqrt_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(8)); | ||||
|             FDECL(fcmp_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(32)); | ||||
|             FDECL(fcvt_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); | ||||
|             FDECL(fmadd_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(32), INT_TYPE(8)); | ||||
|             FDECL(fsel_d, INT_TYPE(64), INT_TYPE(64), INT_TYPE(64), INT_TYPE(32)); | ||||
|             FDECL(fclass_d, INT_TYPE(64), INT_TYPE(64)); | ||||
|             FDECL(unbox_s, INT_TYPE(32), INT_TYPE(64)); | ||||
|         } | ||||
|     } | ||||
| } | ||||
|  | ||||
| } | ||||
| } | ||||
| } | ||||
| } // namespace fp_impl | ||||
| } // namespace llvm | ||||
| } // namespace iss | ||||
|   | ||||
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							
										
											
												File diff suppressed because it is too large
												Load Diff
											
										
									
								
							
		Reference in New Issue
	
	Block a user