diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml index e3943e4..a1b3300 100644 --- a/.github/workflows/ci.yml +++ b/.github/workflows/ci.yml @@ -23,12 +23,16 @@ jobs: run: python -m pip install Jinja2 - name: Installing pytest run: python -m pip install pytest + - name: Update submodules (Linux) + run: | + git submodule update --init + git submodule foreach 'git checkout main' - name: Running cmake (Linux) run: | ls ${{github.workspace}} mkdir build cd build - cmake -DCMAKE_BUILD_TYPE=Debug .. + cmake -DCMAKE_BUILD_TYPE=Debug -DUSE_FMA_INTRINSIC=1 .. - name: Build Solution (Linux) run: | cd build diff --git a/.gitmodules b/.gitmodules new file mode 100644 index 0000000..c847bd4 --- /dev/null +++ b/.gitmodules @@ -0,0 +1,12 @@ +[submodule "extern/interflop"] + path = extern/interflop + url = https://github.com/a-hamitouche/interflop-stdlib.git +[submodule "extern/interflop-backend-ieee"] + path = extern/interflop-backend-ieee + url = https://github.com/a-hamitouche/interflop-backend-ieee.git +[submodule "extern/interflop-backend-verrou"] + path = extern/interflop-backend-verrou + url = https://github.com/a-hamitouche/interflop-backend-verrou.git +[submodule "extern/interflop-backend-vprec"] + path = extern/interflop-backend-vprec + url = https://github.com/a-hamitouche/interflop-backend-vprec.git diff --git a/CMakeLists.txt b/CMakeLists.txt index 7fdf7a8..3678fdd 100644 --- a/CMakeLists.txt +++ b/CMakeLists.txt @@ -91,6 +91,12 @@ endif() # Include sub-projects. +if(UNIX) + include_directories("extern") + include_directories("extern/interflop") + add_subdirectory ("extern") +endif() + include_directories("include") include_directories("include/replace/backend/backend_verrou") add_subdirectory("code_generator") @@ -105,3 +111,4 @@ add_subdirectory ("Test/cpp_unit") add_subdirectory ("Test/test_backend") add_subdirectory ("Test/test_backend_verrou") + diff --git a/README.md b/README.md index 6d500ee..71faa5b 100644 --- a/README.md +++ b/README.md @@ -25,7 +25,9 @@ To do so, run via your command line on Linux or your powershell on Windows: ```shell cd [PENE repository] -cmake . +git submodule update --init +git submodule foreach 'git checkout main' +cmake -DUSE_FMA_INTRINSIC=1 . cmake --build . ctest -C Debug ``` @@ -47,6 +49,9 @@ Without specifying any options, this command will execute your code under PENE w # How to instrument your code with PENE? +PENE offers two ways to instrument code. A cross-plateforme based on backend [Verrou](https://github.com/edf-hpc/verrou) named **fp-replace** and on based one [Interflop](https://github.com/interflop), available on Linux only. + +## **FP-REPLACE** mode To instrument your code, you can use the **fp-replace** option: ```shell @@ -70,6 +75,43 @@ where: - rounding-mode = 4 : rounding to zero - rounding-mode = 5 : random rounding +## **INTERFLOP** mode (Linux only) + +The interflop mode allows to dynamicaly load up to 16 backends and make them work separately. Available backends are : + +| Backend | Description | +|---------------------------------------------------------------------------|--------------------------------------------------------------------------------------------------------------------------------------| +|[backend ieee](https://github.com/a-hamitouche/interflop-backend-ieee) | The IEEE backend implements straighforward IEEE-754 arithmetic. It should have no effect on the output and behavior of your program. | +|[backend verrou](https://github.com/a-hamitouche/interflop-backend-verrou) | The Verrou backend implements software couterpart of all IEEE-754 standard rounding modes | +|[backend vprec](https://github.com/a-hamitouche/interflop-backend-vprec) | The VPREC backend simulates any floating-point formats that can fit into the IEEE-754 double precision format with a round to the nearest.| + +Each of these backends accepts different arguments and exhibits distinct behavior. To learn more, please consult the README.md files of each backend (located in the external subfolder or on their GitHub page). +With this mode, backends can be used with a scalar mode (by devectorizing operations) or in vector mode to reduce instrumentation overhead. + +Usage : + +```bash +VFC_BACKENDS="libbackend.so [option]" path/to/pin -t path/to/pene.so/or/pene.so -interflop -- path/to/executable +``` + +Exemple of usage with Verrou : + + +```bash +#Scalar mode +VFC_BACKENDS="libinterflop_verrou.so --rounding-mode=upward" path/to/pin -t path/to/pene.so/or/pene.so -interflop -- path/to/executable + +#Vector mode +VFC_BACKENDS="libinterflop_verrou.so --rounding-mode=downward" path/to/pin -t path/to/pene.so/or/pene.so -interflop -vector-mode -- path/to/executable + +#Multiple backends +VFC_BACKENDS="libinterflop_verrou.so --rounding-mode=upward; libinterflop_vprec.so --mode=full --precision-binary32=23 --debug" path/to/pin -t path/to/pene.so/or/pene.so -interflop -- path/to/executable +``` + +/!\ Note : +- Proposed backends fully work only in scalar mode +- For backend Verrou, only nearest, upward and downward modes are available on vector mode + ## How to exclude parts of the code from instrumentation? You can filter which parts of the code your want to instrument using the option `-exclude` along with an exclusion file containing a list of the functions you want to exclude. diff --git a/extern/CMakeLists.txt b/extern/CMakeLists.txt new file mode 100644 index 0000000..f77c63d --- /dev/null +++ b/extern/CMakeLists.txt @@ -0,0 +1,113 @@ +project("Interflop") + + +include_directories("${CMAKE_CURRENT_SOURCE_DIR}") +include_directories("${CMAKE_CURRENT_SOURCE_DIR}/interflop") + +if(DEFINED USE_FMA_INTRINSIC) +message("-- Using FMA Intrinsic") +set(HAVE_FMA_INTRINSIC=${HAVE_FMA_INTRINSIC}) +set(FMA_FLAGS "-mfma") +endif() + +set(CRT_COMPILE_DEFINITIONS + # Preprocessor Options + "-D__PIN__=1 -DPIN_CRT=1 " + "-DTARGET_IA32E -DHOST_IA32E " + "-DTARGET_LINUX " + ${HAVE_FMA_INTRINSIC} + "-DHAVE_FENV_H " + "-D__PENE_FRONTEND__ " +) +set(CRT_COMPILE_OPTIONS + # Compilateur (middle) + "-funwind-tables" # Code Gen Options + "-fasynchronous-unwind-tables" # Code Gen Option + "-fomit-frame-pointer" # Code Optimize Options + "-fno-strict-aliasing" # Code Optimize Options + "-fno-stack-protector" # Instrumentation Options + ${FMA_FLAGS} + "-fPIC" +) +set(CRT_PREPROCESS_OPTIONS + # Preprocesseur (front) + "-isystem ${PIN_ROOT}/extras/stlport/include " + "-isystem ${PIN_ROOT}/extras/libstdc++/include " + "-isystem ${PIN_ROOT}/extras/crt/include " + "-isystem ${PIN_ROOT}/extras/crt/include/arch-x86_64 " + "-isystem ${PIN_ROOT}/extras/crt/include/kernel/uapi " + "-isystem ${PIN_ROOT}/extras/crt/include/kernel/uapi/asm-x86 " + "-I${PIN_ROOT}/source/include/pin " + "-I${PIN_ROOT}/source/include/pin/gen " + "-I${PIN_ROOT}/extras/components/include " + "-I${PIN_ROOT}/extras/xed-intel64/include/xed " +) +set(CRT_CXX_COMPILE_OPTIONS + "-fno-exceptions" + "-fno-rtti" + "-fPIC" + "-faligned-new" +) +set(CRT_LINK_OPTIONS + "-fPIC" + "-Wl,--hash-style=sysv" +) + +set(CRT_LINK_LIBRARIES + "-L${PIN_ROOT}/intel64/runtime/pincrt" + "-L${PIN_ROOT}/intel64/lib-ext" + "-nostdlib" "c-dynamic" "m-dynamic" "stlport-dynamic" "pin3dwarf" "dl-dynamic" +) + +set(OUTPUT_DIRECTORY "${PIN_ROOT}/intel64/lib-ext") + +add_subdirectory ("argp") +add_subdirectory ("interflop") +add_subdirectory ("interflop-backend-verrou") +add_subdirectory ("interflop-backend-vprec") +add_subdirectory ("interflop-backend-ieee") + +get_directory_property(CRT_COMPILE_DEFINITIONS DIRECTORY interflop VARIABLES CRT_COMPILE_DEFINITIONS + DIRECTORY interflop-backend-verrou VARIABLES CRT_COMPILE_DEFINITIONS + DIRECTORY interflop-backend-vprec VARIABLES CRT_COMPILE_DEFINITIONS + DIRECTORY interflop-backend-ieee VARIABLES CRT_COMPILE_DEFINITIONS + DIRECTORY argp VARIABLES CRT_COMPILE_DEFINITIONS +) +get_directory_property(CRT_COMPILE_OPTIONS DIRECTORY interflop VARIABLES CRT_COMPILE_OPTIONS + DIRECTORY interflop-backend-verrou VARIABLES CRT_COMPILE_OPTIONS + DIRECTORY interflop-backend-vprec VARIABLES CRT_COMPILE_OPTIONS + DIRECTORY interflop-backend-ieee VARIABLES CRT_COMPILE_OPTIONS + DIRECTORY argp VARIABLES CRT_COMPILE_OPTIONS +) +get_directory_property(CRT_CXX_COMPILE_OPTIONS DIRECTORY interflop VARIABLES CRT_CXX_COMPILE_OPTIONS + DIRECTORY interflop-backend-verrou VARIABLES CRT_CXX_COMPILE_OPTIONS + DIRECTORY interflop-backend-vprec VARIABLES CRT_CXX_COMPILE_OPTIONS + DIRECTORY interflop-backend-ieee VARIABLES CRT_CXX_COMPILE_OPTIONS + DIRECTORY argp VARIABLES CRT_CXX_COMPILE_OPTIONS +) +get_directory_property(CRT_PREPROCESS_OPTIONS DIRECTORY interflop VARIABLES CRT_PREPROCESS_OPTIONS + DIRECTORY interflop-backend-verrou VARIABLES CRT_PREPROCESS_OPTIONS + DIRECTORY interflop-backend-vprec VARIABLES CRT_PREPROCESS_OPTIONS + DIRECTORY interflop-backend-ieee VARIABLES CRT_PREPROCESS_OPTIONS + DIRECTORY argp VARIABLES CRT_PREPROCESS_OPTIONS +) +get_directory_property(CRT_LINK_OPTIONS DIRECTORY interflop VARIABLES CRT_LINK_OPTIONS + DIRECTORY interflop VARIABLES CRT_LINK_OPTIONS + DIRECTORY interflop-backend-verrou VARIABLES CRT_LINK_OPTIONS + DIRECTORY interflop-backend-vprec VARIABLES CRT_LINK_OPTIONS + DIRECTORY interflop-backend-ieee VARIABLES CRT_LINK_OPTIONS + DIRECTORY argp VARIABLES CRT_LINK_OPTIONS +) +get_directory_property(CRT_LINK_LIBRARIES DIRECTORY interflop VARIABLES CRT_LINK_LIBRARIES + DIRECTORY interflop-backend-verrou VARIABLES CRT_LINK_LIBRARIES + DIRECTORY interflop-backend-vprec VARIABLES CRT_LINK_LIBRARIES + DIRECTORY interflop-backend-ieee VARIABLES CRT_LINK_LIBRARIES + DIRECTORY argp VARIABLES CRT_LINK_LIBRARIES +) + +get_directory_property( OUTPUT_DIRECTORY DIRECTORY interflop VARIABLES OUTPUT_DIRECTORY + DIRECTORY interflop-backend-verrou VARIABLES OUTPUT_DIRECTORY + DIRECTORY interflop-backend-vprec VARIABLES OUTPUT_DIRECTORY + DIRECTORY interflop-backend-ieee VARIABLES OUTPUT_DIRECTORY + DIRECTORY argp VARIABLES OUTPUT_DIRECTORY +) diff --git a/extern/argp/CMakeLists.txt b/extern/argp/CMakeLists.txt new file mode 100644 index 0000000..83b8f2a --- /dev/null +++ b/extern/argp/CMakeLists.txt @@ -0,0 +1,17 @@ +project("argp") + +cmake_minimum_required(VERSION 3.20) + +set (ARGP_C_SRC + "argp-parse.c" +) + +add_library(argp_c OBJECT ${ARGP_C_SRC}) +target_compile_definitions(argp_c PRIVATE ${CRT_COMPILE_DEFINITIONS}) +target_compile_options (argp_c PRIVATE ${CRT_PREPROCESS_OPTIONS} ${CRT_COMPILE_OPTIONS} "-fPIC") + +set(CMAKE_LIBRARY_OUTPUT_DIRECTORY ${OUTPUT_DIRECTORY}) +add_library (argp SHARED $) +target_link_options (argp PRIVATE ${CRT_LINK_OPTIONS}) +target_link_libraries (argp ${CRT_LINK_LIBRARIES}) + diff --git a/extern/argp/argp-namefrob.h b/extern/argp/argp-namefrob.h new file mode 100644 index 0000000..39f9684 --- /dev/null +++ b/extern/argp/argp-namefrob.h @@ -0,0 +1,149 @@ +/* Name frobnication for compiling argp outside of glibc + Copyright (C) 1997-2023 Free Software Foundation, Inc. + This file is part of the GNU C Library. + Written by Miles Bader . + + The GNU C Library is free software; you can redistribute it and/or + modify it under the terms of the GNU Lesser General Public + License as published by the Free Software Foundation; either + version 2.1 of the License, or (at your option) any later version. + + The GNU C Library is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + Lesser General Public License for more details. + + You should have received a copy of the GNU Lesser General Public + License along with the GNU C Library; if not, see + . */ + +#if !_LIBC +/* This code is written for inclusion in gnu-libc, and uses names in the + namespace reserved for libc. If we're not compiling in libc, define those + names to be the normal ones instead. */ + +/* argp-parse functions */ +#undef __argp_parse +#define __argp_parse argp_parse +#undef __option_is_end +#define __option_is_end _option_is_end +#undef __option_is_short +#define __option_is_short _option_is_short +#undef __argp_input +#define __argp_input _argp_input + +/* argp-help functions */ +#undef __argp_help +#define __argp_help argp_help +#undef __argp_error +#define __argp_error argp_error +#undef __argp_failure +#define __argp_failure argp_failure +#undef __argp_state_help +#define __argp_state_help argp_state_help +#undef __argp_usage +#define __argp_usage argp_usage + +/* argp-fmtstream functions */ +#undef __argp_make_fmtstream +#define __argp_make_fmtstream argp_make_fmtstream +#undef __argp_fmtstream_free +#define __argp_fmtstream_free argp_fmtstream_free +#undef __argp_fmtstream_putc +#define __argp_fmtstream_putc argp_fmtstream_putc +#undef __argp_fmtstream_puts +#define __argp_fmtstream_puts argp_fmtstream_puts +#undef __argp_fmtstream_write +#define __argp_fmtstream_write argp_fmtstream_write +#undef __argp_fmtstream_printf +#define __argp_fmtstream_printf argp_fmtstream_printf +#undef __argp_fmtstream_set_lmargin +#define __argp_fmtstream_set_lmargin argp_fmtstream_set_lmargin +#undef __argp_fmtstream_set_rmargin +#define __argp_fmtstream_set_rmargin argp_fmtstream_set_rmargin +#undef __argp_fmtstream_set_wmargin +#define __argp_fmtstream_set_wmargin argp_fmtstream_set_wmargin +#undef __argp_fmtstream_point +#define __argp_fmtstream_point argp_fmtstream_point +#undef __argp_fmtstream_update +#define __argp_fmtstream_update _argp_fmtstream_update +#undef __argp_fmtstream_ensure +#define __argp_fmtstream_ensure _argp_fmtstream_ensure +#undef __argp_fmtstream_lmargin +#define __argp_fmtstream_lmargin argp_fmtstream_lmargin +#undef __argp_fmtstream_rmargin +#define __argp_fmtstream_rmargin argp_fmtstream_rmargin +#undef __argp_fmtstream_wmargin +#define __argp_fmtstream_wmargin argp_fmtstream_wmargin + +/* normal libc functions we call */ +#undef __flockfile +#define __flockfile flockfile +#undef __funlockfile +#define __funlockfile funlockfile +#undef __mempcpy +#define __mempcpy mempcpy +#undef __sleep +#define __sleep sleep +#undef __strcasecmp +#define __strcasecmp strcasecmp +#undef __strchrnul +#define __strchrnul strchrnul +#undef __strerror_r +#define __strerror_r strerror_r +#undef __strndup +#define __strndup strndup + +#if defined(HAVE_DECL_CLEARERR_UNLOCKED) && !HAVE_DECL_CLEARERR_UNLOCKED +# define clearerr_unlocked(x) clearerr (x) +#endif +#if defined(HAVE_DECL_FEOF_UNLOCKED) && !HAVE_DECL_FEOF_UNLOCKED +# define feof_unlocked(x) feof (x) +# endif +#if defined(HAVE_DECL_FERROR_UNLOCKED) && !HAVE_DECL_FERROR_UNLOCKED +# define ferror_unlocked(x) ferror (x) +# endif +#if defined(HAVE_DECL_FFLUSH_UNLOCKED) && !HAVE_DECL_FFLUSH_UNLOCKED +# define fflush_unlocked(x) fflush (x) +# endif +#if defined(HAVE_DECL_FGETS_UNLOCKED) && !HAVE_DECL_FGETS_UNLOCKED +# define fgets_unlocked(x,y,z) fgets (x,y,z) +# endif +#if defined(HAVE_DECL_FPUTC_UNLOCKED) && !HAVE_DECL_FPUTC_UNLOCKED +# define fputc_unlocked(x,y) fputc (x,y) +# endif +#if defined(HAVE_DECL_FPUTS_UNLOCKED) && !HAVE_DECL_FPUTS_UNLOCKED +# define fputs_unlocked(x,y) fputs (x,y) +# endif +#if defined(HAVE_DECL_FREAD_UNLOCKED) && !HAVE_DECL_FREAD_UNLOCKED +# define fread_unlocked(w,x,y,z) fread (w,x,y,z) +# endif +#if defined(HAVE_DECL_FWRITE_UNLOCKED) && !HAVE_DECL_FWRITE_UNLOCKED +# define fwrite_unlocked(w,x,y,z) fwrite (w,x,y,z) +# endif +#if defined(HAVE_DECL_GETC_UNLOCKED) && !HAVE_DECL_GETC_UNLOCKED +# define getc_unlocked(x) getc (x) +# endif +#if defined(HAVE_DECL_GETCHAR_UNLOCKED) && !HAVE_DECL_GETCHAR_UNLOCKED +# define getchar_unlocked() getchar () +# endif +#if defined(HAVE_DECL_PUTC_UNLOCKED) && !HAVE_DECL_PUTC_UNLOCKED +# define putc_unlocked(x,y) putc (x,y) +# endif +#if defined(HAVE_DECL_PUTCHAR_UNLOCKED) && !HAVE_DECL_PUTCHAR_UNLOCKED +# define putchar_unlocked(x) putchar (x) +# endif + +extern char *__argp_basename (char *name); + +#endif /* !_LIBC */ + +#ifndef __set_errno +#define __set_errno(e) (errno = (e)) +#endif + +#if defined _LIBC || HAVE_DECL_PROGRAM_INVOCATION_SHORT_NAME +# define __argp_short_program_name() (program_invocation_short_name) +#else +extern char *__argp_short_program_name (void); +#endif diff --git a/extern/argp/argp-parse.c b/extern/argp/argp-parse.c new file mode 100644 index 0000000..85fc9b1 --- /dev/null +++ b/extern/argp/argp-parse.c @@ -0,0 +1,86 @@ +/* Hierarchial argument parsing, layered over getopt + Copyright (C) 1995-2023 Free Software Foundation, Inc. + This file is part of the GNU C Library. + Written by Miles Bader . + + The GNU C Library is free software; you can redistribute it and/or + modify it under the terms of the GNU Lesser General Public + License as published by the Free Software Foundation; either + version 2.1 of the License, or (at your option) any later version. + + The GNU C Library is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + Lesser General Public License for more details. + + You should have received a copy of the GNU Lesser General Public + License along with the GNU C Library; if not, see + . */ + +#include +#include +#include +#include +#include +#include +#include "getopt_int.h" + + +#include "argp.h" +#include "argp-namefrob.h" + + +int argp_end_options(struct argp_option opt) { + return !opt.name && + !opt.key && + !opt.arg && + !opt.flags && + !opt.doc && + !opt.group; + return 0; +} + +/* Parse the options strings in ARGC & ARGV according to the argp in ARGP. + FLAGS is one of the ARGP_ flags above. If END_INDEX is non-NULL, the + index in ARGV of the first unparsed option is returned in it. If an + unknown option is present, EINVAL is returned; if some parser routine + returned a non-zero value, it is returned; otherwise 0 is returned. */ +error_t +argp_parse (const struct argp *argp, int argc, char **argv, unsigned flags, + int *end_index, void *input) +{ + error_t err; + const struct argp * backend_argp = argp; + struct argp_state state = {backend_argp,argc,argv,0,flags,0,0,input,0,0,argv[0],0,0,0}; + void *child_inputs[16]; + state.child_inputs = child_inputs; + + char buf[256]; + for (int i = 1; i < argc; i++) { + strcpy ( buf, argv[i]); + char *arg = buf; + + char *equal_sign = strchr(arg, '='); + char *param = NULL, *value = NULL; + if (equal_sign) { + *equal_sign = '\0'; + param = arg + 2; + value = equal_sign + 1; + } + else { + param = arg+2; + } + + int argp_argc = 0; + + while( argp_end_options( backend_argp->options[argp_argc]) == 0) { + + if ( strcasecmp( backend_argp->options[argp_argc].name, param) == 0) + { + backend_argp->parser(backend_argp->options[argp_argc].key, value, &state); + } + argp_argc++; + } + } + return 0; +} diff --git a/extern/argp/argp.h b/extern/argp/argp.h new file mode 100644 index 0000000..b3fdae7 --- /dev/null +++ b/extern/argp/argp.h @@ -0,0 +1,564 @@ +/* Hierarchical argument parsing, layered over getopt. + Copyright (C) 1995-2022 Free Software Foundation, Inc. + This file is part of the GNU C Library. + Written by Miles Bader . + + The GNU C Library is free software; you can redistribute it and/or + modify it under the terms of the GNU Lesser General Public + License as published by the Free Software Foundation; either + version 2.1 of the License, or (at your option) any later version. + + The GNU C Library is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + Lesser General Public License for more details. + + You should have received a copy of the GNU Lesser General Public + License along with the GNU C Library; if not, see + . */ + +#ifndef _ARGP_H +#define _ARGP_H + +#include +#include +#include +#include +#include + +__BEGIN_DECLS + +/* error_t may or may not be available from errno.h, depending on the + operating system. */ +#ifndef __error_t_defined +# define __error_t_defined 1 +typedef int error_t; +#endif + +/* A description of a particular option. A pointer to an array of + these is passed in the OPTIONS field of an argp structure. Each option + entry can correspond to one long option and/or one short option; more + names for the same option can be added by following an entry in an option + array with options having the OPTION_ALIAS flag set. */ +struct argp_option +{ + /* The long option name. For more than one name for the same option, you + can use following options with the OPTION_ALIAS flag set. */ + const char *name; + + /* What key is returned for this option. If > 0 and printable, then it's + also accepted as a short option. */ + int key; + + /* If non-NULL, this is the name of the argument associated with this + option, which is required unless the OPTION_ARG_OPTIONAL flag is set. */ + const char *arg; + + /* OPTION_ flags. */ + int flags; + + /* The doc string for this option. If both NAME and KEY are 0, This string + will be printed outdented from the normal option column, making it + useful as a group header (it will be the first thing printed in its + group); in this usage, it's conventional to end the string with a `:'. */ + const char *doc; + + /* The group this option is in. In a long help message, options are sorted + alphabetically within each group, and the groups presented in the order + 0, 1, 2, ..., n, -m, ..., -2, -1. Every entry in an options array with + if this field 0 will inherit the group number of the previous entry, or + zero if it's the first one, unless its a group header (NAME and KEY both + 0), in which case, the previous entry + 1 is the default. Automagic + options such as --help are put into group -1. */ + int group; +}; + +/* The argument associated with this option is optional. */ +#define OPTION_ARG_OPTIONAL 0x1 + +/* This option isn't displayed in any help messages. */ +#define OPTION_HIDDEN 0x2 + +/* This option is an alias for the closest previous non-alias option. This + means that it will be displayed in the same help entry, and will inherit + fields other than NAME and KEY from the aliased option. */ +#define OPTION_ALIAS 0x4 + +/* This option isn't actually an option (and so should be ignored by the + actual option parser), but rather an arbitrary piece of documentation that + should be displayed in much the same manner as the options. If this flag + is set, then the option NAME field is displayed unmodified (e.g., no `--' + prefix is added) at the left-margin (where a *short* option would normally + be displayed), and the documentation string in the normal place. For + purposes of sorting, any leading whitespace and punctuation is ignored, + except that if the first non-whitespace character is not `-', this entry + is displayed after all options (and OPTION_DOC entries with a leading `-') + in the same group. */ +#define OPTION_DOC 0x8 + +/* This option shouldn't be included in `long' usage messages (but is still + included in help messages). This is mainly intended for options that are + completely documented in an argp's ARGS_DOC field, in which case including + the option in the generic usage list would be redundant. For instance, + if ARGS_DOC is "FOO BAR\n-x BLAH", and the `-x' option's purpose is to + distinguish these two cases, -x should probably be marked + OPTION_NO_USAGE. */ +#define OPTION_NO_USAGE 0x10 + +struct argp; /* fwd declare this type */ +struct argp_state; /* " */ +struct argp_child; /* " */ + +/* The type of a pointer to an argp parsing function. */ +typedef error_t (*argp_parser_t) (int __key, char *__arg, + struct argp_state *__state); + +/* What to return for unrecognized keys. For special ARGP_KEY_ keys, such + returns will simply be ignored. For user keys, this error will be turned + into EINVAL (if the call to argp_parse is such that errors are propagated + back to the user instead of exiting); returning EINVAL itself would result + in an immediate stop to parsing in *all* cases. */ +#define ARGP_ERR_UNKNOWN E2BIG /* Hurd should never need E2BIG. XXX */ + +/* Special values for the KEY argument to an argument parsing function. + ARGP_ERR_UNKNOWN should be returned if they aren't understood. + + The sequence of keys to a parsing function is either (where each + uppercased word should be prefixed by `ARGP_KEY_' and opt is a user key): + + INIT opt... NO_ARGS END SUCCESS -- No non-option arguments at all + or INIT (opt | ARG)... END SUCCESS -- All non-option args parsed + or INIT (opt | ARG)... SUCCESS -- Some non-option arg unrecognized + + The third case is where every parser returned ARGP_KEY_UNKNOWN for an + argument, in which case parsing stops at that argument (returning the + unparsed arguments to the caller of argp_parse if requested, or stopping + with an error message if not). + + If an error occurs (either detected by argp, or because the parsing + function returned an error value), then the parser is called with + ARGP_KEY_ERROR, and no further calls are made. */ + +/* This is not an option at all, but rather a command line argument. If a + parser receiving this key returns success, the fact is recorded, and the + ARGP_KEY_NO_ARGS case won't be used. HOWEVER, if while processing the + argument, a parser function decrements the NEXT field of the state it's + passed, the option won't be considered processed; this is to allow you to + actually modify the argument (perhaps into an option), and have it + processed again. */ +#define ARGP_KEY_ARG 0 +/* There are remaining arguments not parsed by any parser, which may be found + starting at (STATE->argv + STATE->next). If success is returned, but + STATE->next left untouched, it's assumed that all arguments were consume, + otherwise, the parser should adjust STATE->next to reflect any arguments + consumed. */ +#define ARGP_KEY_ARGS 0x1000006 +/* There are no more command line arguments at all. */ +#define ARGP_KEY_END 0x1000001 +/* Because it's common to want to do some special processing if there aren't + any non-option args, user parsers are called with this key if they didn't + successfully process any non-option arguments. Called just before + ARGP_KEY_END (where more general validity checks on previously parsed + arguments can take place). */ +#define ARGP_KEY_NO_ARGS 0x1000002 +/* Passed in before any parsing is done. Afterwards, the values of each + element of the CHILD_INPUT field, if any, in the state structure is + copied to each child's state to be the initial value of the INPUT field. */ +#define ARGP_KEY_INIT 0x1000003 +/* Use after all other keys, including SUCCESS & END. */ +#define ARGP_KEY_FINI 0x1000007 +/* Passed in when parsing has successfully been completed (even if there are + still arguments remaining). */ +#define ARGP_KEY_SUCCESS 0x1000004 +/* Passed in if an error occurs. */ +#define ARGP_KEY_ERROR 0x1000005 + +/* An argp structure contains a set of options declarations, a function to + deal with parsing one, documentation string, a possible vector of child + argp's, and perhaps a function to filter help output. When actually + parsing options, getopt is called with the union of all the argp + structures chained together through their CHILD pointers, with conflicts + being resolved in favor of the first occurrence in the chain. */ +struct argp +{ + /* An array of argp_option structures, terminated by an entry with both + NAME and KEY having a value of 0. */ + const struct argp_option *options; + + /* What to do with an option from this structure. KEY is the key + associated with the option, and ARG is any associated argument (NULL if + none was supplied). If KEY isn't understood, ARGP_ERR_UNKNOWN should be + returned. If a non-zero, non-ARGP_ERR_UNKNOWN value is returned, then + parsing is stopped immediately, and that value is returned from + argp_parse(). For special (non-user-supplied) values of KEY, see the + ARGP_KEY_ definitions below. */ + argp_parser_t parser; + + /* A string describing what other arguments are wanted by this program. It + is only used by argp_usage to print the `Usage:' message. If it + contains newlines, the strings separated by them are considered + alternative usage patterns, and printed on separate lines (lines after + the first are prefix by ` or: ' instead of `Usage:'). */ + const char *args_doc; + + /* If non-NULL, a string containing extra text to be printed before and + after the options in a long help message (separated by a vertical tab + `\v' character). */ + const char *doc; + + /* A vector of argp_children structures, terminated by a member with a 0 + argp field, pointing to child argps should be parsed with this one. Any + conflicts are resolved in favor of this argp, or early argps in the + CHILDREN list. This field is useful if you use libraries that supply + their own argp structure, which you want to use in conjunction with your + own. */ + const struct argp_child *children; + + /* If non-zero, this should be a function to filter the output of help + messages. KEY is either a key from an option, in which case TEXT is + that option's help text, or a special key from the ARGP_KEY_HELP_ + defines, below, describing which other help text TEXT is. The function + should return either TEXT, if it should be used as-is, a replacement + string, which should be malloced, and will be freed by argp, or NULL, + meaning `print nothing'. The value for TEXT is *after* any translation + has been done, so if any of the replacement text also needs translation, + that should be done by the filter function. INPUT is either the input + supplied to argp_parse, or NULL, if argp_help was called directly. */ + char *(*help_filter) (int __key, const char *__text, void *__input); + + /* If non-zero the strings used in the argp library are translated using + the domain described by this string. Otherwise the currently installed + default domain is used. */ + const char *argp_domain; +}; + +/* Possible KEY arguments to a help filter function. */ +#define ARGP_KEY_HELP_PRE_DOC 0x2000001 /* Help text preceding options. */ +#define ARGP_KEY_HELP_POST_DOC 0x2000002 /* Help text following options. */ +#define ARGP_KEY_HELP_HEADER 0x2000003 /* Option header string. */ +#define ARGP_KEY_HELP_EXTRA 0x2000004 /* After all other documentation; + TEXT is NULL for this key. */ +/* Explanatory note emitted when duplicate option arguments have been + suppressed. */ +#define ARGP_KEY_HELP_DUP_ARGS_NOTE 0x2000005 +#define ARGP_KEY_HELP_ARGS_DOC 0x2000006 /* Argument doc string. */ + +/* When an argp has a non-zero CHILDREN field, it should point to a vector of + argp_child structures, each of which describes a subsidiary argp. */ +struct argp_child +{ + /* The child parser. */ + const struct argp *argp; + + /* Flags for this child. */ + int flags; + + /* If non-zero, an optional header to be printed in help output before the + child options. As a side-effect, a non-zero value forces the child + options to be grouped together; to achieve this effect without actually + printing a header string, use a value of "". */ + const char *header; + + /* Where to group the child options relative to the other (`consolidated') + options in the parent argp; the values are the same as the GROUP field + in argp_option structs, but all child-groupings follow parent options at + a particular group level. If both this field and HEADER are zero, then + they aren't grouped at all, but rather merged with the parent options + (merging the child's grouping levels with the parents). */ + int group; +}; + +/* Parsing state. This is provided to parsing functions called by argp, + which may examine and, as noted, modify fields. */ +struct argp_state +{ + /* The top level ARGP being parsed. */ + const struct argp *root_argp; + + /* The argument vector being parsed. May be modified. */ + int argc; + char **argv; + + /* The index in ARGV of the next arg that to be parsed. May be modified. */ + int next; + + /* The flags supplied to argp_parse. May be modified. */ + unsigned flags; + + /* While calling a parsing function with a key of ARGP_KEY_ARG, this is the + number of the current arg, starting at zero, and incremented after each + such call returns. At all other times, this is the number of such + arguments that have been processed. */ + unsigned arg_num; + + /* If non-zero, the index in ARGV of the first argument following a special + `--' argument (which prevents anything following being interpreted as an + option). Only set once argument parsing has proceeded past this point. */ + int quoted; + + /* An arbitrary pointer passed in from the user. */ + void *input; + /* Values to pass to child parsers. This vector will be the same length as + the number of children for the current parser. */ + void **child_inputs; + + /* For the parser's use. Initialized to 0. */ + void *hook; + + /* The name used when printing messages. This is initialized to ARGV[0], + or PROGRAM_INVOCATION_NAME if that is unavailable. */ + char *name; + + /* Streams used when argp prints something. */ + FILE *err_stream; /* For errors; initialized to stderr. */ + FILE *out_stream; /* For information; initialized to stdout. */ + + void *pstate; /* Private, for use by argp. */ +}; + +/* Flags for argp_parse (note that the defaults are those that are + convenient for program command line parsing): */ + +/* Don't ignore the first element of ARGV. Normally (and always unless + ARGP_NO_ERRS is set) the first element of the argument vector is + skipped for option parsing purposes, as it corresponds to the program name + in a command line. */ +#define ARGP_PARSE_ARGV0 0x01 + +/* Don't print error messages for unknown options to stderr; unless this flag + is set, ARGP_PARSE_ARGV0 is ignored, as ARGV[0] is used as the program + name in the error messages. This flag implies ARGP_NO_EXIT (on the + assumption that silent exiting upon errors is bad behaviour). */ +#define ARGP_NO_ERRS 0x02 + +/* Don't parse any non-option args. Normally non-option args are parsed by + calling the parse functions with a key of ARGP_KEY_ARG, and the actual arg + as the value. Since it's impossible to know which parse function wants to + handle it, each one is called in turn, until one returns 0 or an error + other than ARGP_ERR_UNKNOWN; if an argument is handled by no one, the + argp_parse returns prematurely (but with a return value of 0). If all + args have been parsed without error, all parsing functions are called one + last time with a key of ARGP_KEY_END. This flag needn't normally be set, + as the normal behavior is to stop parsing as soon as some argument can't + be handled. */ +#define ARGP_NO_ARGS 0x04 + +/* Parse options and arguments in the same order they occur on the command + line -- normally they're rearranged so that all options come first. */ +#define ARGP_IN_ORDER 0x08 + +/* Don't provide the standard long option --help, which causes usage and + option help information to be output to stdout, and exit (0) called. */ +#define ARGP_NO_HELP 0x10 + +/* Don't exit on errors (they may still result in error messages). */ +#define ARGP_NO_EXIT 0x20 + +/* Use the gnu getopt `long-only' rules for parsing arguments. */ +#define ARGP_LONG_ONLY 0x40 + +/* Turns off any message-printing/exiting options. */ +#define ARGP_SILENT (ARGP_NO_EXIT | ARGP_NO_ERRS | ARGP_NO_HELP) + +/* Parse the options strings in ARGC & ARGV according to the options in ARGP. + FLAGS is one of the ARGP_ flags above. If ARG_INDEX is non-NULL, the + index in ARGV of the first unparsed option is returned in it. If an + unknown option is present, ARGP_ERR_UNKNOWN is returned; if some parser + routine returned a non-zero value, it is returned; otherwise 0 is + returned. This function may also call exit unless the ARGP_NO_HELP flag + is set. INPUT is a pointer to a value to be passed in to the parser. */ +extern error_t argp_parse (const struct argp *__restrict __argp, + int __argc, char **__restrict __argv, + unsigned __flags, int *__restrict __arg_index, + void *__restrict __input); +extern error_t __argp_parse (const struct argp *__restrict __argp, + int __argc, char **__restrict __argv, + unsigned __flags, int *__restrict __arg_index, + void *__restrict __input); + +/* Global variables. */ + +/* If defined or set by the user program to a non-zero value, then a default + option --version is added (unless the ARGP_NO_HELP flag is used), which + will print this string followed by a newline and exit (unless the + ARGP_NO_EXIT flag is used). Overridden by ARGP_PROGRAM_VERSION_HOOK. */ +extern const char *argp_program_version; + +/* If defined or set by the user program to a non-zero value, then a default + option --version is added (unless the ARGP_NO_HELP flag is used), which + calls this function with a stream to print the version to and a pointer to + the current parsing state, and then exits (unless the ARGP_NO_EXIT flag is + used). This variable takes precedent over ARGP_PROGRAM_VERSION. */ +extern void (*argp_program_version_hook) (FILE *__restrict __stream, + struct argp_state *__restrict + __state); + +/* If defined or set by the user program, it should point to string that is + the bug-reporting address for the program. It will be printed by + argp_help if the ARGP_HELP_BUG_ADDR flag is set (as it is by various + standard help messages), embedded in a sentence that says something like + `Report bugs to ADDR.'. */ +extern const char *argp_program_bug_address; + +/* The exit status that argp will use when exiting due to a parsing error. + If not defined or set by the user program, this defaults to EX_USAGE from + . */ +extern error_t argp_err_exit_status; + +/* Flags for argp_help. */ +#define ARGP_HELP_USAGE 0x01 /* a Usage: message. */ +#define ARGP_HELP_SHORT_USAGE 0x02 /* " but don't actually print options. */ +#define ARGP_HELP_SEE 0x04 /* a `Try ... for more help' message. */ +#define ARGP_HELP_LONG 0x08 /* a long help message. */ +#define ARGP_HELP_PRE_DOC 0x10 /* doc string preceding long help. */ +#define ARGP_HELP_POST_DOC 0x20 /* doc string following long help. */ +#define ARGP_HELP_DOC (ARGP_HELP_PRE_DOC | ARGP_HELP_POST_DOC) +#define ARGP_HELP_BUG_ADDR 0x40 /* bug report address */ +#define ARGP_HELP_LONG_ONLY 0x80 /* modify output appropriately to + reflect ARGP_LONG_ONLY mode. */ + +/* These ARGP_HELP flags are only understood by argp_state_help. */ +#define ARGP_HELP_EXIT_ERR 0x100 /* Call exit(1) instead of returning. */ +#define ARGP_HELP_EXIT_OK 0x200 /* Call exit(0) instead of returning. */ + +/* The standard thing to do after a program command line parsing error, if an + error message has already been printed. */ +#define ARGP_HELP_STD_ERR \ + (ARGP_HELP_SEE | ARGP_HELP_EXIT_ERR) +/* The standard thing to do after a program command line parsing error, if no + more specific error message has been printed. */ +#define ARGP_HELP_STD_USAGE \ + (ARGP_HELP_SHORT_USAGE | ARGP_HELP_SEE | ARGP_HELP_EXIT_ERR) +/* The standard thing to do in response to a --help option. */ +#define ARGP_HELP_STD_HELP \ + (ARGP_HELP_SHORT_USAGE | ARGP_HELP_LONG | ARGP_HELP_EXIT_OK \ + | ARGP_HELP_DOC | ARGP_HELP_BUG_ADDR) + +/* Output a usage message for ARGP to STREAM. FLAGS are from the set + ARGP_HELP_*. */ +extern void argp_help (const struct argp *__restrict __argp, + FILE *__restrict __stream, + unsigned __flags, char *__restrict __name); +extern void __argp_help (const struct argp *__restrict __argp, + FILE *__restrict __stream, unsigned __flags, + char *__name); + +/* The following routines are intended to be called from within an argp + parsing routine (thus taking an argp_state structure as the first + argument). They may or may not print an error message and exit, depending + on the flags in STATE -- in any case, the caller should be prepared for + them *not* to exit, and should return an appropriate error after calling + them. [argp_usage & argp_error should probably be called argp_state_..., + but they're used often enough that they should be short] */ + +/* Output, if appropriate, a usage message for STATE to STREAM. FLAGS are + from the set ARGP_HELP_*. */ +extern void argp_state_help (const struct argp_state *__restrict __state, + FILE *__restrict __stream, + unsigned int __flags); +extern void __argp_state_help (const struct argp_state *__restrict __state, + FILE *__restrict __stream, + unsigned int __flags); + +/* Possibly output the standard usage message for ARGP to stderr and exit. */ +extern void argp_usage (const struct argp_state *__state); +extern void __argp_usage (const struct argp_state *__state); + +/* If appropriate, print the printf string FMT and following args, preceded + by the program name and `:', to stderr, and followed by a `Try ... --help' + message, then exit (1). */ +extern void argp_error (const struct argp_state *__restrict __state, + const char *__restrict __fmt, ...) + __attribute__ ((__format__ (__printf__, 2, 3))); +extern void __argp_error (const struct argp_state *__restrict __state, + const char *__restrict __fmt, ...) + __attribute__ ((__format__ (__printf__, 2, 3))); + +/* Similar to the standard gnu error-reporting function error(), but will + respect the ARGP_NO_EXIT and ARGP_NO_ERRS flags in STATE, and will print + to STATE->err_stream. This is useful for argument parsing code that is + shared between program startup (when exiting is desired) and runtime + option parsing (when typically an error code is returned instead). The + difference between this function and argp_error is that the latter is for + *parsing errors*, and the former is for other problems that occur during + parsing but don't reflect a (syntactic) problem with the input. */ +extern void argp_failure (const struct argp_state *__restrict __state, + int __status, int __errnum, + const char *__restrict __fmt, ...) + __attribute__ ((__format__ (__printf__, 4, 5))); +extern void __argp_failure (const struct argp_state *__restrict __state, + int __status, int __errnum, + const char *__restrict __fmt, ...) + __attribute__ ((__format__ (__printf__, 4, 5))); + +/* Returns true if the option OPT is a valid short option. */ +extern int _option_is_short (const struct argp_option *__opt); +extern int __option_is_short (const struct argp_option *__opt); + +/* Returns true if the option OPT is in fact the last (unused) entry in an + options array. */ +extern int _option_is_end (const struct argp_option *__opt); +extern int __option_is_end (const struct argp_option *__opt); + +/* Return the input field for ARGP in the parser corresponding to STATE; used + by the help routines. */ +extern void *_argp_input (const struct argp *__restrict __argp, + const struct argp_state *__restrict __state) + ; +extern void *__argp_input (const struct argp *__restrict __argp, + const struct argp_state *__restrict __state) + ; + +#ifdef __USE_EXTERN_INLINES + +# if !(defined _LIBC && _LIBC) +# define __argp_usage argp_usage +# define __argp_state_help argp_state_help +# define __option_is_short _option_is_short +# define __option_is_end _option_is_end +# endif + +# ifndef ARGP_EI +# define ARGP_EI __extern_inline +# endif + +ARGP_EI void +__argp_usage (const struct argp_state *__state) +{ + //~ __argp_state_help (__state, stderr, ARGP_HELP_STD_USAGE); +} + +ARGP_EI int +__NTH (__option_is_short (const struct argp_option *__opt)) +{ + if (__opt->flags & OPTION_DOC) + return 0; + else + { + int __key = __opt->key; + return __key > 0 && __key <= UCHAR_MAX && isprint (__key); + } +} + +ARGP_EI int +__NTH (__option_is_end (const struct argp_option *__opt)) +{ + return !__opt->key && !__opt->name && !__opt->doc && !__opt->group; +} + +# if !(defined _LIBC && _LIBC) +# undef __argp_usage +# undef __argp_state_help +# undef __option_is_short +# undef __option_is_end +# endif +#endif /* Use extern inlines. */ + +#include +#if defined __LDBL_COMPAT || __LDOUBLE_REDIRECTS_TO_FLOAT128_ABI == 1 +# include +#endif + +__END_DECLS + +#endif /* argp.h */ diff --git a/extern/argp/getopt_int.h b/extern/argp/getopt_int.h new file mode 100644 index 0000000..4d9e24b --- /dev/null +++ b/extern/argp/getopt_int.h @@ -0,0 +1,118 @@ +/* Internal declarations for getopt. + Copyright (C) 1989-2023 Free Software Foundation, Inc. + This file is part of the GNU C Library and is also part of gnulib. + Patches to this file should be submitted to both projects. + + The GNU C Library is free software; you can redistribute it and/or + modify it under the terms of the GNU Lesser General Public + License as published by the Free Software Foundation; either + version 2.1 of the License, or (at your option) any later version. + + The GNU C Library is distributed in the hope that it will be useful, + but WITHOUT ANY WARRANTY; without even the implied warranty of + MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU + Lesser General Public License for more details. + + You should have received a copy of the GNU Lesser General Public + License along with the GNU C Library; if not, see + . */ + +#ifndef _GETOPT_INT_H +#define _GETOPT_INT_H 1 + +#include + +extern int _getopt_internal (int ___argc, char **___argv, + const char *__shortopts, + const struct option *__longopts, int *__longind, + int __long_only, int __posixly_correct); + + +/* Reentrant versions which can handle parsing multiple argument + vectors at the same time. */ + +/* Describe how to deal with options that follow non-option ARGV-elements. + + REQUIRE_ORDER means don't recognize them as options; stop option + processing when the first non-option is seen. This is what POSIX + specifies should happen. + + PERMUTE means permute the contents of ARGV as we scan, so that + eventually all the non-options are at the end. This allows options + to be given in any order, even with programs that were not written + to expect this. + + RETURN_IN_ORDER is an option available to programs that were + written to expect options and other ARGV-elements in any order + and that care about the ordering of the two. We describe each + non-option ARGV-element as if it were the argument of an option + with character code 1. + + The special argument '--' forces an end of option-scanning regardless + of the value of 'ordering'. In the case of RETURN_IN_ORDER, only + '--' can cause 'getopt' to return -1 with 'optind' != ARGC. */ + +enum __ord + { + REQUIRE_ORDER, PERMUTE, RETURN_IN_ORDER + }; + +/* Data type for reentrant functions. */ +struct _getopt_data +{ + /* These have exactly the same meaning as the corresponding global + variables, except that they are used for the reentrant + versions of getopt. */ + int optind; + int opterr; + int optopt; + char *optarg; + + /* Internal members. */ + + /* True if the internal members have been initialized. */ + int __initialized; + + /* The next char to be scanned in the option-element + in which the last option character we returned was found. + This allows us to pick up the scan where we left off. + + If this is zero, or a null string, it means resume the scan + by advancing to the next ARGV-element. */ + char *__nextchar; + + /* See __ord above. */ + enum __ord __ordering; + + /* Handle permutation of arguments. */ + + /* Describe the part of ARGV that contains non-options that have + been skipped. 'first_nonopt' is the index in ARGV of the first + of them; 'last_nonopt' is the index after the last of them. */ + + int __first_nonopt; + int __last_nonopt; +}; + +/* The initializer is necessary to set OPTIND and OPTERR to their + default values and to clear the initialization flag. */ +#define _GETOPT_DATA_INITIALIZER { 1, 1 } + +extern int _getopt_internal_r (int ___argc, char **___argv, + const char *__shortopts, + const struct option *__longopts, int *__longind, + int __long_only, struct _getopt_data *__data, + int __posixly_correct); + +extern int _getopt_long_r (int ___argc, char **___argv, + const char *__shortopts, + const struct option *__longopts, int *__longind, + struct _getopt_data *__data); + +extern int _getopt_long_only_r (int ___argc, char **___argv, + const char *__shortopts, + const struct option *__longopts, + int *__longind, + struct _getopt_data *__data); + +#endif /* getopt_int.h */ diff --git a/extern/interflop b/extern/interflop new file mode 160000 index 0000000..fc7ebdd --- /dev/null +++ b/extern/interflop @@ -0,0 +1 @@ +Subproject commit fc7ebdda53497624a8c73811187b70bf9080a8e9 diff --git a/extern/interflop-backend-ieee b/extern/interflop-backend-ieee new file mode 160000 index 0000000..a4fc711 --- /dev/null +++ b/extern/interflop-backend-ieee @@ -0,0 +1 @@ +Subproject commit a4fc711079aa7d2dca1b55f7a609d1d3f996be15 diff --git a/extern/interflop-backend-verrou b/extern/interflop-backend-verrou new file mode 160000 index 0000000..f7eeaa4 --- /dev/null +++ b/extern/interflop-backend-verrou @@ -0,0 +1 @@ +Subproject commit f7eeaa468f2907aefcb9d0dd6726890001b21222 diff --git a/extern/interflop-backend-vprec b/extern/interflop-backend-vprec new file mode 160000 index 0000000..4995b25 --- /dev/null +++ b/extern/interflop-backend-vprec @@ -0,0 +1 @@ +Subproject commit 4995b255802a0c99b5d9157adbb24735737e0e93 diff --git a/include/interflop_module.h b/include/interflop_module.h new file mode 100644 index 0000000..4e44b01 --- /dev/null +++ b/include/interflop_module.h @@ -0,0 +1,32 @@ +#pragma once + +#include + +#include "module.h" +#include "pin_utils/instrumenter.h" + +#define MAX_BACKENDS 16 +#define MAX_ARGS 256 + +namespace pene { + class interflop_module : public module + { + KNOB KnobInterflop; + KNOB KnobVectorInterflop; + pin_utils::instrumenter* data; + + public: + + interflop_module(); + void init() override; + // virtual bool validate() override; + const std::string& name() override; + + + + static void panic (const char *msg); + + static void _interflop_err(int eval, const char *fmt, ...); + private: + }; +} diff --git a/include/replace/wrappers/vfc_avx.h b/include/replace/wrappers/vfc_avx.h new file mode 100644 index 0000000..d096ea7 --- /dev/null +++ b/include/replace/wrappers/vfc_avx.h @@ -0,0 +1,572 @@ +#pragma once +#include +extern "C" +{ +# include +} +#include + +namespace pene +{ + namespace replace + { + namespace vfc_wrappers + { + namespace avx + { + + template + void arithmetic_wrapper(T* const a, T* const b, T* c, interflop_backend_interface_t * backends, void** contexts, int loaded_backends, op_t op) + { + void (*interflop_call[MAX_BACKENDS])(float *, float *, float *, void *); + switch (op) + { + case ADD_1: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector256.add.op_vector_float_1; + } + break; + case ADD_4: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector256.add.op_vector_float_4; + } + break; + case ADD_8: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector256.add.op_vector_float_8; + } + break; + case ADD_16: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector256.add.op_vector_float_16; + } + break; + case SUB_1: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector256.sub.op_vector_float_1; + } + break; + case SUB_4: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector256.sub.op_vector_float_4; + } + break; + case SUB_8: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector256.sub.op_vector_float_8; + } + break; + case SUB_16: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector256.sub.op_vector_float_16; + } + break; + case MUL_1: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector256.mul.op_vector_float_1; + } + break; + case MUL_4: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector256.mul.op_vector_float_4; + } + break; + case MUL_8: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector256.mul.op_vector_float_8; + } + break; + case MUL_16: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector256.mul.op_vector_float_16; + } + break; + case DIV_1: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector256.div.op_vector_float_1; + } + break; + case DIV_4: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector256.div.op_vector_float_4; + } + break; + case DIV_8: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector256.div.op_vector_float_8; + } + break; + case DIV_16: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector256.div.op_vector_float_16; + } + break; + default: + break; + } + for (int i = 0; i < loaded_backends; i++) + { + interflop_call[i](a, b, c, contexts[i]); + } + + } + + void instrument(int loaded_backends, interflop_backend_interface_t* backends, void** contexts, INS ins) + { + auto xed = INS_XedDec(ins); // TODO check that pointer does not need to be freed + auto iform = xed_decoded_inst_get_iform_enum(xed); + + switch (iform) + { + case xed_iform_enum_t::XED_IFORM_VADDPS_YMMqq_YMMqq_MEMqq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_8, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_VADDPS_YMMqq_YMMqq_YMMqq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_8, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_VADDPS_XMMdq_XMMdq_MEMdq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_VADDPS_XMMdq_XMMdq_XMMdq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_VADDSS_XMMdq_XMMdq_MEMd: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_VADDSS_XMMdq_XMMdq_XMMd: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_VSUBPS_YMMqq_YMMqq_MEMqq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_8, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_VSUBPS_YMMqq_YMMqq_YMMqq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_8, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_VSUBPS_XMMdq_XMMdq_MEMdq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_VSUBPS_XMMdq_XMMdq_XMMdq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_VSUBSS_XMMdq_XMMdq_MEMd: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_VSUBSS_XMMdq_XMMdq_XMMd: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_VMULPS_YMMqq_YMMqq_MEMqq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_8, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_VMULPS_YMMqq_YMMqq_YMMqq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_8, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_VMULPS_XMMdq_XMMdq_MEMdq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_VMULPS_XMMdq_XMMdq_XMMdq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_VMULSS_XMMdq_XMMdq_MEMd: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_VMULSS_XMMdq_XMMdq_XMMd: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_VDIVPS_YMMqq_YMMqq_MEMqq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_8, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_VDIVPS_YMMqq_YMMqq_YMMqq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_8, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_VDIVPS_XMMdq_XMMdq_MEMdq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_VDIVPS_XMMdq_XMMdq_XMMdq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_VDIVSS_XMMdq_XMMdq_MEMd: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_VDIVSS_XMMdq_XMMdq_XMMd: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_1, + IARG_END + ); + } + INS_Delete(ins); + break; + default: break; + + + + } + } + + + } + } + } +} diff --git a/include/replace/wrappers/vfc_sse.h b/include/replace/wrappers/vfc_sse.h new file mode 100644 index 0000000..9625b72 --- /dev/null +++ b/include/replace/wrappers/vfc_sse.h @@ -0,0 +1,429 @@ +#pragma once +#include +extern "C" +{ +# include +} +#include + + +namespace pene +{ + namespace replace + { + namespace vfc_wrappers + { + namespace sse + { + + template + void arithmetic_wrapper(T* const a, T* const b, T* c, interflop_backend_interface_t * backends, void** contexts, int loaded_backends, op_t op) + { + void (*interflop_call[MAX_BACKENDS])(float *, float *, float *, void *); + switch (op) + { + case ADD_1: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector128.add.op_vector_float_1; + } + break; + case ADD_4: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector128.add.op_vector_float_4; + } + break; + case ADD_8: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector128.add.op_vector_float_8; + } + break; + case ADD_16: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector128.add.op_vector_float_16; + } + break; + case SUB_1: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector128.sub.op_vector_float_1; + } + break; + case SUB_4: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector128.sub.op_vector_float_4; + } + break; + case SUB_8: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector128.sub.op_vector_float_8; + } + break; + case SUB_16: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector128.sub.op_vector_float_16; + } + break; + case MUL_1: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector128.mul.op_vector_float_1; + } + break; + case MUL_4: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector128.mul.op_vector_float_4; + } + break; + case MUL_8: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector128.mul.op_vector_float_8; + } + break; + case MUL_16: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector128.mul.op_vector_float_16; + } + break; + case DIV_1: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector128.div.op_vector_float_1; + } + break; + case DIV_4: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector128.div.op_vector_float_4; + } + break; + case DIV_8: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector128.div.op_vector_float_8; + } + break; + case DIV_16: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].vbackend.vector128.div.op_vector_float_16; + } + break; + default: + break; + } + for (int i = 0; i < loaded_backends; i++) + { + interflop_call[i](a, b, c, contexts[i]); + } + + } + + void instrument(int loaded_backends, interflop_backend_interface_t* backends, void** contexts, INS ins) + { + auto xed = INS_XedDec(ins); // TODO check that pointer does not need to be freed + auto iform = xed_decoded_inst_get_iform_enum(xed); + + switch (iform) + { + case xed_iform_enum_t::XED_IFORM_ADDPS_XMMps_MEMps: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_ADDPS_XMMps_XMMps: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_ADDSS_XMMss_MEMss: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_ADDSS_XMMss_XMMss: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_SUBPS_XMMps_MEMps: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_SUBPS_XMMps_XMMps: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_SUBSS_XMMss_MEMss: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_SUBSS_XMMss_XMMss: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_MULPS_XMMps_MEMps: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_MULPS_XMMps_XMMps: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_MULSS_XMMss_MEMss: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_MULSS_XMMss_XMMss: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_DIVPS_XMMps_MEMps: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_DIVPS_XMMps_XMMps: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_DIVSS_XMMss_MEMss: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_DIVSS_XMMss_XMMss: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_1, + IARG_END + ); + } + INS_Delete(ins); + break; + default: break; + + + + } + } + + + } + } + } +} diff --git a/include/replace/wrappers/vfc_wrapper_avx.h b/include/replace/wrappers/vfc_wrapper_avx.h new file mode 100644 index 0000000..f59df63 --- /dev/null +++ b/include/replace/wrappers/vfc_wrapper_avx.h @@ -0,0 +1,496 @@ +#pragma once +#include +extern "C" +{ +# include +} +#include + +namespace pene +{ + namespace replace + { + namespace vfc_wrappers + { + namespace devectorized_avx + { + + template + void arithmetic_wrapper(T* const a, T* const b, T* c, interflop_backend_interface_t * backends, void** contexts, int loaded_backends, op_t op) + { + void (*interflop_call[MAX_BACKENDS])(float, float, float*, void*); + switch (op) + { + case ADD_1: + case ADD_4: + case ADD_8: + for (int i = 0; i < loaded_backends; i++) + { + interflop_call[i] = backends[i].interflop_add_float; + } + break; + case SUB_1: + case SUB_4: + case SUB_8: + for (int i = 0; i < loaded_backends; i++) + { + interflop_call[i] = backends[i].interflop_sub_float; + } + break; + case MUL_1: + case MUL_4: + case MUL_8: + for (int i = 0; i < loaded_backends; i++) + { + interflop_call[i] = backends[i].interflop_mul_float; + } + break; + case DIV_1: + case DIV_4: + case DIV_8: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].interflop_div_float; + } + break; + default: + break; + } + + for (int i = 0; i < loaded_backends; i++) + { + for(int s = 0; s < N; s++) + { + interflop_call[i](*(a+s), *(b+s), c+s, contexts[i]); + } + } + } + + void instrument(int loaded_backends, interflop_backend_interface_t* backends, void** contexts, INS ins) + { + auto xed = INS_XedDec(ins); // TODO check that pointer does not need to be freed + auto iform = xed_decoded_inst_get_iform_enum(xed); + + switch (iform) + { + case xed_iform_enum_t::XED_IFORM_VADDPS_YMMqq_YMMqq_MEMqq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_8, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_VADDPS_YMMqq_YMMqq_YMMqq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_8, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_VADDPS_XMMdq_XMMdq_MEMdq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_VADDPS_XMMdq_XMMdq_XMMdq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_VADDSS_XMMdq_XMMdq_MEMd: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_VADDSS_XMMdq_XMMdq_XMMd: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_VSUBPS_YMMqq_YMMqq_MEMqq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_8, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_VSUBPS_YMMqq_YMMqq_YMMqq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_8, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_VSUBPS_XMMdq_XMMdq_MEMdq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_VSUBPS_XMMdq_XMMdq_XMMdq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_VSUBSS_XMMdq_XMMdq_MEMd: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_VSUBSS_XMMdq_XMMdq_XMMd: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_VMULPS_YMMqq_YMMqq_MEMqq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_8, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_VMULPS_YMMqq_YMMqq_YMMqq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_8, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_VMULPS_XMMdq_XMMdq_MEMdq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_VMULPS_XMMdq_XMMdq_XMMdq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_VMULSS_XMMdq_XMMdq_MEMd: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_VMULSS_XMMdq_XMMdq_XMMd: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_VDIVPS_YMMqq_YMMqq_MEMqq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_8, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_VDIVPS_YMMqq_YMMqq_YMMqq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_8, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_VDIVPS_XMMdq_XMMdq_MEMdq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_VDIVPS_XMMdq_XMMdq_XMMdq: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_VDIVSS_XMMdq_XMMdq_MEMd: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_VDIVSS_XMMdq_XMMdq_XMMd: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,2), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_1, + IARG_END + ); + } + INS_Delete(ins); + break; + default: break; + + + + } + } + + + } + } + } +} diff --git a/include/replace/wrappers/vfc_wrapper_sse.h b/include/replace/wrappers/vfc_wrapper_sse.h new file mode 100644 index 0000000..46f3707 --- /dev/null +++ b/include/replace/wrappers/vfc_wrapper_sse.h @@ -0,0 +1,352 @@ +#pragma once +#include +extern "C" +{ +# include +} +#include + + +namespace pene +{ + namespace replace + { + namespace vfc_wrappers + { + namespace devectorized_sse + { + + template + void arithmetic_wrapper(T* const a, T* const b, T* c, interflop_backend_interface_t * backends, void** contexts, int loaded_backends, op_t op) + { + void (*interflop_call[MAX_BACKENDS])(float,float,float*,void*); + switch (op) + { + case ADD_1: + case ADD_4: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].interflop_add_float; + } + break; + case SUB_1: + case SUB_4: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].interflop_sub_float; + } + break; + case MUL_1: + case MUL_4: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].interflop_mul_float; + } + break; + case DIV_1: + case DIV_4: + for (int i = 0; i < loaded_backends; i++) + { + + interflop_call[i] = backends[i].interflop_div_float; + } + break; + default: + break; + } + + for (int i = 0; i < loaded_backends; i++) + { + for(int s = 0; s < N; s++) + { + interflop_call[i](*(a+s), *(b+s), c+s, contexts[i]); + } + } + } + + void instrument(int loaded_backends, interflop_backend_interface_t* backends, void** contexts, INS ins) + { + auto xed = INS_XedDec(ins); // TODO check that pointer does not need to be freed + auto iform = xed_decoded_inst_get_iform_enum(xed); + + switch (iform) + { + case xed_iform_enum_t::XED_IFORM_ADDPS_XMMps_MEMps: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_ADDPS_XMMps_XMMps: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_ADDSS_XMMss_MEMss: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_ADDSS_XMMss_XMMss: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, ADD_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_SUBPS_XMMps_MEMps: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_SUBPS_XMMps_XMMps: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_SUBSS_XMMss_MEMss: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_SUBSS_XMMss_XMMss: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, SUB_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_MULPS_XMMps_MEMps: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_MULPS_XMMps_XMMps: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_MULSS_XMMss_MEMss: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_MULSS_XMMss_XMMss: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, MUL_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_DIVPS_XMMps_MEMps: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + + + case xed_iform_enum_t::XED_IFORM_DIVPS_XMMps_XMMps: + { + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_4, + IARG_END + ); + } + INS_Delete(ins); + break; + } + case xed_iform_enum_t::XED_IFORM_DIVSS_XMMss_MEMss: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_MEMORYREAD_EA, + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_1, + IARG_END + ); + } + INS_Delete(ins); + break; + case xed_iform_enum_t::XED_IFORM_DIVSS_XMMss_XMMss: + { + INS_InsertCall(ins,IPOINT_BEFORE,(AFUNPTR)arithmetic_wrapper, + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,0), + IARG_REG_CONST_REFERENCE, INS_OperandReg(ins,1), + IARG_REG_REFERENCE, INS_OperandReg(ins,0), + IARG_PTR, backends, + IARG_PTR, contexts, + IARG_UINT32, loaded_backends, + IARG_UINT32, DIV_1, + IARG_END + ); + } + INS_Delete(ins); + break; + default: break; + + + + } + } + + + } + } + } +} diff --git a/src/CMakeLists.txt b/src/CMakeLists.txt index 5fbc393..8ac5ade 100644 --- a/src/CMakeLists.txt +++ b/src/CMakeLists.txt @@ -23,20 +23,28 @@ include_directories(${CMAKE_CURRENT_SOURCE_DIR}) # Set source files set(SOURCES "pene.cpp" "module.cpp" "version_module.cpp" "utils/match.cpp" "counters.cpp" "counters_module.cpp" "update_counters.cpp" - "symbol_list_generator_module.cpp" "replace_module.cpp" + "symbol_list_generator_module.cpp" "replace_module.cpp" "interflop_module.cpp" "pin_utils/instrumenter.cpp" "pin_utils/filter.cpp" "pin_utils/element_instrumenter.cpp" "pin_utils/symbol_filter.cpp" "pin_utils/source_filter.cpp" "replace/backend/backend_verrou/interflop_verrou.cpp" "replace/backend/backend_verrou/tinymt64.cpp" - ) +) + set(PIN_TOOL pene) + # Add target add_library (${PIN_TOOL} SHARED ${SOURCES}) set_property(TARGET ${PIN_TOOL} PROPERTY CXX_STANDARD 17) + +target_compile_definitions(${PIN_TOOL} PRIVATE "-DHAVE_FMA_INTRINSIC") target_link_libraries(${PIN_TOOL} ${PIN_LIBRARIES}) +if(UNIX) +target_link_libraries(${PIN_TOOL} instr argp interflop_stdlib) +else() target_link_libraries(${PIN_TOOL} instr) +endif(UNIX) target_link_options(${PIN_TOOL} PUBLIC ${PIN_LDFLAGS}) install(TARGETS ${PIN_TOOL}) diff --git a/src/interflop_module.cpp b/src/interflop_module.cpp new file mode 100644 index 0000000..dc9b22c --- /dev/null +++ b/src/interflop_module.cpp @@ -0,0 +1,692 @@ +#if defined(_WIN32) + +#include +#include "interflop_module.h" + +namespace pene { + using namespace pin_utils; + interflop_module::interflop_module() : module(), + KnobInterflop(KNOB_MODE_WRITEONCE, "pintool", "interflop", "0", "use interflop dynamic backend (should not be used on windows target)"), + KnobVectorInterflop(KNOB_MODE_WRITEONCE, "pintool", "vector-mode", "0", "use interflop dynamic backend (should not be used on windows target)"), + data(nullptr) + {} + + void interflop_module::init() + { + std::cerr << "Initialization: interflop module." << std::endl; + std::cerr << " Interflop verificarlo's dynamic backends : " << "disabled" << std::endl; + std::cerr << " Backends working mode : none" << std::endl; + std::cerr << " /!\\ Feature not supported on Windows" << std::endl; + } + + const std::string& interflop_module::name() + { + static const std::string name_("interflop_module"); + return name_; + } +} + +#else +extern "C" +{ + #include "argp/argp.h" + #include + #include + #include + #include + #include + #include + //#include + #include + #include + #include + #include + #include + #include + #include + #include + #include + #include + #include +} + + + +#include +#include "interflop_module.h" + +extern "C"{ +#include "interflop.h" +#include "interflop_stdlib.h" +#include "iostream/logger.h" +} +// Part of Verificarlo project +// Taken from +// https://github.com/interflop/verificarlo/blob/master/src/vfcwrapper/main.c.in + + +#include "interflop/interflop.h" +#include "interflop/interflop_stdlib.h" + +/* In delta-debug we retrieve the return address of + * instrumented operations. Call op size allows us + * to compute the previous instruction so that the + * user sees the address of the actual operation */ +#ifdef __x86_64__ +#define CALL_OP_SIZE 5 +#else +/* On other architectures we assume an instruction is + * 4 bytes */ +#define CALL_OP_SIZE 4 +#endif + +// #if @LLVM_VERSION_MAJOR@ <= 7 +// #define ADDR2LINE_BIN "addr2line" +// #define ADDR2LINE_PATH "/usr/bin/addr2line" +// #else +// #define ADDR2LINE_BIN "@LLVM_BINDIR@/llvm-addr2line" +// #define ADDR2LINE_PATH "@LLVM_BINDIR@/llvm-addr2line" +// #endif + +// typedef int int2 __attribute__((ext_vector_type(2))); +// typedef int int4 __attribute__((ext_vector_type(4))); +// typedef int int8 __attribute__((ext_vector_type(8))); +// typedef int int16 __attribute__((ext_vector_type(16))); + +// typedef float float2 __attribute__((ext_vector_type(2))); +// typedef float float4 __attribute__((ext_vector_type(4))); +// typedef float float8 __attribute__((ext_vector_type(8))); +// typedef float float16 __attribute__((ext_vector_type(16))); + +// typedef double double2 __attribute__((ext_vector_type(2))); +// typedef double double4 __attribute__((ext_vector_type(4))); +// typedef double double8 __attribute__((ext_vector_type(8))); +// typedef double double16 __attribute__((ext_vector_type(16))); + +typedef struct interflop_backend_interface_t (*interflop_init_t)(void *context); + +typedef void (*interflop_pre_init_t)(interflop_panic_t panic, FILE *stream, + void **context); +typedef void (*interflop_cli_t)(int argc, char **argv, void *context); +typedef void (*interflop_panic_t)(const char *msg); + +#define MAX_BACKENDS 16 +#define MAX_ARGS 256 + +#define XSTR(X) STR(X) +#define STR(X) #X + +struct interflop_backend_interface_t backends[MAX_BACKENDS]; +void *contexts[MAX_BACKENDS] = {NULL}; +unsigned char loaded_backends = 0; +unsigned char already_initialized = 0; + +/* Logger functions */ + +void logger_init(interflop_panic_t panic, File *stream, const char *name); +void logger_info(const char *fmt, ...); +void logger_warning(const char *fmt, ...); +void logger_error(const char *fmt, ...); + +__attribute__((unused)) static char *dd_exclude_path = NULL; +__attribute__((unused)) static char *dd_include_path = NULL; +__attribute__((unused)) static char *dd_generate_path = NULL; + +/* Function instrumentation prototypes */ + +void vfc_init_func_inst(); + +void vfc_quit_func_inst(); + +/* Hashmap header */ + +#define __VFC_HASHMAP_HEADER__ + +struct vfc_hashmap_st { + size_t nbits; + size_t mask; + + size_t capacity; + size_t *items; + size_t nitems; + size_t n_deleted_items; +}; + +typedef struct vfc_hashmap_st *vfc_hashmap_t; +// allocate and initialize the map +vfc_hashmap_t vfc_hashmap_create(); + +// free the map +void vfc_hashmap_destroy(vfc_hashmap_t map); + +// get the value at an index of a map +size_t get_value_at(size_t *items, size_t i); + +// get the key at an index of a map +size_t get_key_at(size_t *items, size_t i); + +// set the value at an index of a map +void set_value_at(size_t *items, size_t value, size_t i); + +// set the key at an index of a map +void set_key_at(size_t *items, size_t key, size_t i); + +// insert an element in the map +void vfc_hashmap_insert(vfc_hashmap_t map, size_t key, void *item); + +// remove an element of the map +void vfc_hashmap_remove(vfc_hashmap_t map, size_t key); + +// test if an element is in the map +char vfc_hashmap_have(vfc_hashmap_t map, size_t key); + +// get an element of the map +void *vfc_hashmap_get(vfc_hashmap_t map, size_t key); + +// get the number of elements in the map +size_t vfc_hashmap_num_items(vfc_hashmap_t map); + +// Hash function for strings +size_t vfc_hashmap_str_function(const char *id); + +// Free the hashmap +void vfc_hashmap_free(vfc_hashmap_t map); + +/* dd_must_instrument is used to apply and generate include DD filters */ +/* dd_mustnot_instrument is used to apply exclude DD filters */ +vfc_hashmap_t dd_must_instrument; +vfc_hashmap_t dd_mustnot_instrument; + +/* +void ddebug_generate_inclusion(char *dd_generate_path, vfc_hashmap_t map) { + int output = open(dd_generate_path, O_WRONLY | O_CREAT, S_IWUSR | S_IRUSR); + if (output == -1) { + logger_error("cannot open DDEBUG_GEN file %s", dd_generate_path); + } + for (size_t i = 0; i < map->capacity; i++) { + if (get_value_at(map->items, i) != 0 && get_value_at(map->items, i) != 1) { + pid_t pid = fork(); + if (pid == 0) { + char addr[19]; + char executable[64]; + snprintf(addr, 19, "%p", + (void *)(get_value_at(map->items, i) - CALL_OP_SIZE)); + snprintf(executable, 64, "/proc/%d/exe", getppid()); + dup2(output, 1); + execlp(ADDR2LINE_BIN, ADDR2LINE_PATH, + "-fpaCs", "-e", executable, addr, NULL); + logger_error("error running " ADDR2LINE_BIN); + } else { + int status; + wait(&status); + assert(status == 0); + } + } + } + close(output); +} +*/ + +__attribute__((destructor(0))) static void vfc_atexit(void) { + + /* Send finalize message to backends */ + for (int i = 0; i < loaded_backends; i++) + if (backends[i].interflop_finalize) + backends[i].interflop_finalize(contexts[i]); + +#ifdef DDEBUG + if (dd_generate_path) { + ddebug_generate_inclusion(dd_generate_path, dd_must_instrument); + logger_info("ddebug: generated complete inclusion file at %s\n", + dd_generate_path); + } + vfc_hashmap_destroy(dd_must_instrument); + vfc_hashmap_destroy(dd_mustnot_instrument); +#endif + +#ifdef INST_FUNC + vfc_quit_func_inst(); +#endif +} + +/* Checks that a least one of the loaded backend implements the chosen + * operation at a given precision */ +#define check_backends_implements(precision, operation) \ + do { \ + int res = 0; \ + for (unsigned char i = 0; i < loaded_backends; i++) { \ + if (backends[i].interflop_##operation##_##precision) { \ + res = 1; \ + break; \ + } \ + } \ + if (res == 0) \ + logger_error("No backend instruments " #operation " for " #precision \ + ".\n" \ + "Include one backend in VFC_BACKENDS that provides it"); \ + } while (0) + +#if DDEBUG +/* vfc_read_filter_file reads an inclusion/exclusion ddebug file and returns + * an address map */ +static void vfc_read_filter_file(const char *dd_filter_path, + vfc_hashmap_t map) { + FILE *input = fopen(dd_filter_path, "r"); + if (input) { + void *addr; + char line[2048]; + int lineno = 0; + while (fgets(line, sizeof line, input)) { + lineno++; + if (sscanf(line, "%p", &addr) == 1) { + vfc_hashmap_insert(map, (size_t)addr + CALL_OP_SIZE, + addr + CALL_OP_SIZE); + } else { + logger_error( + "ddebug: error parsing VFC_DDEBUG_[INCLUDE/EXCLUDE] %s at line %d", + dd_filter_path, lineno); + } + } + } +} +#endif + +/* Parse the different VFC_BACKENDS variables per priorty order */ +/* 1- VFC_BACKENDS */ +/* 2- VFC_BACKENDS_FROM_FILE */ +/* Set the backends read in vfc_backends */ +/* Set the name of the environment variable read in vfc_backends_env */ +void parse_vfc_backends_env(char **vfc_backends, char **vfc_backends_env) { + + /* Parse VFC_BACKENDS */ + *vfc_backends_env = (char *)malloc(sizeof(char) * 256); + *vfc_backends = (char *)malloc(sizeof(char) * 256); + + sprintf(*vfc_backends_env, "VFC_BACKENDS"); + *vfc_backends = getenv(*vfc_backends_env); + + /* Parse VFC_BACKENDS_FROM_FILE if VFC_BACKENDS is empty*/ + if (*vfc_backends == NULL) { + sprintf(*vfc_backends_env, "VFC_BACKENDS_FROM_FILE"); + char *vfc_backends_fromfile_file = getenv(*vfc_backends_env); + if (vfc_backends_fromfile_file != NULL) { + FILE *fi = fopen(vfc_backends_fromfile_file, "r"); + if (fi == NULL) { + logger_error("Error while opening file pointed by %s: %s", + *vfc_backends_env, strerror(errno)); + } else { + size_t len = 0; + ssize_t nread; + nread = getline(vfc_backends, &len, fi); + if (nread == -1) { + logger_error("Error while reading file pointed by %s: %s", + *vfc_backends_env, strerror(errno)); + } else { + if ((*vfc_backends)[nread - 1] == '\n') { + (*vfc_backends)[nread - 1] = '\0'; + } + } + } + } + } +} + +long _vfc_strtol(const char *nptr, char **endptr, int *error) { + *error = 0; + errno = 0; + long val = strtoll(nptr, endptr, 10); + if (errno != 0) { + *error = 1; + } + return val; +} + +double _vfc_strtod(const char *nptr, char **endptr, int *error) { + *error = 0; + errno = 0; + double val = strtod(nptr, endptr); + if (errno != 0) { + *error = 1; + } + return val; +} + +/* Load the function in .so of name */ +void *load_function(const char *token, void *handle, const char *function) { + /* reset dl errors */ + dlerror(); + /* get the address of the interflop_pre_init function */ + void *handler = dlsym(handle, function); + const char *dlsym_error = dlerror(); + if (dlsym_error) { + logger_error("No %s function in backend %s: %s", function, token, + strerror(errno)); + } + /* reset dl errors */ + dlerror(); + return handler; +} + +pid_t get_tid() { return syscall(__NR_gettid); } + +void _vfc_inf_handler(void) { + +} + +void _vfc_nan_handler(void) { + +} + +void _vfc_cancellation_handler(int unused) { + +} + +void _vfc_denormal_handler(void) { + +} + +void _vfc_floatmax_handler(void) { + +} + +void vfc_set_handlers(const char *token, void *handle) { + + interflop_set_handler_t set_handler = (interflop_set_handler_t)load_function( + token, handle, "interflop_set_handler"); + set_handler("getenv", (void*) getenv); + set_handler("sprintf", (void*) sprintf); + set_handler("strerror", (void*) strerror); + set_handler("gettid", (void*) get_tid); + set_handler("fopen", (void*) fopen); + set_handler("strcasecmp", (void*) strcasecmp); + set_handler("vwarnx", (void*) vwarnx); + set_handler("fprintf", (void*) fprintf); + set_handler("exit", (void*) exit); + set_handler("vfprintf", (void*) vfprintf); + set_handler("malloc", (void*) malloc); + set_handler("strcmp", (void*) strcmp); + set_handler("strtol", (void*) _vfc_strtol); + set_handler("strtod", (void*) _vfc_strtod); + set_handler("strcpy", (void*) strcpy); + set_handler("fclose", (void*) fclose); + set_handler("fgets", (void*) fgets); + set_handler("strtok_r", (void*) strtok_r); + set_handler("free", (void*) free); + set_handler("calloc", (void*) calloc); + set_handler("argp_parse", (void*) argp_parse); + set_handler("gettimeofday", (void*) gettimeofday); + // set_handler("register_printf_specifier", (void*) register_printf_specifier); + set_handler("infHandler", (void*) _vfc_inf_handler); + set_handler("nanHandler", (void*) _vfc_nan_handler); + set_handler("cancellationHandler", (void*) _vfc_cancellation_handler); + set_handler("denormalHandler", (void*) _vfc_denormal_handler); + set_handler("maxHandler", (void*) _vfc_floatmax_handler); +} + +void _vfc_panic(const char *msg) { + fprintf(stderr, "%s", msg); + exit(1); +} + +#include "pin_utils/symbol_filters.h" +typedef enum +{ + ADD_1=0, + ADD_4, + ADD_8, + ADD_16, + SUB_1, + SUB_4, + SUB_8, + SUB_16, + MUL_1, + MUL_4, + MUL_8, + MUL_16, + DIV_1, + DIV_4, + DIV_8, + DIV_16 +} op_t; + +#include "replace/wrappers/vfc_sse.h" +#include "replace/wrappers/vfc_wrapper_sse.h" +#include "replace/wrappers/vfc_avx.h" +#include "replace/wrappers/vfc_wrapper_avx.h" + +namespace pene { + using namespace pin_utils; + + + namespace replace_module_internals + { + template + class dynamic_backend_instrumenters final : public element_instrumenter + { + REG tmp_reg1; + REG tmp_reg2; + REG tmp_reg_output; + + public: + //~ int loaded_backends; + //~ interflop_backend_interface_t backends[MAX_BACKENDS]; + //~ void * contexts[MAX_BACKENDS]; + //~ void* backend_ctx; + dynamic_backend_instrumenters() + : element_instrumenter() + , tmp_reg1(PIN_ClaimToolRegister()) + , tmp_reg2(PIN_ClaimToolRegister()) + , tmp_reg_output(PIN_ClaimToolRegister()) + //, backend_ctx(OPERATION_IMPL::init()) + { + //struct pene::replace::backend::verrou ifverrou=pene::replace::backend::init(&backend_ctx); + if (!REG_valid(tmp_reg1) || !REG_valid(tmp_reg2) || !REG_valid(tmp_reg_output)) + { + std::cerr << "Cannot allocate a scratch register.\n"; + std::cerr << std::flush; + PIN_ExitApplication(1); + } + } + + virtual void instrument(INS ins) override { + switch (INS_Category(ins)) + { + case xed_category_enum_t::XED_CATEGORY_SSE: + replace::vfc_wrappers::devectorized_sse::instrument(loaded_backends, backends, contexts, ins); + break; + case xed_category_enum_t::XED_CATEGORY_AVX: + replace::vfc_wrappers::devectorized_avx::instrument(loaded_backends, backends, contexts, ins); + break; + // case xed_category_enum_t::XED_CATEGORY_AVX512: + // replace::wrappers::avx512::instrument(backend_ctx, ins); + // break; + // case xed_category_enum_t::XED_CATEGORY_VFMA: + // replace::wrappers::fma::instrument(backend_ctx, ins); + // break; + default: + break; + } + } + }; + + template<> + void dynamic_backend_instrumenters::instrument(INS ins) { + switch (INS_Category(ins)) + { + case xed_category_enum_t::XED_CATEGORY_SSE: + replace::vfc_wrappers::sse::instrument(loaded_backends, backends, contexts, ins); + break; + case xed_category_enum_t::XED_CATEGORY_AVX: + replace::vfc_wrappers::avx::instrument(loaded_backends, backends, contexts, ins); + break; + // case xed_category_enum_t::XED_CATEGORY_AVX512: + // replace::wrappers::avx512::instrument(backend_ctx, ins); + // break; + // case xed_category_enum_t::XED_CATEGORY_VFMA: + // replace::wrappers::fma::instrument(backend_ctx, ins); + // break; + default: + break; + } + } + } + + interflop_module::interflop_module() : module(), + KnobInterflop(KNOB_MODE_WRITEONCE, "pintool", "interflop", "0", "use interflop dynamic backend (should not be used if using -fp-replace)"), + KnobVectorInterflop(KNOB_MODE_WRITEONCE, "pintool", "vector-mode", "0", "use interflop dynamic backend (should not be used if using -fp-replace)"), + data(nullptr) + {} + + void interflop_module::init() + { + std::cerr << "Initialization: interflop module." << std::endl; + std::cerr << " Interflop verificarlo's dynamic backends : " << (KnobInterflop.Value() ? "enabled" : "disabled") << std::endl; + std::cerr << " Backends working mode : " << (KnobVectorInterflop.Value() ? "vector" : "scalar") << std::endl; + if (!KnobInterflop.Value()) + { + return; + } + //~ return; + /* function required by vfcwrapper.c */ + interflop_set_handler("getenv", (void *)getenv); + interflop_set_handler("sprintf", (void *)sprintf); + interflop_set_handler("strerror", (void *)strerror); + interflop_set_handler("gettid", (void*) get_tid); + interflop_set_handler("fopen", (void *)fopen); + interflop_set_handler("strcasecmp", (void *)strcasecmp); + interflop_set_handler("vwarnx", (void *)vwarnx); + interflop_set_handler("fprintf", (void *)fprintf); + interflop_set_handler("exit", (void *)exit); + interflop_set_handler("vfprintf", (void *)vfprintf); + interflop_set_handler("malloc", (void *)malloc); + interflop_set_handler("strcmp", (void *)strcmp); + interflop_set_handler("strtod", (void *)_vfc_strtol); + interflop_set_handler("strtod", (void *)_vfc_strtod); + interflop_set_handler("strcpy", (void *)strcpy); + interflop_set_handler("fclose", (void *)fclose); + interflop_set_handler("fgets", (void *)fgets); + interflop_set_handler("strtok_r", (void *)strtok_r); + interflop_set_handler("free", (void *)free); + interflop_set_handler("calloc", (void *)calloc); + interflop_set_handler("gettimeofday", (void *)gettimeofday); + // interflop_set_handler("register_printf_specifier", (void *)register_printf_specifier); + + /* Initialize the logger */ + logger_init(&interflop_module::panic, stderr, "pene"); + char *vfc_backends = NULL, *vfc_backends_env = NULL; + parse_vfc_backends_env(&vfc_backends, &vfc_backends_env); + + if (vfc_backends == NULL) { + logger_error("At least one backend should be provided " + "by defining VFC_BACKENDS or VFC_BACKENDS_FROM_FILE " + "environment variables", + vfc_backends_env); + } + + /* Environnement variable to disable loading message */ + char *silent_load_env = getenv("VFC_BACKENDS_SILENT_LOAD"); + bool silent_load = + ((silent_load_env == NULL) || (strcasecmp(silent_load_env, "True") != 0)) + ? false + : true; + + /* For each backend, load and register the backend vtable interface + Backends .so are separated by semi-colons in the VFC_BACKENDS + env variable */ + char *semicolonptr; + char *token = strtok_r(vfc_backends, ";", &semicolonptr); + + //~ interflop_backend_interface_t * _backends = dyn_backends->get_backends_interface(); + //~ void ** _contexts = dyn_backends->get_backends_contexts(); + while (token) { + /* Parse each backend arguments, argv[0] is the backend name */ + int backend_argc = 0; + char *backend_argv[MAX_ARGS]; + char *spaceptr; + char *arg = strtok_r(token, " ", &spaceptr); + while (arg) { + if (backend_argc >= MAX_ARGS) { + logger_error("%s syntax error: too many arguments", vfc_backends_env); + } + backend_argv[backend_argc++] = arg; + arg = strtok_r(NULL, " ", &spaceptr); + } + /* load the backend .so */ + void *handle = dlopen(backend_argv[0], RTLD_NOW); + if (handle == NULL) { + logger_error("Cannot load backend %s: dlopen error\n%s", token, + dlerror()); + } + if (!silent_load) + logger_info("loaded backend %s\n", token); + + /* get the addresses of the interflop_init, interflop_pre_init, and + * interflop_cli functions */ + interflop_pre_init_t handle_pre_init = (interflop_pre_init_t)load_function( + token, handle, "interflop_pre_init"); + interflop_cli_t handle_cli = + (interflop_cli_t)load_function(token, handle, "interflop_cli"); + interflop_init_t handle_init = + (interflop_init_t)load_function(token, handle, "interflop_init"); + + + vfc_set_handlers(token, handle); + + /* Register backend */ + if (loaded_backends == MAX_BACKENDS) { + logger_error("No more than %d backends can be used simultaneously", + MAX_BACKENDS); + } + + handle_pre_init(&interflop_module::panic, stderr, &contexts[loaded_backends]); + handle_cli(backend_argc, backend_argv, contexts[loaded_backends]); + backends[loaded_backends] = handle_init(contexts[loaded_backends]); + loaded_backends++; + + /* parse next backend token */ + token = strtok_r(NULL, ";", &semicolonptr); + } + //~ dyn_backends->set_loaded_backends(loaded_backends); + if (loaded_backends == 0) { + logger_error("%s syntax error: at least one backend should be provided", + vfc_backends_env); + } + + /* Check that at least one backend implements each required operation */ + check_backends_implements(float, add); + check_backends_implements(float, sub); + check_backends_implements(float, mul); + check_backends_implements(float, div); + check_backends_implements(double, add); + check_backends_implements(double, sub); + check_backends_implements(double, mul); + check_backends_implements(double, div); + + filter* filter = new null_filter(); + if (KnobVectorInterflop.Value()) + { + data = new instrumenter(new replace_module_internals::dynamic_backend_instrumenters(), filter); + } + else + { + data = new instrumenter(new replace_module_internals::dynamic_backend_instrumenters(), filter); + } + data->TRACE_AddInstrumentFunction(); + } + + void interflop_module::panic (const char *msg) + { + std::cerr << msg; + exit(1); + } + + + const std::string& interflop_module::name() + { + static const std::string name_("interflop_module"); + return name_; + } + +} + +#endif diff --git a/src/module.cpp b/src/module.cpp index 1c22c35..360451c 100644 --- a/src/module.cpp +++ b/src/module.cpp @@ -33,6 +33,16 @@ namespace pene { return false; } } + KNOB * interflop = static_cast*>(KNOB_BASE::FindKnob("interflop")); + KNOB * replace = static_cast*>(KNOB_BASE::FindKnob("fp-replace")); + if (interflop && replace) + { + if (interflop->Value() && replace->Value()) + { + std::cerr << "error : Only one mode between -interflop or -fp-replace should be used" << std::endl; + return false; + } + } return true; } void module::init_all() diff --git a/src/pene.cpp b/src/pene.cpp index 7d9ef2b..5566b0e 100644 --- a/src/pene.cpp +++ b/src/pene.cpp @@ -7,6 +7,7 @@ #include "symbol_list_generator_module.h" #include "replace_module.h" #include "extern_file.h" +#include "interflop_module.h" using namespace pene; std::ofstream OutFile; @@ -54,6 +55,7 @@ int main(int argc, char* argv[]) counters_module countersModule{}; symbol_list_generator_module symlistgenModule{}; replace_module replacemodule{}; + interflop_module interflopmodule{}; OutFile.open(KnobOutputFile.Value().c_str());