{ lib }: rec { # gcc.arch to its features (as in /proc/cpuinfo) features = { # x86_64 Generic # Spec: https://gitlab.com/x86-psABIs/x86-64-ABI/ default = [ ]; x86-64 = [ ]; x86-64-v2 = [ "sse3" "ssse3" "sse4_1" "sse4_2" ]; x86-64-v3 = [ "sse3" "ssse3" "sse4_1" "sse4_2" "avx" "avx2" "fma" ]; x86-64-v4 = [ "sse3" "ssse3" "sse4_1" "sse4_2" "avx" "avx2" "avx512" "fma" ]; # x86_64 Intel nehalem = [ "sse3" "ssse3" "sse4_1" "sse4_2" ]; westmere = [ "sse3" "ssse3" "sse4_1" "sse4_2" ]; silvermont = [ "sse3" "ssse3" "sse4_1" "sse4_2" ]; sandybridge = [ "sse3" "ssse3" "sse4_1" "sse4_2" "avx" ]; ivybridge = [ "sse3" "ssse3" "sse4_1" "sse4_2" "avx" ]; haswell = [ "sse3" "ssse3" "sse4_1" "sse4_2" "avx" "avx2" "fma" ]; broadwell = [ "sse3" "ssse3" "sse4_1" "sse4_2" "avx" "avx2" "fma" ]; skylake = [ "sse3" "ssse3" "sse4_1" "sse4_2" "aes" "avx" "avx2" "fma" ]; skylake-avx512 = [ "sse3" "ssse3" "sse4_1" "sse4_2" "aes" "avx" "avx2" "avx512" "fma" ]; cannonlake = [ "sse3" "ssse3" "sse4_1" "sse4_2" "aes" "avx" "avx2" "avx512" "fma" ]; icelake-client = [ "sse3" "ssse3" "sse4_1" "sse4_2" "aes" "avx" "avx2" "avx512" "fma" ]; icelake-server = [ "sse3" "ssse3" "sse4_1" "sse4_2" "aes" "avx" "avx2" "avx512" "fma" ]; cascadelake = [ "sse3" "ssse3" "sse4_1" "sse4_2" "aes" "avx" "avx2" "avx512" "fma" ]; cooperlake = [ "sse3" "ssse3" "sse4_1" "sse4_2" "aes" "avx" "avx2" "avx512" "fma" ]; tigerlake = [ "sse3" "ssse3" "sse4_1" "sse4_2" "aes" "avx" "avx2" "avx512" "fma" ]; alderlake = [ "sse3" "ssse3" "sse4_1" "sse4_2" "aes" "avx" "avx2" "fma" ]; sapphirerapids = [ "sse3" "ssse3" "sse4_1" "sse4_2" "aes" "avx" "avx2" "avx512" "fma" ]; emeraldrapids = [ "sse3" "ssse3" "sse4_1" "sse4_2" "aes" "avx" "avx2" "avx512" "fma" ]; sierraforest = [ "sse3" "ssse3" "sse4_1" "sse4_2" "aes" "avx" "avx2" "fma" ]; # x86_64 AMD btver1 = [ "sse3" "ssse3" "sse4_1" "sse4_2" ]; btver2 = [ "sse3" "ssse3" "sse4_1" "sse4_2" "aes" "avx" ]; bdver1 = [ "sse3" "ssse3" "sse4_1" "sse4_2" "sse4a" "aes" "avx" "fma" "fma4" ]; bdver2 = [ "sse3" "ssse3" "sse4_1" "sse4_2" "sse4a" "aes" "avx" "fma" "fma4" ]; bdver3 = [ "sse3" "ssse3" "sse4_1" "sse4_2" "sse4a" "aes" "avx" "fma" "fma4" ]; bdver4 = [ "sse3" "ssse3" "sse4_1" "sse4_2" "sse4a" "aes" "avx" "avx2" "fma" "fma4" ]; znver1 = [ "sse3" "ssse3" "sse4_1" "sse4_2" "sse4a" "aes" "avx" "avx2" "fma" ]; znver2 = [ "sse3" "ssse3" "sse4_1" "sse4_2" "sse4a" "aes" "avx" "avx2" "fma" ]; znver3 = [ "sse3" "ssse3" "sse4_1" "sse4_2" "sse4a" "aes" "avx" "avx2" "fma" ]; znver4 = [ "sse3" "ssse3" "sse4_1" "sse4_2" "sse4a" "aes" "avx" "avx2" "avx512" "fma" ]; znver5 = [ "sse3" "ssse3" "sse4_1" "sse4_2" "sse4a" "aes" "avx" "avx2" "avx512" "fma" ]; # LoongArch64 # https://github.com/loongson/la-toolchain-conventions loongarch64 = [ "fpu64" ]; la464 = [ "fpu64" "lsx" "lasx" ]; la664 = [ "fpu64" "lsx" "lasx" "div32" "frecipe" "lam-bh" "lamcas" "ld-seq-sa" ]; "la64v1.0" = [ "fpu64" "lsx" ]; "la64v1.1" = [ "fpu64" "lsx" "div32" "frecipe" "lam-bh" "lamcas" "ld-seq-sa" ]; # other armv5te = [ ]; armv6 = [ ]; armv7-a = [ ]; armv8-a = [ ]; mips32 = [ ]; loongson2f = [ ]; }; # a superior CPU has all the features of an inferior and is able to build and test code for it inferiors = let withInferiors = archs: lib.unique (archs ++ lib.flatten (lib.attrVals archs inferiors)); in { # x86_64 Generic default = [ ]; x86-64 = [ ]; x86-64-v2 = [ "x86-64" ]; x86-64-v3 = [ "x86-64-v2" ] ++ inferiors.x86-64-v2; x86-64-v4 = [ "x86-64-v3" ] ++ inferiors.x86-64-v3; # x86_64 Intel # https://gcc.gnu.org/onlinedocs/gcc/x86-Options.html nehalem = [ "x86-64-v2" ] ++ inferiors.x86-64-v2; westmere = [ "nehalem" ] ++ inferiors.nehalem; sandybridge = [ "westmere" ] ++ inferiors.westmere; ivybridge = [ "sandybridge" ] ++ inferiors.sandybridge; haswell = lib.unique ( [ "ivybridge" "x86-64-v3" ] ++ inferiors.ivybridge ++ inferiors.x86-64-v3 ); broadwell = [ "haswell" ] ++ inferiors.haswell; skylake = [ "broadwell" ] ++ inferiors.broadwell; skylake-avx512 = lib.unique ( [ "skylake" "x86-64-v4" ] ++ inferiors.skylake ++ inferiors.x86-64-v4 ); cannonlake = [ "skylake-avx512" ] ++ inferiors.skylake-avx512; icelake-client = [ "cannonlake" ] ++ inferiors.cannonlake; icelake-server = [ "icelake-client" ] ++ inferiors.icelake-client; cascadelake = [ "cannonlake" ] ++ inferiors.cannonlake; cooperlake = [ "cascadelake" ] ++ inferiors.cascadelake; tigerlake = [ "icelake-server" ] ++ inferiors.icelake-server; sapphirerapids = [ "tigerlake" ] ++ inferiors.tigerlake; emeraldrapids = [ "sapphirerapids" ] ++ inferiors.sapphirerapids; alderlake = [ "skylake" ] ++ inferiors.skylake; sierraforest = [ "alderlake" ] ++ inferiors.alderlake; # x86_64 AMD # TODO: fill in specific CPU architecture inferiors btver1 = [ "x86-64" ]; btver2 = [ "x86-64-v2" ] ++ inferiors.x86-64-v2; bdver1 = [ "x86-64-v2" ] ++ inferiors.x86-64-v2; bdver2 = [ "x86-64-v2" ] ++ inferiors.x86-64-v2; bdver3 = [ "x86-64-v2" ] ++ inferiors.x86-64-v2; bdver4 = [ "x86-64-v3" ] ++ inferiors.x86-64-v3; # Regarding `skylake` as inferior of `znver1`, there are reports of # successful usage by Gentoo users and Phoronix benchmarking of different # `-march` targets. # # The GCC documentation on extensions used and wikichip documentation # regarding supperted extensions on znver1 and skylake was used to create # this partial order. # # Note: # # - The successors of `skylake` (`cannonlake`, `icelake`, etc) use `avx512` # which no current AMD Zen michroarch support. # - `znver1` uses `ABM`, `CLZERO`, `CX16`, `MWAITX`, and `SSE4A` which no # current Intel microarch support. # # https://www.phoronix.com/scan.php?page=article&item=amd-znver3-gcc11&num=1 # https://gcc.gnu.org/onlinedocs/gcc/x86-Options.html # https://en.wikichip.org/wiki/amd/microarchitectures/zen # https://en.wikichip.org/wiki/intel/microarchitectures/skylake znver1 = [ "skylake" ] ++ inferiors.skylake; # Includes haswell and x86-64-v3 znver2 = [ "znver1" ] ++ inferiors.znver1; znver3 = [ "znver2" ] ++ inferiors.znver2; znver4 = lib.unique ( [ "znver3" "x86-64-v4" ] ++ inferiors.znver3 ++ inferiors.x86-64-v4 ); znver5 = [ "znver4" ] ++ inferiors.znver4; # ARM64 (AArch64) armv8-a = [ ]; "armv8.1-a" = [ "armv8-a" ]; "armv8.2-a" = [ "armv8.1-a" ] ++ inferiors."armv8.1-a"; "armv8.3-a" = [ "armv8.2-a" ] ++ inferiors."armv8.2-a"; "armv8.4-a" = [ "armv8.3-a" ] ++ inferiors."armv8.3-a"; "armv8.5-a" = [ "armv8.4-a" ] ++ inferiors."armv8.4-a"; "armv8.6-a" = [ "armv8.5-a" ] ++ inferiors."armv8.5-a"; "armv8.7-a" = [ "armv8.6-a" ] ++ inferiors."armv8.6-a"; "armv8.8-a" = [ "armv8.7-a" ] ++ inferiors."armv8.7-a"; "armv8.9-a" = [ "armv8.8-a" ] ++ inferiors."armv8.8-a"; armv9-a = [ "armv8.5-a" ] ++ inferiors."armv8.5-a"; "armv9.1-a" = [ "armv9-a" "armv8.6-a" ] ++ inferiors."armv8.6-a"; "armv9.2-a" = lib.unique ( [ "armv9.1-a" "armv8.7-a" ] ++ inferiors."armv9.1-a" ++ inferiors."armv8.7-a" ); "armv9.3-a" = lib.unique ( [ "armv9.2-a" "armv8.8-a" ] ++ inferiors."armv9.2-a" ++ inferiors."armv8.8-a" ); "armv9.4-a" = [ "armv9.3-a" ] ++ inferiors."armv9.3-a"; # ARM cortex-a53 = [ "armv8-a" ]; cortex-a72 = [ "armv8-a" ]; cortex-a55 = [ "armv8.2-a" "cortex-a53" "cortex-a72" ] ++ inferiors."armv8.2-a"; cortex-a76 = [ "armv8.2-a" "cortex-a53" "cortex-a72" ] ++ inferiors."armv8.2-a"; # Ampere ampere1 = withInferiors [ "armv8.6-a" "cortex-a55" "cortex-a76" ]; ampere1a = [ "ampere1" ] ++ inferiors.ampere1; ampere1b = [ "ampere1a" ] ++ inferiors.ampere1a; # LoongArch64 loongarch64 = [ ]; "la64v1.0" = [ "loongarch64" ]; la464 = [ "la64v1.0" ] ++ inferiors."la64v1.0"; "la64v1.1" = [ "la64v1.0" ] ++ inferiors."la64v1.0"; la664 = withInferiors [ "la464" "la64v1.1" ]; # other armv5te = [ ]; armv6 = [ ]; armv7-a = [ ]; mips32 = [ ]; loongson2f = [ ]; }; /** Check whether one GCC architecture has the the other inferior architecture. # Inputs `arch1` : GCC architecture in string `arch2` : GCC architecture in string # Type ``` hasInferior :: string -> string -> bool ``` # Examples ::: {.example} ## `lib.systems.architectures.hasInferior` usage example ```nix hasInferior "x86-64-v3" "x86-64" => true hasInferior "x86-64" "x86-64-v3" => false hasInferior "x86-64" "x86-64" => false ``` */ hasInferior = arch1: arch2: inferiors ? ${arch1} && lib.elem arch2 inferiors.${arch1}; /** Check whether one GCC architecture can execute the other. # Inputs `arch1` : GCC architecture in string `arch2` : GCC architecture in string # Type ``` canExecute :: string -> string -> bool ``` # Examples ::: {.example} ## `lib.systems.architectures.canExecute` usage example ```nix canExecute "x86-64" "x86-64-v3" => false canExecute "x86-64-v3" "x86-64" => true canExecute "x86-64" "x86-64" => true ``` */ canExecute = arch1: arch2: arch1 == arch2 || hasInferior arch1 arch2; predicates = let featureSupport = feature: x: builtins.elem feature features.${x} or [ ]; in { sse3Support = featureSupport "sse3"; ssse3Support = featureSupport "ssse3"; sse4_1Support = featureSupport "sse4_1"; sse4_2Support = featureSupport "sse4_2"; sse4_aSupport = featureSupport "sse4a"; avxSupport = featureSupport "avx"; avx2Support = featureSupport "avx2"; avx512Support = featureSupport "avx512"; aesSupport = featureSupport "aes"; fmaSupport = featureSupport "fma"; fma4Support = featureSupport "fma4"; lsxSupport = featureSupport "lsx"; lasxSupport = featureSupport "lasx"; }; }