Skip to content

Commit

Permalink
Added reinterpret primitives for neon (#107)
Browse files Browse the repository at this point in the history
  • Loading branch information
JPietrzykTUD authored Sep 4, 2024
1 parent 5aacdfa commit b3bf7ab
Showing 1 changed file with 27 additions and 1 deletion.
28 changes: 27 additions & 1 deletion primitive_data/primitives/convert.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -131,12 +131,38 @@ definitions:
additional_simd_template_base_type: ["int8_t", "uint8_t", "int16_t", "uint16_t", "int32_t", "uint32_t", "int64_t", "uint64_t"]
lscpu_flags: ["sse2"]
implementation: "return _mm_castpd_si128(data);"
#SCALAR
#SCALAR
- target_extension: "scalar"
ctype: ["int8_t", "uint8_t", "int16_t", "uint16_t", "int32_t", "uint32_t", "int64_t", "uint64_t", "float", "double"]
additional_simd_template_base_type: ["int8_t", "uint8_t", "int16_t", "uint16_t", "int32_t", "uint32_t", "int64_t", "uint64_t", "float", "double"]
lscpu_flags: []
implementation: "return data;"
#ARM - NEON
- target_extension: "neon"
ctype: ["int8_t", "uint8_t", "int16_t", "uint16_t", "int32_t", "uint32_t", "int64_t", "uint64_t", "float", "double"]
additional_simd_template_base_type: ["int8_t", "uint8_t", "int16_t", "uint16_t", "int32_t", "uint32_t", "int64_t", "uint64_t", "float", "double"]
lscpu_flags: ["neon"]
implementation: "return data;"
- target_extension: "neon"
ctype: ["int8_t", "uint8_t", "int16_t", "uint16_t", "int32_t", "uint32_t", "int64_t", "uint64_t"]
additional_simd_template_base_type: ["float"]
lscpu_flags: ["neon"]
implementation: "return vreinterpretq_{{ intrin_tp_full[additional_simd_template_base_type] }}_{{ intrin_tp_full[ctype] }}(data);"
- target_extension: "neon"
ctype: ["float"]
additional_simd_template_base_type: ["int8_t", "uint8_t", "int16_t", "uint16_t", "int32_t", "uint32_t", "int64_t", "uint64_t"]
lscpu_flags: ["neon"]
implementation: "return vreinterpretq_{{ intrin_tp_full[additional_simd_template_base_type] }}_{{ intrin_tp_full[ctype] }}(data);"
- target_extension: "neon"
ctype: ["int8_t", "uint8_t", "int16_t", "uint16_t", "int32_t", "uint32_t", "int64_t", "uint64_t"]
additional_simd_template_base_type: ["double"]
lscpu_flags: ["neon"]
implementation: "return vreinterpretq_{{ intrin_tp_full[additional_simd_template_base_type] }}_{{ intrin_tp_full[ctype] }}(data);"
- target_extension: "neon"
ctype: ["double"]
additional_simd_template_base_type: ["int8_t", "uint8_t", "int16_t", "uint16_t", "int32_t", "uint32_t", "int64_t", "uint64_t"]
lscpu_flags: ["neon"]
implementation: "return vreinterpretq_{{ intrin_tp_full[additional_simd_template_base_type] }}_{{ intrin_tp_full[ctype] }}(data);"
#INTEL - FPGA
- target_extension: ["oneAPIfpga", "oneAPIfpgaRTL"]
ctype: ["float", "double"]
Expand Down

0 comments on commit b3bf7ab

Please sign in to comment.