unary_element_wise_operation.hpp Source File#
tensor_operation/gpu/element/unary_element_wise_operation.hpp
Go to the documentation of this file.
18// https://github.com/NVIDIA/FasterTransformer/blob/main/src/fastertransformer/cutlass_extensions/include/cutlass_extensions/interleaved_numeric_conversion.h
1821 __host__ __device__ DynamicUnaryOp(const UnaryAbs&&) : unary_op_type_(UnaryOpType::UnaryAbs) {}
Definition ck.hpp:268
__device__ half2_t amd_assembly_pk_add_f16(half2_t a, half2_t b)
Definition amd_inline_asm.hpp:35
__device__ half4_t i4_to_half4(int q)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:20
__device__ f8x8_t amd_assembly_i4_to_fp8x8(int a)
Definition amd_inline_asm.hpp:59
__host__ __device__ constexpr Y bf16_convert_rtn(X x)
__device__ half4_t i4_to_half4_scale(int q, const ck::half2_t &scale)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:48
__host__ __device__ constexpr Y f8_convert_rne(X x)
__device__ f8x4_t amd_assembly_cvt_f8_to_f32(float b0, float b1, float b2, float b3)
Definition amd_inline_asm.hpp:49
__device__ int amd_assembly_and_b32(int a, int b)
Definition amd_inline_asm.hpp:14
__device__ half2_t amd_assembly_pk_fma_f16(half2_t a, half2_t b, half2_t c)
Definition amd_inline_asm.hpp:28
__host__ __device__ constexpr Y f8_convert_sr(X x)
__device__ f8x4_t i4_to_f8x4(int q)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:82
__host__ __device__ constexpr Y type_convert(X x)
Definition utility/type_convert.hpp:98
__device__ int amd_assembly_and_or_b32(int a, int b, int d)
Definition amd_inline_asm.hpp:21
__device__ float amd_assemble_cvt_f32_i4(int b)
Definition amd_inline_asm.hpp:42
__device__ bhalf4_t i4_to_bhalf4(int q)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:126
__device__ f8x8_t i4_to_fp8x8(int q)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:98
__host__ static __device__ constexpr T Infinity()
Definition numeric_limits.hpp:317
Definition data_type.hpp:42
Definition data_type.hpp:187
Definition functional2.hpp:33
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1223
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1227
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1224
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1127
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1128
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1131
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1191
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1195
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1192
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1367
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1368
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1371
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1255
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1259
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1256
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1159
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1160
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1163
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1287
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1291
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1288
Clamp(float floor=0.f, float ceil=NumericLimits< float >::Max())
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:814
__host__ __device__ constexpr void operator()(Y &y, const X &x) const
const float floor_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:881
const float ceil_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:882
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:812
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1496
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1502
__host__ __device__ constexpr void operator()(Y &y, const X &x) const
const float beta_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1523
const float alpha_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1522
ClippedRelu(float alpha=0.f, float beta=1.f)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1499
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1497
float scale_wei_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1635
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1616
float scale_out_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1636
float scale_in_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1634
__host__ __device__ void operator()(E &e, const C &c) const
__host__ __device__ ConvInvscale(float scale_in=1.f, float scale_wei=1.f, float scale_out=1.f)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1618
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1641
__host__ __device__ void operator()(E &e, const C &c) const
float scale_out_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1661
float scale_wei_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1660
float scale_in_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1659
__host__ __device__ ConvScale(float scale_in=1.f, float scale_wei=1.f, float scale_out=1.f)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1643
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1666
float scale_in_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1686
float scale_wei_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1687
__host__ __device__ void operator()(E &e, const C &c) const
__host__ __device__ ConvScaleRelu(float scale_in=1.f, float scale_wei=1.f, float scale_out=1.f)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1668
float scale_out_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1688
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:577
__host__ __device__ void operator()(Y &y, const X &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:582
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:578
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:616
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:617
__host__ __device__ void operator()(Y &y, const X &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:621
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:596
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:597
__host__ __device__ void operator()(Y &y, const X &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:601
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1319
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1323
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1320
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1207
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1208
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1211
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:269
constexpr static const bool is_pack8_invocable
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:303
__host__ __device__ void operator()(Y &y, const X &x, const Z &z) const
__host__ __device__ constexpr void operator()(ck::half8_t &y, const ck::pk_i4x4_t &x, const ck::half2_t &z) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:276
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:270
__host__ __device__ DynamicUnaryOp(const TanH &&)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1803
__host__ __device__ DynamicUnaryOp(const LeakyRelu &leakyrelu)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1845
__host__ __device__ DynamicUnaryOp(const Power &&pow)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1828
__host__ __device__ DynamicUnaryOp(const UnaryAbs &&)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1821
__host__ __device__ DynamicUnaryOp(const Swish &&swish)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1772
__host__ __device__ DynamicUnaryOp(const TanH &)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1801
__host__ __device__ DynamicUnaryOp(const DynamicUnaryOp &dynamic_op)=default
__host__ __device__ DynamicUnaryOp(const Sigmoid &&)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1779
__host__ __device__ DynamicUnaryOp(const Swish &swish)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1767
TanH tanh_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1923
__host__ __device__ DynamicUnaryOp(const Sigmoid &)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1777
__host__ __device__ DynamicUnaryOp(const SoftRelu &&softrelu)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1814
__host__ __device__ void operator()(Y &y, const X &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1870
__host__ __device__ DynamicUnaryOp(const UnaryAbs &)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1819
__host__ __device__ DynamicUnaryOp(const LeakyRelu &&leakyrelu)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1850
__host__ __device__ DynamicUnaryOp(const Relu &&)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1807
LeakyRelu leaky_relu_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1929
Logistic logistic_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1922
Swish swish_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1919
__host__ __device__ DynamicUnaryOp(const Elu &elu)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1855
UnaryOpType unary_op_type_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1917
__host__ __device__ DynamicUnaryOp()=delete
UnaryAbs unary_abs_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1926
__host__ __device__ ~DynamicUnaryOp()
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1867
__host__ __device__ DynamicUnaryOp(const PassThrough &)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1781
__host__ __device__ DynamicUnaryOp(const Power &pow)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1823
Relu relu_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1924
__host__ __device__ DynamicUnaryOp(const PassThrough &&)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1786
__host__ __device__ DynamicUnaryOp(const Logistic &logistic)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1791
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1763
SoftRelu soft_relu_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1925
__host__ __device__ DynamicUnaryOp(const SoftRelu &softrelu)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1809
__host__ __device__ DynamicUnaryOp(const ClippedRelu &clippedrelu)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1833
Power power_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1927
__host__ __device__ DynamicUnaryOp(const Elu &&elu)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1860
__host__ __device__ DynamicUnaryOp(const ClippedRelu &&clippedrelu)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1839
Elu elu_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1930
__host__ __device__ DynamicUnaryOp(const Relu &)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1805
Sigmoid sigmoid_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1920
__host__ __device__ DynamicUnaryOp(const Logistic &&logistic)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1796
ClippedRelu clipped_relu_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1928
PassThrough pass_through_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1921
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1556
const float alpha_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1581
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1562
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1557
Elu(float alpha=1.f)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1559
__host__ __device__ constexpr void operator()(Y &y, const X &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1303
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1307
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1304
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:924
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:925
__device__ void operator()(Y &y, const X &x) const
__host__ void operator()(Y &y, const X &x) const
vector_type< uint8_t, 4 > InputArray
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1701
vector_type< half_t, 4 > OutputArray
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1702
__device__ OutputArray operator()(InputArray const &Input)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1728
static __device__ OutputArray convert(InputArray const &Input)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1704
vector_type< uint8_t, N > InputArray
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1737
static constexpr int VEC_WIDTH
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1734
vector_type< half_t, N > OutputArray
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1738
static __device__ OutputArray convert(InputArray const &Input)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1740
__device__ OutputArray operator()(InputArray const &Input)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1758
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1695
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1335
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1339
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1336
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1041
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1042
__host__ __device__ void operator()(Y &y, const X &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1527
const float alpha_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1552
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1533
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1528
LeakyRelu(float alpha=0.01f)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1530
__host__ __device__ constexpr void operator()(Y &y, const X &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1351
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1352
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1355
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1585
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1586
Logistic(float alpha=1.f)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1588
const float alpha_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1611
__host__ __device__ constexpr void operator()(Y &y, const X &x) const
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1591
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1143
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1144
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1147
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:340
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:341
__host__ __device__ void operator()(Y &y, const X &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:307
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:308
constexpr static const bool is_pack2_invocable
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:336
__host__ __device__ constexpr void operator()(ck::half2_t &y, const ck::pk_i4_t &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:319
__host__ __device__ constexpr void operator()(half2_t &y, const f8x2_t &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:313
__host__ __device__ void operator()(Y &y, const X &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:159
__host__ __device__ constexpr void operator()(ck::f8x8_t &y, const ck::pk_i4x4_t &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:191
__host__ __device__ void operator()(Y &y, const X &x) const
__host__ __device__ constexpr void operator()(ck::bhalf8_t &y, const ck::pk_i4x4_t &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:240
constexpr static const bool is_pack8_invocable
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:265
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:160
__host__ __device__ constexpr void operator()(ck::half8_t &y, const ck::pk_i4x4_t &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:165
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1460
const float gamma_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1492
const float alpha_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1490
Power(float alpha=0.f, float beta=1.f, float gamma=2.f)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1463
__host__ __device__ constexpr void operator()(Y &y, const X &x) const
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1467
const float beta_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1491
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1461
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1383
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1384
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1387
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:886
__host__ __device__ void operator()(bhalf_t &y, const bhalf_t &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:903
__host__ __device__ constexpr void operator()(Y &y, const X &x) const
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:890
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:887
__host__ __device__ void operator()(Y &y, const X &x) const
float scale_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:697
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:684
ck::tensor_operation::element_wise::ScaleAndResetNaNToMinusInfinity::ScaleAndResetNaNToMinusInfinity
__host__ __device__ ScaleAndResetNaNToMinusInfinity(float scale)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:686
float scale_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:679
__host__ __device__ void operator()(Y &y, const X &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:642
__host__ __device__ Scale(float scale=1.f)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:639
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:637
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1061
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1062
__host__ __device__ constexpr void operator()(Y &y, const X &x) const
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1065
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1087
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1091
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1088
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1271
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1272
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1275
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1175
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1176
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1179
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1430
__host__ __device__ constexpr void operator()(Y &y, const X &x) const
const float alpha_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1456
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1431
SoftRelu(float alpha=1.f)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1433
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1436
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1399
__host__ __device__ void operator()(Y &y, const X &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1405
Swish(float beta=1.0f)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1402
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1400
const float beta_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1426
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1102
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1103
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1106
__host__ __device__ constexpr void operator()(Y &y, const X &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1239
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1240
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:1243
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:765
__host__ __device__ constexpr void operator()(Y &y, const X &x) const
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:769
__host__ __device__ void operator()(f8_t &y, const f8_t &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:781
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:766
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:566
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:567
__host__ __device__ void operator()(Y &y, const X &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:570
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:707
__host__ __device__ UnaryDivide(const int32_t divider=1)
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:704
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:702
int32_t divider_
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:743
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:797
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:801
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:798
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:747
__host__ __device__ void operator()(T &y, const T &x) const
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:751
static constexpr const char * name
Definition tensor_operation/gpu/element/unary_element_wise_operation.hpp:748
Definition dtype_vector.hpp:10