Skip to content

Commit

Permalink
Fix duplication of pk_add_f16 symbols (#1858)
Browse files Browse the repository at this point in the history
  • Loading branch information
bartekxk authored Feb 4, 2025
1 parent 9ee69dd commit 11e4082
Showing 1 changed file with 2 additions and 2 deletions.
4 changes: 2 additions & 2 deletions include/ck_tile/core/numeric/vector_type.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -200,7 +200,7 @@ using bf8x32_t = bf8_t __attribute((ext_vector_type(32)));
using bf8x64_t = bf8_t __attribute((ext_vector_type(64)));
#endif

__host__ fp16x2_t pk_add_f16(const fp16x2_t& x, const fp16x2_t& y)
CK_TILE_HOST fp16x2_t pk_add_f16(const fp16x2_t& x, const fp16x2_t& y)
{
fp16x2_t vector_res;

Expand All @@ -210,7 +210,7 @@ __host__ fp16x2_t pk_add_f16(const fp16x2_t& x, const fp16x2_t& y)
return vector_res;
}

__device__ fp16x2_t pk_add_f16(const fp16x2_t& x, const fp16x2_t& y)
CK_TILE_DEVICE fp16x2_t pk_add_f16(const fp16x2_t& x, const fp16x2_t& y)
{
fp16x2_t c;
asm volatile("v_pk_add_f16 %0, %1, %2" : "=v"(c) : "v"(x), "v"(y));
Expand Down

0 comments on commit 11e4082

Please sign in to comment.