Skip to content
This repository has been archived by the owner on Aug 30, 2024. It is now read-only.

Commit

Permalink
XeTLA Fix Global 1D Store
Browse files Browse the repository at this point in the history
  • Loading branch information
DDEle committed Jul 24, 2024
1 parent 1081543 commit f737f52
Showing 1 changed file with 4 additions and 5 deletions.
9 changes: 4 additions & 5 deletions include/subgroup/tile/impl/payload_xe.hpp
Original file line number Diff line number Diff line change
Expand Up @@ -467,10 +467,9 @@ struct mem_payload_t<
uint32_t offset_y = surface_offset_y;
width_in_elems = surface_width;
height_in_elems = surface_height;
payload_bytes = mem_transpose ? (surface_offset_x - 1) * pitch_in_bytes +
surface_offset_y * sizeof(dtype)
: (surface_offset_y - 1) * pitch_in_bytes +
surface_offset_x * sizeof(dtype);
payload_bytes = mem_transpose
? (surface_width - 1) * pitch_in_bytes + surface_height * sizeof(dtype)
: (surface_height - 1) * pitch_in_bytes + surface_width * sizeof(dtype);
base_offset = mem_transpose
? offset_x * pitch_in_bytes + offset_y * sizeof(dtype)
: offset_y * pitch_in_bytes + offset_x * sizeof(dtype);
Expand Down Expand Up @@ -2313,4 +2312,4 @@ struct prefetch_payload_t<
__XETLA_API void update_tdesc([[maybe_unused]] int offset) {}
};

} // namespace gpu::xetla::subgroup
} // namespace gpu::xetla::subgroup

0 comments on commit f737f52

Please sign in to comment.