2024-08-14 16:32:53 +00:00
|
|
|
#version 450
|
|
|
|
|
|
|
|
#include "types.comp"
|
|
|
|
#include "generic_unary_head.comp"
|
|
|
|
|
2024-11-13 06:58:57 +00:00
|
|
|
layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in;
|
|
|
|
|
2024-08-14 16:32:53 +00:00
|
|
|
uint src0_idx_mod(uint idx) {
|
|
|
|
const uint i13 = idx / (p.ne12*p.ne11*p.ne10);
|
|
|
|
const uint i13_offset = i13 * p.ne12*p.ne11*p.ne10;
|
|
|
|
const uint i12 = (idx - i13_offset) / (p.ne11*p.ne10);
|
|
|
|
const uint i12_offset = i12*p.ne11*p.ne10;
|
|
|
|
const uint i11 = (idx - i13_offset - i12_offset) / p.ne10;
|
|
|
|
const uint i10 = idx - i13_offset - i12_offset - i11*p.ne10;
|
|
|
|
return (i13 % p.ne03)*p.nb03 + (i12 % p.ne02)*p.nb02 + (i11 % p.ne01)*p.nb01 + (i10 % p.ne00)*p.nb00;
|
|
|
|
}
|
|
|
|
|
|
|
|
void main() {
|
|
|
|
const uint idx = get_idx();
|
|
|
|
|
|
|
|
if (idx >= p.ne) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
|
|
|
|
data_d[p.d_offset + dst_idx(idx)] = D_TYPE(data_a[src0_idx_mod(idx)]);
|
|
|
|
}
|