#version 450 #include "types.comp" #include "generic_unary_head.comp" layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in; uint src0_idx_mod(uint idx) { const uint i13 = idx / (p.ne12*p.ne11*p.ne10); const uint i13_offset = i13 * p.ne12*p.ne11*p.ne10; const uint i12 = (idx - i13_offset) / (p.ne11*p.ne10); const uint i12_offset = i12*p.ne11*p.ne10; const uint i11 = (idx - i13_offset - i12_offset) / p.ne10; const uint i10 = idx - i13_offset - i12_offset - i11*p.ne10; return (i13 % p.ne03)*p.nb03 + (i12 % p.ne02)*p.nb02 + (i11 % p.ne01)*p.nb01 + (i10 % p.ne00)*p.nb00; } void main() { const uint idx = get_idx(); if (idx >= p.ne) { return; } data_d[p.d_offset + dst_idx(idx)] = D_TYPE(data_a[src0_idx_mod(idx)]); }