diff --git a/library/src/include/tree_node_3D.h b/library/src/include/tree_node_3D.h index 076749b6..dc0262f6 100644 --- a/library/src/include/tree_node_3D.h +++ b/library/src/include/tree_node_3D.h @@ -181,9 +181,11 @@ class SBRCTranspose3DNode : public LeafNode auto alignment_dimension = sbrc_3D_alignment_dimension(); if(alignment_dimension == 0) return NONE; - // NB: from the benchmark results, diagonal transpose benefits only gfx906 + // NB: from the benchmark results, diagonal transpose + // benefits only some architectures if(is_diagonal_sbrc_3D_length(length.front()) && is_cube_size(length) - && is_device_gcn_arch(deviceProp, "gfx906")) + && (is_device_gcn_arch(deviceProp, "gfx906") + || is_device_gcn_arch(deviceProp, "gfx1030"))) return DIAGONAL; if(alignment_dimension % blockWidth == 0) return TILE_ALIGNED;