Skip to content
Snippets Groups Projects
Commit 662253dd authored by René Heß's avatar René Heß
Browse files

Merge branch 'feature/random-future-work' into 'master'

Implement register transpose of 4 AVX512 register

See merge request !120
parents 73cfe31b a36a7ca1
No related branches found
No related tags found
No related merge requests found
......@@ -20,4 +20,21 @@ void transpose_reg(Vec4d& a0, Vec4d& a1, Vec4d& a2, Vec4d& a3)
a3 = blend4d<2,3,6,7>(b1,b3);
}
#if MAX_VECTOR_SIZE >= 512
void transpose_reg(Vec8d& a0, Vec8d& a1, Vec8d& a2, Vec8d& a3)
{
Vec8d b0, b1, b2, b3;
b0 = blend8d<0,4,8,12,1,5,9,13>(a0, a1);
b1 = blend8d<1,5,9,13,3,7,11,15>(a0, a1);
b2 = blend8d<0,4,8,12,1,5,9,13>(a2, a3);
b3 = blend8d<1,5,9,13,3,7,11,15>(a2, a3);
a0 = blend8d<0,1,2,3,8,9,10,11>(b0, b2);
a1 = blend8d<4,5,6,7,12,13,14,15>(b0, b2);
a2 = blend8d<0,1,2,3,8,9,10,11>(b1, b3);
a3 = blend8d<4,5,6,7,12,13,14,15>(b1, b3);
}
#endif
#endif
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment