mirror of https://github.com/xemu-project/xemu.git
target-tilegx: Tidy simd_helper.c
Using the V1 macro when we want to replicate a byte across the 8 elements of the word. Using deposit and extract for manipulating specific elements. Signed-off-by: Richard Henderson <rth@twiddle.net>
This commit is contained in:
parent
5fdb4671b0
commit
0551301076
|
@ -23,12 +23,16 @@
|
||||||
#include "exec/helper-proto.h"
|
#include "exec/helper-proto.h"
|
||||||
|
|
||||||
|
|
||||||
|
/* Broadcast a value to all elements of a vector. */
|
||||||
|
#define V1(X) (((X) & 0xff) * 0x0101010101010101ull)
|
||||||
|
|
||||||
|
|
||||||
uint64_t helper_v1shl(uint64_t a, uint64_t b)
|
uint64_t helper_v1shl(uint64_t a, uint64_t b)
|
||||||
{
|
{
|
||||||
uint64_t m;
|
uint64_t m;
|
||||||
|
|
||||||
b &= 7;
|
b &= 7;
|
||||||
m = 0x0101010101010101ULL * (0xff >> b);
|
m = V1(0xff >> b);
|
||||||
return (a & m) << b;
|
return (a & m) << b;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -37,7 +41,7 @@ uint64_t helper_v1shru(uint64_t a, uint64_t b)
|
||||||
uint64_t m;
|
uint64_t m;
|
||||||
|
|
||||||
b &= 7;
|
b &= 7;
|
||||||
m = 0x0101010101010101ULL * ((0xff << b) & 0xff);
|
m = V1(0xff << b);
|
||||||
return (a & m) >> b;
|
return (a & m) >> b;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -48,8 +52,7 @@ uint64_t helper_v1shrs(uint64_t a, uint64_t b)
|
||||||
|
|
||||||
b &= 7;
|
b &= 7;
|
||||||
for (i = 0; i < 64; i += 8) {
|
for (i = 0; i < 64; i += 8) {
|
||||||
int64_t ae = (int8_t)(a >> i);
|
r = deposit64(r, i, 8, sextract64(a, i + b, 8 - b));
|
||||||
r |= ((ae >> b) & 0xff) << i;
|
|
||||||
}
|
}
|
||||||
return r;
|
return r;
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue