src/wasm/simd-shuffle.cc - v8/v8 - Git at Google

 // Copyright 2020 the V8 project authors. All rights reserved.
 // Use of this source code is governed by a BSD-style license that can be
 // found in the LICENSE file.

 #include "src/wasm/simd-shuffle.h"

 #include <algorithm>

 #include "src/common/globals.h"

 namespace v8 {
 namespace internal {
 namespace wasm {

 bool SimdShuffle::TryMatchIdentity(const uint8_t* shuffle) {
   for (int i = 0; i < kSimd128Size; ++i) {
     if (shuffle[i] != i) return false;
   }
   return true;
 }

 bool SimdShuffle::TryMatch32x4Rotate(const uint8_t* shuffle,
                                      uint8_t* shuffle32x4, bool is_swizzle) {
   uint8_t offset;
   bool is_concat = TryMatchConcat(shuffle, &offset);
   DCHECK_NE(offset, 0);  // 0 is identity, it should not be matched.
   // Since we already have a concat shuffle, we know that the indices goes from:
   // [ offset, ..., 15, 0, ... ], it suffices to check that the offset points
   // to the low byte of a 32x4 element.
   if (!is_concat || !is_swizzle || offset % 4 != 0) {
     return false;
   }

   uint8_t offset_32 = offset / 4;
   for (int i = 0; i < 4; i++) {
     shuffle32x4[i] = (offset_32 + i) % 4;
   }
   return true;
 }

 bool SimdShuffle::TryMatch32x4Reverse(const uint8_t* shuffle32x4) {
   return shuffle32x4[0] == 3 && shuffle32x4[1] == 2 && shuffle32x4[2] == 1 &&
          shuffle32x4[3] == 0;
 }

 bool SimdShuffle::TryMatch32x4OneLaneSwizzle(const uint8_t* shuffle32x4,
                                              uint8_t* from_lane,
                                              uint8_t* to_lane) {
   constexpr uint32_t patterns[12]{
       0x30200000,  // 0 -> 1
       0x30000100,  // 0 -> 2
       0x00020100,  // 0 -> 3
       0x03020101,  // 1 -> 0
       0x03010100,  // 1 -> 2
       0x01020100,  // 1 -> 3
       0x03020102,  // 2 -> 0
       0x03020200,  // 2 -> 1
       0x02020100,  // 2 -> 3
       0x03020103,  // 3 -> 0
       0x03020300,  // 3 -> 1
       0x03030100   // 3 -> 2
   };

   unsigned pattern_idx = 0;
   uint32_t shuffle = *reinterpret_cast<const uint32_t*>(shuffle32x4);
 #ifdef V8_TARGET_BIG_ENDIAN
   shuffle = base::bits::ReverseBytes(shuffle);
 #endif
   for (unsigned from = 0; from < 4; ++from) {
     for (unsigned to = 0; to < 4; ++to) {
       if (from == to) {
         continue;
       }
       if (shuffle == patterns[pattern_idx]) {
         *from_lane = from;
         *to_lane = to;
         return true;
       }
       ++pattern_idx;
     }
   }
   return false;
 }

 bool SimdShuffle::TryMatch32x4Shuffle(const uint8_t* shuffle,
                                       uint8_t* shuffle32x4) {
   for (int i = 0; i < 4; ++i) {
     if (shuffle[i * 4] % 4 != 0) return false;
     for (int j = 1; j < 4; ++j) {
       if (shuffle[i * 4 + j] - shuffle[i * 4 + j - 1] != 1) return false;
     }
     shuffle32x4[i] = shuffle[i * 4] / 4;
   }
   return true;
 }

 bool SimdShuffle::TryMatch32x8Shuffle(const uint8_t* shuffle,
                                       uint8_t* shuffle32x8) {
   for (int i = 0; i < 8; ++i) {
     if (shuffle[i * 4] % 4 != 0) return false;
     for (int j = 1; j < 4; ++j) {
       if (shuffle[i * 4 + j] - shuffle[i * 4 + j - 1] != 1) return false;
     }
     shuffle32x8[i] = shuffle[i * 4] / 4;
   }
   return true;
 }

 bool SimdShuffle::TryMatch16x8Shuffle(const uint8_t* shuffle,
                                       uint8_t* shuffle16x8) {
   for (int i = 0; i < 8; ++i) {
     if (shuffle[i * 2] % 2 != 0) return false;
     for (int j = 1; j < 2; ++j) {
       if (shuffle[i * 2 + j] - shuffle[i * 2 + j - 1] != 1) return false;
     }
     shuffle16x8[i] = shuffle[i * 2] / 2;
   }
   return true;
 }

 bool SimdShuffle::TryMatchConcat(const uint8_t* shuffle, uint8_t* offset) {
   // Don't match the identity shuffle (e.g. [0 1 2 ... 15]).
   uint8_t start = shuffle[0];
   if (start == 0) return false;
   DCHECK_GT(kSimd128Size, start);  // The shuffle should be canonicalized.
   // A concatenation is a series of consecutive indices, with at most one jump
   // in the middle from the last lane to the first.
   for (int i = 1; i < kSimd128Size; ++i) {
     if ((shuffle[i]) != ((shuffle[i - 1] + 1))) {
       if (shuffle[i - 1] != 15) return false;
       if (shuffle[i] % kSimd128Size != 0) return false;
     }
   }
   *offset = start;
   return true;
 }

 bool SimdShuffle::TryMatchBlend(const uint8_t* shuffle) {
   for (int i = 0; i < 16; ++i) {
     if ((shuffle[i] & 0xF) != i) return false;
   }
   return true;
 }

 bool SimdShuffle::TryMatchByteToDwordZeroExtend(const uint8_t* shuffle) {
   for (int i = 0; i < 16; ++i) {
     if ((i % 4 != 0) && (shuffle[i] < 16)) return false;
     if ((i % 4 == 0) && (shuffle[i] > 15 || (shuffle[i] != shuffle[0] + i / 4)))
       return false;
   }
   return true;
 }

 uint8_t SimdShuffle::PackShuffle4(uint8_t* shuffle) {
   return (shuffle[0] & 3) | ((shuffle[1] & 3) << 2) | ((shuffle[2] & 3) << 4) |
          ((shuffle[3] & 3) << 6);
 }

 uint8_t SimdShuffle::PackBlend8(const uint8_t* shuffle16x8) {
   int8_t result = 0;
   for (int i = 0; i < 8; ++i) {
     result |= (shuffle16x8[i] >= 8 ? 1 : 0) << i;
   }
   return result;
 }

 uint8_t SimdShuffle::PackBlend4(const uint8_t* shuffle32x4) {
   int8_t result = 0;
   for (int i = 0; i < 4; ++i) {
     result |= (shuffle32x4[i] >= 4 ? 0x3 : 0) << (i * 2);
   }
   return result;
 }

 int32_t SimdShuffle::Pack4Lanes(const uint8_t* shuffle) {
   int32_t result = 0;
   for (int i = 3; i >= 0; --i) {
     result <<= 8;
     result |= shuffle[i];
   }
   return result;
 }

 void SimdShuffle::Pack16Lanes(uint32_t* dst, const uint8_t* shuffle) {
   for (int i = 0; i < 4; i++) {
     dst[i] = wasm::SimdShuffle::Pack4Lanes(shuffle + (i * 4));
   }
 }

 #ifdef V8_TARGET_ARCH_X64
 // static
 bool SimdShuffle::TryMatchVpshufd(const uint8_t* shuffle32x8,
                                   uint8_t* control) {
   *control = 0;
   for (int i = 0; i < 4; ++i) {
     uint8_t mask;
     if (shuffle32x8[i] < 4 && shuffle32x8[i + 4] - shuffle32x8[i] == 4) {
       mask = shuffle32x8[i];
       *control |= mask << (2 * i);
       continue;
     }
     return false;
   }
   return true;
 }

 // static
 bool SimdShuffle::TryMatchShufps256(const uint8_t* shuffle32x8,
                                     uint8_t* control) {
   *control = 0;
   for (int i = 0; i < 4; ++i) {
     // low 128-bits and high 128-bits should have the same shuffle order.
     if (shuffle32x8[i + 4] - shuffle32x8[i] == 4) {
       // [63:0]   bits select from SRC1,
       // [127:64] bits select from SRC2
       if ((i < 2 && shuffle32x8[i] < 4) ||
           (i >= 2 && shuffle32x8[i] >= 8 && shuffle32x8[i] < 12)) {
         *control |= (shuffle32x8[i] % 4) << (2 * i);
         continue;
       }
       return false;
     }
     return false;
   }
   return true;
 }
 #endif  // V8_TARGET_ARCH_X64

 bool SimdSwizzle::AllInRangeOrTopBitSet(
     std::array<uint8_t, kSimd128Size> shuffle) {
   return std::all_of(shuffle.begin(), shuffle.end(),
                      [](auto i) { return (i < kSimd128Size) || (i & 0x80); });
 }

 }  // namespace wasm
 }  // namespace internal
 }  // namespace v8
	// Copyright 2020 the V8 project authors. All rights reserved.
	// Use of this source code is governed by a BSD-style license that can be
	// found in the LICENSE file.

	#include "src/wasm/simd-shuffle.h"

	#include <algorithm>

	#include "src/common/globals.h"

	namespace v8 {
	namespace internal {
	namespace wasm {

	bool SimdShuffle::TryMatchIdentity(const uint8_t* shuffle) {
	for (int i = 0; i < kSimd128Size; ++i) {
	if (shuffle[i] != i) return false;
	}
	return true;
	}

	bool SimdShuffle::TryMatch32x4Rotate(const uint8_t* shuffle,
	uint8_t* shuffle32x4, bool is_swizzle) {
	uint8_t offset;
	bool is_concat = TryMatchConcat(shuffle, &offset);
	DCHECK_NE(offset, 0); // 0 is identity, it should not be matched.
	// Since we already have a concat shuffle, we know that the indices goes from:
	// [ offset, ..., 15, 0, ... ], it suffices to check that the offset points
	// to the low byte of a 32x4 element.
	if (!is_concat \|\| !is_swizzle \|\| offset % 4 != 0) {
	return false;
	}

	uint8_t offset_32 = offset / 4;
	for (int i = 0; i < 4; i++) {
	shuffle32x4[i] = (offset_32 + i) % 4;
	}
	return true;
	}

	bool SimdShuffle::TryMatch32x4Reverse(const uint8_t* shuffle32x4) {
	return shuffle32x4[0] == 3 && shuffle32x4[1] == 2 && shuffle32x4[2] == 1 &&
	shuffle32x4[3] == 0;
	}

	bool SimdShuffle::TryMatch32x4OneLaneSwizzle(const uint8_t* shuffle32x4,
	uint8_t* from_lane,
	uint8_t* to_lane) {
	constexpr uint32_t patterns[12]{
	0x30200000, // 0 -> 1
	0x30000100, // 0 -> 2
	0x00020100, // 0 -> 3
	0x03020101, // 1 -> 0
	0x03010100, // 1 -> 2
	0x01020100, // 1 -> 3
	0x03020102, // 2 -> 0
	0x03020200, // 2 -> 1
	0x02020100, // 2 -> 3
	0x03020103, // 3 -> 0
	0x03020300, // 3 -> 1
	0x03030100 // 3 -> 2
	};

	unsigned pattern_idx = 0;
	uint32_t shuffle = reinterpret_cast<const uint32_t>(shuffle32x4);
	#ifdef V8_TARGET_BIG_ENDIAN
	shuffle = base::bits::ReverseBytes(shuffle);
	#endif
	for (unsigned from = 0; from < 4; ++from) {
	for (unsigned to = 0; to < 4; ++to) {
	if (from == to) {
	continue;
	}
	if (shuffle == patterns[pattern_idx]) {
	*from_lane = from;
	*to_lane = to;
	return true;
	}
	++pattern_idx;
	}
	}
	return false;
	}

	bool SimdShuffle::TryMatch32x4Shuffle(const uint8_t* shuffle,
	uint8_t* shuffle32x4) {
	for (int i = 0; i < 4; ++i) {
	if (shuffle[i * 4] % 4 != 0) return false;
	for (int j = 1; j < 4; ++j) {
	if (shuffle[i * 4 + j] - shuffle[i * 4 + j - 1] != 1) return false;
	}
	shuffle32x4[i] = shuffle[i * 4] / 4;
	}
	return true;
	}

	bool SimdShuffle::TryMatch32x8Shuffle(const uint8_t* shuffle,
	uint8_t* shuffle32x8) {
	for (int i = 0; i < 8; ++i) {
	if (shuffle[i * 4] % 4 != 0) return false;
	for (int j = 1; j < 4; ++j) {
	if (shuffle[i * 4 + j] - shuffle[i * 4 + j - 1] != 1) return false;
	}
	shuffle32x8[i] = shuffle[i * 4] / 4;
	}
	return true;
	}

	bool SimdShuffle::TryMatch16x8Shuffle(const uint8_t* shuffle,
	uint8_t* shuffle16x8) {
	for (int i = 0; i < 8; ++i) {
	if (shuffle[i * 2] % 2 != 0) return false;
	for (int j = 1; j < 2; ++j) {
	if (shuffle[i * 2 + j] - shuffle[i * 2 + j - 1] != 1) return false;
	}
	shuffle16x8[i] = shuffle[i * 2] / 2;
	}
	return true;
	}

	bool SimdShuffle::TryMatchConcat(const uint8_t* shuffle, uint8_t* offset) {
	// Don't match the identity shuffle (e.g. [0 1 2 ... 15]).
	uint8_t start = shuffle[0];
	if (start == 0) return false;
	DCHECK_GT(kSimd128Size, start); // The shuffle should be canonicalized.
	// A concatenation is a series of consecutive indices, with at most one jump
	// in the middle from the last lane to the first.
	for (int i = 1; i < kSimd128Size; ++i) {
	if ((shuffle[i]) != ((shuffle[i - 1] + 1))) {
	if (shuffle[i - 1] != 15) return false;
	if (shuffle[i] % kSimd128Size != 0) return false;
	}
	}
	*offset = start;
	return true;
	}

	bool SimdShuffle::TryMatchBlend(const uint8_t* shuffle) {
	for (int i = 0; i < 16; ++i) {
	if ((shuffle[i] & 0xF) != i) return false;
	}
	return true;
	}

	bool SimdShuffle::TryMatchByteToDwordZeroExtend(const uint8_t* shuffle) {
	for (int i = 0; i < 16; ++i) {
	if ((i % 4 != 0) && (shuffle[i] < 16)) return false;
	if ((i % 4 == 0) && (shuffle[i] > 15 \|\| (shuffle[i] != shuffle[0] + i / 4)))
	return false;
	}
	return true;
	}

	uint8_t SimdShuffle::PackShuffle4(uint8_t* shuffle) {
	return (shuffle[0] & 3) \| ((shuffle[1] & 3) << 2) \| ((shuffle[2] & 3) << 4) \|
	((shuffle[3] & 3) << 6);
	}

	uint8_t SimdShuffle::PackBlend8(const uint8_t* shuffle16x8) {
	int8_t result = 0;
	for (int i = 0; i < 8; ++i) {
	result \|= (shuffle16x8[i] >= 8 ? 1 : 0) << i;
	}
	return result;
	}

	uint8_t SimdShuffle::PackBlend4(const uint8_t* shuffle32x4) {
	int8_t result = 0;
	for (int i = 0; i < 4; ++i) {
	result \|= (shuffle32x4[i] >= 4 ? 0x3 : 0) << (i * 2);
	}
	return result;
	}

	int32_t SimdShuffle::Pack4Lanes(const uint8_t* shuffle) {
	int32_t result = 0;
	for (int i = 3; i >= 0; --i) {
	result <<= 8;
	result \|= shuffle[i];
	}
	return result;
	}

	void SimdShuffle::Pack16Lanes(uint32_t* dst, const uint8_t* shuffle) {
	for (int i = 0; i < 4; i++) {
	dst[i] = wasm::SimdShuffle::Pack4Lanes(shuffle + (i * 4));
	}
	}

	#ifdef V8_TARGET_ARCH_X64
	// static
	bool SimdShuffle::TryMatchVpshufd(const uint8_t* shuffle32x8,
	uint8_t* control) {
	*control = 0;
	for (int i = 0; i < 4; ++i) {
	uint8_t mask;
	if (shuffle32x8[i] < 4 && shuffle32x8[i + 4] - shuffle32x8[i] == 4) {
	mask = shuffle32x8[i];
	control \|= mask << (2 i);
	continue;
	}
	return false;
	}
	return true;
	}

	// static
	bool SimdShuffle::TryMatchShufps256(const uint8_t* shuffle32x8,
	uint8_t* control) {
	*control = 0;
	for (int i = 0; i < 4; ++i) {
	// low 128-bits and high 128-bits should have the same shuffle order.
	if (shuffle32x8[i + 4] - shuffle32x8[i] == 4) {
	// [63:0] bits select from SRC1,
	// [127:64] bits select from SRC2
	if ((i < 2 && shuffle32x8[i] < 4) \|\|
	(i >= 2 && shuffle32x8[i] >= 8 && shuffle32x8[i] < 12)) {
	control \|= (shuffle32x8[i] % 4) << (2 i);
	continue;
	}
	return false;
	}
	return false;
	}
	return true;
	}
	#endif // V8_TARGET_ARCH_X64

	bool SimdSwizzle::AllInRangeOrTopBitSet(
	std::array<uint8_t, kSimd128Size> shuffle) {
	return std::all_of(shuffle.begin(), shuffle.end(),
	[](auto i) { return (i < kSimd128Size) \|\| (i & 0x80); });
	}

	} // namespace wasm
	} // namespace internal
	} // namespace v8