wasm-revec-reducer_8h_source.html

// Copyright 2023 the V8 project authors. All rights reserved.

// Use of this source code is governed by a BSD-style license that can be

// found in the LICENSE file.


#ifndef V8_COMPILER_TURBOSHAFT_WASM_REVEC_REDUCER_H_

#define V8_COMPILER_TURBOSHAFT_WASM_REVEC_REDUCER_H_


#if !V8_ENABLE_WEBASSEMBLY

#error This header should only be included if WebAssembly is enabled.

#endif  // !V8_ENABLE_WEBASSEMBLY


#include <algorithm>


#include "src/base/numerics/safe_conversions.h"

#include "src/compiler/turboshaft/assembler.h"

#include "src/compiler/turboshaft/operations.h"

#include "src/compiler/turboshaft/phase.h"

#include "src/compiler/turboshaft/use-map.h"

#include "src/compiler/wasm-graph-assembler.h"


namespace v8::internal::compiler::turboshaft {


#define SIMD256_LOADTRANSFORM_OP(V) \

  V(8x8S, 8x16S)                    \

  V(8x8U, 8x16U)                    \

  V(16x4S, 16x8S)                   \

  V(16x4U, 16x8U)                   \

  V(32x2S, 32x4S)                   \

  V(32x2U, 32x4U)                   \

  V(8Splat, 8Splat)                 \

  V(16Splat, 16Splat)               \

  V(32Splat, 32Splat)               \

  V(64Splat, 64Splat)


#define SIMD256_UNARY_SIMPLE_OP(V)                         \

  V(S128Not, S256Not)                                      \

  V(I8x16Abs, I8x32Abs)                                    \

  V(I8x16Neg, I8x32Neg)                                    \

  V(I16x8ExtAddPairwiseI8x16S, I16x16ExtAddPairwiseI8x32S) \

  V(I16x8ExtAddPairwiseI8x16U, I16x16ExtAddPairwiseI8x32U) \

  V(I32x4ExtAddPairwiseI16x8S, I32x8ExtAddPairwiseI16x16S) \

  V(I32x4ExtAddPairwiseI16x8U, I32x8ExtAddPairwiseI16x16U) \

  V(I16x8Abs, I16x16Abs)                                   \

  V(I16x8Neg, I16x16Neg)                                   \

  V(I32x4Abs, I32x8Abs)                                    \

  V(I32x4Neg, I32x8Neg)                                    \

  V(F32x4Abs, F32x8Abs)                                    \

  V(F32x4Neg, F32x8Neg)                                    \

  V(F32x4Sqrt, F32x8Sqrt)                                  \

  V(F64x2Abs, F64x4Abs)                                    \

  V(F64x2Neg, F64x4Neg)                                    \

  V(F64x2Sqrt, F64x4Sqrt)                                  \

  V(I32x4UConvertF32x4, I32x8UConvertF32x8)                \

  V(I32x4SConvertF32x4, I32x8SConvertF32x8)                \

  V(F32x4UConvertI32x4, F32x8UConvertI32x8)                \

  V(F32x4SConvertI32x4, F32x8SConvertI32x8)                \

  V(I32x4RelaxedTruncF32x4S, I32x8RelaxedTruncF32x8S)      \

  V(I32x4RelaxedTruncF32x4U, I32x8RelaxedTruncF32x8U)


#define SIMD256_UNARY_SIGN_EXTENSION_OP(V)                              \

  V(I64x2SConvertI32x4Low, I64x4SConvertI32x4, I64x2SConvertI32x4High)  \

  V(I64x2UConvertI32x4Low, I64x4UConvertI32x4, I64x2UConvertI32x4High)  \

  V(I32x4SConvertI16x8Low, I32x8SConvertI16x8, I32x4SConvertI16x8High)  \

  V(I32x4UConvertI16x8Low, I32x8UConvertI16x8, I32x4UConvertI16x8High)  \

  V(I16x8SConvertI8x16Low, I16x16SConvertI8x16, I16x8SConvertI8x16High) \

  V(I16x8UConvertI8x16Low, I16x16UConvertI8x16, I16x8UConvertI8x16High)


#define SIMD256_BINOP_SIMPLE_OP(V)                 \

  V(I8x16Eq, I8x32Eq)                              \

  V(I8x16Ne, I8x32Ne)                              \

  V(I8x16GtS, I8x32GtS)                            \

  V(I8x16GtU, I8x32GtU)                            \

  V(I8x16GeS, I8x32GeS)                            \

  V(I8x16GeU, I8x32GeU)                            \

  V(I16x8Eq, I16x16Eq)                             \

  V(I16x8Ne, I16x16Ne)                             \

  V(I16x8GtS, I16x16GtS)                           \

  V(I16x8GtU, I16x16GtU)                           \

  V(I16x8GeS, I16x16GeS)                           \

  V(I16x8GeU, I16x16GeU)                           \

  V(I32x4Eq, I32x8Eq)                              \

  V(I32x4Ne, I32x8Ne)                              \

  V(I32x4GtS, I32x8GtS)                            \

  V(I32x4GtU, I32x8GtU)                            \

  V(I32x4GeS, I32x8GeS)                            \

  V(I32x4GeU, I32x8GeU)                            \

  V(F32x4Eq, F32x8Eq)                              \

  V(F32x4Ne, F32x8Ne)                              \

  V(F32x4Lt, F32x8Lt)                              \

  V(F32x4Le, F32x8Le)                              \

  V(F64x2Eq, F64x4Eq)                              \

  V(F64x2Ne, F64x4Ne)                              \

  V(F64x2Lt, F64x4Lt)                              \

  V(F64x2Le, F64x4Le)                              \

  V(S128And, S256And)                              \

  V(S128AndNot, S256AndNot)                        \

  V(S128Or, S256Or)                                \

  V(S128Xor, S256Xor)                              \

  V(I8x16SConvertI16x8, I8x32SConvertI16x16)       \

  V(I8x16UConvertI16x8, I8x32UConvertI16x16)       \

  V(I8x16Add, I8x32Add)                            \

  V(I8x16AddSatS, I8x32AddSatS)                    \

  V(I8x16AddSatU, I8x32AddSatU)                    \

  V(I8x16Sub, I8x32Sub)                            \

  V(I8x16SubSatS, I8x32SubSatS)                    \

  V(I8x16SubSatU, I8x32SubSatU)                    \

  V(I8x16MinS, I8x32MinS)                          \

  V(I8x16MinU, I8x32MinU)                          \

  V(I8x16MaxS, I8x32MaxS)                          \

  V(I8x16MaxU, I8x32MaxU)                          \

  V(I8x16RoundingAverageU, I8x32RoundingAverageU)  \

  V(I16x8SConvertI32x4, I16x16SConvertI32x8)       \

  V(I16x8UConvertI32x4, I16x16UConvertI32x8)       \

  V(I16x8Add, I16x16Add)                           \

  V(I16x8AddSatS, I16x16AddSatS)                   \

  V(I16x8AddSatU, I16x16AddSatU)                   \

  V(I16x8Sub, I16x16Sub)                           \

  V(I16x8SubSatS, I16x16SubSatS)                   \

  V(I16x8SubSatU, I16x16SubSatU)                   \

  V(I16x8Mul, I16x16Mul)                           \

  V(I16x8MinS, I16x16MinS)                         \

  V(I16x8MinU, I16x16MinU)                         \

  V(I16x8MaxS, I16x16MaxS)                         \

  V(I16x8MaxU, I16x16MaxU)                         \

  V(I16x8RoundingAverageU, I16x16RoundingAverageU) \

  V(I32x4Add, I32x8Add)                            \

  V(I32x4Sub, I32x8Sub)                            \

  V(I32x4Mul, I32x8Mul)                            \

  V(I32x4MinS, I32x8MinS)                          \

  V(I32x4MinU, I32x8MinU)                          \

  V(I32x4MaxS, I32x8MaxS)                          \

  V(I32x4MaxU, I32x8MaxU)                          \

  V(I32x4DotI16x8S, I32x8DotI16x16S)               \

  V(I64x2Add, I64x4Add)                            \

  V(I64x2Sub, I64x4Sub)                            \

  V(I64x2Mul, I64x4Mul)                            \

  V(I64x2Eq, I64x4Eq)                              \

  V(I64x2Ne, I64x4Ne)                              \

  V(I64x2GtS, I64x4GtS)                            \

  V(I64x2GeS, I64x4GeS)                            \

  V(F32x4Add, F32x8Add)                            \

  V(F32x4Sub, F32x8Sub)                            \

  V(F32x4Mul, F32x8Mul)                            \

  V(F32x4Div, F32x8Div)                            \

  V(F32x4Min, F32x8Min)                            \

  V(F32x4Max, F32x8Max)                            \

  V(F32x4Pmin, F32x8Pmin)                          \

  V(F32x4Pmax, F32x8Pmax)                          \

  V(F64x2Add, F64x4Add)                            \

  V(F64x2Sub, F64x4Sub)                            \

  V(F64x2Mul, F64x4Mul)                            \

  V(F64x2Div, F64x4Div)                            \

  V(F64x2Min, F64x4Min)                            \

  V(F64x2Max, F64x4Max)                            \

  V(F64x2Pmin, F64x4Pmin)                          \

  V(F64x2Pmax, F64x4Pmax)                          \

  V(F32x4RelaxedMin, F32x8RelaxedMin)              \

  V(F32x4RelaxedMax, F32x8RelaxedMax)              \

  V(F64x2RelaxedMin, F64x4RelaxedMin)              \

  V(F64x2RelaxedMax, F64x4RelaxedMax)              \

  V(I16x8DotI8x16I7x16S, I16x16DotI8x32I7x32S)


#define SIMD256_BINOP_SIGN_EXTENSION_OP(V)                           \

  V(I16x8ExtMulLowI8x16S, I16x16ExtMulI8x16S, I16x8ExtMulHighI8x16S) \

  V(I16x8ExtMulLowI8x16U, I16x16ExtMulI8x16U, I16x8ExtMulHighI8x16U) \

  V(I32x4ExtMulLowI16x8S, I32x8ExtMulI16x8S, I32x4ExtMulHighI16x8S)  \

  V(I32x4ExtMulLowI16x8U, I32x8ExtMulI16x8U, I32x4ExtMulHighI16x8U)  \

  V(I64x2ExtMulLowI32x4S, I64x4ExtMulI32x4S, I64x2ExtMulHighI32x4S)  \

  V(I64x2ExtMulLowI32x4U, I64x4ExtMulI32x4U, I64x2ExtMulHighI32x4U)


#define SIMD256_SHIFT_OP(V) \

  V(I16x8Shl, I16x16Shl)    \

  V(I16x8ShrS, I16x16ShrS)  \

  V(I16x8ShrU, I16x16ShrU)  \

  V(I32x4Shl, I32x8Shl)     \

  V(I32x4ShrS, I32x8ShrS)   \

  V(I32x4ShrU, I32x8ShrU)   \

  V(I64x2Shl, I64x4Shl)     \

  V(I64x2ShrU, I64x4ShrU)


#define SIMD256_TERNARY_OP(V)                        \

  V(S128Select, S256Select)                          \

  V(F32x4Qfma, F32x8Qfma)                            \

  V(F32x4Qfms, F32x8Qfms)                            \

  V(F64x2Qfma, F64x4Qfma)                            \

  V(F64x2Qfms, F64x4Qfms)                            \

  V(I8x16RelaxedLaneSelect, I8x32RelaxedLaneSelect)  \

  V(I16x8RelaxedLaneSelect, I16x16RelaxedLaneSelect) \

  V(I32x4RelaxedLaneSelect, I32x8RelaxedLaneSelect)  \

  V(I64x2RelaxedLaneSelect, I64x4RelaxedLaneSelect)  \

  V(I32x4DotI8x16I7x16AddS, I32x8DotI8x32I7x32AddS)


#define SIMD256_SPLAT_OP(V) \

  V(I8x16, I8x32)           \

  V(I16x8, I16x16)          \

  V(I32x4, I32x8)           \

  V(I64x2, I64x4)           \

  V(F32x4, F32x8)           \

  V(F64x2, F64x4)


#define REDUCE_SEED_KIND(V) \

  V(I64x2Add)               \

  V(I32x4Add)               \

  V(I8x16Add)               \

  V(I16x8AddSatS)           \

  V(I16x8AddSatU)           \

  V(I8x16AddSatS)           \

  V(I8x16AddSatU)           \

  V(I16x8SConvertI32x4)     \

  V(I16x8UConvertI32x4)     \

  V(I8x16SConvertI16x8)     \

  V(I8x16UConvertI16x8)


#include "src/compiler/turboshaft/define-assembler-macros.inc"


class NodeGroup {

 public:

  // Current only support merge 2 Simd128 into Simd256

  static constexpr int kSize = kSimd256Size / kSimd128Size;


  NodeGroup(OpIndex a, OpIndex b) {

    indexes_[0] = a;

    indexes_[1] = b;

  }


  size_t size() const { return kSize; }

  OpIndex operator[](int i) const { return indexes_[i]; }


  bool operator==(const NodeGroup& other) const {

    return indexes_[0] == other.indexes_[0] && indexes_[1] == other.indexes_[1];

  }


  bool operator!=(const NodeGroup& other) const {

    return indexes_[0] != other.indexes_[0] || indexes_[1] != other.indexes_[1];

  }


  const OpIndex* begin() const { return indexes_; }

  const OpIndex* end() const { return indexes_ + kSize; }


 private:

  OpIndex indexes_[kSize];

};


class ForcePackNode;

class ShufflePackNode;

class BundlePackNode;


// A PackNode consists of a fixed number of isomorphic simd128 nodes which can

// execute in parallel and convert to a 256-bit simd node later. The nodes in a

// PackNode must satisfy that they can be scheduled in the same basic block and

// are mutually independent.


class PackNode : public NON_EXPORTED_BASE(ZoneObject) {

 public:


  enum NodeType {

    kDefault,        // Nodes are naturally packed without special attributes.

    kForcePackNode,  // Nodes do not satisfy some packing rule, but can be

                     // forcely coalesced with a Pack128To256 operation. E.g.

                     // inconsecutive loads. In x64, we can use the vinsertf128

                     // instruction to forcely coalescing two 128-bit values.

    kShufflePackNode,  // Nodes are Simd128Shuffle operations with specific

                       // info.

    kBundlePackNode,   // Nodes representing a i8x16/i16x8 to f32x4 conversion.

    kIntersectPackNode,  // One or more nodes already packed by an existing

                         // PackNode.

  };


  explicit PackNode(Zone* zone, const NodeGroup& node_group,

                    NodeType node_type = kDefault)

      : nodes_(node_group),

        revectorized_node_(),

        operands_(zone),

        node_type_(node_type) {}


  const NodeGroup& nodes() const { return nodes_; }


  bool IsSame(const NodeGroup& node_group) const {

    return nodes_ == node_group;

  }


  bool IsSame(const PackNode& other) const { return nodes_ == other.nodes_; }

  V<Simd256> RevectorizedNode() const { return revectorized_node_; }

  void SetRevectorizedNode(V<Simd256> node) { revectorized_node_ = node; }


  bool IsDefaultPackNode() const { return node_type_ == kDefault; }

  bool IsForcePackNode() const { return node_type_ == kForcePackNode; }

  bool IsShufflePackNode() const { return node_type_ == kShufflePackNode; }

  bool IsBundlePackNode() const { return node_type_ == kBundlePackNode; }

  // We will force-pack nodes for both ForcePackNode and IntersectPackNode.


  bool is_force_packing() const {

    return node_type_ == kForcePackNode || node_type_ == kIntersectPackNode;

  }


  ForcePackNode* AsForcePackNode() {

    DCHECK(IsForcePackNode());

    return reinterpret_cast<ForcePackNode*>(this);

  }


  ShufflePackNode* AsShufflePackNode() {

    DCHECK(IsShufflePackNode());

    return reinterpret_cast<ShufflePackNode*>(this);

  }


  BundlePackNode* AsBundlePackNode() {

    DCHECK(IsBundlePackNode());

    return reinterpret_cast<BundlePackNode*>(this);

  }


  PackNode* GetOperand(int index) const {

    DCHECK_LT(index, operands_.size());

    DCHECK(operands_[index]);

    return operands_[index];

  }


  void SetOperand(int index, PackNode* pnode) {

    DCHECK_GE(index, 0);

    if (operands_.size() < static_cast<size_t>(index + 1)) {

      operands_.resize(index + 1);

    }

    operands_[index] = pnode;

  }


  ZoneVector<PackNode*>::size_type GetOperandsSize() const {

    return operands_.size();

  }


  void Print(Graph* graph) const;


 private:

  friend class ForcePackNode;

  NodeGroup nodes_;

  V<Simd256> revectorized_node_;

  ZoneVector<PackNode*> operands_;

  NodeType node_type_;

};


class ForcePackNode : public PackNode {

 public:


  enum ForcePackType {

    kSplat,    // force pack 2 identical nodes or 2 loads at the same address

    kGeneral,  // force pack 2 different nodes

  };


  explicit ForcePackNode(Zone* zone, const NodeGroup& node_group,

                         ForcePackType type)

      : PackNode(zone, node_group, kForcePackNode), force_pack_type_(type) {}


  ForcePackType force_pack_type() const { return force_pack_type_; }


 private:

  ForcePackType force_pack_type_;

};


class ShufflePackNode : public PackNode {

 public:


  class SpecificInfo {

   public:


    enum class Kind {

      kS256Load32Transform,

      kS256Load64Transform,

      kS256Load8x8U,

#ifdef V8_TARGET_ARCH_X64

      kShufd,

      kShufps,

      kS32x8UnpackLow,

      kS32x8UnpackHigh,

#endif  // V8_TARGET_ARCH_X64

    };


    union Param {

      int splat_index = 0;

#ifdef V8_TARGET_ARCH_X64

      uint8_t shufd_control;

      uint8_t shufps_control;

#endif  // V8_TARGET_ARCH_X64

    };


    Kind kind() { return kind_; }

    void set_kind(Kind kind) { kind_ = kind; }


    void set_splat_index(uint8_t value) {

      DCHECK(kind_ == Kind::kS256Load32Transform ||

             kind_ == Kind::kS256Load64Transform);

      param_.splat_index = value;

    }


    int splat_index() const {

      DCHECK(kind_ == Kind::kS256Load32Transform ||

             kind_ == Kind::kS256Load64Transform);

      return param_.splat_index;

    }


#ifdef V8_TARGET_ARCH_X64

    void set_shufd_control(uint8_t control) {

      DCHECK_EQ(kind_, Kind::kShufd);

      param_.shufd_control = control;

    }

    uint8_t shufd_control() const {

      DCHECK_EQ(kind_, Kind::kShufd);

      return param_.shufd_control;

    }


    void set_shufps_control(uint8_t control) {

      DCHECK_EQ(kind_, Kind::kShufps);

      param_.shufps_control = control;

    }

    uint8_t shufps_control() const {

      DCHECK_EQ(kind_, Kind::kShufps);

      return param_.shufps_control;

    }

#endif  // V8_TARGET_ARCH_X64


   private:

    Kind kind_;

    Param param_;

  };


  ShufflePackNode(Zone* zone, const NodeGroup& node_group,

                  SpecificInfo::Kind kind)

      : PackNode(zone, node_group, kShufflePackNode) {

    info_.set_kind(kind);

  }


  SpecificInfo& info() { return info_; }


 private:

  SpecificInfo info_;

};


// BundlePackNode is used to represent a i8x16/i16x8 to f32x4 conversion.

// The conversion extracts 4 lanes of i8x16/i16x8 input(base), start from lane

// index(offset), sign/zero(is_sign_extract) extends the extracted lanes to

// i32x4, then converts i32x4/u32x4(is_sign_convert) to f32x4.


class BundlePackNode : public PackNode {

 public:


  BundlePackNode(Zone* zone, const NodeGroup& node_group, OpIndex base,

                 int8_t offset, uint8_t lane_size, bool is_sign_extract,

                 bool is_sign_convert)

      : PackNode(zone, node_group, kBundlePackNode) {

    base_ = base;

    offset_ = offset;

    lane_size_ = lane_size;

    is_sign_extract_ = is_sign_extract;

    is_sign_convert_ = is_sign_convert;

  }


  OpIndex base() const { return base_; }

  uint8_t offset() const { return offset_; }

  uint8_t lane_size() const { return lane_size_; }

  bool is_sign_extract() const { return is_sign_extract_; }

  bool is_sign_convert() const { return is_sign_convert_; }


 private:

  OpIndex base_;

  uint8_t offset_;

  uint8_t lane_size_;

  bool is_sign_extract_;

  bool is_sign_convert_;

};


// An auxillary tree structure with a set of PackNodes based on the Superword

// Level Parallelism (SLP) vectorization technique. The BuildTree method will

// start from a selected root, e.g. a group of consecutive stores, and extend

// through value inputs to create new PackNodes if the inputs are valid, or

// conclude that the current PackNode is a leaf and terminate the tree.

// Below is an example of SLPTree where loads and stores in each PackNode are

// all consecutive.

// [Load0, Load1]  [Load2, Load3]

//           \       /

//          [Add0, Add1]

//                |

//         [Store0, Store1]


class SLPTree : public NON_EXPORTED_BASE(ZoneObject) {

 public:


  explicit SLPTree(Graph& graph, WasmRevecAnalyzer* analyzer, Zone* zone)

      : graph_(graph),

        analyzer_(analyzer),

        phase_zone_(zone),

        root_(nullptr),

        node_to_packnode_(zone),

        node_to_intersect_packnodes_(zone) {}


  // Information for extending i8x16/i16x8 to f32x4


  struct ExtendIntToF32x4Info {

    OpIndex extend_from;

    uint8_t start_lane;    // 0 or 8

    uint8_t lane_size;     // 1(i8) or 2(i16)

    bool is_sign_extract;  // extract_lane_s or extract_lane_u

    bool is_sign_convert;  // f32x4.convert_i32x4_s or f32x4.convert_i32x4_u

  };


  // Per-lane information for extending i8x16/i16x8 to f32x4


  struct LaneExtendInfo {

    OpIndex extract_from;

    Simd128ExtractLaneOp::Kind extract_kind;

    int extract_lane_index;

    ChangeOp::Kind change_kind;

    int replace_lane_index;

  };


  PackNode* BuildTree(const NodeGroup& roots);

  void DeleteTree();


  PackNode* GetPackNode(OpIndex node);

  ZoneVector<PackNode*>* GetIntersectPackNodes(OpIndex node);


  ZoneUnorderedMap<OpIndex, PackNode*>& GetNodeMapping() {

    return node_to_packnode_;

  }


  ZoneUnorderedMap<OpIndex, ZoneVector<PackNode*>>& GetIntersectNodeMapping() {

    return node_to_intersect_packnodes_;

  }


  void Print(const char* info);


 private:

  // This is the recursive part of BuildTree.

  PackNode* BuildTreeRec(const NodeGroup& node_group, unsigned depth);


  // Baseline: create a new PackNode, and return.

  PackNode* NewPackNode(const NodeGroup& node_group);


  // Baseline: create a new IntersectPackNode that contains nodes existing in

  // another PackNode, and return.

  PackNode* NewIntersectPackNode(const NodeGroup& node_group);


  PackNode* NewForcePackNode(const NodeGroup& node_group,

                             ForcePackNode::ForcePackType type,

                             const Graph& graph);

  BundlePackNode* NewBundlePackNode(const NodeGroup& node_group, OpIndex base,

                                    int8_t offset, uint8_t lane_size,

                                    bool is_sign_extract, bool is_sign_convert);


  // Recursion: create a new PackNode and call BuildTreeRec recursively

  PackNode* NewPackNodeAndRecurs(const NodeGroup& node_group, int start_index,

                                 int count, unsigned depth);


  PackNode* NewCommutativePackNodeAndRecurs(const NodeGroup& node_group,

                                            unsigned depth);


  ShufflePackNode* NewShufflePackNode(const NodeGroup& node_group,

                                      ShufflePackNode::SpecificInfo::Kind kind);


  // Try match the following pattern:

  //   1. simd128_load64zero(memargs)

  //   2. simd128_const[0,0,0,0]

  //   3. simd128_shuffle(1, 2, shuffle_arg0)

  //   4. simd128_shuffle(1, 2, shuffle_arg1)

  // To:

  //   1. simd256_load8x8u(memargs)

  ShufflePackNode* Try256ShuffleMatchLoad8x8U(const NodeGroup& node_group,

                                              const uint8_t* shuffle0,

                                              const uint8_t* shuffle1);


#ifdef V8_TARGET_ARCH_X64

  // The Simd Shuffle in wasm is a high level representation, and it can map to

  // different x64 intructions base on its shuffle array. And the performance of

  // different intructions are varies greatly.

  // For example, if the shuffle array are totally random, there is a high

  // probability to use a general shuffle. Under x64, the general shuffle may

  // consists of a series mov, a vpinsrq and a vpshufb. It's performance cost is

  // high. However, if the shuffle array is in an particular pattern, for

  // example: [0,  1,  2,  3,  32, 33, 34, 35, 4,  5,  6,  7,  36, 37, 38, 39,

  //      16, 17, 18, 19, 48, 49, 50, 51, 20, 21, 22, 23, 52, 53, 54, 55]

  // we can use a single vpunpckldq instruction. It's performance cost is much

  // more lower than a general one.

  //

  // This function is used to try to match the shuffle array to the

  // x64 instructions which has the best performance.

  ShufflePackNode* X64TryMatch256Shuffle(const NodeGroup& node_group,

                                         const uint8_t* shuffle0,

                                         const uint8_t* shuffle1);

#endif  // V8_TARGET_ARCH_X64


  bool TryMatchExtendIntToF32x4(const NodeGroup& node_group,

                                ExtendIntToF32x4Info* info);

  std::optional<ExtendIntToF32x4Info> TryGetExtendIntToF32x4Info(OpIndex index);


  bool IsSideEffectFree(OpIndex first, OpIndex second);

  bool CanBePacked(const NodeGroup& node_group);

  bool IsEqual(const OpIndex node0, const OpIndex node1);

  // Check if the nodes in the node_group depend on the result of each other.

  bool HasInputDependencies(const NodeGroup& node_group);


  Graph& graph() const { return graph_; }

  Zone* zone() const { return phase_zone_; }


  Graph& graph_;

  WasmRevecAnalyzer* analyzer_;

  Zone* phase_zone_;

  PackNode* root_;

  // Maps a specific node to PackNode.

  ZoneUnorderedMap<OpIndex, PackNode*> node_to_packnode_;

  // Maps a node to multiple IntersectPackNodes.

  ZoneUnorderedMap<OpIndex, ZoneVector<PackNode*>> node_to_intersect_packnodes_;

  static constexpr size_t RecursionMaxDepth = 1000;

};


class WasmRevecAnalyzer {

 public:


  WasmRevecAnalyzer(PipelineData* data, Zone* zone, Graph& graph)

      : data_(data),

        graph_(graph),

        phase_zone_(zone),

        store_seeds_(zone),

        reduce_seeds_(zone),

        revectorizable_node_(zone),

        revectorizable_intersect_node_(zone),

        should_reduce_(false),

        use_map_(nullptr) {

    Run();

  }


  void Run();


  void MergeSLPTree(SLPTree& slp_tree);

  bool ShouldReduce() const { return should_reduce_; }


  PackNode* GetPackNode(const OpIndex ig_index) {

    auto itr = revectorizable_node_.find(ig_index);

    if (itr != revectorizable_node_.end()) {

      return itr->second;

    }

    return nullptr;

  }


  ZoneVector<PackNode*>* GetIntersectPackNodes(const OpIndex node) {

    auto I = revectorizable_intersect_node_.find(node);

    if (I != revectorizable_intersect_node_.end()) {

      return &(I->second);

    }

    return nullptr;

  }


  const OpIndex GetReducedInput(const PackNode* pnode, const int index = 0) {

    if (index >= static_cast<int>(pnode->GetOperandsSize())) {

      return OpIndex::Invalid();

    }

    return pnode->GetOperand(index)->RevectorizedNode();

  }


  const Operation& GetStartOperation(const PackNode* pnode, const OpIndex node,

                                     const Operation& op) {

    DCHECK(pnode);

    const OpIndex start = pnode->nodes()[0];

    return (start == node) ? op : graph_.Get(start);

  }


  base::Vector<const OpIndex> uses(OpIndex node) {

    return use_map_->uses(node);

  }


 private:

  bool IsSupportedReduceSeed(const Operation& op);

  void ProcessBlock(const Block& block);

  bool DecideVectorize();

  void Print(const char* info);


  PipelineData* data_;

  Graph& graph_;

  Zone* phase_zone_;

  ZoneVector<std::pair<OpIndex, OpIndex>> store_seeds_;

  ZoneVector<std::pair<OpIndex, OpIndex>> reduce_seeds_;

  const wasm::WasmModule* module_ = data_->wasm_module();

  ZoneUnorderedMap<OpIndex, PackNode*> revectorizable_node_;

  ZoneUnorderedMap<OpIndex, ZoneVector<PackNode*>>

      revectorizable_intersect_node_;

  bool should_reduce_;

  SimdUseMap* use_map_;

};


template <class Next>


class WasmRevecReducer : public UniformReducerAdapter<WasmRevecReducer, Next> {

 public:

  TURBOSHAFT_REDUCER_BOILERPLATE(WasmRevec)

  using Adapter = UniformReducerAdapter<WasmRevecReducer, Next>;


  OpIndex GetExtractOpIfNeeded(const PackNode* pnode, OpIndex ig_index,

                               OpIndex og_index) {

    const auto lane = base::checked_cast<uint8_t>(

        std::find(pnode->nodes().begin(), pnode->nodes().end(), ig_index) -

        pnode->nodes().begin());


    // Force PackNode has a dedicated use in SimdPack128To256Op.

    if (pnode->is_force_packing()) {

      SimdPack128To256Op& op = __ output_graph()

                                   .Get(pnode -> RevectorizedNode())

                                   .template Cast<SimdPack128To256Op>();

      return lane == 0 ? op.left() : op.right();

    }


    for (auto use : analyzer_.uses(ig_index)) {

      // Extract128 is needed for the additional Simd128 store before

      // Simd256 store in case of OOB trap at the higher 128-bit

      // address.

      auto use_pnode = analyzer_.GetPackNode(use);

      if (use_pnode != nullptr && !use_pnode->is_force_packing()) {

        DCHECK_GE(use_pnode->nodes().size(), 2);

        if (__ input_graph().Get(use).opcode != Opcode::kStore ||

            use_pnode->nodes()[0] != use ||

            use_pnode->nodes()[0] > use_pnode->nodes()[1])

          continue;

      }


      return __ Simd256Extract128Lane(og_index, lane);

    }


    return OpIndex::Invalid();

  }


  V<Simd128> REDUCE_INPUT_GRAPH(Simd128Constant)(

      V<Simd128> ig_index, const Simd128ConstantOp& constant_op) {

    PackNode* pnode = analyzer_.GetPackNode(ig_index);

    if (!pnode) {

      return Adapter::ReduceInputGraphSimd128Constant(ig_index, constant_op);

    }


    V<Simd256> og_index = pnode->RevectorizedNode();

    // Skip revectorized node.

    if (!og_index.valid()) {

      NodeGroup inputs = pnode->nodes();

      const Simd128ConstantOp& op0 =

          __ input_graph().Get(inputs[0]).template Cast<Simd128ConstantOp>();

      const Simd128ConstantOp& op1 =

          __ input_graph().Get(inputs[1]).template Cast<Simd128ConstantOp>();

      uint8_t value[kSimd256Size] = {};

      memcpy(value, op0.value, kSimd128Size);

      memcpy(value + kSimd128Size, op1.value, kSimd128Size);


      og_index = __ Simd256Constant(value);


      pnode->SetRevectorizedNode(og_index);

    }

    return GetExtractOpIfNeeded(pnode, ig_index, og_index);

  }


  V<Simd128> REDUCE_INPUT_GRAPH(Simd128LoadTransform)(

      V<Simd128> ig_index, const Simd128LoadTransformOp& load_transform) {

    PackNode* pnode = analyzer_.GetPackNode(ig_index);

    if (!pnode || !pnode->IsDefaultPackNode()) {

      return Adapter::ReduceInputGraphSimd128LoadTransform(ig_index,

                                                           load_transform);

    }


    V<Simd256> og_index = pnode->RevectorizedNode();

    // Skip revectorized node.

    if (!og_index.valid()) {

      auto base = __ MapToNewGraph(load_transform.base());

      auto index = __ MapToNewGraph(load_transform.index());

      auto offset = load_transform.offset;

      DCHECK_EQ(load_transform.offset, 0);


      og_index = __ Simd256LoadTransform(

          base, index, load_transform.load_kind,

          Get256LoadTransformKindFrom128(load_transform.transform_kind),

          offset);

      pnode->SetRevectorizedNode(og_index);

    }

    return GetExtractOpIfNeeded(pnode, ig_index, og_index);

  }


  OpIndex REDUCE_INPUT_GRAPH(Load)(OpIndex ig_index, const LoadOp& load) {

    PackNode* pnode = analyzer_.GetPackNode(ig_index);

    if (!pnode || !pnode->IsDefaultPackNode()) {

      return Adapter::ReduceInputGraphLoad(ig_index, load);

    }


    OpIndex og_index = pnode->RevectorizedNode();

    // Skip revectorized node.

    if (!og_index.valid()) {

      const LoadOp& start = analyzer_.GetStartOperation(pnode, ig_index, load)

                                .template Cast<LoadOp>();

      DCHECK_EQ(start.base(), load.base());


      auto base = __ MapToNewGraph(load.base());

      // We need to use load's index here due to there would be different

      // ChangeOps from the same index. If start is not load, it's possible

      // that the ChangeOp of start index is not visited yet.

      auto index = __ MapToNewGraph(load.index());

      og_index = __ Load(base, index, load.kind,

                         MemoryRepresentation::Simd256(), start.offset);

      pnode->SetRevectorizedNode(og_index);

    }


    // Emit extract op if needed.

    return GetExtractOpIfNeeded(pnode, ig_index, og_index);

  }


  OpIndex REDUCE_INPUT_GRAPH(Store)(OpIndex ig_index, const StoreOp& store) {

    PackNode* pnode = analyzer_.GetPackNode(ig_index);

    if (!pnode) {

      return Adapter::ReduceInputGraphStore(ig_index, store);

    }


    OpIndex og_index = pnode->RevectorizedNode();

    // Skip revectorized node.

    if (!og_index.valid()) {

      const StoreOp& start =

          (analyzer_.GetStartOperation(pnode, ig_index, store))

              .template Cast<StoreOp>();

      DCHECK_EQ(start.base(), store.base());


      // It's possible that an OOB is trapped at the higher 128-bit address

      // after the lower 128-bit store is executed. To ensure a consistent

      // memory state before and after revectorization, emit the first 128-bit

      // store before the 256-bit revectorized store.

      if (ig_index == pnode->nodes()[0]) {

        Adapter::ReduceInputGraphStore(ig_index, store);

      }


      auto base = __ MapToNewGraph(store.base());

      // We need to use store's index here due to there would be different

      // ChangeOps from the same index. If start is not store, it's possible

      // that the ChangeOp of start index is not visited yet.

      auto index = __ MapToNewGraph(store.index());

      V<Simd256> value = analyzer_.GetReducedInput(pnode);

      DCHECK(value.valid());


      __ Store(base, index, value, store.kind, MemoryRepresentation::Simd256(),

               store.write_barrier, start.offset);


      // Set an arbitrary valid opindex here to skip reduce later.

      pnode->SetRevectorizedNode(ig_index);

    }


    // No extract op needed for Store.

    return OpIndex::Invalid();

  }


  OpIndex REDUCE_INPUT_GRAPH(Phi)(OpIndex ig_index, const PhiOp& phi) {

    if (phi.rep == RegisterRepresentation::Simd128()) {

      if (auto pnode = analyzer_.GetPackNode(ig_index)) {

        OpIndex og_index = pnode->RevectorizedNode();


        // Don't reduce revectorized node.

        if (!og_index.valid()) {

          base::SmallVector<OpIndex, 16> elements;

          og_index = __ ResolvePhi(

              phi,

              [&](OpIndex ind, int block_id, int old_block_id = 0) {

                return analyzer_.GetReducedInput(pnode, old_block_id);

              },

              RegisterRepresentation::Simd256());

          pnode->SetRevectorizedNode(og_index);

        }


        OpIndex extract_op_index =

            GetExtractOpIfNeeded(pnode, ig_index, og_index);

        // If phis are not be mapped to anything in the new graph,

        // they will be skipped in FixLoopPhis in copying-phase.

        // return og_index to create the mapping.

        if (extract_op_index == OpIndex::Invalid()) {

          return og_index;

        } else {

          return extract_op_index;

        }

      }

    }


    return Adapter::ReduceInputGraphPhi(ig_index, phi);

  }


  void FixLoopPhi(const PhiOp& input_phi, OpIndex output_index,

                  Block* output_graph_loop) {

    if (input_phi.rep == RegisterRepresentation::Simd128()) {

      OpIndex phi_index = __ input_graph().Index(input_phi);

      DCHECK(phi_index.valid());

      if (auto* pnode = analyzer_.GetPackNode(phi_index)) {

        auto pending_index = pnode->RevectorizedNode();

        DCHECK(pending_index.valid());

        if (pending_index.valid() &&

            output_graph_loop->Contains(pending_index)) {

          // Need skip replaced op

          if (auto* pending_phi = __ output_graph()

                                      .Get(pending_index)

                                      .template TryCast<PendingLoopPhiOp>()) {

            __ output_graph().template Replace<PhiOp>(

                pending_index,

                base::VectorOf({pending_phi -> first(),

                                analyzer_.GetReducedInput(pnode, 1)}),

                RegisterRepresentation::Simd256());

            return;

          }

        }

      }

    }


    return Adapter::FixLoopPhi(input_phi, output_index, output_graph_loop);

  }


  V<Simd128> REDUCE_INPUT_GRAPH(Simd128Unary)(V<Simd128> ig_index,

                                              const Simd128UnaryOp& unary) {

    PackNode* pnode = analyzer_.GetPackNode(ig_index);

    if (!pnode || !pnode->IsDefaultPackNode()) {

      return Adapter::ReduceInputGraphSimd128Unary(ig_index, unary);

    }


    V<Simd256> og_index = pnode->RevectorizedNode();

    // Skip revectorized node.

    if (!og_index.valid()) {

      V<Simd256> input = analyzer_.GetReducedInput(pnode);

      if (!input.valid()) {

        V<Simd128> input_128 = __ MapToNewGraph(unary.input());

        og_index = __ Simd256Unary(input_128, GetSimd256UnaryKind(unary.kind));

      } else {

        og_index = __ Simd256Unary(input, GetSimd256UnaryKind(unary.kind));

      }

      pnode->SetRevectorizedNode(og_index);

    }

    return GetExtractOpIfNeeded(pnode, ig_index, og_index);

  }


  V<Simd128> REDUCE_INPUT_GRAPH(Simd128Binop)(V<Simd128> ig_index,

                                              const Simd128BinopOp& op) {

    PackNode* pnode = analyzer_.GetPackNode(ig_index);

    if (!pnode || !pnode->IsDefaultPackNode()) {

      return Adapter::ReduceInputGraphSimd128Binop(ig_index, op);

    }


    V<Simd256> og_index = pnode->RevectorizedNode();

    // Skip revectorized node.

    if (!og_index.valid()) {

      if (pnode->GetOperandsSize() < 2) {

        V<Simd128> left = __ MapToNewGraph(op.left());

        V<Simd128> right = __ MapToNewGraph(op.right());

        og_index = __ Simd256Binop(left, right, GetSimd256BinOpKind(op.kind));

      } else {

        V<Simd256> left = analyzer_.GetReducedInput(pnode, 0);

        V<Simd256> right = analyzer_.GetReducedInput(pnode, 1);

        og_index = __ Simd256Binop(left, right, GetSimd256BinOpKind(op.kind));

      }

      pnode->SetRevectorizedNode(og_index);

    }

    return GetExtractOpIfNeeded(pnode, ig_index, og_index);

  }


  V<Simd128> REDUCE_INPUT_GRAPH(Simd128Shift)(V<Simd128> ig_index,

                                              const Simd128ShiftOp& op) {

    PackNode* pnode = analyzer_.GetPackNode(ig_index);

    if (!pnode) {

      return Adapter::ReduceInputGraphSimd128Shift(ig_index, op);

    }


    V<Simd256> og_index = pnode->RevectorizedNode();

    // Skip revectorized node.

    if (!og_index.valid()) {

      V<Simd256> input = analyzer_.GetReducedInput(pnode);

      DCHECK(input.valid());

      V<Word32> shift = __ MapToNewGraph(op.shift());

      og_index = __ Simd256Shift(input, shift, GetSimd256ShiftOpKind(op.kind));

      pnode->SetRevectorizedNode(og_index);

    }

    return GetExtractOpIfNeeded(pnode, ig_index, og_index);

  }


  V<Simd128> REDUCE_INPUT_GRAPH(Simd128Ternary)(

      V<Simd128> ig_index, const Simd128TernaryOp& ternary) {

    PackNode* pnode = analyzer_.GetPackNode(ig_index);

    if (!pnode) {

      return Adapter::ReduceInputGraphSimd128Ternary(ig_index, ternary);

    }


    V<Simd256> og_index = pnode->RevectorizedNode();

    // Skip revectorized node.

    if (!og_index.valid()) {

      V<Simd256> first = analyzer_.GetReducedInput(pnode, 0);

      V<Simd256> second = analyzer_.GetReducedInput(pnode, 1);

      V<Simd256> third = analyzer_.GetReducedInput(pnode, 2);


      og_index = __ Simd256Ternary(first, second, third,

                                   GetSimd256TernaryKind(ternary.kind));


      pnode->SetRevectorizedNode(og_index);

    }

    return GetExtractOpIfNeeded(pnode, ig_index, og_index);

  }


  V<Simd128> REDUCE_INPUT_GRAPH(Simd128Splat)(V<Simd128> ig_index,

                                              const Simd128SplatOp& op) {

    PackNode* pnode = analyzer_.GetPackNode(ig_index);

    if (!pnode) {

      return Adapter::ReduceInputGraphSimd128Splat(ig_index, op);

    }


    V<Simd256> og_index = pnode->RevectorizedNode();

    // Skip revectorized node.

    if (!og_index.valid()) {

      og_index = __ Simd256Splat(__ MapToNewGraph(op.input()),

                                 Get256SplatOpKindFrom128(op.kind));


      pnode->SetRevectorizedNode(og_index);

    }

    return GetExtractOpIfNeeded(pnode, ig_index, og_index);

  }


  V<Simd128> REDUCE_INPUT_GRAPH(Simd128Shuffle)(V<Simd128> ig_index,

                                                const Simd128ShuffleOp& op) {

    PackNode* p = analyzer_.GetPackNode(ig_index);

    if (!p) {

      return Adapter::ReduceInputGraphSimd128Shuffle(ig_index, op);

    }

    DCHECK_EQ(op.kind, Simd128ShuffleOp::Kind::kI8x16);


    ShufflePackNode* pnode = p->AsShufflePackNode();

    V<Simd256> og_index = pnode->RevectorizedNode();

    // Skip revectorized node.

    if (!og_index.valid()) {

      const ShufflePackNode::SpecificInfo::Kind kind = pnode->info().kind();

      switch (kind) {

        case ShufflePackNode::SpecificInfo::Kind::kS256Load32Transform:

        case ShufflePackNode::SpecificInfo::Kind::kS256Load64Transform: {

          const bool is_32 =

              kind == ShufflePackNode::SpecificInfo::Kind::kS256Load32Transform;


          const OpIndex load_index =

              op.input(pnode->info().splat_index() >> (is_32 ? 2 : 1));

          const LoadOp& load =

              __ input_graph().Get(load_index).template Cast<LoadOp>();


          const int bytes_per_lane = is_32 ? 4 : 8;

          const int splat_index = pnode->info().splat_index() * bytes_per_lane;

          const int offset = splat_index + load.offset;


          V<WordPtr> base = __ WordPtrAdd(__ MapToNewGraph(load.base()),

                                          __ IntPtrConstant(offset));


          V<WordPtr> index = load.index().has_value()

                                 ? __ MapToNewGraph(load.index().value())

                                 : __ IntPtrConstant(0);


          const Simd256LoadTransformOp::TransformKind transform_kind =

              is_32 ? Simd256LoadTransformOp::TransformKind::k32Splat

                    : Simd256LoadTransformOp::TransformKind::k64Splat;

          og_index = __ Simd256LoadTransform(base, index, load.kind,

                                             transform_kind, 0);

          pnode->SetRevectorizedNode(og_index);

          break;

        }

        case ShufflePackNode::SpecificInfo::Kind::kS256Load8x8U: {

          const Simd128ShuffleOp& op0 = __ input_graph()

                                            .Get(pnode -> nodes()[0])

                                            .template Cast<Simd128ShuffleOp>();


          V<Simd128> load_transform_idx =

              __ input_graph()

                      .Get(op0.left())

                      .template Is<Simd128LoadTransformOp>()

                  ? op0.left()

                  : op0.right();

          const Simd128LoadTransformOp& load_transform =

              __ input_graph()

                  .Get(load_transform_idx)

                  .template Cast<Simd128LoadTransformOp>();

          DCHECK_EQ(load_transform.transform_kind,

                    Simd128LoadTransformOp::TransformKind::k64Zero);

          V<WordPtr> base = __ MapToNewGraph(load_transform.base());

          V<WordPtr> index = __ MapToNewGraph(load_transform.index());

          og_index = __ Simd256LoadTransform(

              base, index, load_transform.load_kind,

              Simd256LoadTransformOp::TransformKind::k8x8U,

              load_transform.offset);

          pnode->SetRevectorizedNode(og_index);

          break;

        }

#ifdef V8_TARGET_ARCH_X64

        case ShufflePackNode::SpecificInfo::Kind::kShufd: {

          V<Simd256> og_left = analyzer_.GetReducedInput(pnode, 0);

          DCHECK_EQ(og_left, analyzer_.GetReducedInput(pnode, 1));

          og_index = __ Simd256Shufd(og_left, pnode->info().shufd_control());

          pnode->SetRevectorizedNode(og_index);

          break;

        }

        case ShufflePackNode::SpecificInfo::Kind::kShufps: {

          V<Simd256> og_left = analyzer_.GetReducedInput(pnode, 0);

          V<Simd256> og_right = analyzer_.GetReducedInput(pnode, 1);

          og_index = __ Simd256Shufps(og_left, og_right,

                                      pnode->info().shufps_control());

          pnode->SetRevectorizedNode(og_index);

          break;

        }

        case ShufflePackNode::SpecificInfo::Kind::kS32x8UnpackLow: {

          V<Simd256> og_left = analyzer_.GetReducedInput(pnode, 0);

          V<Simd256> og_right = analyzer_.GetReducedInput(pnode, 1);

          og_index = __ Simd256Unpack(og_left, og_right,

                                      Simd256UnpackOp::Kind::k32x8Low);

          pnode->SetRevectorizedNode(og_index);

          break;

        }

        case ShufflePackNode::SpecificInfo::Kind::kS32x8UnpackHigh: {

          V<Simd256> og_left = analyzer_.GetReducedInput(pnode, 0);

          V<Simd256> og_right = analyzer_.GetReducedInput(pnode, 1);

          og_index = __ Simd256Unpack(og_left, og_right,

                                      Simd256UnpackOp::Kind::k32x8High);

          pnode->SetRevectorizedNode(og_index);

          break;

        }

#endif  // V8_TARGET_ARCH_X64

        default:

          UNREACHABLE();

      }

    }

    return GetExtractOpIfNeeded(pnode, ig_index, og_index);

  }


  OpIndex REDUCE_INPUT_GRAPH(Simd128ReplaceLane)(

      OpIndex ig_index, const Simd128ReplaceLaneOp& replace) {

    PackNode* pnode = analyzer_.GetPackNode(ig_index);

    if (!pnode || !pnode->IsBundlePackNode()) {

      return Adapter::ReduceInputGraphSimd128ReplaceLane(ig_index, replace);

    }


    V<Simd256> og_index = pnode->RevectorizedNode();

    // Don't reduce revectorized node.

    if (!og_index.valid()) {

      const BundlePackNode* bundle_pnode = pnode->AsBundlePackNode();

      V<Simd128> base_index = __ MapToNewGraph(bundle_pnode->base());

      V<Simd128> i16x8_index = base_index;

      V<Simd256> i32x8_index;

      if (bundle_pnode->is_sign_extract()) {

        if (bundle_pnode->lane_size() == 1) {

          if (bundle_pnode->offset() == 0) {

            i16x8_index = __ Simd128Unary(

                base_index, Simd128UnaryOp::Kind::kI16x8SConvertI8x16Low);

          } else {

            DCHECK_EQ(bundle_pnode->offset(), 8);

            i16x8_index = __ Simd128Unary(

                base_index, Simd128UnaryOp::Kind::kI16x8SConvertI8x16High);

          }

        }

        i32x8_index = __ Simd256Unary(

            i16x8_index, Simd256UnaryOp::Kind::kI32x8SConvertI16x8);

      } else {

        if (bundle_pnode->lane_size() == 1) {

          if (bundle_pnode->offset() == 0) {

            i16x8_index = __ Simd128Unary(

                base_index, Simd128UnaryOp::Kind::kI16x8UConvertI8x16Low);

          } else {

            DCHECK_EQ(bundle_pnode->offset(), 8);

            i16x8_index = __ Simd128Unary(

                base_index, Simd128UnaryOp::Kind::kI16x8UConvertI8x16High);

          }

        }

        i32x8_index = __ Simd256Unary(

            i16x8_index, Simd256UnaryOp::Kind::kI32x8UConvertI16x8);

      }


      if (bundle_pnode->is_sign_convert()) {

        og_index = __ Simd256Unary(i32x8_index,

                                   Simd256UnaryOp::Kind::kF32x8SConvertI32x8);

      } else {

        og_index = __ Simd256Unary(i32x8_index,

                                   Simd256UnaryOp::Kind::kF32x8UConvertI32x8);

      }


      pnode->SetRevectorizedNode(og_index);

    }

    return GetExtractOpIfNeeded(pnode, ig_index, og_index);

  }


  void ReduceInputsOfOp(OpIndex cur_index, OpIndex op_index) {

    // Reduce all the operations of op_index's input tree, which should be

    // bigger than the cur_index. The traversal is done in a DFS manner

    // to make sure all inputs are emitted before the use.

    const Block* current_input_block = Asm().current_input_block();

    std::stack<OpIndex> inputs;

    ZoneUnorderedSet<OpIndex> visited(Asm().phase_zone());

    inputs.push(op_index);


    while (!inputs.empty()) {

      OpIndex idx = inputs.top();

      if (visited.find(idx) != visited.end()) {

        inputs.pop();

        continue;

      }


      const Operation& op = __ input_graph().Get(idx);

      bool has_unvisited_inputs = false;

      for (OpIndex input : op.inputs()) {

        if (input > cur_index && visited.find(input) == visited.end()) {

          inputs.push(input);

          has_unvisited_inputs = true;

        }

      }


      if (!has_unvisited_inputs) {

        inputs.pop();

        visited.insert(idx);


        // op_index will be reduced later.

        if (idx == op_index) continue;


        DCHECK(!Asm().input_graph().Get(idx).template Is<PhiOp>());

        Asm().template VisitOpAndUpdateMapping<false>(idx, current_input_block);

      }

    }

  }


  template <typename Op, typename Continuation>


  void ReduceForceOrIntersectPackNode(PackNode* pnode, const OpIndex ig_index,

                                      OpIndex* og_index) {

    std::array<OpIndex, 2> v;

    DCHECK_EQ(pnode->nodes().size(), 2);

    // The operation order in pnode is determined by the store or reduce

    // seed when build the SLPTree. It is not quaranteed to align with

    // the visiting order in each basic block from input graph. E.g. we

    // can have a block including {a1, a2, b1, b2} operations, and the

    // SLPTree can be pnode1: (a2, a1), pnode2: (b1, b2) if a2 is input

    // of b1, and a1 is input of b2.

    for (int i = 0; i < static_cast<int>(pnode->nodes().size()); i++) {

      OpIndex cur_index = pnode->nodes()[i];

      if ((*og_index).valid() && cur_index == ig_index) {

        v[i] = *og_index;

      } else {

        // The current index maybe already reduced by the IntersectPackNode.

        v[i] = __ template MapToNewGraph<true>(cur_index);

      }


      if (v[i].valid()) continue;


      if (cur_index != ig_index) {

        ReduceInputsOfOp(ig_index, cur_index);

      }

      const Op& op = Asm().input_graph().Get(cur_index).template Cast<Op>();

      v[i] = Continuation{this}.ReduceInputGraph(cur_index, op);


      if (cur_index == ig_index) {

        *og_index = v[i];

      } else {

        // We have to create the mapping as cur_index may exist in other

        // IntersectPackNode and reduce again.

        __ CreateOldToNewMapping(cur_index, v[i]);

      }

    }


    OpIndex revec_index = __ SimdPack128To256(v[0], v[1]);

    pnode->SetRevectorizedNode(revec_index);

  }


  template <typename Op, typename Continuation>


  OpIndex ReduceInputGraphOperation(OpIndex ig_index, const Op& op) {

    OpIndex og_index;

    // Reduce ForcePackNode

    if (PackNode* p = analyzer_.GetPackNode(ig_index);

        p && p->IsForcePackNode()) {

      // Handle force packing nodes.

      ForcePackNode* pnode = p->AsForcePackNode();

      if (!pnode->RevectorizedNode().valid()) {

        switch (pnode->force_pack_type()) {

          case ForcePackNode::kSplat: {

            // The og_index maybe already reduced by the IntersectPackNode.

            OpIndex reduced_index = __ template MapToNewGraph<true>(ig_index);

            if (!reduced_index.valid()) {

              og_index = reduced_index =

                  Continuation{this}.ReduceInputGraph(ig_index, op);

            }

            OpIndex revec_index =

                __ SimdPack128To256(reduced_index, reduced_index);

            pnode->SetRevectorizedNode(revec_index);

            break;

          }

          case ForcePackNode::kGeneral: {

            ReduceForceOrIntersectPackNode<Op, Continuation>(pnode, ig_index,

                                                             &og_index);

            break;

          }

        }

      }

    }


    // Reduce IntersectPackNode

    if (auto intersect_packnodes = analyzer_.GetIntersectPackNodes(ig_index)) {

      for (PackNode* pnode : *intersect_packnodes) {

        if (!(pnode->RevectorizedNode()).valid()) {

          ReduceForceOrIntersectPackNode<Op, Continuation>(pnode, ig_index,

                                                           &og_index);

        }

      }

    }


    if (og_index.valid()) {

      return og_index;

    }


    if (__ template MapToNewGraph<true>(ig_index).valid()) {

      // The op is already emitted during emitting force pack right node input

      // trees.

      return OpIndex::Invalid();

    }


    return Continuation{this}.ReduceInputGraph(ig_index, op);

  }


 private:


  static Simd256UnaryOp::Kind GetSimd256UnaryKind(

      Simd128UnaryOp::Kind simd128_kind) {

    switch (simd128_kind) {

#define UNOP_KIND_MAPPING(from, to)   \

  case Simd128UnaryOp::Kind::k##from: \

    return Simd256UnaryOp::Kind::k##to;

      SIMD256_UNARY_SIMPLE_OP(UNOP_KIND_MAPPING)

#undef UNOP_KIND_MAPPING


#define SIGN_EXTENSION_UNOP_KIND_MAPPING(from_1, to, from_2) \

  case Simd128UnaryOp::Kind::k##from_1:                      \

    return Simd256UnaryOp::Kind::k##to;                      \

  case Simd128UnaryOp::Kind::k##from_2:                      \

    return Simd256UnaryOp::Kind::k##to;

      SIMD256_UNARY_SIGN_EXTENSION_OP(SIGN_EXTENSION_UNOP_KIND_MAPPING)

#undef SIGN_EXTENSION_UNOP_KIND_MAPPING

      default:

        UNIMPLEMENTED();

    }

  }


  static Simd256BinopOp::Kind GetSimd256BinOpKind(Simd128BinopOp::Kind kind) {

    switch (kind) {

#define BINOP_KIND_MAPPING(from, to)  \

  case Simd128BinopOp::Kind::k##from: \

    return Simd256BinopOp::Kind::k##to;

      SIMD256_BINOP_SIMPLE_OP(BINOP_KIND_MAPPING)

#undef BINOP_KIND_MAPPING


#define SIGN_EXTENSION_BINOP_KIND_MAPPING(from_1, to, from_2) \

  case Simd128BinopOp::Kind::k##from_1:                       \

    return Simd256BinopOp::Kind::k##to;                       \

  case Simd128BinopOp::Kind::k##from_2:                       \

    return Simd256BinopOp::Kind::k##to;

      SIMD256_BINOP_SIGN_EXTENSION_OP(SIGN_EXTENSION_BINOP_KIND_MAPPING)

#undef SIGN_EXTENSION_UNOP_KIND_MAPPING

      default:

        UNIMPLEMENTED();

    }

  }


  static Simd256ShiftOp::Kind GetSimd256ShiftOpKind(Simd128ShiftOp::Kind kind) {

    switch (kind) {

#define SHIFT_KIND_MAPPING(from, to)  \

  case Simd128ShiftOp::Kind::k##from: \

    return Simd256ShiftOp::Kind::k##to;

      SIMD256_SHIFT_OP(SHIFT_KIND_MAPPING)

#undef SHIFT_KIND_MAPPING

      default:

        UNIMPLEMENTED();

    }

  }


  static Simd256TernaryOp::Kind GetSimd256TernaryKind(

      Simd128TernaryOp::Kind simd128_kind) {

    switch (simd128_kind) {

#define TERNARY_KIND_MAPPING(from, to)  \

  case Simd128TernaryOp::Kind::k##from: \

    return Simd256TernaryOp::Kind::k##to;

      SIMD256_TERNARY_OP(TERNARY_KIND_MAPPING)

#undef TERNARY_KIND_MAPPING

      default:

        UNIMPLEMENTED();

    }

  }


  static Simd256LoadTransformOp::TransformKind Get256LoadTransformKindFrom128(

      Simd128LoadTransformOp::TransformKind simd128_kind) {

    switch (simd128_kind) {

#define TRANSFORM_KIND_MAPPING(from, to)               \

  case Simd128LoadTransformOp::TransformKind::k##from: \

    return Simd256LoadTransformOp::TransformKind::k##to;

      SIMD256_LOADTRANSFORM_OP(TRANSFORM_KIND_MAPPING)

#undef TRANSFORM_KIND_MAPPING

      default:

        UNREACHABLE();

    }

  }


  static Simd256SplatOp::Kind Get256SplatOpKindFrom128(

      Simd128SplatOp::Kind kind) {

    switch (kind) {

#define SPLAT_KIND_MAPPING(from, to)  \

  case Simd128SplatOp::Kind::k##from: \

    return Simd256SplatOp::Kind::k##to;

      SIMD256_SPLAT_OP(SPLAT_KIND_MAPPING)

      default:

        UNREACHABLE();

    }

  }


  const wasm::WasmModule* module_ = __ data() -> wasm_module();

  WasmRevecAnalyzer analyzer_ = *__ data() -> wasm_revec_analyzer();

};


#include "src/compiler/turboshaft/undef-assembler-macros.inc"


}  // namespace v8::internal::compiler::turboshaft


#endif  // V8_COMPILER_TURBOSHAFT_WASM_REVEC_REDUCER_H_

phase_zone
Zone * phase_zone
Definition add-type-assertions-reducer.cc:18

__
#define __
Definition baseline-assembler-arm-inl.h:52

REDUCE_INPUT_GRAPH
#define REDUCE_INPUT_GRAPH(operation)

data
union v8::internal::@341::BuiltinMetadata::KindSpecificData data

kind
Builtins::Kind kind
Definition builtins.cc:40

v8::base::SmallVector
Definition small-vector.h:22

v8::base::Vector
Definition zone-list.h:15

v8::internal::ZoneUnorderedMap
Definition zone-containers.h:712

v8::internal::ZoneUnorderedSet
Definition zone-containers.h:727

v8::internal::ZoneVector
Definition zone-containers.h:53

v8::internal::ZoneVector::size_type
size_t size_type
Definition zone-containers.h:62

v8::internal::Zone
Definition zone.h:43

v8::internal::compiler::turboshaft::Block
Definition graph.h:306

v8::internal::compiler::turboshaft::Block::Contains
bool Contains(OpIndex op_idx) const
Definition graph.h:322

v8::internal::compiler::turboshaft::BundlePackNode
Definition wasm-revec-reducer.h:422

v8::internal::compiler::turboshaft::BundlePackNode::is_sign_convert
bool is_sign_convert() const
Definition wasm-revec-reducer.h:439

v8::internal::compiler::turboshaft::BundlePackNode::offset
uint8_t offset() const
Definition wasm-revec-reducer.h:436

v8::internal::compiler::turboshaft::BundlePackNode::lane_size
uint8_t lane_size() const
Definition wasm-revec-reducer.h:437

v8::internal::compiler::turboshaft::BundlePackNode::base_
OpIndex base_
Definition wasm-revec-reducer.h:442

v8::internal::compiler::turboshaft::BundlePackNode::is_sign_extract
bool is_sign_extract() const
Definition wasm-revec-reducer.h:438

v8::internal::compiler::turboshaft::BundlePackNode::is_sign_convert_
bool is_sign_convert_
Definition wasm-revec-reducer.h:446

v8::internal::compiler::turboshaft::BundlePackNode::base
OpIndex base() const
Definition wasm-revec-reducer.h:435

v8::internal::compiler::turboshaft::BundlePackNode::is_sign_extract_
bool is_sign_extract_
Definition wasm-revec-reducer.h:445

v8::internal::compiler::turboshaft::BundlePackNode::offset_
uint8_t offset_
Definition wasm-revec-reducer.h:443

v8::internal::compiler::turboshaft::BundlePackNode::BundlePackNode
BundlePackNode(Zone *zone, const NodeGroup &node_group, OpIndex base, int8_t offset, uint8_t lane_size, bool is_sign_extract, bool is_sign_convert)
Definition wasm-revec-reducer.h:424

v8::internal::compiler::turboshaft::BundlePackNode::lane_size_
uint8_t lane_size_
Definition wasm-revec-reducer.h:444

v8::internal::compiler::turboshaft::ForcePackNode
Definition wasm-revec-reducer.h:328

v8::internal::compiler::turboshaft::ForcePackNode::force_pack_type
ForcePackType force_pack_type() const
Definition wasm-revec-reducer.h:338

v8::internal::compiler::turboshaft::ForcePackNode::ForcePackNode
ForcePackNode(Zone *zone, const NodeGroup &node_group, ForcePackType type)
Definition wasm-revec-reducer.h:334

v8::internal::compiler::turboshaft::ForcePackNode::force_pack_type_
ForcePackType force_pack_type_
Definition wasm-revec-reducer.h:341

v8::internal::compiler::turboshaft::ForcePackNode::ForcePackType
ForcePackType
Definition wasm-revec-reducer.h:330

v8::internal::compiler::turboshaft::ForcePackNode::kSplat
@ kSplat
Definition wasm-revec-reducer.h:331

v8::internal::compiler::turboshaft::ForcePackNode::kGeneral
@ kGeneral
Definition wasm-revec-reducer.h:332

v8::internal::compiler::turboshaft::Graph
Definition graph.h:578

v8::internal::compiler::turboshaft::Graph::Get
V8_INLINE const Operation & Get(OpIndex i) const
Definition graph.h:618

v8::internal::compiler::turboshaft::MemoryRepresentation::Simd256
static constexpr MemoryRepresentation Simd256()
Definition representations.h:621

v8::internal::compiler::turboshaft::NodeGroup
Definition wasm-revec-reducer.h:216

v8::internal::compiler::turboshaft::NodeGroup::indexes_
OpIndex indexes_[kSize]
Definition wasm-revec-reducer.h:238

v8::internal::compiler::turboshaft::NodeGroup::end
const OpIndex * end() const
Definition wasm-revec-reducer.h:235

v8::internal::compiler::turboshaft::NodeGroup::operator==
bool operator==(const NodeGroup &other) const
Definition wasm-revec-reducer.h:227

v8::internal::compiler::turboshaft::NodeGroup::operator[]
OpIndex operator[](int i) const
Definition wasm-revec-reducer.h:225

v8::internal::compiler::turboshaft::NodeGroup::operator!=
bool operator!=(const NodeGroup &other) const
Definition wasm-revec-reducer.h:230

v8::internal::compiler::turboshaft::NodeGroup::begin
const OpIndex * begin() const
Definition wasm-revec-reducer.h:234

v8::internal::compiler::turboshaft::NodeGroup::kSize
static constexpr int kSize
Definition wasm-revec-reducer.h:219

v8::internal::compiler::turboshaft::NodeGroup::size
size_t size() const
Definition wasm-revec-reducer.h:224

v8::internal::compiler::turboshaft::NodeGroup::NodeGroup
NodeGroup(OpIndex a, OpIndex b)
Definition wasm-revec-reducer.h:220

v8::internal::compiler::turboshaft::OpIndex
Definition index.h:39

v8::internal::compiler::turboshaft::OpIndex::Invalid
static constexpr OpIndex Invalid()
Definition index.h:88

v8::internal::compiler::turboshaft::OpIndex::valid
constexpr bool valid() const
Definition index.h:86

v8::internal::compiler::turboshaft::PackNode
Definition wasm-revec-reducer.h:249

v8::internal::compiler::turboshaft::PackNode::NodeType
NodeType
Definition wasm-revec-reducer.h:251

v8::internal::compiler::turboshaft::PackNode::kDefault
@ kDefault
Definition wasm-revec-reducer.h:252

v8::internal::compiler::turboshaft::PackNode::kBundlePackNode
@ kBundlePackNode
Definition wasm-revec-reducer.h:259

v8::internal::compiler::turboshaft::PackNode::kIntersectPackNode
@ kIntersectPackNode
Definition wasm-revec-reducer.h:260

v8::internal::compiler::turboshaft::PackNode::kShufflePackNode
@ kShufflePackNode
Definition wasm-revec-reducer.h:257

v8::internal::compiler::turboshaft::PackNode::kForcePackNode
@ kForcePackNode
Definition wasm-revec-reducer.h:253

v8::internal::compiler::turboshaft::PackNode::nodes
const NodeGroup & nodes() const
Definition wasm-revec-reducer.h:270

v8::internal::compiler::turboshaft::PackNode::IsShufflePackNode
bool IsShufflePackNode() const
Definition wasm-revec-reducer.h:280

v8::internal::compiler::turboshaft::PackNode::revectorized_node_
V< Simd256 > revectorized_node_
Definition wasm-revec-reducer.h:323

v8::internal::compiler::turboshaft::PackNode::AsForcePackNode
ForcePackNode * AsForcePackNode()
Definition wasm-revec-reducer.h:287

v8::internal::compiler::turboshaft::PackNode::nodes_
NodeGroup nodes_
Definition wasm-revec-reducer.h:322

v8::internal::compiler::turboshaft::PackNode::IsForcePackNode
bool IsForcePackNode() const
Definition wasm-revec-reducer.h:279

v8::internal::compiler::turboshaft::PackNode::IsSame
bool IsSame(const NodeGroup &node_group) const
Definition wasm-revec-reducer.h:271

v8::internal::compiler::turboshaft::PackNode::SetOperand
void SetOperand(int index, PackNode *pnode)
Definition wasm-revec-reducer.h:306

v8::internal::compiler::turboshaft::PackNode::operands_
ZoneVector< PackNode * > operands_
Definition wasm-revec-reducer.h:324

v8::internal::compiler::turboshaft::PackNode::IsSame
bool IsSame(const PackNode &other) const
Definition wasm-revec-reducer.h:274

v8::internal::compiler::turboshaft::PackNode::GetOperandsSize
ZoneVector< PackNode * >::size_type GetOperandsSize() const
Definition wasm-revec-reducer.h:314

v8::internal::compiler::turboshaft::PackNode::IsBundlePackNode
bool IsBundlePackNode() const
Definition wasm-revec-reducer.h:281

v8::internal::compiler::turboshaft::PackNode::GetOperand
PackNode * GetOperand(int index) const
Definition wasm-revec-reducer.h:300

v8::internal::compiler::turboshaft::PackNode::SetRevectorizedNode
void SetRevectorizedNode(V< Simd256 > node)
Definition wasm-revec-reducer.h:276

v8::internal::compiler::turboshaft::PackNode::PackNode
PackNode(Zone *zone, const NodeGroup &node_group, NodeType node_type=kDefault)
Definition wasm-revec-reducer.h:264

v8::internal::compiler::turboshaft::PackNode::Print
void Print(Graph *graph) const
Definition wasm-revec-reducer.cc:195

v8::internal::compiler::turboshaft::PackNode::node_type_
NodeType node_type_
Definition wasm-revec-reducer.h:325

v8::internal::compiler::turboshaft::PackNode::AsShufflePackNode
ShufflePackNode * AsShufflePackNode()
Definition wasm-revec-reducer.h:291

v8::internal::compiler::turboshaft::PackNode::RevectorizedNode
V< Simd256 > RevectorizedNode() const
Definition wasm-revec-reducer.h:275

v8::internal::compiler::turboshaft::PackNode::IsDefaultPackNode
bool IsDefaultPackNode() const
Definition wasm-revec-reducer.h:278

v8::internal::compiler::turboshaft::PackNode::AsBundlePackNode
BundlePackNode * AsBundlePackNode()
Definition wasm-revec-reducer.h:295

v8::internal::compiler::turboshaft::PackNode::is_force_packing
bool is_force_packing() const
Definition wasm-revec-reducer.h:283

v8::internal::compiler::turboshaft::PipelineData
Definition phase.h:177

v8::internal::compiler::turboshaft::RegisterRepresentation::Simd128
static constexpr RegisterRepresentation Simd128()
Definition representations.h:265

v8::internal::compiler::turboshaft::RegisterRepresentation::Simd256
static constexpr RegisterRepresentation Simd256()
Definition representations.h:268

v8::internal::compiler::turboshaft::SLPTree
Definition wasm-revec-reducer.h:461

v8::internal::compiler::turboshaft::SLPTree::NewPackNodeAndRecurs
PackNode * NewPackNodeAndRecurs(const NodeGroup &node_group, int start_index, int count, unsigned depth)
Definition wasm-revec-reducer.cc:412

v8::internal::compiler::turboshaft::SLPTree::IsSideEffectFree
bool IsSideEffectFree(OpIndex first, OpIndex second)
Definition wasm-revec-reducer.cc:787

v8::internal::compiler::turboshaft::SLPTree::BuildTreeRec
PackNode * BuildTreeRec(const NodeGroup &node_group, unsigned depth)
Definition wasm-revec-reducer.cc:890

v8::internal::compiler::turboshaft::SLPTree::root_
PackNode * root_
Definition wasm-revec-reducer.h:578

v8::internal::compiler::turboshaft::SLPTree::Print
void Print(const char *info)
Definition wasm-revec-reducer.cc:249

v8::internal::compiler::turboshaft::SLPTree::SLPTree
SLPTree(Graph &graph, WasmRevecAnalyzer *analyzer, Zone *zone)
Definition wasm-revec-reducer.h:463

v8::internal::compiler::turboshaft::SLPTree::node_to_intersect_packnodes_
ZoneUnorderedMap< OpIndex, ZoneVector< PackNode * > > node_to_intersect_packnodes_
Definition wasm-revec-reducer.h:582

v8::internal::compiler::turboshaft::SLPTree::GetPackNode
PackNode * GetPackNode(OpIndex node)
Definition wasm-revec-reducer.cc:201

v8::internal::compiler::turboshaft::SLPTree::GetIntersectPackNodes
ZoneVector< PackNode * > * GetIntersectPackNodes(OpIndex node)
Definition wasm-revec-reducer.cc:209

v8::internal::compiler::turboshaft::SLPTree::Try256ShuffleMatchLoad8x8U
ShufflePackNode * Try256ShuffleMatchLoad8x8U(const NodeGroup &node_group, const uint8_t *shuffle0, const uint8_t *shuffle1)
Definition wasm-revec-reducer.cc:445

v8::internal::compiler::turboshaft::SLPTree::phase_zone_
Zone * phase_zone_
Definition wasm-revec-reducer.h:577

v8::internal::compiler::turboshaft::SLPTree::node_to_packnode_
ZoneUnorderedMap< OpIndex, PackNode * > node_to_packnode_
Definition wasm-revec-reducer.h:580

v8::internal::compiler::turboshaft::SLPTree::IsEqual
bool IsEqual(const OpIndex node0, const OpIndex node1)
Definition wasm-revec-reducer.cc:849

v8::internal::compiler::turboshaft::SLPTree::analyzer_
WasmRevecAnalyzer * analyzer_
Definition wasm-revec-reducer.h:576

v8::internal::compiler::turboshaft::SLPTree::HasInputDependencies
bool HasInputDependencies(const NodeGroup &node_group)
Definition wasm-revec-reducer.cc:261

v8::internal::compiler::turboshaft::SLPTree::NewPackNode
PackNode * NewPackNode(const NodeGroup &node_group)
Definition wasm-revec-reducer.cc:292

v8::internal::compiler::turboshaft::SLPTree::CanBePacked
bool CanBePacked(const NodeGroup &node_group)
Definition wasm-revec-reducer.cc:817

v8::internal::compiler::turboshaft::SLPTree::GetIntersectNodeMapping
ZoneUnorderedMap< OpIndex, ZoneVector< PackNode * > > & GetIntersectNodeMapping()
Definition wasm-revec-reducer.h:497

v8::internal::compiler::turboshaft::SLPTree::graph_
Graph & graph_
Definition wasm-revec-reducer.h:575

v8::internal::compiler::turboshaft::SLPTree::NewForcePackNode
PackNode * NewForcePackNode(const NodeGroup &node_group, ForcePackNode::ForcePackType type, const Graph &graph)
Definition wasm-revec-reducer.cc:303

v8::internal::compiler::turboshaft::SLPTree::DeleteTree
void DeleteTree()

v8::internal::compiler::turboshaft::SLPTree::RecursionMaxDepth
static constexpr size_t RecursionMaxDepth
Definition wasm-revec-reducer.h:583

v8::internal::compiler::turboshaft::SLPTree::NewIntersectPackNode
PackNode * NewIntersectPackNode(const NodeGroup &node_group)
Definition wasm-revec-reducer.cc:351

v8::internal::compiler::turboshaft::SLPTree::NewBundlePackNode
BundlePackNode * NewBundlePackNode(const NodeGroup &node_group, OpIndex base, int8_t offset, uint8_t lane_size, bool is_sign_extract, bool is_sign_convert)
Definition wasm-revec-reducer.cc:334

v8::internal::compiler::turboshaft::SLPTree::BuildTree
PackNode * BuildTree(const NodeGroup &roots)
Definition wasm-revec-reducer.cc:859

v8::internal::compiler::turboshaft::SLPTree::zone
Zone * zone() const
Definition wasm-revec-reducer.h:573

v8::internal::compiler::turboshaft::SLPTree::TryMatchExtendIntToF32x4
bool TryMatchExtendIntToF32x4(const NodeGroup &node_group, ExtendIntToF32x4Info *info)
Definition wasm-revec-reducer.cc:749

v8::internal::compiler::turboshaft::SLPTree::GetNodeMapping
ZoneUnorderedMap< OpIndex, PackNode * > & GetNodeMapping()
Definition wasm-revec-reducer.h:494

v8::internal::compiler::turboshaft::SLPTree::NewShufflePackNode
ShufflePackNode * NewShufflePackNode(const NodeGroup &node_group, ShufflePackNode::SpecificInfo::Kind kind)
Definition wasm-revec-reducer.cc:432

v8::internal::compiler::turboshaft::SLPTree::NewCommutativePackNodeAndRecurs
PackNode * NewCommutativePackNodeAndRecurs(const NodeGroup &node_group, unsigned depth)
Definition wasm-revec-reducer.cc:382

v8::internal::compiler::turboshaft::SLPTree::TryGetExtendIntToF32x4Info
std::optional< ExtendIntToF32x4Info > TryGetExtendIntToF32x4Info(OpIndex index)
Definition wasm-revec-reducer.cc:644

v8::internal::compiler::turboshaft::SLPTree::graph
Graph & graph() const
Definition wasm-revec-reducer.h:572

v8::internal::compiler::turboshaft::ShufflePackNode::SpecificInfo
Definition wasm-revec-reducer.h:346

v8::internal::compiler::turboshaft::ShufflePackNode::SpecificInfo::kind
Kind kind()
Definition wasm-revec-reducer.h:367

v8::internal::compiler::turboshaft::ShufflePackNode::SpecificInfo::set_kind
void set_kind(Kind kind)
Definition wasm-revec-reducer.h:368

v8::internal::compiler::turboshaft::ShufflePackNode::SpecificInfo::splat_index
int splat_index() const
Definition wasm-revec-reducer.h:375

v8::internal::compiler::turboshaft::ShufflePackNode::SpecificInfo::Kind
Kind
Definition wasm-revec-reducer.h:348

v8::internal::compiler::turboshaft::ShufflePackNode::SpecificInfo::Kind::kS256Load64Transform
@ kS256Load64Transform

v8::internal::compiler::turboshaft::ShufflePackNode::SpecificInfo::Kind::kS256Load32Transform
@ kS256Load32Transform

v8::internal::compiler::turboshaft::ShufflePackNode::SpecificInfo::Kind::kS256Load8x8U
@ kS256Load8x8U

v8::internal::compiler::turboshaft::ShufflePackNode::SpecificInfo::param_
Param param_
Definition wasm-revec-reducer.h:403

v8::internal::compiler::turboshaft::ShufflePackNode::SpecificInfo::kind_
Kind kind_
Definition wasm-revec-reducer.h:402

v8::internal::compiler::turboshaft::ShufflePackNode::SpecificInfo::set_splat_index
void set_splat_index(uint8_t value)
Definition wasm-revec-reducer.h:370

v8::internal::compiler::turboshaft::ShufflePackNode
Definition wasm-revec-reducer.h:344

v8::internal::compiler::turboshaft::ShufflePackNode::info_
SpecificInfo info_
Definition wasm-revec-reducer.h:415

v8::internal::compiler::turboshaft::ShufflePackNode::info
SpecificInfo & info()
Definition wasm-revec-reducer.h:412

v8::internal::compiler::turboshaft::ShufflePackNode::ShufflePackNode
ShufflePackNode(Zone *zone, const NodeGroup &node_group, SpecificInfo::Kind kind)
Definition wasm-revec-reducer.h:406

v8::internal::compiler::turboshaft::SimdUseMap
Definition use-map.h:45

v8::internal::compiler::turboshaft::UniformReducerAdapter
Definition uniform-reducer-adapter.h:110

v8::internal::compiler::turboshaft::UseMap::uses
base::Vector< const OpIndex > uses(OpIndex index) const
Definition use-map.cc:69

v8::internal::compiler::turboshaft::V
Definition index.h:607

v8::internal::compiler::turboshaft::WasmRevecAnalyzer
Definition wasm-revec-reducer.h:586

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::GetPackNode
PackNode * GetPackNode(const OpIndex ig_index)
Definition wasm-revec-reducer.h:606

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::WasmRevecAnalyzer
WasmRevecAnalyzer(PipelineData *data, Zone *zone, Graph &graph)
Definition wasm-revec-reducer.h:588

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::ProcessBlock
void ProcessBlock(const Block &block)
Definition wasm-revec-reducer.cc:1339

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::ShouldReduce
bool ShouldReduce() const
Definition wasm-revec-reducer.h:604

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::GetStartOperation
const Operation & GetStartOperation(const PackNode *pnode, const OpIndex node, const Operation &op)
Definition wasm-revec-reducer.h:629

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::store_seeds_
ZoneVector< std::pair< OpIndex, OpIndex > > store_seeds_
Definition wasm-revec-reducer.h:649

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::IsSupportedReduceSeed
bool IsSupportedReduceSeed(const Operation &op)
Definition wasm-revec-reducer.cc:1326

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::reduce_seeds_
ZoneVector< std::pair< OpIndex, OpIndex > > reduce_seeds_
Definition wasm-revec-reducer.h:650

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::Run
void Run()
Definition wasm-revec-reducer.cc:1391

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::uses
base::Vector< const OpIndex > uses(OpIndex node)
Definition wasm-revec-reducer.h:636

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::Print
void Print(const char *info)
Definition wasm-revec-reducer.cc:1514

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::data_
PipelineData * data_
Definition wasm-revec-reducer.h:646

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::phase_zone_
Zone * phase_zone_
Definition wasm-revec-reducer.h:648

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::revectorizable_intersect_node_
ZoneUnorderedMap< OpIndex, ZoneVector< PackNode * > > revectorizable_intersect_node_
Definition wasm-revec-reducer.h:654

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::DecideVectorize
bool DecideVectorize()
Definition wasm-revec-reducer.cc:1452

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::GetReducedInput
const OpIndex GetReducedInput(const PackNode *pnode, const int index=0)
Definition wasm-revec-reducer.h:622

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::graph_
Graph & graph_
Definition wasm-revec-reducer.h:647

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::GetIntersectPackNodes
ZoneVector< PackNode * > * GetIntersectPackNodes(const OpIndex node)
Definition wasm-revec-reducer.h:614

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::module_
const wasm::WasmModule * module_
Definition wasm-revec-reducer.h:651

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::use_map_
SimdUseMap * use_map_
Definition wasm-revec-reducer.h:656

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::revectorizable_node_
ZoneUnorderedMap< OpIndex, PackNode * > revectorizable_node_
Definition wasm-revec-reducer.h:652

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::MergeSLPTree
void MergeSLPTree(SLPTree &slp_tree)
Definition wasm-revec-reducer.cc:1306

v8::internal::compiler::turboshaft::WasmRevecAnalyzer::should_reduce_
bool should_reduce_
Definition wasm-revec-reducer.h:655

v8::internal::compiler::turboshaft::WasmRevecReducer
Definition wasm-revec-reducer.h:660

v8::internal::compiler::turboshaft::WasmRevecReducer::ReduceInputsOfOp
void ReduceInputsOfOp(OpIndex cur_index, OpIndex op_index)
Definition wasm-revec-reducer.h:1147

v8::internal::compiler::turboshaft::WasmRevecReducer::Simd128ReplaceLane
OpIndex REDUCE_INPUT_GRAPH Simd128ReplaceLane(OpIndex ig_index, const Simd128ReplaceLaneOp &replace)
Definition wasm-revec-reducer.h:1092

v8::internal::compiler::turboshaft::WasmRevecReducer::Simd128Splat
V< Simd128 > REDUCE_INPUT_GRAPH Simd128Splat(V< Simd128 > ig_index, const Simd128SplatOp &op)
Definition wasm-revec-reducer.h:965

v8::internal::compiler::turboshaft::WasmRevecReducer::ReduceInputGraphOperation
OpIndex ReduceInputGraphOperation(OpIndex ig_index, const Op &op)
Definition wasm-revec-reducer.h:1227

v8::internal::compiler::turboshaft::WasmRevecReducer::Phi
OpIndex REDUCE_INPUT_GRAPH Phi(OpIndex ig_index, const PhiOp &phi)
Definition wasm-revec-reducer.h:817

v8::internal::compiler::turboshaft::WasmRevecReducer::Simd128Shift
V< Simd128 > REDUCE_INPUT_GRAPH Simd128Shift(V< Simd128 > ig_index, const Simd128ShiftOp &op)
Definition wasm-revec-reducer.h:924

v8::internal::compiler::turboshaft::WasmRevecReducer::GetSimd256TernaryKind
static Simd256TernaryOp::Kind GetSimd256TernaryKind(Simd128TernaryOp::Kind simd128_kind)
Definition wasm-revec-reducer.h:1334

v8::internal::compiler::turboshaft::WasmRevecReducer::Simd128Constant
V< Simd128 > REDUCE_INPUT_GRAPH Simd128Constant(V< Simd128 > ig_index, const Simd128ConstantOp &constant_op)
Definition wasm-revec-reducer.h:698

v8::internal::compiler::turboshaft::WasmRevecReducer::Simd128LoadTransform
V< Simd128 > REDUCE_INPUT_GRAPH Simd128LoadTransform(V< Simd128 > ig_index, const Simd128LoadTransformOp &load_transform)
Definition wasm-revec-reducer.h:724

v8::internal::compiler::turboshaft::WasmRevecReducer::Store
OpIndex REDUCE_INPUT_GRAPH Store(OpIndex ig_index, const StoreOp &store)
Definition wasm-revec-reducer.h:776

v8::internal::compiler::turboshaft::WasmRevecReducer::Get256LoadTransformKindFrom128
static Simd256LoadTransformOp::TransformKind Get256LoadTransformKindFrom128(Simd128LoadTransformOp::TransformKind simd128_kind)
Definition wasm-revec-reducer.h:1347

v8::internal::compiler::turboshaft::WasmRevecReducer::GetSimd256ShiftOpKind
static Simd256ShiftOp::Kind GetSimd256ShiftOpKind(Simd128ShiftOp::Kind kind)
Definition wasm-revec-reducer.h:1322

v8::internal::compiler::turboshaft::WasmRevecReducer::Load
OpIndex REDUCE_INPUT_GRAPH Load(OpIndex ig_index, const LoadOp &load)
Definition wasm-revec-reducer.h:749

v8::internal::compiler::turboshaft::WasmRevecReducer::GetExtractOpIfNeeded
OpIndex GetExtractOpIfNeeded(const PackNode *pnode, OpIndex ig_index, OpIndex og_index)
Definition wasm-revec-reducer.h:665

v8::internal::compiler::turboshaft::WasmRevecReducer::ReduceForceOrIntersectPackNode
void ReduceForceOrIntersectPackNode(PackNode *pnode, const OpIndex ig_index, OpIndex *og_index)
Definition wasm-revec-reducer.h:1186

v8::internal::compiler::turboshaft::WasmRevecReducer::Simd128Shuffle
V< Simd128 > REDUCE_INPUT_GRAPH Simd128Shuffle(V< Simd128 > ig_index, const Simd128ShuffleOp &op)
Definition wasm-revec-reducer.h:983

v8::internal::compiler::turboshaft::WasmRevecReducer::Simd128Ternary
V< Simd128 > REDUCE_INPUT_GRAPH Simd128Ternary(V< Simd128 > ig_index, const Simd128TernaryOp &ternary)
Definition wasm-revec-reducer.h:943

v8::internal::compiler::turboshaft::WasmRevecReducer::Get256SplatOpKindFrom128
static Simd256SplatOp::Kind Get256SplatOpKindFrom128(Simd128SplatOp::Kind kind)
Definition wasm-revec-reducer.h:1360

v8::internal::compiler::turboshaft::WasmRevecReducer::Simd128Unary
V< Simd128 > REDUCE_INPUT_GRAPH Simd128Unary(V< Simd128 > ig_index, const Simd128UnaryOp &unary)
Definition wasm-revec-reducer.h:878

v8::internal::compiler::turboshaft::WasmRevecReducer::FixLoopPhi
void FixLoopPhi(const PhiOp &input_phi, OpIndex output_index, Block *output_graph_loop)
Definition wasm-revec-reducer.h:850

v8::internal::compiler::turboshaft::WasmRevecReducer::module_
const wasm::WasmModule * module_
Definition wasm-revec-reducer.h:1372

v8::internal::compiler::turboshaft::WasmRevecReducer::Simd128Binop
V< Simd128 > REDUCE_INPUT_GRAPH Simd128Binop(V< Simd128 > ig_index, const Simd128BinopOp &op)
Definition wasm-revec-reducer.h:900

v8::internal::compiler::turboshaft::WasmRevecReducer::analyzer_
WasmRevecAnalyzer analyzer_
Definition wasm-revec-reducer.h:1373

v8::internal::compiler::turboshaft::WasmRevecReducer::GetSimd256UnaryKind
static Simd256UnaryOp::Kind GetSimd256UnaryKind(Simd128UnaryOp::Kind simd128_kind)
Definition wasm-revec-reducer.h:1281

v8::internal::compiler::turboshaft::WasmRevecReducer::GetSimd256BinOpKind
static Simd256BinopOp::Kind GetSimd256BinOpKind(Simd128BinopOp::Kind kind)
Definition wasm-revec-reducer.h:1302

assembler.h

TURBOSHAFT_REDUCER_BOILERPLATE
#define TURBOSHAFT_REDUCER_BOILERPLATE(Name)
Definition assembler.h:823

start
int start
Definition debug-coverage.cc:595

define-assembler-macros.inc

base
OpIndex base
Definition instruction-selector-ia32.cc:65

offset
int32_t offset
Definition instruction-selector-ia32.cc:67

a
std::optional< TNode< JSArray > > a
Definition js-call-reducer.cc:1757

node
Node * node
Definition js-inlining-heuristic.cc:316

second
double second
Definition js-temporal-objects.cc:63

v8::base::VectorOf
constexpr Vector< T > VectorOf(T *start, size_t size)
Definition vector.h:360

v8::internal::compiler::turboshaft
Definition builtins.h:33

v8::internal::compiler::turboshaft::Get
V8_INLINE const Operation & Get(const Graph &graph, OpIndex index)
Definition graph.h:1231

v8::internal::compiler::IntPtrConstant
static const Operator * IntPtrConstant(CommonOperatorBuilder *common, intptr_t value)
Definition basic-block-instrumentor.cc:44

v8::internal::compiler::UNIMPLEMENTED
UNIMPLEMENTED()

v8::internal
Definition api-arguments-inl.h:20

v8::internal::TryCast
bool TryCast(Tagged< From > value, Tagged< To > *out)
Definition casting.h:77

v8::internal::index
int index
Definition heap-snapshot-generator.cc:1670

v8::internal::kSimd128Size
constexpr int kSimd128Size
Definition globals.h:706

v8::internal::Is
bool Is(IndirectHandle< U > value)
Definition handles-inl.h:51

v8::internal::store
too high values may cause the compiler to set high thresholds for inlining to as much as possible avoid inlined allocation of objects that cannot escape trace load stores from virtual maglev objects use TurboFan fast string builder analyze liveness of environment slots and zap dead values trace TurboFan load elimination emit data about basic block usage in builtins to this enable builtin reordering when run mksnapshot flag for emit warnings when applying builtin profile data verify register allocation in TurboFan randomly schedule instructions to stress dependency tracking enable store store elimination in TurboFan rewrite far to near simulate GC compiler thread race related to allow float parameters to be passed in simulator mode JS Wasm Run additional turbo_optimize_inlined_js_wasm_wrappers enable experimental feedback collection in generic lowering enable Turboshaft s WasmLoadElimination enable Turboshaft s low level load elimination for JS enable Turboshaft s escape analysis for string concatenation use enable Turbolev features that we want to ship in the not too far future trace individual Turboshaft reduction steps trace intermediate Turboshaft reduction steps invocation count threshold for early optimization Enables optimizations which favor memory size over execution speed Enables sampling allocation profiler with X as a sample interval min size of a semi the new space consists of two semi spaces max size of the Collect garbage after Collect garbage after keeps maps alive for< n > old space garbage collections print one detailed trace line in allocation gc speed threshold for starting incremental marking via a task in percent of available threshold for starting incremental marking immediately in percent of available Use a single schedule for determining a marking schedule between JS and C objects schedules the minor GC task with kUserVisible priority max worker number of concurrent for NumberOfWorkerThreads start background threads that allocate memory concurrent_array_buffer_sweeping use parallel threads to clear weak refs in the atomic pause trace progress of the incremental marking trace object counts and memory usage report a tick only when allocated zone memory changes by this amount TracingFlags::gc_stats store(v8::tracing::TracingCategoryObserver::ENABLED_BY_NATIVE)) DEFINE_GENERIC_IMPLICATION(trace_gc_object_stats

v8::internal::I
constexpr int I
Definition constants-arm.h:183

v8::internal::kSimd256Size
constexpr int kSimd256Size
Definition globals.h:709

v8::internal::value
return value
Definition map-inl.h:893

v8::internal::UNREACHABLE
UNREACHABLE()

v8::internal::Cast
Tagged< To > Cast(Tagged< From > value, const v8::SourceLocation &loc=INIT_SOURCE_LOCATION_IN_DEBUG)
Definition casting.h:150

operations.h

safe_conversions.h

NON_EXPORTED_BASE
#define NON_EXPORTED_BASE(code)
Definition compiler-specific.h:93

DCHECK_GE
#define DCHECK_GE(v1, v2)
Definition logging.h:488

DCHECK
#define DCHECK(condition)
Definition logging.h:482

DCHECK_LT
#define DCHECK_LT(v1, v2)
Definition logging.h:489

DCHECK_EQ
#define DCHECK_EQ(v1, v2)
Definition logging.h:485

v8::internal::compiler::turboshaft::ChangeOp::Kind
Kind
Definition operations.h:2153

v8::internal::compiler::turboshaft::LoadOp
Definition operations.h:2857

v8::internal::compiler::turboshaft::Operation
Definition operations.h:934

v8::internal::compiler::turboshaft::Operation::inputs
base::Vector< const OpIndex > inputs() const
Definition operations.h:9121

v8::internal::compiler::turboshaft::PhiOp
Definition operations.h:2544

v8::internal::compiler::turboshaft::PhiOp::rep
RegisterRepresentation rep
Definition operations.h:2545

v8::internal::compiler::turboshaft::SLPTree::ExtendIntToF32x4Info
Definition wasm-revec-reducer.h:472

v8::internal::compiler::turboshaft::SLPTree::ExtendIntToF32x4Info::start_lane
uint8_t start_lane
Definition wasm-revec-reducer.h:474

v8::internal::compiler::turboshaft::SLPTree::ExtendIntToF32x4Info::extend_from
OpIndex extend_from
Definition wasm-revec-reducer.h:473

v8::internal::compiler::turboshaft::SLPTree::ExtendIntToF32x4Info::is_sign_convert
bool is_sign_convert
Definition wasm-revec-reducer.h:477

v8::internal::compiler::turboshaft::SLPTree::ExtendIntToF32x4Info::is_sign_extract
bool is_sign_extract
Definition wasm-revec-reducer.h:476

v8::internal::compiler::turboshaft::SLPTree::ExtendIntToF32x4Info::lane_size
uint8_t lane_size
Definition wasm-revec-reducer.h:475

v8::internal::compiler::turboshaft::SLPTree::LaneExtendInfo
Definition wasm-revec-reducer.h:481

v8::internal::compiler::turboshaft::SLPTree::LaneExtendInfo::replace_lane_index
int replace_lane_index
Definition wasm-revec-reducer.h:486

v8::internal::compiler::turboshaft::SLPTree::LaneExtendInfo::extract_kind
Simd128ExtractLaneOp::Kind extract_kind
Definition wasm-revec-reducer.h:483

v8::internal::compiler::turboshaft::SLPTree::LaneExtendInfo::change_kind
ChangeOp::Kind change_kind
Definition wasm-revec-reducer.h:485

v8::internal::compiler::turboshaft::SLPTree::LaneExtendInfo::extract_lane_index
int extract_lane_index
Definition wasm-revec-reducer.h:484

v8::internal::compiler::turboshaft::SLPTree::LaneExtendInfo::extract_from
OpIndex extract_from
Definition wasm-revec-reducer.h:482

v8::internal::compiler::turboshaft::StoreOp
Definition operations.h:3382

v8::internal::count
Definition v8-fast-api-calls.h:511

v8::internal::wasm::WasmModule
Definition wasm-module.h:705

phase.h

undef-assembler-macros.inc

v8::internal::compiler::turboshaft::ShufflePackNode::SpecificInfo::Param
Definition wasm-revec-reducer.h:359

v8::internal::compiler::turboshaft::ShufflePackNode::SpecificInfo::Param::splat_index
int splat_index
Definition wasm-revec-reducer.h:360

use-map.h

wasm-graph-assembler.h

SIGN_EXTENSION_BINOP_KIND_MAPPING
#define SIGN_EXTENSION_BINOP_KIND_MAPPING(from_1, to, from_2)

SHIFT_KIND_MAPPING
#define SHIFT_KIND_MAPPING(from, to)

SIMD256_BINOP_SIGN_EXTENSION_OP
#define SIMD256_BINOP_SIGN_EXTENSION_OP(V)
Definition wasm-revec-reducer.h:163

SIGN_EXTENSION_UNOP_KIND_MAPPING
#define SIGN_EXTENSION_UNOP_KIND_MAPPING(from_1, to, from_2)

SIMD256_LOADTRANSFORM_OP
#define SIMD256_LOADTRANSFORM_OP(V)
Definition wasm-revec-reducer.h:23

SIMD256_SPLAT_OP
#define SIMD256_SPLAT_OP(V)
Definition wasm-revec-reducer.h:193

SIMD256_UNARY_SIGN_EXTENSION_OP
#define SIMD256_UNARY_SIGN_EXTENSION_OP(V)
Definition wasm-revec-reducer.h:60

SPLAT_KIND_MAPPING
#define SPLAT_KIND_MAPPING(from, to)

TRANSFORM_KIND_MAPPING
#define TRANSFORM_KIND_MAPPING(from, to)

BINOP_KIND_MAPPING
#define BINOP_KIND_MAPPING(from, to)

SIMD256_SHIFT_OP
#define SIMD256_SHIFT_OP(V)
Definition wasm-revec-reducer.h:171

SIMD256_TERNARY_OP
#define SIMD256_TERNARY_OP(V)
Definition wasm-revec-reducer.h:181

UNOP_KIND_MAPPING
#define UNOP_KIND_MAPPING(from, to)

TERNARY_KIND_MAPPING
#define TERNARY_KIND_MAPPING(from, to)

SIMD256_BINOP_SIMPLE_OP
#define SIMD256_BINOP_SIMPLE_OP(V)
Definition wasm-revec-reducer.h:68

SIMD256_UNARY_SIMPLE_OP
#define SIMD256_UNARY_SIMPLE_OP(V)
Definition wasm-revec-reducer.h:35