[midend]非全0初始化数组情况下，检查0初始值个数，超过阈值（目前为16）则生成menset减少大量store操作

2025-08-02 02:33:25 +08:00
parent e48cddab9f
commit bfe218be07
1 changed files with 98 additions and 27 deletions
--- a/src/midend/SysYIRGenerator.cpp
+++ b/src/midend/SysYIRGenerator.cpp
@ -653,7 +653,44 @@ std::any SysYIRGenerator::visitConstDecl(SysYParser::ConstDeclContext *ctx) {
          Value *currentValue = counterValues[k];
          unsigned currentRepeatNum = counterNumbers[k];
          // 检查是否是0，并且重复次数足够大（例如 >16），才用 memset
          if (ConstantInteger *constInt = dynamic_cast<ConstantInteger *>(currentValue)) {
            if (constInt->getInt() == 0 && currentRepeatNum >= 16) { // 阈值可调整（如16、32等）
              // 计算 memset 的起始地址（基于当前线性偏移量）
              std::vector<Value *> memsetStartIndices;
              int tempLinearIndex = linearIndexOffset;
              // 将线性索引转换为多维索引
              for (int dimIdx = dimSizes.size() - 1; dimIdx >= 0; --dimIdx) {
                memsetStartIndices.insert(memsetStartIndices.begin(),
                                          ConstantInteger::get(static_cast<int>(tempLinearIndex % dimSizes[dimIdx])));
                tempLinearIndex /= dimSizes[dimIdx];
              }
              // 构造 GEP 计算 memset 的起始地址
              std::vector<Value *> gepIndicesForMemset;
              gepIndicesForMemset.push_back(ConstantInteger::get(0)); // 跳过 alloca 类型
              gepIndicesForMemset.insert(gepIndicesForMemset.end(), memsetStartIndices.begin(),
                                         memsetStartIndices.end());
              Value *memsetPtr = builder.createGetElementPtrInst(alloca, gepIndicesForMemset);
              // 计算 memset 的字节数 = 元素个数 × 元素大小
              Type *elementType = type;;
              uint64_t elementSize = elementType->getSize();
              Value *size = ConstantInteger::get(currentRepeatNum * elementSize);
              // 生成 memset 指令（假设你的 IRBuilder 有 createMemset 方法）
              builder.createMemsetInst(memsetPtr, ConstantInteger::get(0), size, ConstantInteger::get(0));
              // 跳过这些已处理的0
              linearIndexOffset += currentRepeatNum;
              continue; // 直接进入下一次循环
            }
          }
          for (unsigned i = 0; i < currentRepeatNum; ++i) {
            // 对于非零值，生成对应的 store 指令
            std::vector<Value *> currentIndices;
            int tempLinearIndex = linearIndexOffset + i; // 使用偏移量和当前重复次数内的索引
@ -761,39 +798,73 @@ std::any SysYIRGenerator::visitVarDecl(SysYParser::VarDeclContext *ctx) {
              ConstantInteger::get(0));
        }
        else {
-          
+
          int linearIndexOffset = 0; // 用于追踪当前处理的线性索引的偏移量
          for (int k = 0; k < counterValues.size(); ++k) {
-              // 当前 Value 的值和重复次数
+            // 当前 Value 的值和重复次数
-              Value* currentValue = counterValues[k];
+            Value *currentValue = counterValues[k];
-              unsigned currentRepeatNum = counterNumbers[k];
+            unsigned currentRepeatNum = counterNumbers[k];
            // 检查是否是0，并且重复次数足够大（例如 >16），才用 memset
            if (ConstantInteger *constInt = dynamic_cast<ConstantInteger *>(currentValue)) {
              if (constInt->getInt() == 0 && currentRepeatNum >= 16) { // 阈值可调整（如16、32等）
                // 计算 memset 的起始地址（基于当前线性偏移量）
                std::vector<Value *> memsetStartIndices;
                int tempLinearIndex = linearIndexOffset;
-              for (unsigned i = 0; i < currentRepeatNum; ++i) {
+                // 将线性索引转换为多维索引
-                  std::vector<Value *> currentIndices;
+                for (int dimIdx = dimSizes.size() - 1; dimIdx >= 0; --dimIdx) {
-                  int tempLinearIndex = linearIndexOffset + i; // 使用偏移量和当前重复次数内的索引
+                  memsetStartIndices.insert(memsetStartIndices.begin(),
                                            ConstantInteger::get(static_cast<int>(tempLinearIndex % dimSizes[dimIdx])));
                  tempLinearIndex /= dimSizes[dimIdx];
                }
-                  // 将线性索引转换为多维索引
+                // 构造 GEP 计算 memset 的起始地址
-                  for (int dimIdx = dimSizes.size() - 1; dimIdx >= 0; --dimIdx) {
+                std::vector<Value *> gepIndicesForMemset;
-                      currentIndices.insert(currentIndices.begin(),
+                gepIndicesForMemset.push_back(ConstantInteger::get(0)); // 跳过 alloca 类型
-                                          ConstantInteger::get(static_cast<int>(tempLinearIndex % dimSizes[dimIdx])));
+                gepIndicesForMemset.insert(gepIndicesForMemset.end(), memsetStartIndices.begin(),
-                      tempLinearIndex /= dimSizes[dimIdx];
+                                           memsetStartIndices.end());
-                  }
+
-                  
+                Value *memsetPtr = builder.createGetElementPtrInst(alloca, gepIndicesForMemset);
-                  // 对于局部数组，alloca 本身就是 GEP 的基指针。
+
-                  // GEP 的第一个索引必须是 0，用于“步过”整个数组。
+                // 计算 memset 的字节数 = 元素个数 × 元素大小
-                  std::vector<Value*> gepIndicesForInit;
+                Type *elementType = type;
-                  gepIndicesForInit.push_back(ConstantInteger::get(0));
+                ;
-                  gepIndicesForInit.insert(gepIndicesForInit.end(), currentIndices.begin(), currentIndices.end());
+                uint64_t elementSize = elementType->getSize();
-                  
+                Value *size = ConstantInteger::get(currentRepeatNum * elementSize);
-                  // 计算元素的地址
+
-                  Value* elementAddress = getGEPAddressInst(alloca, gepIndicesForInit);
+                // 生成 memset 指令（假设你的 IRBuilder 有 createMemset 方法）
-                  // 生成 store 指令
+                builder.createMemsetInst(memsetPtr, ConstantInteger::get(0), size, ConstantInteger::get(0));
-                  builder.createStoreInst(currentValue, elementAddress);
+
                // 跳过这些已处理的0
                linearIndexOffset += currentRepeatNum;
                continue; // 直接进入下一次循环
              }
-              // 更新线性索引偏移量，以便下一次迭代从正确的位置开始
+            }
-              linearIndexOffset += currentRepeatNum;
+            for (unsigned i = 0; i < currentRepeatNum; ++i) {
-          }
+              std::vector<Value *> currentIndices;
              int tempLinearIndex = linearIndexOffset + i; // 使用偏移量和当前重复次数内的索引
              // 将线性索引转换为多维索引
              for (int dimIdx = dimSizes.size() - 1; dimIdx >= 0; --dimIdx) {
                currentIndices.insert(currentIndices.begin(),
                                      ConstantInteger::get(static_cast<int>(tempLinearIndex % dimSizes[dimIdx])));
                tempLinearIndex /= dimSizes[dimIdx];
              }
              // 对于局部数组，alloca 本身就是 GEP 的基指针。
              // GEP 的第一个索引必须是 0，用于“步过”整个数组。
              std::vector<Value *> gepIndicesForInit;
              gepIndicesForInit.push_back(ConstantInteger::get(0));
              gepIndicesForInit.insert(gepIndicesForInit.end(), currentIndices.begin(), currentIndices.end());
              // 计算元素的地址
              Value *elementAddress = getGEPAddressInst(alloca, gepIndicesForInit);
              // 生成 store 指令
              builder.createStoreInst(currentValue, elementAddress);
            }
            // 更新线性索引偏移量，以便下一次迭代从正确的位置开始
            linearIndexOffset += currentRepeatNum;
          }
        }
      }
    }