#include "RISCv64Backend.h" #include "RISCv64ISel.h" #include "RISCv64RegAlloc.h" #include "RISCv64AsmPrinter.h" #include "RISCv64Passes.h" #include namespace sysy { // 顶层入口 std::string RISCv64CodeGen::code_gen() { return module_gen(); } unsigned RISCv64CodeGen::getTypeSizeInBytes(Type* type) { if (!type) { assert(false && "Cannot get size of a null type."); return 0; } switch (type->getKind()) { // 对于SysY语言,基本类型int和float都占用4字节 case Type::kInt: case Type::kFloat: return 4; // 指针类型在RISC-V 64位架构下占用8字节 // 虽然SysY没有'int*'语法,但数组变量在IR层面本身就是指针类型 case Type::kPointer: return 8; // 数组类型的总大小 = 元素数量 * 单个元素的大小 case Type::kArray: { auto arrayType = type->as(); // 递归调用以计算元素大小 return arrayType->getNumElements() * getTypeSizeInBytes(arrayType->getElementType()); } // 其他类型,如Void, Label等不占用栈空间,或者不应该出现在这里 default: // 如果遇到未处理的类型,触发断言,方便调试 // assert(false && "Unsupported type for size calculation."); return 0; // 对于像Label或Void这样的类型,返回0是合理的 } } void printInitializer(std::stringstream& ss, const ValueCounter& init_values) { for (size_t i = 0; i < init_values.getValues().size(); ++i) { auto val = init_values.getValues()[i]; auto count = init_values.getNumbers()[i]; if (auto constant = dynamic_cast(val)) { for (unsigned j = 0; j < count; ++j) { if (constant->isInt()) { ss << " .word " << constant->getInt() << "\n"; } else { float f = constant->getFloat(); uint32_t float_bits = *(uint32_t*)&f; ss << " .word " << float_bits << "\n"; } } } } } std::string RISCv64CodeGen::module_gen() { std::stringstream ss; // --- 步骤1:将全局变量(GlobalValue)分为.data和.bss两组 --- std::vector data_globals; std::vector bss_globals; for (const auto& global_ptr : module->getGlobals()) { GlobalValue* global = global_ptr.get(); // 使用更健壮的逻辑来判断是否为大型零初始化数组 bool is_all_zeros = true; const auto& init_values = global->getInitValues(); // 检查初始化值是否全部为0 if (init_values.getValues().empty()) { // 如果 ValueCounter 为空,GlobalValue 的构造函数会确保它是零初始化的 is_all_zeros = true; } else { for (auto val : init_values.getValues()) { if (auto const_val = dynamic_cast(val)) { if (!const_val->isZero()) { is_all_zeros = false; break; } } else { // 如果初始值包含非常量(例如,另一个全局变量的地址),则不认为是纯零初始化 is_all_zeros = false; break; } } } // 使用 getTypeSizeInBytes 检查总大小是否超过阈值 (16个整数 = 64字节) Type* allocated_type = global->getType()->as()->getBaseType(); unsigned total_size = getTypeSizeInBytes(allocated_type); bool is_large_zero_array = is_all_zeros && (total_size > 64); if (is_large_zero_array) { bss_globals.push_back(global); } else { data_globals.push_back(global); } } // --- 步骤2:生成 .bss 段的代码 --- if (!bss_globals.empty()) { ss << ".bss\n"; for (GlobalValue* global : bss_globals) { Type* allocated_type = global->getType()->as()->getBaseType(); unsigned total_size = getTypeSizeInBytes(allocated_type); ss << " .align 3\n"; ss << ".globl " << global->getName() << "\n"; ss << ".type " << global->getName() << ", @object\n"; ss << ".size " << global->getName() << ", " << total_size << "\n"; ss << global->getName() << ":\n"; ss << " .space " << total_size << "\n"; } } // --- 步骤3:生成 .data 段的代码 --- if (!data_globals.empty() || !module->getConsts().empty()) { ss << ".data\n"; // a. 处理普通的全局变量 (GlobalValue) for (GlobalValue* global : data_globals) { Type* allocated_type = global->getType()->as()->getBaseType(); unsigned total_size = getTypeSizeInBytes(allocated_type); ss << " .align 3\n"; ss << ".globl " << global->getName() << "\n"; ss << ".type " << global->getName() << ", @object\n"; ss << ".size " << global->getName() << ", " << total_size << "\n"; ss << global->getName() << ":\n"; bool is_all_zeros = true; const auto& init_values = global->getInitValues(); if (init_values.getValues().empty()) { is_all_zeros = true; } else { for (auto val : init_values.getValues()) { if (auto const_val = dynamic_cast(val)) { if (!const_val->isZero()) { is_all_zeros = false; break; } } else { is_all_zeros = false; break; } } } if (is_all_zeros) { ss << " .zero " << total_size << "\n"; } else { // 对于有非零初始值的变量,保持原有的打印逻辑。 printInitializer(ss, global->getInitValues()); } } // b. 处理全局常量 (ConstantVariable) for (const auto& const_ptr : module->getConsts()) { ConstantVariable* cnst = const_ptr.get(); Type* allocated_type = cnst->getType()->as()->getBaseType(); unsigned total_size = getTypeSizeInBytes(allocated_type); ss << " .align 3\n"; ss << ".globl " << cnst->getName() << "\n"; ss << ".type " << cnst->getName() << ", @object\n"; ss << ".size " << cnst->getName() << ", " << total_size << "\n"; ss << cnst->getName() << ":\n"; printInitializer(ss, cnst->getInitValues()); } } // --- 步骤4:处理函数 (.text段) 的逻辑 --- if (!module->getFunctions().empty()) { ss << ".text\n"; for (const auto& func_pair : module->getFunctions()) { if (func_pair.second.get() && !func_pair.second->getBasicBlocks().empty()) { ss << function_gen(func_pair.second.get()); if (DEBUG) std::cerr << "Function: " << func_pair.first << " generated.\n"; } } } return ss.str(); } std::string RISCv64CodeGen::function_gen(Function* func) { // === 完整的后端处理流水线 === // 阶段 1: 指令选择 (sysy::IR -> LLIR with virtual registers) DEBUG = 0; DEEPDEBUG = 0; RISCv64ISel isel; std::unique_ptr mfunc = isel.runOnFunction(func); // 第一次调试打印输出 std::stringstream ss_after_isel; RISCv64AsmPrinter printer_isel(mfunc.get()); printer_isel.run(ss_after_isel, true); if (DEBUG) { std::cout << ss_after_isel.str(); } if (DEBUG) { std::cerr << "====== Intermediate Representation after Instruction Selection ======\n" << ss_after_isel.str(); } // 阶段 2: 消除帧索引 (展开伪指令,计算局部变量偏移) // 这个Pass必须在寄存器分配之前运行 EliminateFrameIndicesPass efi_pass; efi_pass.runOnMachineFunction(mfunc.get()); if (DEBUG) { std::cerr << "====== stack info after eliminate frame indices ======\n"; mfunc->dumpStackFrameInfo(std::cerr); std::stringstream ss_after_eli; printer_isel.run(ss_after_eli, true); std::cerr << "====== LLIR after eliminate frame indices ======\n" << ss_after_eli.str(); } // 阶段 2: 除法强度削弱优化 (Division Strength Reduction) DivStrengthReduction div_strength_reduction; div_strength_reduction.runOnMachineFunction(mfunc.get()); // 阶段 2.1: 指令调度 (Instruction Scheduling) PreRA_Scheduler scheduler; scheduler.runOnMachineFunction(mfunc.get()); // 阶段 3: 物理寄存器分配 (Register Allocation) RISCv64RegAlloc reg_alloc(mfunc.get()); reg_alloc.run(); if (DEBUG) { std::cerr << "====== stack info after reg alloc ======\n"; mfunc->dumpStackFrameInfo(std::cerr); } // 阶段 3.1: 处理被调用者保存寄存器 CalleeSavedHandler callee_handler; callee_handler.runOnMachineFunction(mfunc.get()); if (DEBUG) { std::cerr << "====== stack info after callee handler ======\n"; mfunc->dumpStackFrameInfo(std::cerr); } // 阶段 4: 窥孔优化 (Peephole Optimization) PeepholeOptimizer peephole; peephole.runOnMachineFunction(mfunc.get()); // 阶段 5: 局部指令调度 (Local Scheduling) PostRA_Scheduler local_scheduler; local_scheduler.runOnMachineFunction(mfunc.get()); // 阶段 3.2: 插入序言和尾声 PrologueEpilogueInsertionPass pei_pass; pei_pass.runOnMachineFunction(mfunc.get()); // 阶段 3.3: 大立即数合法化 LegalizeImmediatesPass legalizer; legalizer.runOnMachineFunction(mfunc.get()); // 阶段 6: 代码发射 (Code Emission) std::stringstream ss; RISCv64AsmPrinter printer(mfunc.get()); printer.run(ss); return ss.str(); } } // namespace sysy