Files
SAPFOR/src/Transformations/SwapOperators/swap_operators.cpp

299 lines
11 KiB
C++
Raw Normal View History

2025-03-25 15:18:49 +03:00
#include <map>
#include <unordered_set>
#include <vector>
#include <queue>
#include <iostream>
2025-10-23 14:54:43 +03:00
#include <algorithm>
2025-03-25 15:18:49 +03:00
2025-06-02 08:54:45 +03:00
#include "../../Utils/errors.h"
#include "../../Utils/SgUtils.h"
#include "../../GraphCall/graph_calls.h"
#include "../../GraphCall/graph_calls_func.h"
#include "../../CFGraph/CFGraph.h"
#include "../../CFGraph/IR.h"
#include "../../GraphLoop/graph_loops.h"
#include "swap_operators.h"
2025-03-25 15:18:49 +03:00
2025-05-13 00:46:32 +03:00
using namespace std;
2025-03-25 15:18:49 +03:00
2025-10-23 14:54:43 +03:00
string getNameByArg(SAPFOR::Argument* arg);
SgSymbol* getSybolByArg(SAPFOR::Argument* arg);
2025-05-13 00:46:32 +03:00
2025-10-23 14:54:43 +03:00
static vector<SAPFOR::IR_Block*> findInstructionsFromOperator(SgStatement* st, vector<SAPFOR::BasicBlock*> Blocks) {
2025-05-13 00:46:32 +03:00
vector<SAPFOR::IR_Block*> result;
2025-10-23 14:54:43 +03:00
string filename = st->fileName();
for (auto& block: Blocks) {
vector<SAPFOR::IR_Block*> instructionsInBlock = block->getInstructions();
for (auto& instruction: instructionsInBlock) {
SgStatement* curOperator = instruction->getInstruction()->getOperator();
// Match by line number to find corresponding IR instruction
if (curOperator->lineNumber() == st->lineNumber()) {
2025-05-13 00:46:32 +03:00
result.push_back(instruction);
2025-10-23 14:54:43 +03:00
}
2025-05-13 00:46:32 +03:00
}
}
return result;
}
2025-10-23 14:54:43 +03:00
unordered_set<int> loop_tags = {FOR_NODE};
unordered_set<int> control_tags = {IF_NODE, ELSEIF_NODE, DO_WHILE_NODE, WHILE_NODE};
unordered_set<int> control_end_tags = {CONTROL_END};
2025-05-13 00:46:32 +03:00
2025-10-23 14:54:43 +03:00
struct OperatorInfo {
SgStatement* stmt;
set<string> usedVars;
set<string> definedVars;
int lineNumber;
bool isMovable;
OperatorInfo(SgStatement* s) : stmt(s), lineNumber(s->lineNumber()), isMovable(true) {}
};
2025-05-13 00:46:32 +03:00
2025-10-23 14:54:43 +03:00
static vector<OperatorInfo> analyzeOperatorsInLoop(SgForStmt* loop, vector<SAPFOR::BasicBlock*> blocks, map<FuncInfo*, vector<SAPFOR::BasicBlock*>>& FullIR) {
vector<OperatorInfo> operators;
SgStatement* loopStart = loop->lexNext();
SgStatement* loopEnd = loop->lastNodeOfStmt();
SgStatement* current = loopStart;
while (current && current != loopEnd) {
if (isSgExecutableStatement(current)) {
OperatorInfo opInfo(current);
vector<SAPFOR::IR_Block*> irBlocks = findInstructionsFromOperator(current, blocks);
for (auto irBlock : irBlocks) {
SAPFOR::Instruction* instr = irBlock->getInstruction();
if (instr->getArg1()) {
string varName = getNameByArg(instr->getArg1());
if (!varName.empty()) {
opInfo.usedVars.insert(varName);
2025-05-22 22:41:09 +03:00
}
}
2025-10-23 14:54:43 +03:00
if (instr->getArg2()) {
string varName = getNameByArg(instr->getArg2());
if (!varName.empty()) {
opInfo.usedVars.insert(varName);
}
}
if (instr->getResult()) {
string varName = getNameByArg(instr->getResult());
if (!varName.empty()) {
opInfo.definedVars.insert(varName);
2025-05-22 22:41:09 +03:00
}
}
}
2025-10-23 14:54:43 +03:00
if (control_tags.find(current->variant()) != control_tags.end()) {
opInfo.isMovable = false;
}
operators.push_back(opInfo);
2025-05-22 22:41:09 +03:00
}
2025-10-23 14:54:43 +03:00
current = current->lexNext();
2025-05-22 22:41:09 +03:00
}
2025-10-23 14:54:43 +03:00
return operators;
2025-05-13 00:46:32 +03:00
}
2025-10-23 14:54:43 +03:00
static map<string, vector<SgStatement*>> findVariableDefinitions(SgForStmt* loop, vector<OperatorInfo>& operators) {
map<string, vector<SgStatement*>> varDefinitions;
for (auto& op : operators) {
for (const string& var : op.definedVars) {
varDefinitions[var].push_back(op.stmt);
2025-05-24 19:56:15 +03:00
}
}
2025-10-23 14:54:43 +03:00
return varDefinitions;
2025-05-24 19:56:15 +03:00
}
2025-10-23 14:54:43 +03:00
static int calculateDistance(SgStatement* from, SgStatement* to) {
if (!from || !to) return INT_MAX;
return abs(to->lineNumber() - from->lineNumber());
}
2025-05-24 19:56:15 +03:00
2025-10-23 14:54:43 +03:00
static SgStatement* findBestPosition(SgStatement* operatorStmt, vector<OperatorInfo>& operators, map<string, vector<SgStatement*>>& varDefinitions) {
OperatorInfo* opInfo = nullptr;
for (auto& op : operators) {
if (op.stmt == operatorStmt) {
opInfo = &op;
break;
2025-05-27 15:55:02 +03:00
}
}
2025-10-23 14:54:43 +03:00
if (!opInfo || !opInfo->isMovable) return nullptr;
SgStatement* bestPos = nullptr;
int minDistance = INT_MAX;
for (const string& usedVar : opInfo->usedVars) {
if (varDefinitions.find(usedVar) != varDefinitions.end()) {
for (SgStatement* defStmt : varDefinitions[usedVar]) {
int distance = calculateDistance(operatorStmt, defStmt);
if (distance < minDistance) {
minDistance = distance;
bestPos = defStmt;
2025-05-24 19:56:15 +03:00
}
}
}
2025-05-22 22:41:09 +03:00
}
2025-10-23 14:54:43 +03:00
return bestPos;
2025-05-24 19:56:15 +03:00
}
2025-10-23 14:54:43 +03:00
static bool canMoveTo(SgStatement* from, SgStatement* to, SgForStmt* loop) {
if (!from || !to || from == to) return false;
2025-10-08 23:14:19 +03:00
SgStatement* loopStart = loop->lexNext();
SgStatement* loopEnd = loop->lastNodeOfStmt();
2025-10-23 14:54:43 +03:00
if (to->lineNumber() < loopStart->lineNumber() || to->lineNumber() > loopEnd->lineNumber()) {
return false;
}
SgStatement* current = from;
while (current && current != loopEnd) {
if (control_tags.find(current->variant()) != control_tags.end()) {
return false;
}
if (current == to) break;
current = current->lexNext();
}
return true;
}
2025-10-08 23:14:19 +03:00
2025-10-23 14:54:43 +03:00
static vector<SgStatement*> optimizeOperatorOrder(SgForStmt* loop, vector<OperatorInfo>& operators, map<string, vector<SgStatement*>>& varDefinitions) {
vector<SgStatement*> newOrder;
vector<bool> moved(operators.size(), false);
for (size_t i = 0; i < operators.size(); i++) {
if (moved[i] || !operators[i].isMovable) {
newOrder.push_back(operators[i].stmt);
moved[i] = true;
continue;
}
SgStatement* bestPos = findBestPosition(operators[i].stmt, operators, varDefinitions);
if (bestPos && canMoveTo(operators[i].stmt, bestPos, loop)) {
bool inserted = false;
for (size_t j = 0; j < newOrder.size(); j++) {
if (newOrder[j] == bestPos) {
newOrder.insert(newOrder.begin() + j + 1, operators[i].stmt);
inserted = true;
2025-10-08 23:14:19 +03:00
break;
}
}
2025-10-23 14:54:43 +03:00
if (!inserted) {
newOrder.push_back(operators[i].stmt);
}
} else {
newOrder.push_back(operators[i].stmt);
2025-10-08 23:14:19 +03:00
}
2025-10-23 14:54:43 +03:00
moved[i] = true;
2025-05-27 15:55:02 +03:00
}
2025-10-23 14:54:43 +03:00
return newOrder;
}
2025-05-27 15:55:02 +03:00
2025-10-23 14:54:43 +03:00
static bool applyOperatorReordering(SgForStmt* loop, vector<SgStatement*>& newOrder) {
if (!loop || newOrder.empty()) return false;
SgStatement* loopStart = loop->lexNext();
SgStatement* loopEnd = loop->lastNodeOfStmt();
2025-10-08 23:14:19 +03:00
vector<SgStatement*> extractedStatements;
vector<char*> savedComments;
2025-10-23 14:54:43 +03:00
for (SgStatement* stmt : newOrder) {
2025-10-08 23:14:19 +03:00
if (stmt && stmt != loop && stmt != loopEnd) {
savedComments.push_back(stmt->comments() ? strdup(stmt->comments()) : nullptr);
SgStatement* extracted = stmt->extractStmt();
2025-10-23 14:54:43 +03:00
if (extracted) {
extractedStatements.push_back(extracted);
}
2025-10-08 23:14:19 +03:00
}
}
2025-10-23 14:54:43 +03:00
2025-10-08 23:14:19 +03:00
SgStatement* currentPos = loop;
int lineCounter = loop->lineNumber() + 1;
for (size_t i = 0; i < extractedStatements.size(); i++) {
SgStatement* stmt = extractedStatements[i];
if (stmt) {
if (i < savedComments.size() && savedComments[i]) {
stmt->setComments(savedComments[i]);
}
stmt->setlineNumber(lineCounter++);
currentPos->insertStmtAfter(*stmt, *loop);
currentPos = stmt;
}
}
2025-10-23 14:54:43 +03:00
2025-10-08 23:14:19 +03:00
for (char* comment : savedComments) {
if (comment) {
free(comment);
}
}
2025-10-23 14:54:43 +03:00
2025-10-08 23:14:19 +03:00
if (currentPos && currentPos->lexNext() != loopEnd) {
currentPos->setLexNext(*loopEnd);
}
return true;
}
2025-10-23 14:54:43 +03:00
vector<SAPFOR::BasicBlock*> findFuncBlocksByFuncStatement(SgStatement *st, map<FuncInfo*, vector<SAPFOR::BasicBlock*>>& FullIR) {
vector<SAPFOR::BasicBlock*> result;
Statement* forSt = (Statement*)st;
for (auto& func: FullIR) {
if (func.first -> funcPointer -> getCurrProcessFile() == forSt -> getCurrProcessFile()
&& func.first -> funcPointer -> lineNumber() == forSt -> lineNumber())
result = func.second;
2025-10-08 23:14:19 +03:00
}
2025-10-23 14:54:43 +03:00
return result;
}
map<SgForStmt*, vector<SAPFOR::BasicBlock*>> findAndAnalyzeLoops(SgStatement *st, vector<SAPFOR::BasicBlock*> blocks) {
map<SgForStmt*, vector<SAPFOR::BasicBlock*>> result;
SgStatement *lastNode = st->lastNodeOfStmt();
while (st && st != lastNode) {
if (loop_tags.find(st -> variant()) != loop_tags.end()) {
SgForStmt *forSt = (SgForStmt*)st;
SgStatement *loopBody = forSt -> body();
SgStatement *lastLoopNode = st->lastNodeOfStmt();
unordered_set<int> blocks_nums;
while (loopBody && loopBody != lastLoopNode) {
SAPFOR::IR_Block* IR = findInstructionsFromOperator(loopBody, blocks).front();
if (blocks_nums.find(IR -> getBasicBlock() -> getNumber()) == blocks_nums.end()) {
result[forSt].push_back(IR -> getBasicBlock());
blocks_nums.insert(IR -> getBasicBlock() -> getNumber());
}
loopBody = loopBody -> lexNext();
2025-10-08 23:14:19 +03:00
}
2025-10-23 14:54:43 +03:00
std::sort(result[forSt].begin(), result[forSt].end());
2025-10-08 23:14:19 +03:00
}
2025-10-23 14:54:43 +03:00
st = st -> lexNext();
2025-10-08 23:14:19 +03:00
}
2025-10-23 14:54:43 +03:00
return result;
2025-10-08 23:14:19 +03:00
}
2025-05-22 22:41:09 +03:00
2025-10-23 14:54:43 +03:00
void runSwapOperators(SgFile *file, std::map<std::string, std::vector<LoopGraph*>>& loopGraph, std::map<FuncInfo*, std::vector<SAPFOR::BasicBlock*>>& FullIR, int& countOfTransform) {
countOfTransform += 1;
2025-05-13 00:46:32 +03:00
const int funcNum = file -> numberOfFunctions();
2025-10-23 14:54:43 +03:00
for (int i = 0; i < funcNum; ++i) {
SgStatement *st = file -> functions(i);
2025-05-13 00:46:32 +03:00
vector<SAPFOR::BasicBlock*> blocks = findFuncBlocksByFuncStatement(st, FullIR);
map<SgForStmt*, vector<SAPFOR::BasicBlock*>> loopsMapping = findAndAnalyzeLoops(st, blocks);
2025-10-23 14:54:43 +03:00
for (pair<SgForStmt*, vector<SAPFOR::BasicBlock*>> loopForAnalyze: loopsMapping) {
vector<OperatorInfo> operators = analyzeOperatorsInLoop(loopForAnalyze.first, loopForAnalyze.second, FullIR);
map<string, vector<SgStatement*>> varDefinitions = findVariableDefinitions(loopForAnalyze.first, operators);
vector<SgStatement*> newOrder = optimizeOperatorOrder(loopForAnalyze.first, operators, varDefinitions);
applyOperatorReordering(loopForAnalyze.first, newOrder);
2025-05-13 00:46:32 +03:00
}
}
2025-10-23 14:54:43 +03:00
}