Compare commits
15 Commits
libpredict
...
a8f8f44ac1
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
a8f8f44ac1 | ||
| 1c39001e28 | |||
| 7802f538e8 | |||
| 93fa183b63 | |||
| a07a701826 | |||
|
|
e99855cdff | ||
| f07bea4980 | |||
|
|
3de06d9261 | ||
| 678c2cf351 | |||
| 40cfd83de5 | |||
|
|
a0cea2df91 | ||
|
|
4b7df86b8a | ||
| 836894fef1 | |||
| 9ac15eec79 | |||
| 03f565f50b |
@@ -163,6 +163,10 @@ set(PARALLEL_REG src/ParallelizationRegions/ParRegions.cpp
|
||||
src/ParallelizationRegions/resolve_par_reg_conflicts.cpp
|
||||
src/ParallelizationRegions/resolve_par_reg_conflicts.h)
|
||||
|
||||
set(ARRAY_PROP src/ArrayConstantPropagation/propagation.cpp
|
||||
src/ArrayConstantPropagation/propagation.h
|
||||
)
|
||||
|
||||
set(TR_DEAD_CODE src/Transformations/DeadCodeRemoving/dead_code.cpp
|
||||
src/Transformations/DeadCodeRemoving/dead_code.h)
|
||||
set(TR_CP src/Transformations/CheckPoints/checkpoints.cpp
|
||||
@@ -331,9 +335,7 @@ set(MAIN src/Sapfor.cpp
|
||||
src/Utils/PassManager.h)
|
||||
|
||||
set(PREDICTOR src/Predictor/PredictScheme.cpp
|
||||
src/Predictor/PredictScheme.h
|
||||
src/Predictor/PredictSchemeWithLibrary.cpp
|
||||
src/Predictor/PredictSchemeWithLibrary.h)
|
||||
src/Predictor/PredictScheme.h)
|
||||
|
||||
set(LIBPREDICTOR ${libpred_sources}/cluster.cpp
|
||||
${libpred_sources}/predictor.cpp
|
||||
@@ -422,6 +424,7 @@ set(SOURCE_EXE
|
||||
${TRANSFORMS}
|
||||
${PARALLEL_REG}
|
||||
${PRIV}
|
||||
${ARRAY_PROP}
|
||||
${FDVM}
|
||||
${OMEGA}
|
||||
${UTILS}
|
||||
@@ -473,6 +476,7 @@ source_group (GraphLoop FILES ${GR_LOOP})
|
||||
source_group (LoopAnalyzer FILES ${LOOP_ANALYZER})
|
||||
source_group (ParallelizationRegions FILES ${PARALLEL_REG})
|
||||
source_group (PrivateAnalyzer FILES ${PRIV})
|
||||
source_group (ArrayConstantPropagation FILES ${ARRAY_PROP})
|
||||
source_group (FDVM_Compiler FILES ${FDVM})
|
||||
source_group (SageExtension FILES ${OMEGA})
|
||||
source_group (Utils FILES ${UTILS})
|
||||
|
||||
Submodule projects/dvm updated: 4b7ef11871...4d4041a081
Submodule projects/libpredictor updated: e6e805a390...d0772cdb57
301
src/ArrayConstantPropagation/propagation.cpp
Normal file
301
src/ArrayConstantPropagation/propagation.cpp
Normal file
@@ -0,0 +1,301 @@
|
||||
#include "propagation.h"
|
||||
|
||||
#include "../Utils/SgUtils.h"
|
||||
|
||||
#include <iostream>
|
||||
#include <unordered_map>
|
||||
#include <unordered_set>
|
||||
#include <vector>
|
||||
|
||||
using namespace std;
|
||||
|
||||
static SgStatement* declPlace = NULL;
|
||||
|
||||
static bool CheckConstIndexes(SgExpression* exp)
|
||||
{
|
||||
if (!exp)
|
||||
{
|
||||
return true;
|
||||
}
|
||||
SgExpression* lhs = exp->lhs();
|
||||
SgExpression* rhs = exp->rhs();
|
||||
do
|
||||
{
|
||||
if (lhs->variant() != INT_VAL)
|
||||
{
|
||||
return false;
|
||||
}
|
||||
if (rhs)
|
||||
{
|
||||
lhs = rhs->lhs();
|
||||
rhs = rhs->rhs();
|
||||
}
|
||||
} while (rhs);
|
||||
return true;
|
||||
}
|
||||
|
||||
static SgExpression* CreateVar(int& variableNumber, SgType* type)
|
||||
{
|
||||
string varName = "__tmp_prop_var";
|
||||
string name = varName + std::to_string(variableNumber) + "__";
|
||||
variableNumber++;
|
||||
|
||||
SgSymbol* varSymbol = new SgSymbol(VARIABLE_NAME, name.c_str(), *type, *declPlace->controlParent());
|
||||
|
||||
const string commonBlockName = "__propagation_common__";
|
||||
|
||||
SgStatement* funcStart = declPlace->controlParent();
|
||||
SgStatement* commonStat = NULL;
|
||||
SgExpression* commonList = NULL;
|
||||
|
||||
SgStatement* funcEnd = funcStart->lastNodeOfStmt();
|
||||
SgStatement* current = funcStart->lexNext();
|
||||
|
||||
while (current != funcEnd && current)
|
||||
{
|
||||
if (current->variant() == COMM_STAT)
|
||||
{
|
||||
for (SgExpression* exp = current->expr(0); exp; exp = exp->rhs())
|
||||
{
|
||||
if (exp->variant() == COMM_LIST)
|
||||
{
|
||||
string existingName = exp->symbol() ?
|
||||
string(exp->symbol()->identifier()) :
|
||||
string("spf_unnamed");
|
||||
if (existingName == commonBlockName)
|
||||
{
|
||||
commonStat = current;
|
||||
commonList = exp;
|
||||
break;
|
||||
}
|
||||
}
|
||||
}
|
||||
if (commonStat)
|
||||
break;
|
||||
}
|
||||
current = current->lexNext();
|
||||
}
|
||||
|
||||
vector<SgExpression*> varRefs;
|
||||
if (commonList)
|
||||
{
|
||||
SgExpression* varList = commonList->lhs();
|
||||
if (varList)
|
||||
{
|
||||
auto extractSymbol = [](SgExpression* exp) -> SgSymbol* {
|
||||
if (!exp)
|
||||
return NULL;
|
||||
if (exp->symbol())
|
||||
return exp->symbol();
|
||||
if (exp->lhs() && exp->lhs()->symbol())
|
||||
return exp->lhs()->symbol();
|
||||
return NULL;
|
||||
};
|
||||
if (varList->variant() == EXPR_LIST)
|
||||
{
|
||||
for (SgExpression* exp = varList; exp; exp = exp->rhs())
|
||||
{
|
||||
SgExpression* varExp = exp->lhs();
|
||||
SgSymbol* sym = extractSymbol(varExp);
|
||||
if (sym)
|
||||
{
|
||||
varRefs.push_back(new SgVarRefExp(sym));
|
||||
}
|
||||
}
|
||||
}
|
||||
else
|
||||
{
|
||||
for (SgExpression* varExp = varList; varExp; varExp = varExp->rhs())
|
||||
{
|
||||
SgSymbol* sym = extractSymbol(varExp);
|
||||
if (sym)
|
||||
{
|
||||
varRefs.push_back(new SgVarRefExp(sym));
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
if (!commonList)
|
||||
{
|
||||
current = funcStart->lexNext();
|
||||
while (current != funcEnd && current)
|
||||
{
|
||||
if (current->variant() == COMM_STAT)
|
||||
{
|
||||
commonStat = current;
|
||||
break;
|
||||
}
|
||||
current = current->lexNext();
|
||||
}
|
||||
|
||||
SgSymbol* commonSymbol = new SgSymbol(COMMON_NAME, commonBlockName.c_str());
|
||||
commonList = new SgExpression(COMM_LIST, NULL, NULL, commonSymbol);
|
||||
|
||||
if (commonStat)
|
||||
{
|
||||
SgExpression* lastCommList = commonStat->expr(0);
|
||||
if (lastCommList)
|
||||
{
|
||||
while (lastCommList->rhs())
|
||||
lastCommList = lastCommList->rhs();
|
||||
lastCommList->setRhs(commonList);
|
||||
}
|
||||
else
|
||||
{
|
||||
commonStat->setExpression(0, commonList);
|
||||
}
|
||||
}
|
||||
else
|
||||
{
|
||||
commonStat = new SgStatement(COMM_STAT);
|
||||
commonStat->setFileName(declPlace->fileName());
|
||||
commonStat->setFileId(declPlace->getFileId());
|
||||
commonStat->setProject(declPlace->getProject());
|
||||
commonStat->setlineNumber(getNextNegativeLineNumber());
|
||||
commonStat->setExpression(0, commonList);
|
||||
|
||||
declPlace->insertStmtBefore(*commonStat, *declPlace->controlParent());
|
||||
}
|
||||
|
||||
}
|
||||
varRefs.push_back(new SgVarRefExp(varSymbol));
|
||||
|
||||
if (varRefs.size() > 0)
|
||||
{
|
||||
std::reverse(varRefs.begin(), varRefs.end());
|
||||
SgExpression* varList = makeExprList(varRefs, false);
|
||||
|
||||
commonList->setLhs(varList);
|
||||
}
|
||||
|
||||
return new SgExpression(VAR_REF, NULL, NULL, varSymbol, type->copyPtr());
|
||||
}
|
||||
|
||||
static void TransformRightPart(SgStatement* st, SgExpression* exp, unordered_map<string, SgExpression*>& arrayToVariable, int& variableNumber)
|
||||
{
|
||||
if (!exp)
|
||||
{
|
||||
return;
|
||||
}
|
||||
|
||||
vector<SgExpression*> subnodes = { exp->lhs(), exp->rhs() };
|
||||
|
||||
string expUnparsed;
|
||||
SgExpression* toAdd = NULL;
|
||||
if (exp->variant() == ARRAY_REF && CheckConstIndexes(exp->lhs()))
|
||||
{
|
||||
cout << st->unparse() << endl;
|
||||
if (arrayToVariable.find(expUnparsed) == arrayToVariable.end() && exp->symbol()->type()->baseType())
|
||||
{
|
||||
arrayToVariable[expUnparsed] = CreateVar(variableNumber, exp->symbol()->type()->baseType());
|
||||
}
|
||||
st->setExpression(1, arrayToVariable[expUnparsed]->copyPtr());
|
||||
return;
|
||||
}
|
||||
for (int i = 0; i < 2; i++)
|
||||
{
|
||||
if (subnodes[i] && subnodes[i]->variant() == ARRAY_REF && subnodes[i]->symbol()->type()->baseType() && CheckConstIndexes(subnodes[i]->lhs()))
|
||||
{
|
||||
expUnparsed = subnodes[i]->unparse();
|
||||
if (arrayToVariable.find(expUnparsed) == arrayToVariable.end())
|
||||
{
|
||||
arrayToVariable[expUnparsed] = CreateVar(variableNumber, subnodes[i]->symbol()->type()->baseType());;
|
||||
}
|
||||
toAdd = arrayToVariable[expUnparsed]->copyPtr();
|
||||
if (toAdd)
|
||||
{
|
||||
if (i == 0)
|
||||
{
|
||||
exp->setLhs(toAdd);
|
||||
}
|
||||
else
|
||||
{
|
||||
exp->setRhs(toAdd);
|
||||
}
|
||||
}
|
||||
}
|
||||
else
|
||||
{
|
||||
TransformRightPart(st, subnodes[i], arrayToVariable, variableNumber);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
static void TransformLeftPart(SgStatement* st, SgExpression* exp, unordered_map<string, SgExpression*>& arrayToVariable, int& variableNumber)
|
||||
{
|
||||
if (exp->symbol()->type()->variant() == T_STRING)
|
||||
return;
|
||||
string expUnparsed = exp->unparse();
|
||||
if (arrayToVariable.find(expUnparsed) == arrayToVariable.end() && exp->symbol()->type()->baseType())
|
||||
{
|
||||
arrayToVariable[expUnparsed] = CreateVar(variableNumber, exp->symbol()->type()->baseType());
|
||||
}
|
||||
SgStatement* newStatement = new SgStatement(ASSIGN_STAT, NULL, NULL, arrayToVariable[expUnparsed]->copyPtr(), st->expr(1)->copyPtr(), NULL);
|
||||
|
||||
newStatement->setFileId(st->getFileId());
|
||||
newStatement->setProject(st->getProject());
|
||||
|
||||
newStatement->setlineNumber(getNextNegativeLineNumber());
|
||||
newStatement->setLocalLineNumber(st->lineNumber());
|
||||
st->insertStmtBefore(*newStatement, *st->controlParent());
|
||||
}
|
||||
|
||||
void ArrayConstantPropagation(SgProject& project)
|
||||
{
|
||||
unordered_map<string, SgExpression*> arrayToVariable;
|
||||
int variableNumber = 0;
|
||||
for (int i = 0; i < project.numberOfFiles(); i++)
|
||||
{
|
||||
SgFile* file = &(project.file(i));
|
||||
|
||||
if (!file)
|
||||
continue;
|
||||
|
||||
const int funcNum = file->numberOfFunctions();
|
||||
for (int i = 0; i < funcNum; ++i)
|
||||
{
|
||||
SgStatement* st = file->functions(i);
|
||||
declPlace = st->lexNext();
|
||||
SgStatement* lastNode = st->lastNodeOfStmt();
|
||||
|
||||
for (; st != lastNode; st = st->lexNext())
|
||||
{
|
||||
if (st->variant() == ASSIGN_STAT)
|
||||
{
|
||||
if (st->expr(1))
|
||||
{
|
||||
TransformRightPart(st, st->expr(1), arrayToVariable, variableNumber);
|
||||
}
|
||||
if (st->expr(0) && st->expr(0)->variant() == ARRAY_REF && CheckConstIndexes(st->expr(0)->lhs()))
|
||||
{
|
||||
TransformLeftPart(st, st->expr(0), arrayToVariable, variableNumber);
|
||||
}
|
||||
}
|
||||
else if (st->variant() == FOR_NODE)
|
||||
{
|
||||
SgExpression* lowerBound = st->expr(0)->lhs();
|
||||
SgExpression* upperBound = st->expr(0)->rhs();
|
||||
string lowerBoundUnparsed = lowerBound->unparse(), upperBoundUnparsed = upperBound->unparse();
|
||||
if (upperBound->variant() == ARRAY_REF && upperBound->symbol()->type()->baseType() && CheckConstIndexes(upperBound->lhs()))
|
||||
{
|
||||
if (arrayToVariable.find(upperBoundUnparsed) == arrayToVariable.end())
|
||||
{
|
||||
arrayToVariable[upperBoundUnparsed] = CreateVar(variableNumber, upperBound->symbol()->type()->baseType());
|
||||
}
|
||||
st->expr(0)->setRhs(arrayToVariable[upperBoundUnparsed]->copyPtr());
|
||||
}
|
||||
if (lowerBound->variant() == ARRAY_REF && lowerBound->symbol()->type()->baseType() && CheckConstIndexes(lowerBound->lhs()))
|
||||
{
|
||||
if (arrayToVariable.find(lowerBoundUnparsed) == arrayToVariable.end())
|
||||
{
|
||||
arrayToVariable[lowerBoundUnparsed] = CreateVar(variableNumber, lowerBound->symbol()->type()->baseType());
|
||||
}
|
||||
st->expr(0)->setLhs(arrayToVariable[lowerBoundUnparsed]->copyPtr());
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
4
src/ArrayConstantPropagation/propagation.h
Normal file
4
src/ArrayConstantPropagation/propagation.h
Normal file
@@ -0,0 +1,4 @@
|
||||
#pragma once
|
||||
#include "../Utils/SgUtils.h"
|
||||
|
||||
void ArrayConstantPropagation(SgProject& project);
|
||||
@@ -122,7 +122,6 @@ static LoopGraph* createDirectiveForLoop(LoopGraph *currentLoop, MapToArray &mai
|
||||
if (found == false)
|
||||
{
|
||||
directive->shadowRenew.push_back(make_pair(key, vector<pair<int, int>>()));
|
||||
directive->shadowRenewCorner.push_back(false);
|
||||
|
||||
const DIST::Array *arrayRef = read;
|
||||
for (int i = 0; i < arrayRef->GetDimSize(); ++i)
|
||||
|
||||
@@ -274,7 +274,7 @@ static void convertTrees(const map<DIST::Array*, int> &treesIn, map<int, vector<
|
||||
static DIST::Array* findBestInEqual(vector<DIST::Array*> &arrays, DIST::GraphCSR<int, double, attrType> &reducedG, DIST::Arrays<int> &allArrays)
|
||||
{
|
||||
DIST::Array *retVal = NULL;
|
||||
vector<vector<attrType>> coefsByDims;
|
||||
vector<vector<attrType>> coeffsByDims;
|
||||
for (auto &array : arrays)
|
||||
{
|
||||
vector<int> verts;
|
||||
@@ -285,7 +285,7 @@ static DIST::Array* findBestInEqual(vector<DIST::Array*> &arrays, DIST::GraphCSR
|
||||
{
|
||||
retVal = array;
|
||||
for (auto &V : verts)
|
||||
coefsByDims.push_back(reducedG.GetAllAttributes(V));
|
||||
coeffsByDims.push_back(reducedG.GetAllAttributes(V));
|
||||
}
|
||||
else
|
||||
{
|
||||
@@ -294,11 +294,11 @@ static DIST::Array* findBestInEqual(vector<DIST::Array*> &arrays, DIST::GraphCSR
|
||||
toCmp.push_back(reducedG.GetAllAttributes(V));
|
||||
for (int z = 0; z < toCmp.size(); ++z)
|
||||
{
|
||||
if (toCmp[z].size() && coefsByDims[z].size())
|
||||
if (toCmp[z].size() && coeffsByDims[z].size())
|
||||
{
|
||||
if (toCmp[z].back().first.first > coefsByDims[z].back().first.first)
|
||||
if (toCmp[z].back().first.first > coeffsByDims[z].back().first.first)
|
||||
{
|
||||
coefsByDims = toCmp;
|
||||
coeffsByDims = toCmp;
|
||||
retVal = array;
|
||||
break;
|
||||
}
|
||||
|
||||
@@ -45,10 +45,10 @@ static bool findArrayRefAndCheck(SgExpression *ex, const DIST::Array* currArray,
|
||||
int countOfShadows = 0;
|
||||
for (int i = 0; i < ref->numberOfSubscripts(); ++i)
|
||||
{
|
||||
const vector<int*> &coefs = getAttributes<SgExpression*, int*>(ref->subscript(i), set<int>{ INT_VAL });
|
||||
if (coefs.size() == 1)
|
||||
const vector<int*> &coeffs = getAttributes<SgExpression*, int*>(ref->subscript(i), set<int>{ INT_VAL });
|
||||
if (coeffs.size() == 1)
|
||||
{
|
||||
const pair<int, int> coef(coefs[0][0], coefs[0][1]);
|
||||
const pair<int, int> coef(coeffs[0][0], coeffs[0][1]);
|
||||
auto it = shiftsByAccess[i].find(coef);
|
||||
if (it != shiftsByAccess[i].end())
|
||||
if (it->second != 0)
|
||||
@@ -857,11 +857,6 @@ ParallelDirective::genDirective(File* file, const vector<pair<DIST::Array*, cons
|
||||
shadowRenewShifts[i].resize(shadowRenew[i].second.size());
|
||||
}
|
||||
|
||||
if (shadowRenewCorner.size() == 0)
|
||||
{
|
||||
shadowRenewCorner.resize(shadowRenew.size(), false);
|
||||
}
|
||||
|
||||
string shadowAdd = ", SHADOW_RENEW(";
|
||||
int inserted = 0;
|
||||
|
||||
@@ -904,10 +899,7 @@ ParallelDirective::genDirective(File* file, const vector<pair<DIST::Array*, cons
|
||||
for (auto& elem : genSubscripts(shadowRenew[i1].second, shadowRenewShifts[i1]))
|
||||
newArrayRef->addSubscript(*elem);
|
||||
|
||||
bool needCornerFlag = shadowRenew[i1].second.size() > 1 && needCorner(shadowArray, shiftsByAccess, loop);
|
||||
shadowRenewCorner[i1] = needCornerFlag;
|
||||
|
||||
if (needCornerFlag)
|
||||
if (shadowRenew[i1].second.size() > 1 && needCorner(shadowArray, shiftsByAccess, loop))
|
||||
{
|
||||
SgExpression* tmp = new SgExpression(ARRAY_OP, newArrayRef, NULL, NULL);
|
||||
p->setLhs(*tmp);
|
||||
|
||||
@@ -102,7 +102,6 @@ public:
|
||||
// origin_Name uniqName bounds
|
||||
std::vector<std::pair<std::pair<std::string, std::string>, std::vector<std::pair<int, int>>>> shadowRenew;
|
||||
std::vector<std::vector<std::pair<int, int>>> shadowRenewShifts;
|
||||
std::vector<bool> shadowRenewCorner;
|
||||
|
||||
// origin_Name uniqName bounds
|
||||
std::vector<std::pair<std::pair<std::string, std::string>, std::vector<std::pair<int, int>>>> across;
|
||||
@@ -126,7 +125,6 @@ public:
|
||||
privates = copyFrom.privates;
|
||||
shadowRenew = copyFrom.shadowRenew;
|
||||
shadowRenewShifts = copyFrom.shadowRenewShifts;
|
||||
shadowRenewCorner = copyFrom.shadowRenewCorner;
|
||||
across = copyFrom.across;
|
||||
acrossShifts = copyFrom.acrossShifts;
|
||||
remoteAccess = copyFrom.remoteAccess;
|
||||
@@ -153,7 +151,6 @@ public:
|
||||
on.clear();
|
||||
privates.clear();
|
||||
shadowRenew.clear();
|
||||
shadowRenewCorner.clear();
|
||||
across.clear();
|
||||
acrossShifts.clear();
|
||||
reduction.clear();
|
||||
|
||||
@@ -364,11 +364,11 @@ static inline string calculateShifts(DIST::GraphCSR<int, double, attrType> &redu
|
||||
{
|
||||
if (sharedMemoryParallelization)
|
||||
{
|
||||
for (auto& coefs : currReadOp->first[k].coefficients)
|
||||
for (auto& coeffs : currReadOp->first[k].coefficients)
|
||||
{
|
||||
auto currAccess = coefs.first;
|
||||
auto currAccess = coeffs.first;
|
||||
|
||||
const int currShift = coefs.first.second;
|
||||
const int currShift = coeffs.first.second;
|
||||
|
||||
auto itFound = shiftsByAccess[k].find(currAccess);
|
||||
if (itFound == shiftsByAccess[k].end())
|
||||
@@ -393,9 +393,9 @@ static inline string calculateShifts(DIST::GraphCSR<int, double, attrType> &redu
|
||||
int minShift = 9999999;
|
||||
int maxShift = -9999999;
|
||||
|
||||
for (auto &coefs : currReadOp->first[k].coefficients)
|
||||
for (auto &coeffs : currReadOp->first[k].coefficients)
|
||||
{
|
||||
auto currAccess = coefs.first;
|
||||
auto currAccess = coeffs.first;
|
||||
auto result = DIST::Fx(currAccess, currRuleShadow);
|
||||
|
||||
if (result.first == loopRule.first)
|
||||
@@ -417,7 +417,7 @@ static inline string calculateShifts(DIST::GraphCSR<int, double, attrType> &redu
|
||||
auto it = remoteRegularReads.find(calcForArray);
|
||||
if (it == remoteRegularReads.end())
|
||||
it = remoteRegularReads.insert(it, make_pair(calcForArray, vector<ArrayOp>(calcForArray->GetDimSize())));
|
||||
it->second[k].coefficients.insert(coefs);
|
||||
it->second[k].coefficients.insert(coeffs);
|
||||
}
|
||||
}
|
||||
|
||||
|
||||
@@ -1137,9 +1137,9 @@ static bool isMapped(const vector<ArrayOp> &allOps)
|
||||
bool mapped = false;
|
||||
for (auto &ops : allOps)
|
||||
{
|
||||
for (auto &coefs : ops.coefficients)
|
||||
for (auto &coeffs : ops.coefficients)
|
||||
{
|
||||
if (coefs.first.first != 0)
|
||||
if (coeffs.first.first != 0)
|
||||
{
|
||||
mapped = true;
|
||||
break;
|
||||
|
||||
@@ -247,7 +247,7 @@ static vector<int> matchSubscriptToLoopSymbols(const vector<SgForStmt*> &parentL
|
||||
}
|
||||
}
|
||||
|
||||
pair<int, int> coefs = pair<int, int>(0, 0);
|
||||
pair<int, int> coeffs = pair<int, int>(0, 0);
|
||||
// more than one loop symbol in subscription
|
||||
if (countOfSymbols > 1)
|
||||
{
|
||||
@@ -326,16 +326,16 @@ static vector<int> matchSubscriptToLoopSymbols(const vector<SgForStmt*> &parentL
|
||||
{
|
||||
if (subscr->symbol()->id() == (parentLoops[position]->doName())->id())
|
||||
{
|
||||
coefs.first = 1;
|
||||
coeffs.first = 1;
|
||||
needToCacl = false;
|
||||
}
|
||||
}
|
||||
|
||||
if (needToCacl)
|
||||
getCoefsOfSubscript(coefs, subscr, parentLoops[position]->doName());
|
||||
__spf_print(PRINT_ARRAY_ARCS, " <%d %d> ", coefs.first, coefs.second);
|
||||
getCoefsOfSubscript(coeffs, subscr, parentLoops[position]->doName());
|
||||
__spf_print(PRINT_ARRAY_ARCS, " <%d %d> ", coeffs.first, coeffs.second);
|
||||
|
||||
if (coefs.first == 0) // && coefs.second == 0)
|
||||
if (coeffs.first == 0) // && coeffs.second == 0)
|
||||
{
|
||||
if (currRegime == REMOTE_ACC)
|
||||
{
|
||||
@@ -346,7 +346,7 @@ static vector<int> matchSubscriptToLoopSymbols(const vector<SgForStmt*> &parentL
|
||||
{
|
||||
const pair<bool, string> &arrayRefString = constructArrayRefForPrint(arrayRef, dimNum, origSubscr);
|
||||
__spf_print(1, "WARN: can not calculate index expression for array ref '%s' at line %d\n", arrayRefString.second.c_str(), currLine);
|
||||
addInfoToVectors(loopInfo, parentLoops[position], currOrigArrayS, dimNum, coefs, UNREC_OP, numOfSubscriptions, currentW);
|
||||
addInfoToVectors(loopInfo, parentLoops[position], currOrigArrayS, dimNum, coeffs, UNREC_OP, numOfSubscriptions, currentW);
|
||||
if (side == LEFT)
|
||||
allPositions.clear();
|
||||
|
||||
@@ -371,19 +371,19 @@ static vector<int> matchSubscriptToLoopSymbols(const vector<SgForStmt*> &parentL
|
||||
currOp.resize(numOfSubscriptions);
|
||||
|
||||
//add only uniq
|
||||
auto itAdd = currOp[dimNum].coefficients.find(coefs);
|
||||
auto itAdd = currOp[dimNum].coefficients.find(coeffs);
|
||||
if (itAdd == currOp[dimNum].coefficients.end())
|
||||
itAdd = currOp[dimNum].coefficients.insert(itAdd, make_pair(coefs, currentW));
|
||||
itAdd = currOp[dimNum].coefficients.insert(itAdd, make_pair(coeffs, currentW));
|
||||
}
|
||||
|
||||
if (coefs.first < 0)
|
||||
if (coeffs.first < 0)
|
||||
addInfoToMap(loopInfo, parentLoops[position], currOrigArrayS, arrayRef, dimNum, REMOTE_TRUE, currLine, numOfSubscriptions);
|
||||
else
|
||||
//if we found regular access to array - set it false
|
||||
addInfoToMap(loopInfo, parentLoops[position], currOrigArrayS, arrayRef, dimNum, REMOTE_FALSE, currLine, numOfSubscriptions);
|
||||
}
|
||||
|
||||
if (coefs.first < 0 && sharedMemoryParallelization == 0)
|
||||
if (coeffs.first < 0 && sharedMemoryParallelization == 0)
|
||||
{
|
||||
if (currRegime == DATA_DISTR)
|
||||
{
|
||||
@@ -402,15 +402,15 @@ static vector<int> matchSubscriptToLoopSymbols(const vector<SgForStmt*> &parentL
|
||||
if (side == LEFT)
|
||||
allPositions.clear();
|
||||
else
|
||||
addInfoToVectors(loopInfo, parentLoops[position], currOrigArrayS, dimNum, coefs, UNREC_OP, numOfSubscriptions, currentW);
|
||||
addInfoToVectors(loopInfo, parentLoops[position], currOrigArrayS, dimNum, coeffs, UNREC_OP, numOfSubscriptions, currentW);
|
||||
}
|
||||
}
|
||||
else
|
||||
{
|
||||
if (side == LEFT)
|
||||
addInfoToVectors(loopInfo, parentLoops[position], currOrigArrayS, dimNum, coefs, WRITE_OP, numOfSubscriptions, currentW);
|
||||
addInfoToVectors(loopInfo, parentLoops[position], currOrigArrayS, dimNum, coeffs, WRITE_OP, numOfSubscriptions, currentW);
|
||||
else
|
||||
addInfoToVectors(loopInfo, parentLoops[position], currOrigArrayS, dimNum, coefs, READ_OP, numOfSubscriptions, currentW);
|
||||
addInfoToVectors(loopInfo, parentLoops[position], currOrigArrayS, dimNum, coeffs, READ_OP, numOfSubscriptions, currentW);
|
||||
}
|
||||
}
|
||||
}
|
||||
@@ -418,13 +418,13 @@ static vector<int> matchSubscriptToLoopSymbols(const vector<SgForStmt*> &parentL
|
||||
if (currRegime == ARRAY_ACC_CORNER)
|
||||
{
|
||||
int *valueSubs = new int[2];
|
||||
valueSubs[0] = coefs.first;
|
||||
valueSubs[1] = coefs.second;
|
||||
valueSubs[0] = coeffs.first;
|
||||
valueSubs[1] = coeffs.second;
|
||||
#ifdef __SPF
|
||||
addToCollection(__LINE__, __FILE__, valueSubs, 2);
|
||||
#endif
|
||||
const vector<int*> &coefs = getAttributes<SgExpression*, int*>(subscr, set<int>{ INT_VAL });
|
||||
if (coefs.size() == 0)
|
||||
const vector<int*> &coeffs = getAttributes<SgExpression*, int*>(subscr, set<int>{ INT_VAL });
|
||||
if (coeffs.size() == 0)
|
||||
{
|
||||
subscr->addAttribute(INT_VAL, valueSubs, sizeof(int*));
|
||||
if (position != -1 && allPositions.size() == 1 && position < parentLoops.size())
|
||||
|
||||
@@ -23,7 +23,6 @@
|
||||
#include "expr_transform.h"
|
||||
#include "../LoopAnalyzer/loop_analyzer.h"
|
||||
#include "CFGraph/CFGraph.h"
|
||||
#include "../Utils/utils.h"
|
||||
|
||||
#include "json.hpp"
|
||||
|
||||
@@ -37,109 +36,6 @@ using std::tuple;
|
||||
|
||||
using json = nlohmann::json;
|
||||
|
||||
void runPredictSchemeOld(SgProject &project,
|
||||
vector<vector<size_t>> &topologies,
|
||||
vector<ParallelRegion*> ¶llelRegions,
|
||||
map<string, vector<LoopGraph*>> &loopGraph,
|
||||
map<string, vector<SpfInterval*>> &intervals,
|
||||
map<string, vector<Messages>> &SPF_messages)
|
||||
{
|
||||
int maxSizeDist = 0;
|
||||
for (int z = 0; z < parallelRegions.size(); ++z)
|
||||
{
|
||||
const DataDirective &dataDirectives = parallelRegions[z]->GetDataDir();
|
||||
const vector<int> ¤tVariant = parallelRegions[z]->GetCurrentVariant();
|
||||
|
||||
auto &tmp = dataDirectives.distrRules;
|
||||
vector<pair<DIST::Array*, const DistrVariant*>> currentVar;
|
||||
for (int z1 = 0; z1 < currentVariant.size(); ++z1)
|
||||
currentVar.push_back(std::make_pair(tmp[z1].first, &tmp[z1].second[currentVariant[z1]]));
|
||||
|
||||
for (auto &elem : currentVar)
|
||||
{
|
||||
DIST::Array *array = elem.first;
|
||||
const DistrVariant *var = elem.second;
|
||||
|
||||
int countBlock = 0;
|
||||
for (int z = 0; z < var->distRule.size(); ++z)
|
||||
if (var->distRule[z] == dist::BLOCK)
|
||||
++countBlock;
|
||||
maxSizeDist = std::max(maxSizeDist, countBlock);
|
||||
}
|
||||
}
|
||||
|
||||
SpfInterval *mainIterval = getMainInterval(&project, intervals, SPF_messages);
|
||||
topologies.clear();
|
||||
if (maxSizeDist)
|
||||
{
|
||||
const int procNum = 8;
|
||||
//TODO:
|
||||
//topologies = getTopologies(procNum, maxSizeDist);
|
||||
throw -10;
|
||||
|
||||
const int countOfTop = topologies.size();
|
||||
if (countOfTop < 0)
|
||||
printInternalError(convertFileName(__FILE__).c_str(), __LINE__);
|
||||
|
||||
for (auto &inter : intervals)
|
||||
initTimeForIntervalTree(countOfTop, inter.second);
|
||||
|
||||
for (int z = 0; z < parallelRegions.size(); ++z)
|
||||
{
|
||||
const DataDirective &dataDirectives = parallelRegions[z]->GetDataDir();
|
||||
const vector<int> ¤tVariant = parallelRegions[z]->GetCurrentVariant();
|
||||
DIST::Arrays<int> &allArrays = parallelRegions[z]->GetAllArraysToModify();
|
||||
|
||||
auto &tmp = dataDirectives.distrRules;
|
||||
vector<pair<DIST::Array*, const DistrVariant*>> currentVar;
|
||||
for (int z1 = 0; z1 < currentVariant.size(); ++z1)
|
||||
currentVar.push_back(std::make_pair(tmp[z1].first, &tmp[z1].second[currentVariant[z1]]));
|
||||
|
||||
map<LoopGraph*, ParallelDirective*> parallelDirs;
|
||||
vector<std::tuple<DIST::Array*, vector<long>, pair<string, int>>> allSingleRemotes;
|
||||
for (int i = project.numberOfFiles() - 1; i >= 0; --i)
|
||||
{
|
||||
SgFile *file = &(project.file(i));
|
||||
auto fountInfo = findAllDirectives(file, getObjectForFileFromMap(file->filename(), loopGraph), parallelRegions[z]->GetId());
|
||||
parallelDirs.insert(fountInfo.begin(), fountInfo.end());
|
||||
|
||||
auto fountRem = findAllSingleRemotes(file, parallelRegions[z]->GetId(), parallelRegions);
|
||||
allSingleRemotes.insert(allSingleRemotes.end(), fountRem.begin(), fountRem.end());
|
||||
}
|
||||
//TODO!
|
||||
//int err = predictScheme(parallelRegions[z], currentVar, allArrays.GetArrays(), parallelDirs, intervals, SPF_messages, allSingleRemotes, maxSizeDist, procNum);
|
||||
/*if (err != 0)
|
||||
internalExit = err;*/
|
||||
}
|
||||
|
||||
vector<SpfInterval*> tmp = { mainIterval };
|
||||
aggregatePredictedTimes(tmp);
|
||||
|
||||
int idx = 0;
|
||||
int best = -1;
|
||||
double bestSpeedUp = 0;
|
||||
for (auto &top : topologies)
|
||||
{
|
||||
string outStr = "";
|
||||
for (auto &elem : top)
|
||||
outStr += std::to_string(elem) + " ";
|
||||
double currS = mainIterval->exec_time / mainIterval->predictedTimes[idx];
|
||||
__spf_print(1, "%d: speed up %f for top. %s\n", idx, currS, outStr.c_str());
|
||||
|
||||
if (best == -1 || bestSpeedUp < currS)
|
||||
{
|
||||
bestSpeedUp = currS;
|
||||
best = idx;
|
||||
}
|
||||
++idx;
|
||||
}
|
||||
__spf_print(1, "best topology %d with speed up %f\n", best, bestSpeedUp);
|
||||
}
|
||||
else
|
||||
for (auto &inter : intervals)
|
||||
initTimeForIntervalTree(0, inter.second);
|
||||
}
|
||||
|
||||
static void fillParallel(SgExpression *exp, ParallelStats &parStats, int &totalScoreComm)
|
||||
{
|
||||
if (exp)
|
||||
@@ -430,7 +326,7 @@ static json parseAlign(const map<DIST::Array*, int>& byPos, SgSymbol* srcArr, Sg
|
||||
list = list->rhs();
|
||||
}
|
||||
|
||||
vector<pair<int, int>> coefs(srcSymbs.size());
|
||||
vector<pair<int, int>> coeffs(srcSymbs.size());
|
||||
list = listTgt;
|
||||
while (list)
|
||||
{
|
||||
@@ -441,8 +337,8 @@ static json parseAlign(const map<DIST::Array*, int>& byPos, SgSymbol* srcArr, Sg
|
||||
has = recSymbolFind(exp, srcSymbs[z].first, VAR_REF);
|
||||
if (has)
|
||||
{
|
||||
getCoefsOfSubscript(coefs[z], exp, srcSymbs[z].second);
|
||||
if (coefs[z].first == 0)
|
||||
getCoefsOfSubscript(coeffs[z], exp, srcSymbs[z].second);
|
||||
if (coeffs[z].first == 0)
|
||||
printInternalError(convertFileName(__FILE__).c_str(), __LINE__);
|
||||
break;
|
||||
}
|
||||
@@ -450,14 +346,14 @@ static json parseAlign(const map<DIST::Array*, int>& byPos, SgSymbol* srcArr, Sg
|
||||
list = list->rhs();
|
||||
}
|
||||
|
||||
for (int z = 0; z < coefs.size(); ++z)
|
||||
for (int z = 0; z < coeffs.size(); ++z)
|
||||
{
|
||||
if (coefs[z].first == 0)
|
||||
if (coeffs[z].first == 0)
|
||||
continue;
|
||||
if (coefs[z].second)
|
||||
align["rules"].push_back({ z, coefs[z].first });
|
||||
if (coeffs[z].second)
|
||||
align["rules"].push_back({ z, coeffs[z].first });
|
||||
else
|
||||
align["rules"].push_back({ z, coefs[z].first, coefs[z].second });
|
||||
align["rules"].push_back({ z, coeffs[z].first, coeffs[z].second });
|
||||
}
|
||||
return align;
|
||||
}
|
||||
|
||||
@@ -60,6 +60,4 @@ public:
|
||||
void processFileToPredict(SgFile *file, PredictorStats &predictorCounts);
|
||||
|
||||
void calculateStatsForPredictor(const std::map<std::string, std::vector<FuncInfo*>>& allFuncInfo, const std::map<std::string, std::map<int, Gcov_info>>& gCovInfo);
|
||||
void parseDvmDirForPredictor(const std::map<std::tuple<int, std::string, std::string>, std::pair<DIST::Array*, DIST::ArrayAccessInfo*>>& declaredArrays, const std::map<std::string, CommonBlock*>& commonBlocks, const std::map<std::string, std::vector<FuncInfo*>>& allFuncInfo, const std::map<std::string, std::map<int, Gcov_info>>& gCovInfo);
|
||||
|
||||
void runPredictSchemeOld(SgProject &project, std::vector<std::vector<size_t>> &topologies, std::vector<ParallelRegion*> ¶llelRegions, std::map<std::string, std::vector<LoopGraph*>> &loopGraph, std::map<std::string, std::vector<SpfInterval*>> &intervals, std::map<std::string, std::vector<Messages>> &SPF_messages);
|
||||
void parseDvmDirForPredictor(const std::map<std::tuple<int, std::string, std::string>, std::pair<DIST::Array*, DIST::ArrayAccessInfo*>>& declaredArrays, const std::map<std::string, CommonBlock*>& commonBlocks, const std::map<std::string, std::vector<FuncInfo*>>& allFuncInfo, const std::map<std::string, std::map<int, Gcov_info>>& gCovInfo);
|
||||
@@ -1,439 +0,0 @@
|
||||
#include "leak_detector.h"
|
||||
|
||||
#include <limits>
|
||||
#include <map>
|
||||
#include <vector>
|
||||
#include <string>
|
||||
#include <tuple>
|
||||
|
||||
#include "dvm.h"
|
||||
#include "PredictSchemeWithLibrary.h"
|
||||
#include "../../projects/libpredictor/include/libpredict/predictor.h"
|
||||
#include "../DirectiveProcessing/directive_parser.h"
|
||||
#include "../Distribution/DvmhDirective.h"
|
||||
#include "../ParallelizationRegions/ParRegions.h"
|
||||
#include "../GraphLoop/graph_loops_func.h"
|
||||
#include "../Utils/errors.h"
|
||||
#include "../Utils/utils.h"
|
||||
|
||||
using std::map;
|
||||
using std::pair;
|
||||
using std::string;
|
||||
using std::tuple;
|
||||
using std::vector;
|
||||
|
||||
map<size_t, size_t> createTemplateIdMapping(const vector<ParallelRegion*>& parallelRegions)
|
||||
{
|
||||
size_t maxArrayId = 0;
|
||||
for (int z = 0; z < parallelRegions.size(); ++z) {
|
||||
const DataDirective& dataDirectives = parallelRegions[z]->GetDataDir();
|
||||
|
||||
for (const auto& distrRule : dataDirectives.distrRules) {
|
||||
if (distrRule.first && !distrRule.first->IsTemplate()) {
|
||||
maxArrayId = std::max(maxArrayId, (size_t)distrRule.first->GetId());
|
||||
}
|
||||
}
|
||||
|
||||
for (const auto& alignRule : dataDirectives.alignRules) {
|
||||
if (alignRule.alignArray && !alignRule.alignArray->IsTemplate()) {
|
||||
maxArrayId = std::max(maxArrayId, (size_t)alignRule.alignArray->GetId());
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
map<size_t, size_t> templateIdMapping;
|
||||
size_t nextTemplateId = maxArrayId + 1;
|
||||
for (int z = 0; z < parallelRegions.size(); ++z) {
|
||||
const DataDirective& dataDirectives = parallelRegions[z]->GetDataDir();
|
||||
|
||||
for (const auto& distrRule : dataDirectives.distrRules) {
|
||||
if (distrRule.first && distrRule.first->IsTemplate()) {
|
||||
size_t originalId = distrRule.first->GetId();
|
||||
if (templateIdMapping.find(originalId) == templateIdMapping.end()) {
|
||||
templateIdMapping[originalId] = nextTemplateId++;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
for (const auto& alignRule : dataDirectives.alignRules) {
|
||||
if (alignRule.alignWith && alignRule.alignWith->IsTemplate()) {
|
||||
size_t originalId = alignRule.alignWith->GetId();
|
||||
if (templateIdMapping.find(originalId) == templateIdMapping.end()) {
|
||||
templateIdMapping[originalId] = nextTemplateId++;
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return templateIdMapping;
|
||||
}
|
||||
|
||||
PrecomputedLibpredictParams precomputeLibpredictParams(
|
||||
SgProject& project,
|
||||
const vector<ParallelRegion*>& parallelRegions,
|
||||
const map<string, vector<LoopGraph*>>& loopGraph,
|
||||
const map<size_t, size_t>& templateIdMapping)
|
||||
{
|
||||
PrecomputedLibpredictParams result;
|
||||
|
||||
// distribute and align from parallelRegions
|
||||
for (int z = 0; z < parallelRegions.size(); ++z) {
|
||||
const DataDirective& dataDirectives = parallelRegions[z]->GetDataDir();
|
||||
const vector<int>& currentVariant = parallelRegions[z]->GetCurrentVariant();
|
||||
const DIST::Arrays<int>& allArrays = parallelRegions[z]->GetAllArrays();
|
||||
|
||||
auto& tmp = dataDirectives.distrRules;
|
||||
vector<pair<DIST::Array*, const DistrVariant*>> currentVar;
|
||||
for (int z1 = 0; z1 < currentVariant.size(); ++z1) {
|
||||
currentVar.push_back(std::make_pair(tmp[z1].first, &tmp[z1].second[currentVariant[z1]]));
|
||||
}
|
||||
|
||||
// distribute
|
||||
for (const auto& distrRule : currentVar) {
|
||||
DIST::Array* array = distrRule.first;
|
||||
const DistrVariant* variant = distrRule.second;
|
||||
|
||||
if (array && variant && !array->IsNotDistribute()) {
|
||||
PrecomputedDistributeParams params;
|
||||
|
||||
size_t originalId = array->GetId();
|
||||
params.arrayId = originalId;
|
||||
|
||||
if (array->IsTemplate()) {
|
||||
auto it = templateIdMapping.find(originalId);
|
||||
if (it != templateIdMapping.end()) {
|
||||
params.arrayId = it->second;
|
||||
}
|
||||
}
|
||||
|
||||
params.elemSize = array->GetTypeSize();
|
||||
params.array = array;
|
||||
|
||||
const auto& arraySizes = array->GetSizes();
|
||||
for (int dim = 0; dim < array->GetDimSize(); ++dim) {
|
||||
size_t dimSize = arraySizes[dim].second - arraySizes[dim].first + 1;
|
||||
|
||||
if (dim < variant->distRule.size() && variant->distRule[dim] == dist::BLOCK) {
|
||||
params.axisDistributions.emplace_back(dimSize, libpredict::TypeDistribute::BLOCK);
|
||||
} else {
|
||||
params.axisDistributions.emplace_back(dimSize, libpredict::TypeDistribute::NONE);
|
||||
}
|
||||
}
|
||||
|
||||
const auto& shadowSpec = array->GetShadowSpec();
|
||||
for (int dim = 0; dim < shadowSpec.size() && dim < array->GetDimSize(); ++dim) {
|
||||
if (dim < variant->distRule.size() && variant->distRule[dim] == dist::BLOCK) {
|
||||
params.shadowEdges.emplace_back(shadowSpec[dim].first, shadowSpec[dim].second);
|
||||
}
|
||||
}
|
||||
|
||||
result.distributeParams.push_back(params);
|
||||
}
|
||||
}
|
||||
|
||||
// align
|
||||
for (const auto& alignRule : dataDirectives.alignRules) {
|
||||
DIST::Array* alignArray = alignRule.alignArray;
|
||||
DIST::Array* alignWithArray = alignRule.alignWith;
|
||||
|
||||
if (alignArray && alignWithArray && !alignArray->IsNotDistribute()) {
|
||||
PrecomputedAlignParams params;
|
||||
|
||||
params.arrayId = alignArray->GetId();
|
||||
size_t originalDistributedArrayId = alignWithArray->GetId();
|
||||
params.distributedArrayId = originalDistributedArrayId;
|
||||
|
||||
if (alignWithArray->IsTemplate()) {
|
||||
auto it = templateIdMapping.find(originalDistributedArrayId);
|
||||
if (it != templateIdMapping.end()) {
|
||||
params.distributedArrayId = it->second;
|
||||
}
|
||||
}
|
||||
|
||||
params.elemSize = alignArray->GetTypeSize();
|
||||
params.alignArray = alignArray;
|
||||
params.alignWithArray = alignWithArray;
|
||||
|
||||
const auto& arraySizes = alignArray->GetSizes();
|
||||
for (int dim = 0; dim < alignArray->GetDimSize(); ++dim) {
|
||||
size_t dimSize = arraySizes[dim].second - arraySizes[dim].first + 1;
|
||||
params.dimensions.push_back(dimSize);
|
||||
}
|
||||
|
||||
for (int dim = 0; dim < alignWithArray->GetDimSize(); ++dim) {
|
||||
bool found = false;
|
||||
for (int i = 0; i < alignRule.alignRuleWith.size(); ++i) {
|
||||
const auto& ruleWith = alignRule.alignRuleWith[i];
|
||||
if (ruleWith.first == dim) {
|
||||
const auto& rule = ruleWith.second;
|
||||
if (rule.first == 0) {
|
||||
// constant
|
||||
params.distributionExpressions.emplace_back(rule.second);
|
||||
} else {
|
||||
// linear expression a * I + b
|
||||
params.distributionExpressions.emplace_back(i, rule.first, rule.second);
|
||||
}
|
||||
found = true;
|
||||
break;
|
||||
}
|
||||
}
|
||||
if (!found) {
|
||||
// There is no rule for this measurement
|
||||
params.distributionExpressions.emplace_back();
|
||||
}
|
||||
}
|
||||
|
||||
const auto& shadowSpec = alignArray->GetShadowSpec();
|
||||
for (int dim = 0; dim < shadowSpec.size() && dim < alignArray->GetDimSize(); ++dim) {
|
||||
params.shadowEdges.emplace_back(shadowSpec[dim].first, shadowSpec[dim].second);
|
||||
}
|
||||
|
||||
result.alignParams.push_back(params);
|
||||
}
|
||||
}
|
||||
|
||||
// shadow_renew
|
||||
map<LoopGraph*, ParallelDirective*> parallelDirs;
|
||||
for (int i = project.numberOfFiles() - 1; i >= 0; --i) {
|
||||
SgFile* file = &(project.file(i));
|
||||
auto fountInfo = findAllDirectives(
|
||||
file,
|
||||
getObjectForFileFromMap(file->filename(), const_cast<map<string, vector<LoopGraph*>>&>(loopGraph)),
|
||||
parallelRegions[z]->GetId());
|
||||
parallelDirs.insert(fountInfo.begin(), fountInfo.end());
|
||||
}
|
||||
|
||||
for (auto& dirPair : parallelDirs) {
|
||||
LoopGraph* loopPtr = dirPair.first;
|
||||
ParallelDirective* directive = dirPair.second;
|
||||
|
||||
if (directive && !directive->shadowRenew.empty()) {
|
||||
for (size_t shadowIdx = 0; shadowIdx < directive->shadowRenew.size(); ++shadowIdx) {
|
||||
const auto& shadowRenewItem = directive->shadowRenew[shadowIdx];
|
||||
const string& arrayName = shadowRenewItem.first.second; // uniqName
|
||||
const vector<pair<int, int>>& bounds = shadowRenewItem.second;
|
||||
|
||||
DIST::Array* shadowArray = allArrays.GetArrayByName(arrayName);
|
||||
if (shadowArray == NULL) {
|
||||
continue;
|
||||
}
|
||||
|
||||
if (shadowArray && !shadowArray->IsNotDistribute()) {
|
||||
PrecomputedShadowRenewParams params;
|
||||
|
||||
params.arrayId = shadowArray->GetId();
|
||||
params.shadowArray = shadowArray;
|
||||
|
||||
for (const auto& bound : bounds) {
|
||||
params.shadow_renew.emplace_back(static_cast<size_t>(bound.first),
|
||||
static_cast<size_t>(bound.second));
|
||||
}
|
||||
|
||||
params.corner = directive->shadowRenewCorner[shadowIdx];
|
||||
params.number_loop_iterations = loopPtr ? static_cast<size_t>(loopPtr->countOfIters) : 1;
|
||||
|
||||
result.shadowRenewParams.push_back(params);
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return result;
|
||||
}
|
||||
|
||||
double runLibpredictCalc(const vector<size_t>& topology,
|
||||
const string& clusterConfStr,
|
||||
const PrecomputedLibpredictParams& precomputedParams,
|
||||
map<string, vector<Messages>>& SPF_messages)
|
||||
{
|
||||
libpredict::RetInitGrid retInitGrid = libpredict::InitGrid(topology[0], topology[1], topology[2], topology[3]);
|
||||
|
||||
if (retInitGrid != libpredict::INIT_GRID_SUCCESS) {
|
||||
__spf_print(1, "ERROR: Failed to initialize libpredict grid with topology: %zu %zu %zu %zu, return code: %d\n",
|
||||
topology[0], topology[1], topology[2], topology[3], (int)retInitGrid);
|
||||
|
||||
std::wstring messageR, messageE;
|
||||
__spf_printToLongBuf(messageE, L"Failed to initialize libpredict grid with topology: %zu %zu %zu %zu, return code: %d",
|
||||
topology[0], topology[1], topology[2], topology[3], (int)retInitGrid);
|
||||
__spf_printToLongBuf(messageR, R207);
|
||||
getObjectForFileFromMap(clusterConfStr.c_str(), SPF_messages).push_back(Messages(ERROR, 1, messageR, messageE, 1064));
|
||||
return -1;
|
||||
}
|
||||
|
||||
// distribute
|
||||
for (const auto& params : precomputedParams.distributeParams) {
|
||||
libpredict::RetDistribute retDistribute = libpredict::Distribute(
|
||||
params.arrayId, params.elemSize, params.axisDistributions, params.shadowEdges);
|
||||
|
||||
if (retDistribute != libpredict::DISTRIBUTE_SUCCESS) {
|
||||
__spf_print(1, "ERROR: Failed to distribute array '%s' (id=%zu) with libpredict, return code: %d\n",
|
||||
params.array->GetShortName().c_str(), params.arrayId, (int)retDistribute);
|
||||
|
||||
std::wstring messageR, messageE;
|
||||
__spf_printToLongBuf(messageE, L"Failed to distribute array '%s' with libpredict, return code: %d",
|
||||
to_wstring(params.array->GetShortName()).c_str(), (int)retDistribute);
|
||||
__spf_printToLongBuf(messageR, R208);
|
||||
getObjectForFileFromMap(params.array->GetDeclInfo().begin()->first.c_str(), SPF_messages).push_back(Messages(ERROR, params.array->GetDeclInfo().begin()->second, messageR, messageE, 1065));
|
||||
}
|
||||
}
|
||||
|
||||
// align
|
||||
for (const auto& params : precomputedParams.alignParams) {
|
||||
libpredict::RetAlign retAlign = libpredict::Align(
|
||||
params.arrayId, params.distributedArrayId, params.elemSize,
|
||||
params.dimensions, params.distributionExpressions, params.shadowEdges);
|
||||
|
||||
if (retAlign != libpredict::ALIGN_SUCCESS) {
|
||||
__spf_print(1, "ERROR: Failed to align array '%s' (id=%zu) with array '%s' (id=%zu), return code: %d\n",
|
||||
params.alignArray->GetShortName().c_str(), params.arrayId,
|
||||
params.alignWithArray->GetShortName().c_str(), params.distributedArrayId, (int)retAlign);
|
||||
|
||||
std::wstring messageR, messageE;
|
||||
__spf_printToLongBuf(messageE, L"Failed to align array '%s' with array '%s' using libpredict, return code: %d",
|
||||
to_wstring(params.alignArray->GetShortName()).c_str(),
|
||||
to_wstring(params.alignWithArray->GetShortName()).c_str(), (int)retAlign);
|
||||
__spf_printToLongBuf(messageR, R209);
|
||||
getObjectForFileFromMap(params.alignArray->GetDeclInfo().begin()->first.c_str(), SPF_messages).push_back(Messages(ERROR, params.alignArray->GetDeclInfo().begin()->second, messageR, messageE, 1066));
|
||||
}
|
||||
}
|
||||
|
||||
// shadow_renew
|
||||
for (const auto& params : precomputedParams.shadowRenewParams) {
|
||||
libpredict::RetShadowRenew retShadowRenew = libpredict::ShadowRenew(
|
||||
params.arrayId, params.shadow_renew, params.corner, params.number_loop_iterations);
|
||||
|
||||
if (retShadowRenew != libpredict::SHADOW_RENEW_SUCCESS) {
|
||||
__spf_print(1, "ERROR: Failed to process shadow_renew for array '%s' (id=%zu), return code: %d\n",
|
||||
params.shadowArray->GetShortName().c_str(), params.arrayId, (int)retShadowRenew);
|
||||
|
||||
std::wstring messageR, messageE;
|
||||
__spf_printToLongBuf(messageE, L"Failed to process shadow_renew for array '%s' with libpredict, return code: %d",
|
||||
to_wstring(params.shadowArray->GetShortName()).c_str(), (int)retShadowRenew);
|
||||
__spf_printToLongBuf(messageR, R210);
|
||||
getObjectForFileFromMap(params.shadowArray->GetDeclInfo().begin()->first.c_str(), SPF_messages).push_back(Messages(ERROR, params.shadowArray->GetDeclInfo().begin()->second, messageR, messageE, 1067));
|
||||
}
|
||||
}
|
||||
|
||||
return libpredict::GetTime();
|
||||
}
|
||||
|
||||
void runPredictScheme(SgProject& project,
|
||||
vector<vector<size_t>>& topologies,
|
||||
const vector<ParallelRegion*>& parallelRegions,
|
||||
map<string, vector<LoopGraph*>>& loopGraph,
|
||||
map<string, vector<Messages>>& SPF_messages)
|
||||
{
|
||||
// calculating maximum dimension of distribution
|
||||
int maxSizeDist = 0;
|
||||
for (int z = 0; z < parallelRegions.size(); ++z) {
|
||||
const DataDirective& dataDirectives = parallelRegions[z]->GetDataDir();
|
||||
const vector<int>& currentVariant = parallelRegions[z]->GetCurrentVariant();
|
||||
|
||||
auto& tmp = dataDirectives.distrRules;
|
||||
vector<const DistrVariant*> currentVar;
|
||||
for (int z1 = 0; z1 < currentVariant.size(); ++z1) {
|
||||
currentVar.push_back(&tmp[z1].second[currentVariant[z1]]);
|
||||
}
|
||||
|
||||
for (auto var : currentVar) {
|
||||
int countBlock = 0;
|
||||
for (int z = 0; z < var->distRule.size(); ++z) {
|
||||
if (var->distRule[z] == dist::BLOCK) {
|
||||
++countBlock;
|
||||
}
|
||||
}
|
||||
maxSizeDist = std::max(maxSizeDist, countBlock);
|
||||
}
|
||||
}
|
||||
|
||||
// calculating name of a cluster configuration file
|
||||
string clusterConfStr;
|
||||
if (project.numberOfFiles() > 0) {
|
||||
string firstFilePath = project.fileName(0);
|
||||
|
||||
size_t lastSlash = firstFilePath.find_last_of("/\\");
|
||||
clusterConfStr = firstFilePath.substr(0, lastSlash + 1) + "cluster.conf";
|
||||
}
|
||||
|
||||
// creating template ID display to avoid conflicts
|
||||
map<size_t, size_t> templateIdMapping = createTemplateIdMapping(parallelRegions);
|
||||
|
||||
// Precomputing parameters of directive functions from libpredict
|
||||
PrecomputedLibpredictParams precomputedParams = precomputeLibpredictParams(
|
||||
project, parallelRegions, loopGraph, templateIdMapping);
|
||||
|
||||
// iterating through topologies to find most optimal one
|
||||
topologies = vector<vector<size_t>>();
|
||||
if (maxSizeDist) {
|
||||
if (maxSizeDist > 4) {
|
||||
maxSizeDist = 4;
|
||||
}
|
||||
|
||||
// Initialize cluster
|
||||
int procCount = 0;
|
||||
libpredict::RetInitCluster retInitCluster = libpredict::InitCluster(clusterConfStr, procCount);
|
||||
|
||||
if (retInitCluster != libpredict::INIT_CLUSTER_SUCCESS) {
|
||||
__spf_print(1, "ERROR: Failed to initialize libpredict cluster with config: %s, return code: %d\n", clusterConfStr.c_str(), (int)retInitCluster);
|
||||
|
||||
std::wstring messageR, messageE;
|
||||
__spf_printToLongBuf(messageE, L"Failed to initialize libpredict cluster with config: %s, return code: %d",
|
||||
to_wstring(clusterConfStr).c_str(), (int)retInitCluster);
|
||||
__spf_printToLongBuf(messageR, R206);
|
||||
getObjectForFileFromMap(clusterConfStr.c_str(), SPF_messages).push_back(Messages(ERROR, 1, messageR, messageE, 1063));
|
||||
return;
|
||||
}
|
||||
|
||||
for (size_t n1 = 2; n1 <= procCount; ++n1) {
|
||||
for (size_t n2 = 1; n2 <= n1 && n1 * n2 <= procCount; ++n2) {
|
||||
if (n2 != 1 && maxSizeDist < 2 || n2 == 1 && maxSizeDist == 2) {
|
||||
continue;
|
||||
}
|
||||
|
||||
for (size_t n3 = 1; n3 <= n2 && n1 * n2 * n3 <= procCount; ++n3) {
|
||||
if (n3 != 1 && maxSizeDist < 3 || n3 == 1 && maxSizeDist == 3) {
|
||||
continue;
|
||||
}
|
||||
|
||||
for (size_t n4 = 1; n4 <= n3 && n1 * n2 * n3 * n4 <= procCount; ++n4) {
|
||||
if (n4 != 1 && maxSizeDist < 4 || n4 == 1 && maxSizeDist == 4) {
|
||||
continue;
|
||||
}
|
||||
|
||||
topologies.push_back(vector<size_t>{n1, n2, n3, n4});
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
vector<size_t> best;
|
||||
double bestTime = std::numeric_limits<double>::max();
|
||||
for (auto& topology : topologies) {
|
||||
double currTime = runLibpredictCalc(topology, clusterConfStr, precomputedParams, SPF_messages);
|
||||
|
||||
string outStr = "";
|
||||
for (const auto& elem : topology) {
|
||||
outStr += std::to_string(elem) + " ";
|
||||
}
|
||||
__spf_print(1, "topology %s has time %f\n", outStr.c_str(), currTime);
|
||||
|
||||
if (currTime == -1) {
|
||||
return;
|
||||
}
|
||||
|
||||
if (currTime < bestTime) {
|
||||
bestTime = currTime;
|
||||
best = topology;
|
||||
}
|
||||
}
|
||||
string outStr;
|
||||
for (const auto& elem : best) {
|
||||
outStr += std::to_string(elem) + " ";
|
||||
}
|
||||
|
||||
__spf_print(1, "best topology %s with time %f\n", outStr.c_str(), bestTime);
|
||||
} else {
|
||||
__spf_print(1, "impossible to calculate best topology: project does not contain distribution directives\n");
|
||||
}
|
||||
}
|
||||
@@ -1,57 +0,0 @@
|
||||
#pragma once
|
||||
#include <vector>
|
||||
#include <map>
|
||||
#include <string>
|
||||
#include "dvm.h"
|
||||
#include "graph_calls.h"
|
||||
#include "../../projects/libpredictor/include/libpredict/predictor.h"
|
||||
|
||||
struct PrecomputedDistributeParams {
|
||||
size_t arrayId;
|
||||
size_t elemSize;
|
||||
std::vector<libpredict::DistributeAxisRule> axisDistributions;
|
||||
std::vector<std::pair<size_t, size_t>> shadowEdges;
|
||||
DIST::Array* array;
|
||||
};
|
||||
|
||||
struct PrecomputedAlignParams {
|
||||
size_t arrayId;
|
||||
size_t distributedArrayId;
|
||||
size_t elemSize;
|
||||
std::vector<size_t> dimensions;
|
||||
std::vector<libpredict::AlignDisplay> distributionExpressions;
|
||||
std::vector<std::pair<size_t, size_t>> shadowEdges;
|
||||
DIST::Array* alignArray;
|
||||
DIST::Array* alignWithArray;
|
||||
};
|
||||
|
||||
struct PrecomputedShadowRenewParams {
|
||||
size_t arrayId;
|
||||
std::vector<std::pair<size_t, size_t>> shadow_renew;
|
||||
bool corner;
|
||||
size_t number_loop_iterations;
|
||||
DIST::Array* shadowArray;
|
||||
};
|
||||
|
||||
struct PrecomputedLibpredictParams {
|
||||
std::vector<PrecomputedDistributeParams> distributeParams;
|
||||
std::vector<PrecomputedAlignParams> alignParams;
|
||||
std::vector<PrecomputedShadowRenewParams> shadowRenewParams;
|
||||
};
|
||||
|
||||
PrecomputedLibpredictParams precomputeLibpredictParams(
|
||||
SgProject& project,
|
||||
const std::vector<ParallelRegion*>& parallelRegions,
|
||||
const std::map<std::string, std::vector<LoopGraph*>>& loopGraph,
|
||||
const std::map<size_t, size_t>& templateIdMapping);
|
||||
|
||||
void runPredictScheme(SgProject& project,
|
||||
std::vector<std::vector<size_t>>& topologies,
|
||||
const std::vector<ParallelRegion*>& parallelRegions,
|
||||
std::map<std::string, std::vector<LoopGraph*>>& loopGraph,
|
||||
std::map<std::string, std::vector<Messages>>& SPF_messages);
|
||||
|
||||
double runLibpredictCalc(const std::vector<size_t>& topology,
|
||||
const std::string& clusterConfStr,
|
||||
const PrecomputedLibpredictParams& precomputedParams,
|
||||
std::map<std::string, std::vector<Messages>>& SPF_messages);
|
||||
@@ -12,9 +12,38 @@
|
||||
#include "SgUtils.h"
|
||||
#include "graph_loops.h"
|
||||
#include "CFGraph/CFGraph.h"
|
||||
#include "utils.h"
|
||||
|
||||
using namespace std;
|
||||
|
||||
static void RemoveEmptyPoints(ArrayAccessingIndexes& container)
|
||||
{
|
||||
ArrayAccessingIndexes resultContainer;
|
||||
unordered_set<string> toRemove;
|
||||
|
||||
for (auto& [arrayName, accessingSet] : container)
|
||||
{
|
||||
vector<vector<ArrayDimension>> points;
|
||||
for (auto& arrayPoint : accessingSet.GetElements())
|
||||
{
|
||||
if (!arrayPoint.empty())
|
||||
points.push_back(arrayPoint);
|
||||
}
|
||||
|
||||
if (points.size() < accessingSet.GetElements().size() && !points.empty())
|
||||
resultContainer[arrayName] = points;
|
||||
|
||||
if (points.empty())
|
||||
toRemove.insert(arrayName);
|
||||
}
|
||||
|
||||
for (const string& name : toRemove)
|
||||
container.erase(name);
|
||||
|
||||
for (auto& [arrayName, accessingSet] : resultContainer)
|
||||
container[arrayName] = accessingSet;
|
||||
}
|
||||
|
||||
static void Collapse(Region* region)
|
||||
{
|
||||
if (region->getBasickBlocks().empty())
|
||||
@@ -37,13 +66,13 @@ static void Collapse(Region* region)
|
||||
region->array_use[arrayName] = region->array_use[arrayName].Union(diff);
|
||||
}
|
||||
}
|
||||
|
||||
ArrayAccessingIndexes useUnion;
|
||||
for (auto& byBlock : region->getBasickBlocks())
|
||||
for (auto& [arrayName, arrayRanges] : byBlock->array_use)
|
||||
useUnion[arrayName] = useUnion[arrayName].Union(byBlock->array_use[arrayName]);
|
||||
|
||||
for (auto& [arrayName, arrayRanges] : useUnion)
|
||||
region->array_priv[arrayName] = useUnion[arrayName].Diff(region->array_use[arrayName]);
|
||||
region->array_priv = region->array_use;
|
||||
|
||||
for (Region* prevBlock : region->getHeader()->getPrevRegions())
|
||||
prevBlock->replaceInNextRegions(region, region->getHeader());
|
||||
@@ -74,6 +103,7 @@ static void SolveDataFlowIteratively(Region* DFG)
|
||||
newIn.clear();
|
||||
continue;
|
||||
}
|
||||
|
||||
for (const auto& [arrayName, accessSet] : prevBlock->array_out)
|
||||
{
|
||||
if (newIn.find(arrayName) != newIn.end())
|
||||
@@ -86,6 +116,7 @@ static void SolveDataFlowIteratively(Region* DFG)
|
||||
|
||||
b->array_in = move(newIn);
|
||||
ArrayAccessingIndexes newOut;
|
||||
|
||||
if (b->array_def.empty())
|
||||
newOut = b->array_in;
|
||||
else if (b->array_in.empty())
|
||||
@@ -121,21 +152,83 @@ static void SolveDataFlow(Region* DFG)
|
||||
Collapse(DFG);
|
||||
}
|
||||
|
||||
map<LoopGraph*, ArrayAccessingIndexes> FindPrivateArrays(map<string, vector<LoopGraph*>> &loopGraph, map<FuncInfo*, vector<SAPFOR::BasicBlock*>>& FullIR)
|
||||
{
|
||||
map<LoopGraph*, ArrayAccessingIndexes> result;
|
||||
for (const auto& [loopName, loops] : loopGraph)
|
||||
static void AddPrivateArraysToLoop(LoopGraph* loop, const ArrayAccessingIndexes& privates, set<SgStatement*>& insertedPrivates)
|
||||
{
|
||||
SgStatement* spfStat = new SgStatement(SPF_ANALYSIS_DIR);
|
||||
spfStat->setlineNumber(loop->loop->lineNumber());
|
||||
spfStat->setFileName(loop->loop->fileName());
|
||||
SgExpression* toAdd = new SgExpression(EXPR_LIST, new SgExpression(ACC_PRIVATE_OP), NULL, NULL);
|
||||
set<SgSymbol*> arraysToInsert;
|
||||
for (const auto& [_, accessingSet] : privates)
|
||||
{
|
||||
for (const auto& loop : loops)
|
||||
for (const auto& arrayElement : accessingSet.GetElements())
|
||||
{
|
||||
for (const auto& [funcInfo, blocks]: FullIR)
|
||||
{
|
||||
Region* loopRegion = new Region(loop, blocks);
|
||||
SolveDataFlow(loopRegion);
|
||||
result[loop] = loopRegion->array_priv;
|
||||
delete(loopRegion);
|
||||
}
|
||||
if (arrayElement.empty())
|
||||
continue;
|
||||
arraysToInsert.insert(arrayElement[0].array->symbol());
|
||||
}
|
||||
}
|
||||
|
||||
spfStat->setExpression(0, *toAdd);
|
||||
toAdd = toAdd->lhs();
|
||||
bool first = true;
|
||||
for (auto& elem : arraysToInsert)
|
||||
{
|
||||
if (first)
|
||||
{
|
||||
toAdd->setLhs(new SgExpression(EXPR_LIST));
|
||||
toAdd = toAdd->lhs();
|
||||
first = false;
|
||||
}
|
||||
else
|
||||
{
|
||||
toAdd->setRhs(new SgExpression(EXPR_LIST));
|
||||
toAdd = toAdd->rhs();
|
||||
}
|
||||
toAdd->setLhs(new SgVarRefExp(elem));
|
||||
}
|
||||
|
||||
if (arraysToInsert.size() == 0)
|
||||
printInternalError(convertFileName(__FILE__).c_str(), __LINE__);
|
||||
|
||||
loop->loop->insertStmtBefore(*spfStat, *loop->loop->controlParent());
|
||||
insertedPrivates.insert(spfStat);
|
||||
}
|
||||
|
||||
void FindPrivateArrays(map<string, vector<LoopGraph*>> &loopGraph, map<FuncInfo*, vector<SAPFOR::BasicBlock*>>& FullIR, set<SgStatement*> &insertedPrivates)
|
||||
{
|
||||
map<LoopGraph*, ArrayAccessingIndexes> result;
|
||||
for (const auto& [fileName, loops] : loopGraph)
|
||||
{
|
||||
SgFile::switchToFile(fileName);
|
||||
for (const auto& loop : loops)
|
||||
{
|
||||
if (!loop->isFor())
|
||||
continue;
|
||||
SgStatement* search_func = loop->loop->GetOriginal();
|
||||
|
||||
while (search_func && (!isSgProgHedrStmt(search_func)))
|
||||
search_func = search_func->controlParent();
|
||||
|
||||
for (const auto& [funcInfo, blocks]: FullIR)
|
||||
{
|
||||
if (funcInfo->fileName == fileName && funcInfo->funcPointer->GetOriginal() == search_func)
|
||||
{
|
||||
Region* loopRegion = new Region(loop, blocks);
|
||||
if (loopRegion->getBasickBlocks().size() <= 1)
|
||||
{
|
||||
delete(loopRegion);
|
||||
continue;
|
||||
}
|
||||
SolveDataFlow(loopRegion);
|
||||
RemoveEmptyPoints(loopRegion->array_priv);
|
||||
result[loop] = loopRegion->array_priv;
|
||||
delete(loopRegion);
|
||||
}
|
||||
}
|
||||
|
||||
if (result.find(loop) != result.end() && !result[loop].empty())
|
||||
AddPrivateArraysToLoop(loop, result[loop], insertedPrivates);
|
||||
}
|
||||
}
|
||||
return result;
|
||||
}
|
||||
|
||||
@@ -2,11 +2,12 @@
|
||||
|
||||
#include <vector>
|
||||
#include <map>
|
||||
#include <set>
|
||||
#include <unordered_set>
|
||||
|
||||
#include "range_structures.h"
|
||||
#include "graph_loops.h"
|
||||
#include "CFGraph/CFGraph.h"
|
||||
|
||||
std::map<LoopGraph*, ArrayAccessingIndexes> FindPrivateArrays(std::map<std::string, std::vector<LoopGraph*>>& loopGraph, std::map<FuncInfo*, std::vector<SAPFOR::BasicBlock*>>& FullIR);
|
||||
void FindPrivateArrays(std::map<std::string, std::vector<LoopGraph*>>& loopGraph, std::map<FuncInfo*, std::vector<SAPFOR::BasicBlock*>>& FullIR, std::set<SgStatement*>& insertedPrivates);
|
||||
std::pair<SAPFOR::BasicBlock*, std::unordered_set<SAPFOR::BasicBlock*>> GetBasicBlocksForLoop(const LoopGraph* loop, const std::vector<SAPFOR::BasicBlock*> blocks);
|
||||
|
||||
@@ -47,7 +47,7 @@ static ArrayDimension* DimensionIntersection(const ArrayDimension& dim1, const A
|
||||
|
||||
uint64_t start3 = dim1.start + x0 * dim1.step;
|
||||
uint64_t step3 = c * dim1.step;
|
||||
ArrayDimension* result = new(ArrayDimension){ start3, step3, tMax + 1 };
|
||||
ArrayDimension* result = new(ArrayDimension){ start3, step3, tMax + 1 , dim1.array};
|
||||
return result;
|
||||
}
|
||||
|
||||
@@ -61,21 +61,16 @@ static vector<ArrayDimension> DimensionDifference(const ArrayDimension& dim1, co
|
||||
vector<ArrayDimension> result;
|
||||
/* add the part before intersection */
|
||||
if (dim1.start < intersection->start)
|
||||
result.push_back({ dim1.start, dim1.step, (intersection->start - dim1.start) / dim1.step });
|
||||
result.push_back({ dim1.start, dim1.step, (intersection->start - dim1.start) / dim1.step, dim1.array});
|
||||
|
||||
/* add the parts between intersection steps */
|
||||
uint64_t start = (intersection->start - dim1.start) / dim1.step;
|
||||
uint64_t interValue = intersection->start;
|
||||
for (int64_t i = start; dim1.start + i * dim1.step <= intersection->start + intersection->step * (intersection->tripCount - 1); i++)
|
||||
if (intersection->step > dim1.step)
|
||||
{
|
||||
uint64_t centerValue = dim1.start + i * dim1.step;
|
||||
if (centerValue == interValue)
|
||||
uint64_t start = (intersection->start - dim1.start) / dim1.step;
|
||||
uint64_t interValue = intersection->start;
|
||||
for (int64_t i = start; interValue <= intersection->start + intersection->step * (intersection->tripCount - 1); i++)
|
||||
{
|
||||
if (i - start > 1)
|
||||
{
|
||||
result.push_back({ dim1.start + (start + 1) * dim1.step, dim1.step, i - start - 1 });
|
||||
start = i;
|
||||
}
|
||||
result.push_back({interValue + dim1.step, dim1.step, intersection->step / dim1.step, dim1.array});
|
||||
interValue += intersection->step;
|
||||
}
|
||||
}
|
||||
@@ -85,7 +80,7 @@ static vector<ArrayDimension> DimensionDifference(const ArrayDimension& dim1, co
|
||||
/* first value after intersection */
|
||||
uint64_t right_start = intersection->start + intersection->step * (intersection->tripCount - 1) + dim1.step;
|
||||
uint64_t tripCount = (dim1.start + dim1.step * dim1.tripCount - right_start) / dim1.step;
|
||||
result.push_back({ right_start, dim1.step, tripCount });
|
||||
result.push_back({ right_start, dim1.step, tripCount, dim1.array });
|
||||
}
|
||||
delete(intersection);
|
||||
return result;
|
||||
@@ -216,6 +211,10 @@ void AccessingSet::Insert(const vector<ArrayDimension>& element)
|
||||
}
|
||||
|
||||
AccessingSet AccessingSet::Union(const AccessingSet& source) {
|
||||
if (source.GetElements().empty())
|
||||
return *this;
|
||||
if (allElements.empty())
|
||||
return source;
|
||||
AccessingSet result;
|
||||
for (auto& element : source.GetElements())
|
||||
result.Insert(element);
|
||||
|
||||
@@ -6,9 +6,12 @@
|
||||
#include <string>
|
||||
#include <cstdint>
|
||||
|
||||
#include "SgUtils.h"
|
||||
|
||||
struct ArrayDimension
|
||||
{
|
||||
uint64_t start, step, tripCount;
|
||||
SgArrayRefExp* array;
|
||||
};
|
||||
|
||||
class AccessingSet {
|
||||
|
||||
@@ -4,6 +4,7 @@
|
||||
#include<unordered_map>
|
||||
#include<string>
|
||||
#include <numeric>
|
||||
#include <iostream>
|
||||
|
||||
#include "range_structures.h"
|
||||
#include "region.h"
|
||||
@@ -104,15 +105,33 @@ static int GetDefUseArray(SAPFOR::BasicBlock* block, LoopGraph* loop, ArrayAcces
|
||||
|
||||
auto operation = instruction->getInstruction()->getOperation();
|
||||
auto type = instruction->getInstruction()->getArg1()->getType();
|
||||
if (operation == SAPFOR::CFG_OP::ASSIGN && instruction->getInstruction()->getResult()->getType() == SAPFOR::CFG_ARG_TYPE::ARRAY)
|
||||
{
|
||||
SgStatement* op = instruction->getInstruction()->getOperator();
|
||||
if (op && op->expr(0) && isArrayRef(op->expr(0)) && op->expr(0)->symbol() && op->expr(0)->type())
|
||||
{
|
||||
if (isSgArrayType(op->expr(0)->symbol()->type()))
|
||||
{
|
||||
SgArrayType* arrayType = (SgArrayType*)op->expr(0)->symbol()->type();
|
||||
int dimCount = ((SgArrayType*)op->expr(0)->symbol()->type())->dimension();
|
||||
vector<ArrayDimension> point;
|
||||
for (int i = 0; i < dimCount; i++)
|
||||
{
|
||||
string strDimLength = arrayType->sizeInDim(i)->unparse();
|
||||
if (arrayType->sizeInDim(i)->variant() == INT_VAL && strDimLength != "0")
|
||||
point.push_back({ 1ULL, 1ULL, (uint64_t)stoi(strDimLength), (SgArrayRefExp*)op->expr(0) });
|
||||
}
|
||||
|
||||
if (point.size() == dimCount)
|
||||
def[instruction->getInstruction()->getResult()->getValue()] = AccessingSet({point});
|
||||
}
|
||||
}
|
||||
}
|
||||
if ((operation == SAPFOR::CFG_OP::STORE || operation == SAPFOR::CFG_OP::LOAD) && type == SAPFOR::CFG_ARG_TYPE::ARRAY)
|
||||
{
|
||||
vector<SAPFOR::Argument*> index_vars;
|
||||
vector<int> refPos;
|
||||
string array_name;
|
||||
if (operation == SAPFOR::CFG_OP::STORE)
|
||||
array_name = instruction->getInstruction()->getArg1()->getValue();
|
||||
else
|
||||
array_name = instruction->getInstruction()->getArg2()->getValue();
|
||||
string array_name = instruction->getInstruction()->getArg1()->getValue();
|
||||
|
||||
int j = i - 1;
|
||||
while (j >= 0 && instructions[j]->getInstruction()->getOperation() == SAPFOR::CFG_OP::REF)
|
||||
@@ -127,29 +146,15 @@ static int GetDefUseArray(SAPFOR::BasicBlock* block, LoopGraph* loop, ArrayAcces
|
||||
vector<ArrayDimension> accessPoint(n);
|
||||
|
||||
auto* ref = isSgArrayRefExp(instruction->getInstruction()->getExpression());
|
||||
vector<pair<int, int>> coefsForDims;
|
||||
for (int i = 0; ref && i < ref->numberOfSubscripts(); ++i)
|
||||
{
|
||||
const vector<int*>& coefs = getAttributes<SgExpression*, int*>(ref->subscript(i), set<int>{ INT_VAL });
|
||||
if (coefs.size() == 1)
|
||||
{
|
||||
const pair<int, int> coef(coefs[0][0], coefs[0][1]);
|
||||
coefsForDims.push_back(coef);
|
||||
}
|
||||
int fillCount = 0;
|
||||
|
||||
}
|
||||
|
||||
if(coefsForDims.empty())
|
||||
printInternalError(convertFileName(__FILE__).c_str(), __LINE__);
|
||||
|
||||
while (!index_vars.empty())
|
||||
while (!index_vars.empty() && !refPos.empty())
|
||||
{
|
||||
auto var = index_vars.back();
|
||||
int currentVarPos = refPos.back();
|
||||
pair<int, int> currentCoefs = coefsForDims.back();
|
||||
ArrayDimension current_dim;
|
||||
if (var->getType() == SAPFOR::CFG_ARG_TYPE::CONST)
|
||||
current_dim = { stoul(var->getValue()), 1, 1 };
|
||||
current_dim = { stoul(var->getValue()), 1, 1, ref};
|
||||
else
|
||||
{
|
||||
string name, full_name = var->getValue();
|
||||
@@ -175,21 +180,28 @@ static int GetDefUseArray(SAPFOR::BasicBlock* block, LoopGraph* loop, ArrayAcces
|
||||
return -1;
|
||||
}
|
||||
|
||||
uint64_t start = currentLoop->startVal * currentCoefs.first + currentCoefs.second;
|
||||
uint64_t step = currentCoefs.first;
|
||||
current_dim = { start, step, (uint64_t)currentLoop->calculatedCountOfIters };
|
||||
uint64_t start = currentLoop->startVal;
|
||||
uint64_t step = currentLoop->stepVal;
|
||||
uint64_t iters = currentLoop->calculatedCountOfIters;
|
||||
current_dim = { start, step, iters, ref };
|
||||
}
|
||||
|
||||
accessPoint[n - index_vars.size()] = current_dim;
|
||||
if (current_dim.start != 0 && current_dim.step != 0 && current_dim.tripCount != 0)
|
||||
{
|
||||
accessPoint[n - index_vars.size()] = current_dim;
|
||||
fillCount++;
|
||||
}
|
||||
index_vars.pop_back();
|
||||
refPos.pop_back();
|
||||
coefsForDims.pop_back();
|
||||
}
|
||||
|
||||
if (operation == SAPFOR::CFG_OP::STORE)
|
||||
def[array_name].Insert(accessPoint);
|
||||
else
|
||||
use[array_name].Insert(accessPoint);
|
||||
if (fillCount == accessPoint.size())
|
||||
{
|
||||
if (operation == SAPFOR::CFG_OP::STORE)
|
||||
def[array_name].Insert(accessPoint);
|
||||
else
|
||||
use[array_name].Insert(accessPoint);
|
||||
}
|
||||
}
|
||||
}
|
||||
return 0;
|
||||
@@ -227,8 +239,11 @@ static Region* CreateSubRegion(LoopGraph* loop, const vector<SAPFOR::BasicBlock*
|
||||
region->addBasickBlocks(bbToRegion.at(block));
|
||||
|
||||
for (LoopGraph* childLoop : loop->children)
|
||||
{
|
||||
if (!childLoop->isFor())
|
||||
continue;
|
||||
region->addSubRegions(CreateSubRegion(childLoop, Blocks, bbToRegion));
|
||||
|
||||
}
|
||||
return region;
|
||||
}
|
||||
|
||||
@@ -247,5 +262,9 @@ Region::Region(LoopGraph* loop, const vector<SAPFOR::BasicBlock*>& Blocks)
|
||||
SetConnections(bbToRegion, blockSet);
|
||||
//create subRegions
|
||||
for (LoopGraph* childLoop : loop->children)
|
||||
{
|
||||
if (!childLoop->isFor())
|
||||
continue;
|
||||
subRegions.insert(CreateSubRegion(childLoop, Blocks, bbToRegion));
|
||||
}
|
||||
}
|
||||
|
||||
118
src/Sapfor.cpp
118
src/Sapfor.cpp
@@ -46,6 +46,7 @@
|
||||
#include "DynamicAnalysis/gCov_parser_func.h"
|
||||
#include "DynamicAnalysis/createParallelRegions.h"
|
||||
|
||||
#include "ArrayConstantPropagation/propagation.h"
|
||||
#include "DirectiveProcessing/directive_analyzer.h"
|
||||
#include "DirectiveProcessing/directive_creator.h"
|
||||
#include "DirectiveProcessing/insert_directive.h"
|
||||
@@ -57,7 +58,6 @@
|
||||
#include "expr_transform.h"
|
||||
|
||||
#include "Predictor/PredictScheme.h"
|
||||
#include "Predictor/PredictSchemeWithLibrary.h"
|
||||
#include "Predictor/PredictorModel.h"
|
||||
#include "SageAnalysisTool/depInterfaceExt.h"
|
||||
#include "DvmhRegions/DvmhRegionInserter.h"
|
||||
@@ -280,7 +280,8 @@ static string unparseProjectIfNeed(SgFile* file, const int curr_regime, const bo
|
||||
for (SgStatement* st = file->firstStatement(); st; st = st->lexNext())
|
||||
if (isSPF_stat(st)) // except sapfor parallel regions and if attributes dont move
|
||||
if (st->variant() != SPF_PARALLEL_REG_DIR && st->variant() != SPF_END_PARALLEL_REG_DIR)
|
||||
toDel.push_back(st);
|
||||
if (insertedPrivates.find(st) == insertedPrivates.end())
|
||||
toDel.push_back(st);
|
||||
|
||||
for (auto& elem : toDel)
|
||||
elem->deleteStmt();
|
||||
@@ -1020,8 +1021,6 @@ static bool runAnalysis(SgProject &project, const int curr_regime, const bool ne
|
||||
if(func->funcPointer->variant() != ENTRY_STAT)
|
||||
countOfTransform += removeDeadCode(func->funcPointer, allFuncInfo, commonBlocks);
|
||||
}
|
||||
else if (curr_regime == FIND_PRIVATE_ARRAYS)
|
||||
FindPrivateArrays(loopGraph, fullIR);
|
||||
else if (curr_regime == TEST_PASS)
|
||||
{
|
||||
//test pass
|
||||
@@ -1729,7 +1728,103 @@ static bool runAnalysis(SgProject &project, const int curr_regime, const bool ne
|
||||
}
|
||||
}
|
||||
else if (curr_regime == PREDICT_SCHEME)
|
||||
runPredictScheme(project, topologies, parallelRegions, loopGraph, SPF_messages);
|
||||
{
|
||||
int maxSizeDist = 0;
|
||||
for (int z = 0; z < parallelRegions.size(); ++z)
|
||||
{
|
||||
const DataDirective &dataDirectives = parallelRegions[z]->GetDataDir();
|
||||
const vector<int> ¤tVariant = parallelRegions[z]->GetCurrentVariant();
|
||||
|
||||
auto &tmp = dataDirectives.distrRules;
|
||||
vector<pair<DIST::Array*, const DistrVariant*>> currentVar;
|
||||
for (int z1 = 0; z1 < currentVariant.size(); ++z1)
|
||||
currentVar.push_back(make_pair(tmp[z1].first, &tmp[z1].second[currentVariant[z1]]));
|
||||
|
||||
for (auto &elem : currentVar)
|
||||
{
|
||||
DIST::Array *array = elem.first;
|
||||
const DistrVariant *var = elem.second;
|
||||
|
||||
int countBlock = 0;
|
||||
for (int z = 0; z < var->distRule.size(); ++z)
|
||||
if (var->distRule[z] == dist::BLOCK)
|
||||
++countBlock;
|
||||
maxSizeDist = std::max(maxSizeDist, countBlock);
|
||||
}
|
||||
}
|
||||
|
||||
SpfInterval *mainIterval = getMainInterval(&project, intervals, SPF_messages);
|
||||
topologies.clear();
|
||||
if (maxSizeDist)
|
||||
{
|
||||
const int procNum = 8;
|
||||
//TODO:
|
||||
//topologies = getTopologies(procNum, maxSizeDist);
|
||||
throw -10;
|
||||
|
||||
const int countOfTop = topologies.size();
|
||||
if (countOfTop < 0)
|
||||
printInternalError(convertFileName(__FILE__).c_str(), __LINE__);
|
||||
|
||||
for (auto &inter : intervals)
|
||||
initTimeForIntervalTree(countOfTop, inter.second);
|
||||
|
||||
for (int z = 0; z < parallelRegions.size(); ++z)
|
||||
{
|
||||
const DataDirective &dataDirectives = parallelRegions[z]->GetDataDir();
|
||||
const vector<int> ¤tVariant = parallelRegions[z]->GetCurrentVariant();
|
||||
DIST::Arrays<int> &allArrays = parallelRegions[z]->GetAllArraysToModify();
|
||||
|
||||
auto &tmp = dataDirectives.distrRules;
|
||||
vector<pair<DIST::Array*, const DistrVariant*>> currentVar;
|
||||
for (int z1 = 0; z1 < currentVariant.size(); ++z1)
|
||||
currentVar.push_back(make_pair(tmp[z1].first, &tmp[z1].second[currentVariant[z1]]));
|
||||
|
||||
map<LoopGraph*, ParallelDirective*> parallelDirs;
|
||||
vector<std::tuple<DIST::Array*, vector<long>, pair<string, int>>> allSingleRemotes;
|
||||
for (int i = n - 1; i >= 0; --i)
|
||||
{
|
||||
SgFile *file = &(project.file(i));
|
||||
auto fountInfo = findAllDirectives(file, getObjectForFileFromMap(file->filename(), loopGraph), parallelRegions[z]->GetId());
|
||||
parallelDirs.insert(fountInfo.begin(), fountInfo.end());
|
||||
|
||||
auto fountRem = findAllSingleRemotes(file, parallelRegions[z]->GetId(), parallelRegions);
|
||||
allSingleRemotes.insert(allSingleRemotes.end(), fountRem.begin(), fountRem.end());
|
||||
}
|
||||
//TODO!
|
||||
//int err = predictScheme(parallelRegions[z], currentVar, allArrays.GetArrays(), parallelDirs, intervals, SPF_messages, allSingleRemotes, maxSizeDist, procNum);
|
||||
/*if (err != 0)
|
||||
internalExit = err;*/
|
||||
}
|
||||
|
||||
vector<SpfInterval*> tmp = { mainIterval };
|
||||
aggregatePredictedTimes(tmp);
|
||||
|
||||
int idx = 0;
|
||||
int best = -1;
|
||||
double bestSpeedUp = 0;
|
||||
for (auto &top : topologies)
|
||||
{
|
||||
string outStr = "";
|
||||
for (auto &elem : top)
|
||||
outStr += std::to_string(elem) + " ";
|
||||
double currS = mainIterval->exec_time / mainIterval->predictedTimes[idx];
|
||||
__spf_print(1, "%d: speed up %f for top. %s\n", idx, currS, outStr.c_str());
|
||||
|
||||
if (best == -1 || bestSpeedUp < currS)
|
||||
{
|
||||
bestSpeedUp = currS;
|
||||
best = idx;
|
||||
}
|
||||
++idx;
|
||||
}
|
||||
__spf_print(1, "best topology %d with speed up %f\n", best, bestSpeedUp);
|
||||
}
|
||||
else
|
||||
for (auto &inter : intervals)
|
||||
initTimeForIntervalTree(0, inter.second);
|
||||
|
||||
}
|
||||
else if (curr_regime == CREATE_INTER_TREE)
|
||||
{
|
||||
if (keepFiles)
|
||||
@@ -1821,6 +1916,11 @@ static bool runAnalysis(SgProject &project, const int curr_regime, const bool ne
|
||||
}
|
||||
else if (curr_regime == TRANSFORM_ASSUMED_SIZE_PARAMETERS)
|
||||
transformAssumedSizeParameters(allFuncInfo);
|
||||
else if (curr_regime == FIND_PRIVATE_ARRAYS_ANALYSIS)
|
||||
FindPrivateArrays(loopGraph, fullIR, insertedPrivates);
|
||||
|
||||
else if (curr_regime == ARRAY_PROPAGATION)
|
||||
ArrayConstantPropagation(project);
|
||||
|
||||
const float elapsed = duration_cast<milliseconds>(high_resolution_clock::now() - timeForPass).count() / 1000.;
|
||||
const float elapsedGlobal = duration_cast<milliseconds>(high_resolution_clock::now() - globalTime).count() / 1000.;
|
||||
@@ -2125,8 +2225,9 @@ void runPass(const int curr_regime, const char *proj_name, const char *folderNam
|
||||
|
||||
runAnalysis(*project, CALCULATE_STATS_SCHEME, false);
|
||||
|
||||
if (!folderName && !consoleMode || predictOn)
|
||||
runAnalysis(*project, PREDICT_SCHEME, false);
|
||||
//TODO: need to rewrite this to new algo
|
||||
/*if (!folderName && !consoleMode || predictOn)
|
||||
runAnalysis(*project, PREDICT_SCHEME, false); */
|
||||
|
||||
runAnalysis(*project, REMOVE_COPIES, false);
|
||||
runAnalysis(*project, SWAP_LOOPS, false);
|
||||
@@ -2277,6 +2378,7 @@ void runPass(const int curr_regime, const char *proj_name, const char *folderNam
|
||||
case SUBST_EXPR_RD_AND_UNPARSE:
|
||||
case SUBST_EXPR_AND_UNPARSE:
|
||||
case REMOVE_DEAD_CODE_AND_UNPARSE:
|
||||
case FIND_PRIVATE_ARRAYS:
|
||||
if (folderName)
|
||||
runAnalysis(*project, UNPARSE_FILE, true, "", folderName);
|
||||
else
|
||||
@@ -2538,7 +2640,7 @@ int main(int argc, char **argv)
|
||||
}
|
||||
}
|
||||
|
||||
if (curr_regime == INSERT_PARALLEL_DIRS_NODIST)
|
||||
if (curr_regime == INSERT_PARALLEL_DIRS_NODIST || curr_regime == FIND_PRIVATE_ARRAYS)
|
||||
{
|
||||
ignoreArrayDistributeState = true;
|
||||
sharedMemoryParallelization = 1;
|
||||
|
||||
@@ -183,9 +183,11 @@ enum passes {
|
||||
SET_IMPLICIT_NONE,
|
||||
RENAME_INLCUDES,
|
||||
|
||||
FIND_PRIVATE_ARRAYS_ANALYSIS,
|
||||
FIND_PRIVATE_ARRAYS,
|
||||
|
||||
TRANSFORM_ASSUMED_SIZE_PARAMETERS,
|
||||
ARRAY_PROPAGATION,
|
||||
|
||||
TEST_PASS,
|
||||
EMPTY_PASS
|
||||
@@ -371,9 +373,11 @@ static void setPassValues()
|
||||
passNames[SET_IMPLICIT_NONE] = "SET_IMPLICIT_NONE";
|
||||
passNames[RENAME_INLCUDES] = "RENAME_INLCUDES";
|
||||
passNames[INSERT_NO_DISTR_FLAGS_FROM_GUI] = "INSERT_NO_DISTR_FLAGS_FROM_GUI";
|
||||
passNames[FIND_PRIVATE_ARRAYS_ANALYSIS] = "FIND_PRIVATE_ARRAYS_ANALYSIS";
|
||||
passNames[FIND_PRIVATE_ARRAYS] = "FIND_PRIVATE_ARRAYS";
|
||||
|
||||
passNames[TRANSFORM_ASSUMED_SIZE_PARAMETERS] = "TRANSFORM_ASSUMED_SIZE_PARAMETERS";
|
||||
passNames[ARRAY_PROPAGATION] = "ARRAY_PROPAGATION";
|
||||
|
||||
passNames[TEST_PASS] = "TEST_PASS";
|
||||
}
|
||||
|
||||
@@ -132,7 +132,7 @@ std::map<std::string, PredictorStats> allPredictorStats;
|
||||
|
||||
//for DVM INTERVALS
|
||||
std::map<std::string, std::vector<SpfInterval*>> intervals; // file -> intervals
|
||||
std::vector<std::vector<size_t>> topologies; // current topologies
|
||||
std::vector<std::vector<long>> topologies; // current topologies
|
||||
//
|
||||
|
||||
//for GCOV_PARSER
|
||||
@@ -175,6 +175,11 @@ std::set<std::tuple<std::string, int, std::string>> parametersOfProject; // [fil
|
||||
//for GET_MIN_MAX_BLOCK_DIST
|
||||
std::pair<int, int> min_max_block = std::make_pair(-1, -1);
|
||||
//
|
||||
|
||||
//for FIND_PRIVATE_ARRAYS
|
||||
std::set<SgStatement*> insertedPrivates;
|
||||
//
|
||||
|
||||
const char* passNames[EMPTY_PASS + 1];
|
||||
const char* optionNames[EMPTY_OPTION + 1];
|
||||
bool passNamesWasInit = false;
|
||||
|
||||
@@ -1123,7 +1123,7 @@ static bool hasDependenciesBetweenArrays(LoopGraph* firstLoop, LoopGraph* loop,
|
||||
for (int d = 0; d < dimensions; ++d)
|
||||
{
|
||||
//по измерениям массива отображение на цикл вложенности d
|
||||
vector<set<pair<int, int>>> coefsRead[2], coefsWrite[2];
|
||||
vector<set<pair<int, int>>> coeffsRead[2], coeffsWrite[2];
|
||||
|
||||
checkNull(currLoop[0], convertFileName(__FILE__).c_str(), __LINE__);
|
||||
checkNull(currLoop[1], convertFileName(__FILE__).c_str(), __LINE__);
|
||||
@@ -1133,31 +1133,31 @@ static bool hasDependenciesBetweenArrays(LoopGraph* firstLoop, LoopGraph* loop,
|
||||
auto it = currLoop[k]->readOpsForLoop.find(array);
|
||||
if (it != currLoop[k]->readOpsForLoop.end())
|
||||
{
|
||||
if (coefsRead[k].size() == 0)
|
||||
coefsRead[k].resize(it->second.size());
|
||||
if (coeffsRead[k].size() == 0)
|
||||
coeffsRead[k].resize(it->second.size());
|
||||
|
||||
for (int z = 0; z < it->second.size(); ++z)
|
||||
if (it->second[z].coefficients.size())
|
||||
for (auto& coef : it->second[z].coefficients)
|
||||
coefsRead[k][z].insert(coef.first);
|
||||
coeffsRead[k][z].insert(coef.first);
|
||||
}
|
||||
|
||||
auto itW = currLoop[k]->writeOpsForLoop.find(array);
|
||||
if (itW != currLoop[k]->writeOpsForLoop.end())
|
||||
{
|
||||
if (coefsWrite[k].size() == 0)
|
||||
coefsWrite[k].resize(itW->second.size());
|
||||
if (coeffsWrite[k].size() == 0)
|
||||
coeffsWrite[k].resize(itW->second.size());
|
||||
|
||||
for (int z = 0; z < itW->second.size(); ++z)
|
||||
if (itW->second[z].coefficients.size())
|
||||
for (auto& coef : itW->second[z].coefficients)
|
||||
coefsWrite[k][z].insert(coef.first);
|
||||
coeffsWrite[k][z].insert(coef.first);
|
||||
}
|
||||
}
|
||||
|
||||
//нет записей, значит нет зависимости
|
||||
bool nulWrite = true;
|
||||
for (auto& wr : coefsWrite)
|
||||
for (auto& wr : coeffsWrite)
|
||||
for (auto& elem : wr)
|
||||
if (elem.size() != 0)
|
||||
nulWrite = false;
|
||||
@@ -1168,62 +1168,62 @@ static bool hasDependenciesBetweenArrays(LoopGraph* firstLoop, LoopGraph* loop,
|
||||
// если чтение в одном цикле и запись (и наоборот) в другом идут по разным правилам, то пока что это зависимость.
|
||||
// здесь можно уточнить.
|
||||
|
||||
const int len = std::max(coefsWrite[0].size(), coefsRead[0].size());
|
||||
const int len = std::max(coeffsWrite[0].size(), coeffsRead[0].size());
|
||||
int countW[2] = { 0, 0 };
|
||||
int countR[2] = { 0, 0 };
|
||||
|
||||
for (int L = 0; L < 2; ++L)
|
||||
for (int z = 0; z < coefsWrite[L].size(); ++z)
|
||||
countW[L] += (coefsWrite[L][z].size() ? 1 : 0);
|
||||
for (int z = 0; z < coeffsWrite[L].size(); ++z)
|
||||
countW[L] += (coeffsWrite[L][z].size() ? 1 : 0);
|
||||
|
||||
for (int L = 0; L < 2; ++L)
|
||||
for (int z = 0; z < coefsRead[L].size(); ++z)
|
||||
countR[L] += (coefsRead[L][z].size() ? 1 : 0);
|
||||
for (int z = 0; z < coeffsRead[L].size(); ++z)
|
||||
countR[L] += (coeffsRead[L][z].size() ? 1 : 0);
|
||||
|
||||
for (int p = 0; p < len; ++p)
|
||||
{
|
||||
if (coefsWrite[1].size() && coefsWrite[0].size())
|
||||
if (coefsWrite[0][p].size() != 0 && coefsWrite[1][p].size() != 0)
|
||||
if (coefsWrite[0][p] != coefsWrite[1][p])
|
||||
if (coeffsWrite[1].size() && coeffsWrite[0].size())
|
||||
if (coeffsWrite[0][p].size() != 0 && coeffsWrite[1][p].size() != 0)
|
||||
if (coeffsWrite[0][p] != coeffsWrite[1][p])
|
||||
return true;
|
||||
|
||||
if (coefsRead[1].size() && coefsWrite[0].size())
|
||||
if (coefsWrite[0][p].size() != 0 && coefsRead[1][p].size() != 0)
|
||||
if (coefsWrite[0][p] != coefsRead[1][p])
|
||||
if (coeffsRead[1].size() && coeffsWrite[0].size())
|
||||
if (coeffsWrite[0][p].size() != 0 && coeffsRead[1][p].size() != 0)
|
||||
if (coeffsWrite[0][p] != coeffsRead[1][p])
|
||||
return true;
|
||||
|
||||
if (coefsWrite[1].size() && coefsRead[0].size())
|
||||
if (coefsWrite[1][p].size() != 0 && coefsRead[0][p].size() != 0)
|
||||
if (coefsWrite[1][p] != coefsRead[0][p])
|
||||
if (coeffsWrite[1].size() && coeffsRead[0].size())
|
||||
if (coeffsWrite[1][p].size() != 0 && coeffsRead[0][p].size() != 0)
|
||||
if (coeffsWrite[1][p] != coeffsRead[0][p])
|
||||
return true;
|
||||
|
||||
|
||||
//отображение на разные измерения
|
||||
if (coefsWrite[1].size() && coefsWrite[0].size())
|
||||
if (coeffsWrite[1].size() && coeffsWrite[0].size())
|
||||
{
|
||||
if (coefsWrite[0][p].size() != 0 && coefsWrite[1][p].size() == 0 && countW[1] ||
|
||||
coefsWrite[0][p].size() == 0 && coefsWrite[1][p].size() != 0 && countW[0])
|
||||
if (coeffsWrite[0][p].size() != 0 && coeffsWrite[1][p].size() == 0 && countW[1] ||
|
||||
coeffsWrite[0][p].size() == 0 && coeffsWrite[1][p].size() != 0 && countW[0])
|
||||
return true;
|
||||
}
|
||||
|
||||
if (coefsRead[1].size() && coefsWrite[0].size())
|
||||
if (coeffsRead[1].size() && coeffsWrite[0].size())
|
||||
{
|
||||
if (coefsWrite[0][p].size() != 0 && coefsRead[1][p].size() == 0 && countR[1] ||
|
||||
coefsWrite[0][p].size() == 0 && coefsRead[1][p].size() != 0 && countW[0])
|
||||
if (coeffsWrite[0][p].size() != 0 && coeffsRead[1][p].size() == 0 && countR[1] ||
|
||||
coeffsWrite[0][p].size() == 0 && coeffsRead[1][p].size() != 0 && countW[0])
|
||||
return true;
|
||||
}
|
||||
|
||||
if (coefsWrite[1].size() && coefsRead[1].size())
|
||||
if (coeffsWrite[1].size() && coeffsRead[1].size())
|
||||
{
|
||||
if (coefsWrite[1][p].size() != 0 && coefsRead[0][p].size() == 0 && countR[0] ||
|
||||
coefsWrite[1][p].size() == 0 && coefsRead[0][p].size() != 0 && countW[1])
|
||||
if (coeffsWrite[1][p].size() != 0 && coeffsRead[0][p].size() == 0 && countR[0] ||
|
||||
coeffsWrite[1][p].size() == 0 && coeffsRead[0][p].size() != 0 && countW[1])
|
||||
return true;
|
||||
}
|
||||
|
||||
//где то нет правил отображения вообще, но есть факт его наличия.
|
||||
if ( ((coefsWrite[0].size() == 0 && coefsRead[0].size() == 0) && (countW[0] == 0 && countR[0] == 0))
|
||||
if ( ((coeffsWrite[0].size() == 0 && coeffsRead[0].size() == 0) && (countW[0] == 0 && countR[0] == 0))
|
||||
||
|
||||
((coefsWrite[1].size() == 0 && coefsRead[1].size() == 0) && (countW[1] == 0 && countR[1] == 0)) )
|
||||
((coeffsWrite[1].size() == 0 && coeffsRead[1].size() == 0) && (countW[1] == 0 && countR[1] == 0)) )
|
||||
return true;
|
||||
}
|
||||
|
||||
|
||||
@@ -316,7 +316,8 @@ void InitPassesDependencies(map<passes, vector<passes>> &passDepsIn, set<passes>
|
||||
|
||||
list({ VERIFY_INCLUDES, CORRECT_VAR_DECL }) <= Pass(SET_IMPLICIT_NONE);
|
||||
|
||||
list({ CALL_GRAPH2, CALL_GRAPH, BUILD_IR, LOOP_GRAPH, LOOP_ANALYZER_DATA_DIST_S2 }) <= Pass(FIND_PRIVATE_ARRAYS);
|
||||
list({ CALL_GRAPH2, CALL_GRAPH, BUILD_IR, LOOP_GRAPH, LOOP_ANALYZER_DATA_DIST_S2 }) <= Pass(FIND_PRIVATE_ARRAYS_ANALYSIS);
|
||||
list({ FIND_PRIVATE_ARRAYS_ANALYSIS, CONVERT_LOOP_TO_ASSIGN, RESTORE_LOOP_FROM_ASSIGN, REVERT_SUBST_EXPR_RD }) <= Pass(FIND_PRIVATE_ARRAYS);
|
||||
|
||||
passesIgnoreStateDone.insert({ CREATE_PARALLEL_DIRS, INSERT_PARALLEL_DIRS, INSERT_SHADOW_DIRS, EXTRACT_PARALLEL_DIRS,
|
||||
EXTRACT_SHADOW_DIRS, CREATE_REMOTES, UNPARSE_FILE, REMOVE_AND_CALC_SHADOW,
|
||||
|
||||
@@ -78,12 +78,7 @@ enum typeMessage { WARR, ERROR, NOTE };
|
||||
// 60 "Format misplaced"
|
||||
// 61 "Array has declaration area conflict"
|
||||
// 62 "need to move common declaration to main for DECLATE"
|
||||
// 63 "Failed to initialize libpredict cluster"
|
||||
// 64 "Failed to initialize libpredict grid"
|
||||
// 65 "Failed to distribute array with libpredict"
|
||||
// 66 "Failed to align array with libpredict"
|
||||
// 67 "Failed to process shadow_renew with libpredict"
|
||||
//
|
||||
//
|
||||
// 20xx TRANSFORM GROUP
|
||||
// 01 "can not convert array assign to loop"
|
||||
// 02 "converted arithmetic IF to simple IF"
|
||||
@@ -310,7 +305,7 @@ static void printStackTrace() { };
|
||||
} \
|
||||
} while (0)
|
||||
|
||||
// Свободный - R210
|
||||
// Свободный - R206
|
||||
// Гайд по русификации сообщений: При добавлении нового сообщения, меняется последний сводобный идентификатор.
|
||||
// В этом файле остаются только спецификаторы, для которых будет заполнен текст. Полный текст пишется в файле
|
||||
// russian_errors_text.txt. Спецификаторы там тоже сохраняются, по ним в визуализаторе будет восстановлен
|
||||
@@ -509,16 +504,6 @@ static const wchar_t *R183 = L"R183:";
|
||||
static const wchar_t *R184 = L"R184:%s";
|
||||
//1062
|
||||
static const wchar_t* R205 = L"R205:%s#%s";
|
||||
//1063
|
||||
static const wchar_t* R206 = L"R206:";
|
||||
//1064
|
||||
static const wchar_t* R207 = L"R207:";
|
||||
//1065
|
||||
static const wchar_t* R208 = L"R208:";
|
||||
//1066
|
||||
static const wchar_t* R209 = L"R209:";
|
||||
//1067
|
||||
static const wchar_t* R210 = L"R210:";
|
||||
|
||||
//2001
|
||||
static const wchar_t *R94 = L"R94:";
|
||||
|
||||
@@ -184,18 +184,8 @@ R182 = "Редукционная операция по элементу масс
|
||||
R183 = "Расположение операторов FORMAT не поддерживается, попробуйте применить проход Коррекция стиля кода".
|
||||
//1061
|
||||
R184 = "Область объявления массива '%s' конфликтует с предыдущей областью. Возможно, это вызвано использованием include-файлов. Попробуйте применить проход 'Подстановка заголовочных файлов'".
|
||||
//1062
|
||||
//1042
|
||||
R205 = "Массив '%s' состоящий в common блоке '%s' должен иметь описание в главной программной единице для объявления в директиве DECLARE"
|
||||
//1063
|
||||
R206 = "Ошибка инициализации библиотеки libpredict с конфигурацией кластера: %s, код возврата: %d"
|
||||
//1064
|
||||
R207 = "Ошибка инициализации сетки libpredict с топологией: %zu %zu %zu %zu, код возврата: %d"
|
||||
//1065
|
||||
R208 = "Ошибка распределения массива '%s' с помощью libpredict, код возврата: %d"
|
||||
//1066
|
||||
R209 = "Ошибка выравнивания массива '%s' с массивом '%s' с помощью libpredict, код возврата: %d"
|
||||
//1067
|
||||
R210 = "Ошибка обработки shadow_renew для массива '%s' с помощью libpredict, код возврата: %d"
|
||||
|
||||
//2001
|
||||
R94 = "Невозможно автоматически преобразовать данное присваивание к циклу"
|
||||
|
||||
@@ -1,3 +1,3 @@
|
||||
#pragma once
|
||||
|
||||
#define VERSION_SPF "2446"
|
||||
#define VERSION_SPF "2450"
|
||||
|
||||
@@ -950,7 +950,7 @@ int SPF_ModifyArrayDistribution(void*& context, int winHandler, short *options,
|
||||
|
||||
extern map<string, PredictorStats> allPredictorStats;
|
||||
extern map<string, vector<SpfInterval*>> intervals;
|
||||
extern vector<vector<size_t>> topologies;
|
||||
extern vector<vector<long>> topologies;
|
||||
|
||||
int SPF_CreateParallelVariant(void*& context, int winHandler, short *options, short *projName, short *folderName, int64_t *variants, int *varLen,
|
||||
string &output, string &outputMessage, string &predictorStats)
|
||||
@@ -1793,6 +1793,15 @@ int SPF_RenameIncludes(void*& context, int winHandler, short* options, short* pr
|
||||
return simpleTransformPass(RENAME_INLCUDES, options, projName, folderName, output, outputMessage);
|
||||
}
|
||||
|
||||
int SPF_InsertPrivateArrayDirectives(void*& context, int winHandler, short* options, short* projName, short* folderName, string& output, string& outputMessage)
|
||||
{
|
||||
MessageManager::clearCache();
|
||||
MessageManager::setWinHandler(winHandler);
|
||||
ignoreArrayDistributeState = true;
|
||||
sharedMemoryParallelization = 1;
|
||||
return simpleTransformPass(FIND_PRIVATE_ARRAYS, options, projName, folderName, output, outputMessage);
|
||||
}
|
||||
|
||||
static inline void convertBackSlash(char *str, int strL)
|
||||
{
|
||||
for (int z = 0; z < strL; ++z)
|
||||
@@ -1807,7 +1816,7 @@ static int inline runModificationPass(passes passName, short* projName, short* f
|
||||
runPassesForVisualizer(projName, { passName }, folderName);
|
||||
|
||||
//fill data
|
||||
// newFiles: <<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD> <20><><EFBFBD><EFBFBD><EFBFBD><EFBFBD> <20><><EFBFBD> <20><><EFBFBD>, <20><><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD> <20><><EFBFBD><EFBFBD><EFBFBD>>
|
||||
// newFiles: <èìåíà ôàéëîâ äëÿ ìîä, ñîäåðæèìîå ôàéëà>
|
||||
string newFile;
|
||||
|
||||
if (SgFile::switchToFile(outFileName.c_str()) == -1)
|
||||
@@ -2376,7 +2385,7 @@ const wstring Sapfor_RunAnalysis(const char* analysisName_c, const char* options
|
||||
retCode = SPF_GetArrayLinks(context, winHandler, optSh, projSh, result, output, outputMessage);
|
||||
else if (whichRun == "SPF_GetMaxMinBlockDistribution")
|
||||
retCode = SPF_GetMaxMinBlockDistribution(context, winHandler, optSh, projSh, result, output, outputMessage);
|
||||
else if (whichRun == "SPF_<EFBFBD>hangeDirectory") // russian C
|
||||
else if (whichRun == "SPF_ÑhangeDirectory") // russian C
|
||||
{
|
||||
if (options_c == NULL)
|
||||
printInternalError(convertFileName(__FILE__).c_str(), __LINE__);
|
||||
@@ -2499,6 +2508,8 @@ const wstring Sapfor_RunTransformation(const char* transformName_c, const char*
|
||||
retCode = SPF_InsertImplicitNone(context, winHandler, optSh, projSh, fold, output, outputMessage);
|
||||
else if (whichRun == "SPF_RenameIncludes")
|
||||
retCode = SPF_RenameIncludes(context, winHandler, optSh, projSh, fold, output, outputMessage);
|
||||
else if (whichRun == "SPF_InsertPrivateArrayDirectives")
|
||||
retCode = SPF_InsertPrivateArrayDirectives(context, winHandler, optSh, projSh, fold, output, outputMessage);
|
||||
else if (whichRun == "SPF_CreateParallelVariant")
|
||||
{
|
||||
vector<string> splited;
|
||||
|
||||
Reference in New Issue
Block a user