Compare commits
10 Commits
private_ar
...
libpredict
| Author | SHA1 | Date | |
|---|---|---|---|
| 9c3fa362ec | |||
| d51a5e0301 | |||
| 59af017e0b | |||
| 611cd8014c | |||
| 2caaf1ce07 | |||
| 02d471b90f | |||
| ea0ee153ae | |||
| c9134ddddd | |||
| 704646c1a5 | |||
| 4cb9f5070b |
@@ -338,7 +338,9 @@ set(MAIN src/Sapfor.cpp
|
||||
src/Utils/PassManager.h)
|
||||
|
||||
set(PREDICTOR src/Predictor/PredictScheme.cpp
|
||||
src/Predictor/PredictScheme.h)
|
||||
src/Predictor/PredictScheme.h
|
||||
src/Predictor/PredictSchemeWithLibrary.cpp
|
||||
src/Predictor/PredictSchemeWithLibrary.h)
|
||||
|
||||
set(LIBPREDICTOR ${libpred_sources}/cluster.cpp
|
||||
${libpred_sources}/predictor.cpp
|
||||
|
||||
Submodule projects/dvm updated: cdda71deab...7d374b7cc1
Submodule projects/libpredictor updated: d08cb25cc6...7e57477dfa
@@ -122,6 +122,7 @@ static LoopGraph* createDirectiveForLoop(LoopGraph *currentLoop, MapToArray &mai
|
||||
if (found == false)
|
||||
{
|
||||
directive->shadowRenew.push_back(make_pair(key, vector<pair<int, int>>()));
|
||||
directive->shadowRenewCorner.push_back(false);
|
||||
|
||||
const DIST::Array *arrayRef = read;
|
||||
for (int i = 0; i < arrayRef->GetDimSize(); ++i)
|
||||
|
||||
@@ -857,6 +857,11 @@ ParallelDirective::genDirective(File* file, const vector<pair<DIST::Array*, cons
|
||||
shadowRenewShifts[i].resize(shadowRenew[i].second.size());
|
||||
}
|
||||
|
||||
if (shadowRenewCorner.size() == 0)
|
||||
{
|
||||
shadowRenewCorner.resize(shadowRenew.size(), false);
|
||||
}
|
||||
|
||||
string shadowAdd = ", SHADOW_RENEW(";
|
||||
int inserted = 0;
|
||||
|
||||
@@ -899,7 +904,10 @@ ParallelDirective::genDirective(File* file, const vector<pair<DIST::Array*, cons
|
||||
for (auto& elem : genSubscripts(shadowRenew[i1].second, shadowRenewShifts[i1]))
|
||||
newArrayRef->addSubscript(*elem);
|
||||
|
||||
if (shadowRenew[i1].second.size() > 1 && needCorner(shadowArray, shiftsByAccess, loop))
|
||||
bool needCornerFlag = shadowRenew[i1].second.size() > 1 && needCorner(shadowArray, shiftsByAccess, loop);
|
||||
shadowRenewCorner[i1] = needCornerFlag;
|
||||
|
||||
if (needCornerFlag)
|
||||
{
|
||||
SgExpression* tmp = new SgExpression(ARRAY_OP, newArrayRef, NULL, NULL);
|
||||
p->setLhs(*tmp);
|
||||
|
||||
@@ -102,6 +102,7 @@ public:
|
||||
// origin_Name uniqName bounds
|
||||
std::vector<std::pair<std::pair<std::string, std::string>, std::vector<std::pair<int, int>>>> shadowRenew;
|
||||
std::vector<std::vector<std::pair<int, int>>> shadowRenewShifts;
|
||||
std::vector<bool> shadowRenewCorner;
|
||||
|
||||
// origin_Name uniqName bounds
|
||||
std::vector<std::pair<std::pair<std::string, std::string>, std::vector<std::pair<int, int>>>> across;
|
||||
@@ -125,6 +126,7 @@ public:
|
||||
privates = copyFrom.privates;
|
||||
shadowRenew = copyFrom.shadowRenew;
|
||||
shadowRenewShifts = copyFrom.shadowRenewShifts;
|
||||
shadowRenewCorner = copyFrom.shadowRenewCorner;
|
||||
across = copyFrom.across;
|
||||
acrossShifts = copyFrom.acrossShifts;
|
||||
remoteAccess = copyFrom.remoteAccess;
|
||||
@@ -151,6 +153,7 @@ public:
|
||||
on.clear();
|
||||
privates.clear();
|
||||
shadowRenew.clear();
|
||||
shadowRenewCorner.clear();
|
||||
across.clear();
|
||||
acrossShifts.clear();
|
||||
reduction.clear();
|
||||
|
||||
@@ -23,6 +23,7 @@
|
||||
#include "expr_transform.h"
|
||||
#include "../LoopAnalyzer/loop_analyzer.h"
|
||||
#include "CFGraph/CFGraph.h"
|
||||
#include "../Utils/utils.h"
|
||||
|
||||
#include "json.hpp"
|
||||
|
||||
@@ -37,6 +38,109 @@ using SAPFOR::CFG_Settings;
|
||||
|
||||
using json = nlohmann::json;
|
||||
|
||||
void runPredictSchemeOld(SgProject &project,
|
||||
vector<vector<size_t>> &topologies,
|
||||
vector<ParallelRegion*> ¶llelRegions,
|
||||
map<string, vector<LoopGraph*>> &loopGraph,
|
||||
map<string, vector<SpfInterval*>> &intervals,
|
||||
map<string, vector<Messages>> &SPF_messages)
|
||||
{
|
||||
int maxSizeDist = 0;
|
||||
for (int z = 0; z < parallelRegions.size(); ++z)
|
||||
{
|
||||
const DataDirective &dataDirectives = parallelRegions[z]->GetDataDir();
|
||||
const vector<int> ¤tVariant = parallelRegions[z]->GetCurrentVariant();
|
||||
|
||||
auto &tmp = dataDirectives.distrRules;
|
||||
vector<pair<DIST::Array*, const DistrVariant*>> currentVar;
|
||||
for (int z1 = 0; z1 < currentVariant.size(); ++z1)
|
||||
currentVar.push_back(std::make_pair(tmp[z1].first, &tmp[z1].second[currentVariant[z1]]));
|
||||
|
||||
for (auto &elem : currentVar)
|
||||
{
|
||||
DIST::Array *array = elem.first;
|
||||
const DistrVariant *var = elem.second;
|
||||
|
||||
int countBlock = 0;
|
||||
for (int z = 0; z < var->distRule.size(); ++z)
|
||||
if (var->distRule[z] == dist::BLOCK)
|
||||
++countBlock;
|
||||
maxSizeDist = std::max(maxSizeDist, countBlock);
|
||||
}
|
||||
}
|
||||
|
||||
SpfInterval *mainIterval = getMainInterval(&project, intervals, SPF_messages);
|
||||
topologies.clear();
|
||||
if (maxSizeDist)
|
||||
{
|
||||
const int procNum = 8;
|
||||
//TODO:
|
||||
//topologies = getTopologies(procNum, maxSizeDist);
|
||||
throw -10;
|
||||
|
||||
const int countOfTop = topologies.size();
|
||||
if (countOfTop < 0)
|
||||
printInternalError(convertFileName(__FILE__).c_str(), __LINE__);
|
||||
|
||||
for (auto &inter : intervals)
|
||||
initTimeForIntervalTree(countOfTop, inter.second);
|
||||
|
||||
for (int z = 0; z < parallelRegions.size(); ++z)
|
||||
{
|
||||
const DataDirective &dataDirectives = parallelRegions[z]->GetDataDir();
|
||||
const vector<int> ¤tVariant = parallelRegions[z]->GetCurrentVariant();
|
||||
DIST::Arrays<int> &allArrays = parallelRegions[z]->GetAllArraysToModify();
|
||||
|
||||
auto &tmp = dataDirectives.distrRules;
|
||||
vector<pair<DIST::Array*, const DistrVariant*>> currentVar;
|
||||
for (int z1 = 0; z1 < currentVariant.size(); ++z1)
|
||||
currentVar.push_back(std::make_pair(tmp[z1].first, &tmp[z1].second[currentVariant[z1]]));
|
||||
|
||||
map<LoopGraph*, ParallelDirective*> parallelDirs;
|
||||
vector<std::tuple<DIST::Array*, vector<long>, pair<string, int>>> allSingleRemotes;
|
||||
for (int i = project.numberOfFiles() - 1; i >= 0; --i)
|
||||
{
|
||||
SgFile *file = &(project.file(i));
|
||||
auto fountInfo = findAllDirectives(file, getObjectForFileFromMap(file->filename(), loopGraph), parallelRegions[z]->GetId());
|
||||
parallelDirs.insert(fountInfo.begin(), fountInfo.end());
|
||||
|
||||
auto fountRem = findAllSingleRemotes(file, parallelRegions[z]->GetId(), parallelRegions);
|
||||
allSingleRemotes.insert(allSingleRemotes.end(), fountRem.begin(), fountRem.end());
|
||||
}
|
||||
//TODO!
|
||||
//int err = predictScheme(parallelRegions[z], currentVar, allArrays.GetArrays(), parallelDirs, intervals, SPF_messages, allSingleRemotes, maxSizeDist, procNum);
|
||||
/*if (err != 0)
|
||||
internalExit = err;*/
|
||||
}
|
||||
|
||||
vector<SpfInterval*> tmp = { mainIterval };
|
||||
aggregatePredictedTimes(tmp);
|
||||
|
||||
int idx = 0;
|
||||
int best = -1;
|
||||
double bestSpeedUp = 0;
|
||||
for (auto &top : topologies)
|
||||
{
|
||||
string outStr = "";
|
||||
for (auto &elem : top)
|
||||
outStr += std::to_string(elem) + " ";
|
||||
double currS = mainIterval->exec_time / mainIterval->predictedTimes[idx];
|
||||
__spf_print(1, "%d: speed up %f for top. %s\n", idx, currS, outStr.c_str());
|
||||
|
||||
if (best == -1 || bestSpeedUp < currS)
|
||||
{
|
||||
bestSpeedUp = currS;
|
||||
best = idx;
|
||||
}
|
||||
++idx;
|
||||
}
|
||||
__spf_print(1, "best topology %d with speed up %f\n", best, bestSpeedUp);
|
||||
}
|
||||
else
|
||||
for (auto &inter : intervals)
|
||||
initTimeForIntervalTree(0, inter.second);
|
||||
}
|
||||
|
||||
static void fillParallel(SgExpression *exp, ParallelStats &parStats, int &totalScoreComm)
|
||||
{
|
||||
if (exp)
|
||||
|
||||
@@ -60,4 +60,6 @@ public:
|
||||
void processFileToPredict(SgFile *file, PredictorStats &predictorCounts);
|
||||
|
||||
void calculateStatsForPredictor(const std::map<std::string, std::vector<FuncInfo*>>& allFuncInfo, const std::map<std::string, std::map<int, Gcov_info>>& gCovInfo);
|
||||
void parseDvmDirForPredictor(const std::map<std::tuple<int, std::string, std::string>, std::pair<DIST::Array*, DIST::ArrayAccessInfo*>>& declaredArrays, const std::map<std::string, CommonBlock*>& commonBlocks, const std::map<std::string, std::vector<FuncInfo*>>& allFuncInfo, const std::map<std::string, std::map<int, Gcov_info>>& gCovInfo);
|
||||
void parseDvmDirForPredictor(const std::map<std::tuple<int, std::string, std::string>, std::pair<DIST::Array*, DIST::ArrayAccessInfo*>>& declaredArrays, const std::map<std::string, CommonBlock*>& commonBlocks, const std::map<std::string, std::vector<FuncInfo*>>& allFuncInfo, const std::map<std::string, std::map<int, Gcov_info>>& gCovInfo);
|
||||
|
||||
void runPredictSchemeOld(SgProject &project, std::vector<std::vector<size_t>> &topologies, std::vector<ParallelRegion*> ¶llelRegions, std::map<std::string, std::vector<LoopGraph*>> &loopGraph, std::map<std::string, std::vector<SpfInterval*>> &intervals, std::map<std::string, std::vector<Messages>> &SPF_messages);
|
||||
|
||||
470
src/Predictor/PredictSchemeWithLibrary.cpp
Normal file
470
src/Predictor/PredictSchemeWithLibrary.cpp
Normal file
@@ -0,0 +1,470 @@
|
||||
#include "leak_detector.h"
|
||||
|
||||
#include <limits>
|
||||
#include <map>
|
||||
#include <vector>
|
||||
#include <string>
|
||||
#include <tuple>
|
||||
|
||||
#include "dvm.h"
|
||||
#include "PredictSchemeWithLibrary.h"
|
||||
#include "../../projects/libpredictor/include/libpredict/predictor.h"
|
||||
#include "../DirectiveProcessing/directive_parser.h"
|
||||
#include "../Distribution/DvmhDirective.h"
|
||||
#include "../ParallelizationRegions/ParRegions.h"
|
||||
#include "../GraphLoop/graph_loops_func.h"
|
||||
#include "../Utils/errors.h"
|
||||
#include "../Utils/utils.h"
|
||||
|
||||
using std::map;
|
||||
using std::pair;
|
||||
using std::string;
|
||||
using std::tuple;
|
||||
using std::vector;
|
||||
|
||||
map<size_t, size_t> createTemplateIdMapping(const vector<ParallelRegion*>& parallelRegions)
|
||||
{
|
||||
size_t maxArrayId = 0;
|
||||
for (int z = 0; z < parallelRegions.size(); ++z) {
|
||||
const DataDirective& dataDirectives = parallelRegions[z]->GetDataDir();
|
||||
|
||||
for (const auto& distrRule : dataDirectives.distrRules) {
|
||||
if (distrRule.first && !distrRule.first->IsTemplate()) {
|
||||
maxArrayId = std::max(maxArrayId, (size_t)distrRule.first->GetId());
|
||||
}
|
||||
}
|
||||
|
||||
for (const auto& alignRule : dataDirectives.alignRules) {
|
||||
if (alignRule.alignArray && !alignRule.alignArray->IsTemplate()) {
|
||||
maxArrayId = std::max(maxArrayId, (size_t)alignRule.alignArray->GetId());
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
map<size_t, size_t> templateIdMapping;
|
||||
size_t nextTemplateId = maxArrayId + 1;
|
||||
for (int z = 0; z < parallelRegions.size(); ++z) {
|
||||
const DataDirective& dataDirectives = parallelRegions[z]->GetDataDir();
|
||||
|
||||
for (const auto& distrRule : dataDirectives.distrRules) {
|
||||
if (distrRule.first && distrRule.first->IsTemplate()) {
|
||||
size_t originalId = distrRule.first->GetId();
|
||||
if (templateIdMapping.find(originalId) == templateIdMapping.end()) {
|
||||
templateIdMapping[originalId] = nextTemplateId++;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
for (const auto& alignRule : dataDirectives.alignRules) {
|
||||
if (alignRule.alignWith && alignRule.alignWith->IsTemplate()) {
|
||||
size_t originalId = alignRule.alignWith->GetId();
|
||||
if (templateIdMapping.find(originalId) == templateIdMapping.end()) {
|
||||
templateIdMapping[originalId] = nextTemplateId++;
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return templateIdMapping;
|
||||
}
|
||||
|
||||
PrecomputedLibpredictParams precomputeLibpredictParams(
|
||||
SgProject& project,
|
||||
const vector<ParallelRegion*>& parallelRegions,
|
||||
const map<string, vector<LoopGraph*>>& loopGraph,
|
||||
const map<size_t, size_t>& templateIdMapping)
|
||||
{
|
||||
PrecomputedLibpredictParams result;
|
||||
|
||||
// distribute and align from parallelRegions
|
||||
for (int z = 0; z < parallelRegions.size(); ++z) {
|
||||
const DataDirective& dataDirectives = parallelRegions[z]->GetDataDir();
|
||||
const vector<int>& currentVariant = parallelRegions[z]->GetCurrentVariant();
|
||||
const DIST::Arrays<int>& allArrays = parallelRegions[z]->GetAllArrays();
|
||||
|
||||
auto& tmp = dataDirectives.distrRules;
|
||||
vector<pair<DIST::Array*, const DistrVariant*>> currentVar;
|
||||
for (int z1 = 0; z1 < currentVariant.size(); ++z1) {
|
||||
currentVar.push_back(std::make_pair(tmp[z1].first, &tmp[z1].second[currentVariant[z1]]));
|
||||
}
|
||||
|
||||
// distribute
|
||||
for (const auto& distrRule : currentVar) {
|
||||
DIST::Array* array = distrRule.first;
|
||||
const DistrVariant* variant = distrRule.second;
|
||||
|
||||
if (array && variant && !array->IsNotDistribute()) {
|
||||
PrecomputedDistributeParams params;
|
||||
|
||||
size_t originalId = array->GetId();
|
||||
params.arrayId = originalId;
|
||||
|
||||
if (array->IsTemplate()) {
|
||||
auto it = templateIdMapping.find(originalId);
|
||||
if (it != templateIdMapping.end()) {
|
||||
params.arrayId = it->second;
|
||||
}
|
||||
}
|
||||
|
||||
params.elemSize = array->GetTypeSize();
|
||||
params.array = array;
|
||||
|
||||
const auto& arraySizes = array->GetSizes();
|
||||
for (int dim = 0; dim < array->GetDimSize(); ++dim) {
|
||||
size_t dimSize = arraySizes[dim].second - arraySizes[dim].first + 1;
|
||||
|
||||
if (dim < variant->distRule.size() && variant->distRule[dim] == dist::BLOCK) {
|
||||
params.axisDistributions.emplace_back(dimSize, libpredict::TypeDistribute::BLOCK);
|
||||
} else {
|
||||
params.axisDistributions.emplace_back(dimSize, libpredict::TypeDistribute::NONE);
|
||||
}
|
||||
}
|
||||
|
||||
const auto& shadowSpec = array->GetShadowSpec();
|
||||
for (int dim = 0; dim < shadowSpec.size() && dim < array->GetDimSize(); ++dim) {
|
||||
if (dim < variant->distRule.size() && variant->distRule[dim] == dist::BLOCK) {
|
||||
params.shadowEdges.emplace_back(shadowSpec[dim].first, shadowSpec[dim].second);
|
||||
}
|
||||
}
|
||||
|
||||
result.distributeParams.push_back(params);
|
||||
}
|
||||
}
|
||||
|
||||
// align
|
||||
for (const auto& alignRule : dataDirectives.alignRules) {
|
||||
DIST::Array* alignArray = alignRule.alignArray;
|
||||
DIST::Array* alignWithArray = alignRule.alignWith;
|
||||
|
||||
if (alignArray && alignWithArray && !alignArray->IsNotDistribute()) {
|
||||
PrecomputedAlignParams params;
|
||||
|
||||
params.arrayId = alignArray->GetId();
|
||||
size_t originalDistributedArrayId = alignWithArray->GetId();
|
||||
params.distributedArrayId = originalDistributedArrayId;
|
||||
|
||||
if (alignWithArray->IsTemplate()) {
|
||||
auto it = templateIdMapping.find(originalDistributedArrayId);
|
||||
if (it != templateIdMapping.end()) {
|
||||
params.distributedArrayId = it->second;
|
||||
}
|
||||
}
|
||||
|
||||
params.elemSize = alignArray->GetTypeSize();
|
||||
params.alignArray = alignArray;
|
||||
params.alignWithArray = alignWithArray;
|
||||
|
||||
const auto& arraySizes = alignArray->GetSizes();
|
||||
for (int dim = 0; dim < alignArray->GetDimSize(); ++dim) {
|
||||
size_t dimSize = arraySizes[dim].second - arraySizes[dim].first + 1;
|
||||
params.dimensions.push_back(dimSize);
|
||||
}
|
||||
|
||||
for (int dim = 0; dim < alignWithArray->GetDimSize(); ++dim) {
|
||||
bool found = false;
|
||||
for (int i = 0; i < alignRule.alignRuleWith.size(); ++i) {
|
||||
const auto& ruleWith = alignRule.alignRuleWith[i];
|
||||
if (ruleWith.first == dim) {
|
||||
const auto& rule = ruleWith.second;
|
||||
if (rule.first == 0) {
|
||||
// constant
|
||||
params.distributionExpressions.emplace_back(rule.second);
|
||||
} else {
|
||||
// linear expression a * I + b
|
||||
params.distributionExpressions.emplace_back(i, rule.first, rule.second);
|
||||
}
|
||||
found = true;
|
||||
break;
|
||||
}
|
||||
}
|
||||
if (!found) {
|
||||
// There is no rule for this measurement
|
||||
params.distributionExpressions.emplace_back();
|
||||
}
|
||||
}
|
||||
|
||||
const auto& shadowSpec = alignArray->GetShadowSpec();
|
||||
for (int dim = 0; dim < shadowSpec.size() && dim < alignArray->GetDimSize(); ++dim) {
|
||||
params.shadowEdges.emplace_back(shadowSpec[dim].first, shadowSpec[dim].second);
|
||||
}
|
||||
|
||||
result.alignParams.push_back(params);
|
||||
}
|
||||
}
|
||||
|
||||
// shadow_renew
|
||||
map<LoopGraph*, ParallelDirective*> parallelDirs;
|
||||
for (int i = project.numberOfFiles() - 1; i >= 0; --i) {
|
||||
SgFile* file = &(project.file(i));
|
||||
auto fountInfo = findAllDirectives(
|
||||
file,
|
||||
getObjectForFileFromMap(file->filename(), const_cast<map<string, vector<LoopGraph*>>&>(loopGraph)),
|
||||
parallelRegions[z]->GetId());
|
||||
parallelDirs.insert(fountInfo.begin(), fountInfo.end());
|
||||
}
|
||||
|
||||
for (auto& dirPair : parallelDirs) {
|
||||
LoopGraph* loopPtr = dirPair.first;
|
||||
ParallelDirective* directive = dirPair.second;
|
||||
|
||||
if (directive && !directive->shadowRenew.empty()) {
|
||||
for (size_t shadowIdx = 0; shadowIdx < directive->shadowRenew.size(); ++shadowIdx) {
|
||||
const auto& shadowRenewItem = directive->shadowRenew[shadowIdx];
|
||||
const string& arrayName = shadowRenewItem.first.second; // uniqName
|
||||
const vector<pair<int, int>>& bounds = shadowRenewItem.second;
|
||||
|
||||
DIST::Array* shadowArray = allArrays.GetArrayByName(arrayName);
|
||||
if (shadowArray == NULL) {
|
||||
continue;
|
||||
}
|
||||
|
||||
if (shadowArray && !shadowArray->IsNotDistribute()) {
|
||||
PrecomputedShadowRenewParams params;
|
||||
|
||||
params.arrayId = shadowArray->GetId();
|
||||
params.shadowArray = shadowArray;
|
||||
|
||||
for (const auto& bound : bounds) {
|
||||
params.shadow_renew.emplace_back(static_cast<size_t>(bound.first),
|
||||
static_cast<size_t>(bound.second));
|
||||
}
|
||||
|
||||
params.corner = directive->shadowRenewCorner[shadowIdx];
|
||||
params.number_loop_iterations = loopPtr ? static_cast<size_t>(loopPtr->countOfIters) : 1;
|
||||
|
||||
result.shadowRenewParams.push_back(params);
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
return result;
|
||||
}
|
||||
|
||||
double runLibpredictCalc(const vector<size_t>& topology,
|
||||
const string& clusterConfStr,
|
||||
const PrecomputedLibpredictParams& precomputedParams,
|
||||
map<string, vector<Messages>>& SPF_messages)
|
||||
{
|
||||
libpredict::RetInitGrid retInitGrid = libpredict::InitGrid(topology[0], topology[1], topology[2], topology[3]);
|
||||
|
||||
if (retInitGrid != libpredict::INIT_GRID_SUCCESS) {
|
||||
__spf_print(1, "ERROR: Failed to initialize libpredict grid with topology: %zu %zu %zu %zu, return code: %d\n",
|
||||
topology[0], topology[1], topology[2], topology[3], (int)retInitGrid);
|
||||
|
||||
std::wstring messageR, messageE;
|
||||
__spf_printToLongBuf(messageE, L"Failed to initialize libpredict grid with topology: %zu %zu %zu %zu, return code: %d",
|
||||
topology[0], topology[1], topology[2], topology[3], (int)retInitGrid);
|
||||
__spf_printToLongBuf(messageR, R207);
|
||||
getObjectForFileFromMap(clusterConfStr.c_str(), SPF_messages).push_back(Messages(ERROR, 1, messageR, messageE, 1064));
|
||||
return -1;
|
||||
}
|
||||
|
||||
// distribute
|
||||
for (const auto& params : precomputedParams.distributeParams) {
|
||||
libpredict::RetDistribute retDistribute = libpredict::Distribute(
|
||||
params.arrayId, params.elemSize, params.axisDistributions, params.shadowEdges);
|
||||
|
||||
if (retDistribute != libpredict::DISTRIBUTE_SUCCESS) {
|
||||
__spf_print(1, "ERROR: Failed to distribute array '%s' (id=%zu) with libpredict, return code: %d\n",
|
||||
params.array->GetShortName().c_str(), params.arrayId, (int)retDistribute);
|
||||
|
||||
std::wstring messageR, messageE;
|
||||
__spf_printToLongBuf(messageE, L"Failed to distribute array '%s' with libpredict, return code: %d",
|
||||
to_wstring(params.array->GetShortName()).c_str(), (int)retDistribute);
|
||||
__spf_printToLongBuf(messageR, R208);
|
||||
getObjectForFileFromMap(params.array->GetDeclInfo().begin()->first.c_str(), SPF_messages).push_back(Messages(ERROR, params.array->GetDeclInfo().begin()->second, messageR, messageE, 1065));
|
||||
}
|
||||
}
|
||||
|
||||
// align
|
||||
for (const auto& params : precomputedParams.alignParams) {
|
||||
libpredict::RetAlign retAlign = libpredict::Align(
|
||||
params.arrayId, params.distributedArrayId, params.elemSize,
|
||||
params.dimensions, params.distributionExpressions, params.shadowEdges);
|
||||
|
||||
if (retAlign != libpredict::ALIGN_SUCCESS) {
|
||||
__spf_print(1, "ERROR: Failed to align array '%s' (id=%zu) with array '%s' (id=%zu), return code: %d\n",
|
||||
params.alignArray->GetShortName().c_str(), params.arrayId,
|
||||
params.alignWithArray->GetShortName().c_str(), params.distributedArrayId, (int)retAlign);
|
||||
|
||||
std::wstring messageR, messageE;
|
||||
__spf_printToLongBuf(messageE, L"Failed to align array '%s' with array '%s' using libpredict, return code: %d",
|
||||
to_wstring(params.alignArray->GetShortName()).c_str(),
|
||||
to_wstring(params.alignWithArray->GetShortName()).c_str(), (int)retAlign);
|
||||
__spf_printToLongBuf(messageR, R209);
|
||||
getObjectForFileFromMap(params.alignArray->GetDeclInfo().begin()->first.c_str(), SPF_messages).push_back(Messages(ERROR, params.alignArray->GetDeclInfo().begin()->second, messageR, messageE, 1066));
|
||||
}
|
||||
}
|
||||
|
||||
// shadow_renew
|
||||
for (const auto& params : precomputedParams.shadowRenewParams) {
|
||||
libpredict::RetShadowRenew retShadowRenew = libpredict::ShadowRenew(
|
||||
params.arrayId, params.shadow_renew, params.corner, params.number_loop_iterations);
|
||||
|
||||
if (retShadowRenew != libpredict::SHADOW_RENEW_SUCCESS) {
|
||||
__spf_print(1, "ERROR: Failed to process shadow_renew for array '%s' (id=%zu), return code: %d\n",
|
||||
params.shadowArray->GetShortName().c_str(), params.arrayId, (int)retShadowRenew);
|
||||
|
||||
std::wstring messageR, messageE;
|
||||
__spf_printToLongBuf(messageE, L"Failed to process shadow_renew for array '%s' with libpredict, return code: %d",
|
||||
to_wstring(params.shadowArray->GetShortName()).c_str(), (int)retShadowRenew);
|
||||
__spf_printToLongBuf(messageR, R210);
|
||||
getObjectForFileFromMap(params.shadowArray->GetDeclInfo().begin()->first.c_str(), SPF_messages).push_back(Messages(ERROR, params.shadowArray->GetDeclInfo().begin()->second, messageR, messageE, 1067));
|
||||
}
|
||||
}
|
||||
|
||||
return libpredict::GetTime();
|
||||
}
|
||||
|
||||
void runPredictScheme(SgProject& project,
|
||||
const vector<ParallelRegion*>& parallelRegions,
|
||||
map<string, vector<LoopGraph*>>& loopGraph,
|
||||
map<string, vector<Messages>>& SPF_messages)
|
||||
{
|
||||
// calculating maximum dimension of distribution
|
||||
int maxSizeDist = 0;
|
||||
for (int z = 0; z < parallelRegions.size(); ++z) {
|
||||
const DataDirective& dataDirectives = parallelRegions[z]->GetDataDir();
|
||||
const vector<int>& currentVariant = parallelRegions[z]->GetCurrentVariant();
|
||||
|
||||
auto& tmp = dataDirectives.distrRules;
|
||||
vector<const DistrVariant*> currentVar;
|
||||
for (int z1 = 0; z1 < currentVariant.size(); ++z1) {
|
||||
currentVar.push_back(&tmp[z1].second[currentVariant[z1]]);
|
||||
}
|
||||
|
||||
for (auto var : currentVar) {
|
||||
int countBlock = 0;
|
||||
for (int z = 0; z < var->distRule.size(); ++z) {
|
||||
if (var->distRule[z] == dist::BLOCK) {
|
||||
++countBlock;
|
||||
}
|
||||
}
|
||||
maxSizeDist = std::max(maxSizeDist, countBlock);
|
||||
}
|
||||
}
|
||||
|
||||
// calculating name of a cluster configuration file
|
||||
string clusterConfStr;
|
||||
if (project.numberOfFiles() > 0) {
|
||||
string firstFilePath = project.fileName(0);
|
||||
|
||||
size_t lastSlash = firstFilePath.find_last_of("/\\");
|
||||
clusterConfStr = firstFilePath.substr(0, lastSlash + 1) + "cluster.conf";
|
||||
}
|
||||
|
||||
// creating template ID display to avoid conflicts
|
||||
map<size_t, size_t> templateIdMapping = createTemplateIdMapping(parallelRegions);
|
||||
|
||||
// Precomputing parameters of directive functions from libpredict
|
||||
PrecomputedLibpredictParams precomputedParams = precomputeLibpredictParams(
|
||||
project, parallelRegions, loopGraph, templateIdMapping);
|
||||
|
||||
// iterating through topologies and processes_per_processor to find most optimal one
|
||||
if (maxSizeDist) {
|
||||
if (maxSizeDist > 4) {
|
||||
maxSizeDist = 4;
|
||||
}
|
||||
|
||||
// Initialize cluster
|
||||
int maxCoresCount = 0;
|
||||
libpredict::RetInitCluster retInitCluster = libpredict::InitCluster(clusterConfStr, maxCoresCount);
|
||||
|
||||
if (retInitCluster != libpredict::INIT_CLUSTER_SUCCESS) {
|
||||
__spf_print(1, "ERROR: Failed to initialize libpredict cluster with config: %s, return code: %d\n", clusterConfStr.c_str(), (int)retInitCluster);
|
||||
|
||||
std::wstring messageR, messageE;
|
||||
__spf_printToLongBuf(messageE, L"Failed to initialize libpredict cluster with config: %s, return code: %d",
|
||||
to_wstring(clusterConfStr).c_str(), (int)retInitCluster);
|
||||
__spf_printToLongBuf(messageR, R206);
|
||||
getObjectForFileFromMap(clusterConfStr.c_str(), SPF_messages).push_back(Messages(ERROR, 1, messageR, messageE, 1063));
|
||||
return;
|
||||
}
|
||||
|
||||
vector<size_t> bestTopology;
|
||||
double bestTime = std::numeric_limits<double>::max();
|
||||
size_t bestProcessesPerProcessor = 0;
|
||||
int prevProcCount = -1;
|
||||
|
||||
for (size_t processes_per_processor = 1; processes_per_processor <= maxCoresCount; ++processes_per_processor) {
|
||||
int procCount = 0;
|
||||
libpredict::RetInitMapping retInitMapping = libpredict::InitMapping(processes_per_processor, procCount);
|
||||
|
||||
if (retInitMapping != libpredict::INIT_MAPPING_SUCCESS) {
|
||||
__spf_print(1, "ERROR: Failed to initialize libpredict mapping with processes_per_processor: %zu, return code: %d\n",
|
||||
processes_per_processor, (int)retInitMapping);
|
||||
|
||||
std::wstring messageR, messageE;
|
||||
__spf_printToLongBuf(messageE, L"Failed to initialize libpredict mapping with processes_per_processor: %zu, return code: %d",
|
||||
processes_per_processor, (int)retInitMapping);
|
||||
__spf_printToLongBuf(messageR, R211);
|
||||
getObjectForFileFromMap(clusterConfStr.c_str(), SPF_messages).push_back(Messages(ERROR, 1, messageR, messageE, 1068));
|
||||
continue;
|
||||
}
|
||||
|
||||
if (procCount == 0) {
|
||||
break; // No more processors available
|
||||
}
|
||||
|
||||
if (procCount == prevProcCount) {
|
||||
continue; // Skip with procCount value unchanged for different processes_per_processor
|
||||
}
|
||||
|
||||
prevProcCount = procCount;
|
||||
__spf_print(1, "Calculate with processes_per_processor=%zu, procCount=%d\n", processes_per_processor, procCount);
|
||||
|
||||
for (size_t n1 = 2; n1 <= procCount; ++n1) {
|
||||
for (size_t n2 = 1; n2 <= n1 && n1 * n2 <= procCount; ++n2) {
|
||||
if (n2 != 1 && maxSizeDist < 2 || n2 == 1 && maxSizeDist == 2) {
|
||||
continue;
|
||||
}
|
||||
|
||||
for (size_t n3 = 1; n3 <= n2 && n1 * n2 * n3 <= procCount; ++n3) {
|
||||
if (n3 != 1 && maxSizeDist < 3 || n3 == 1 && maxSizeDist == 3) {
|
||||
continue;
|
||||
}
|
||||
|
||||
for (size_t n4 = 1; n4 <= n3 && n1 * n2 * n3 * n4 <= procCount; ++n4) {
|
||||
if (n4 != 1 && maxSizeDist < 4 || n4 == 1 && maxSizeDist == 4) {
|
||||
continue;
|
||||
}
|
||||
|
||||
vector<size_t> topology = {n1, n2, n3, n4};
|
||||
double currTime = runLibpredictCalc(topology, clusterConfStr, precomputedParams, SPF_messages);
|
||||
|
||||
string outStr = "";
|
||||
for (const auto& elem : topology) {
|
||||
outStr += std::to_string(elem) + " ";
|
||||
}
|
||||
__spf_print(1, "topology %s has time %f\n", outStr.c_str(), currTime);
|
||||
|
||||
if (currTime == -1) {
|
||||
continue;
|
||||
}
|
||||
|
||||
if (currTime < bestTime) {
|
||||
bestTime = currTime;
|
||||
bestTopology = topology;
|
||||
bestProcessesPerProcessor = processes_per_processor;
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
if (!bestTopology.empty()) {
|
||||
string outStr;
|
||||
for (const auto& elem : bestTopology) {
|
||||
outStr += std::to_string(elem) + " ";
|
||||
}
|
||||
|
||||
__spf_print(1, "best topology %s with time %f (processes_per_processor=%zu)\n",
|
||||
outStr.c_str(), bestTime, bestProcessesPerProcessor);
|
||||
}
|
||||
} else {
|
||||
__spf_print(1, "impossible to calculate best topology: project does not contain distribution directives\n");
|
||||
}
|
||||
}
|
||||
56
src/Predictor/PredictSchemeWithLibrary.h
Normal file
56
src/Predictor/PredictSchemeWithLibrary.h
Normal file
@@ -0,0 +1,56 @@
|
||||
#pragma once
|
||||
#include <vector>
|
||||
#include <map>
|
||||
#include <string>
|
||||
#include "dvm.h"
|
||||
#include "graph_calls.h"
|
||||
#include "../../projects/libpredictor/include/libpredict/predictor.h"
|
||||
|
||||
struct PrecomputedDistributeParams {
|
||||
size_t arrayId;
|
||||
size_t elemSize;
|
||||
std::vector<libpredict::DistributeAxisRule> axisDistributions;
|
||||
std::vector<std::pair<size_t, size_t>> shadowEdges;
|
||||
DIST::Array* array;
|
||||
};
|
||||
|
||||
struct PrecomputedAlignParams {
|
||||
size_t arrayId;
|
||||
size_t distributedArrayId;
|
||||
size_t elemSize;
|
||||
std::vector<size_t> dimensions;
|
||||
std::vector<libpredict::AlignDisplay> distributionExpressions;
|
||||
std::vector<std::pair<size_t, size_t>> shadowEdges;
|
||||
DIST::Array* alignArray;
|
||||
DIST::Array* alignWithArray;
|
||||
};
|
||||
|
||||
struct PrecomputedShadowRenewParams {
|
||||
size_t arrayId;
|
||||
std::vector<std::pair<size_t, size_t>> shadow_renew;
|
||||
bool corner;
|
||||
size_t number_loop_iterations;
|
||||
DIST::Array* shadowArray;
|
||||
};
|
||||
|
||||
struct PrecomputedLibpredictParams {
|
||||
std::vector<PrecomputedDistributeParams> distributeParams;
|
||||
std::vector<PrecomputedAlignParams> alignParams;
|
||||
std::vector<PrecomputedShadowRenewParams> shadowRenewParams;
|
||||
};
|
||||
|
||||
PrecomputedLibpredictParams precomputeLibpredictParams(
|
||||
SgProject& project,
|
||||
const std::vector<ParallelRegion*>& parallelRegions,
|
||||
const std::map<std::string, std::vector<LoopGraph*>>& loopGraph,
|
||||
const std::map<size_t, size_t>& templateIdMapping);
|
||||
|
||||
void runPredictScheme(SgProject& project,
|
||||
const std::vector<ParallelRegion*>& parallelRegions,
|
||||
std::map<std::string, std::vector<LoopGraph*>>& loopGraph,
|
||||
std::map<std::string, std::vector<Messages>>& SPF_messages);
|
||||
|
||||
double runLibpredictCalc(const std::vector<size_t>& topology,
|
||||
const std::string& clusterConfStr,
|
||||
const PrecomputedLibpredictParams& precomputedParams,
|
||||
std::map<std::string, std::vector<Messages>>& SPF_messages);
|
||||
@@ -1,4 +1,3 @@
|
||||
#include <algorithm>
|
||||
#include <map>
|
||||
#include <unordered_set>
|
||||
#include <unordered_map>
|
||||
@@ -17,8 +16,6 @@
|
||||
|
||||
using namespace std;
|
||||
|
||||
static unordered_set<Region*> collapsed;
|
||||
|
||||
static void RemoveEmptyPoints(ArrayAccessingIndexes& container)
|
||||
{
|
||||
ArrayAccessingIndexes resultContainer;
|
||||
@@ -52,81 +49,41 @@ static void Collapse(Region* region)
|
||||
if (region->getBasickBlocks().empty())
|
||||
return;
|
||||
|
||||
bool firstRegion = true;
|
||||
for (Region* basickBlock : region->getBasickBlocks())
|
||||
for (auto& [arrayName, arrayRanges] : region->getHeader()->array_out)
|
||||
{
|
||||
if (basickBlock->getNextRegions().empty())
|
||||
for (Region* byBlock : region->getBasickBlocks())
|
||||
{
|
||||
if (firstRegion)
|
||||
{
|
||||
region->array_def = basickBlock->array_out;
|
||||
firstRegion = false;
|
||||
}
|
||||
else
|
||||
{
|
||||
unordered_set<string> toErease;
|
||||
for (auto& [arrayName, arrayRanges] : region->array_def)
|
||||
{
|
||||
if (basickBlock->array_out.find(arrayName) != basickBlock->array_out.end())
|
||||
arrayRanges = arrayRanges.Intersect(basickBlock->array_out[arrayName]);
|
||||
else
|
||||
{
|
||||
arrayRanges = AccessingSet();
|
||||
toErease.insert(arrayName);
|
||||
}
|
||||
}
|
||||
for (string arrayName : toErease)
|
||||
region->array_def.erase(arrayName);
|
||||
}
|
||||
AccessingSet intersection = byBlock->array_def[arrayName].Intersect(arrayRanges);
|
||||
region->array_def[arrayName] = region->array_def[arrayName].Union(intersection);
|
||||
}
|
||||
}
|
||||
|
||||
RegionInstruction instruction;
|
||||
instruction.def = move(region->array_def);
|
||||
|
||||
|
||||
for (auto& byBlock : region->getBasickBlocks())
|
||||
for (auto& byBlock : region->getBasickBlocks())
|
||||
{
|
||||
for (auto& instruction : byBlock->instructions)
|
||||
for (auto& [arrayName, arrayRanges] : byBlock->array_use)
|
||||
{
|
||||
for (auto& [arrayName, _] : instruction.use)
|
||||
{
|
||||
AccessingSet diff = instruction.use[arrayName].Diff(instruction.in[arrayName]);
|
||||
region->array_use[arrayName] = region->array_use[arrayName].Union(diff);
|
||||
}
|
||||
AccessingSet diff = byBlock->array_use[arrayName].Diff(byBlock->array_in[arrayName]);
|
||||
region->array_use[arrayName] = region->array_use[arrayName].Union(diff);
|
||||
}
|
||||
}
|
||||
|
||||
ArrayAccessingIndexes useUnionB;
|
||||
ArrayAccessingIndexes useUnion;
|
||||
for (auto& byBlock : region->getBasickBlocks())
|
||||
for (auto& instruction : byBlock->instructions)
|
||||
for (auto& [arrayName, _] : instruction.use)
|
||||
useUnionB[arrayName] = useUnionB[arrayName].Union(instruction.use[arrayName]);
|
||||
for (auto& [arrayName, arrayRanges] : byBlock->array_use)
|
||||
useUnion[arrayName] = useUnion[arrayName].Union(byBlock->array_use[arrayName]);
|
||||
|
||||
for (auto& [arrayName, _] : useUnionB)
|
||||
region->array_priv[arrayName] = useUnionB[arrayName].Diff(region->array_use[arrayName]);
|
||||
|
||||
instruction.use = move(region->array_use);
|
||||
|
||||
for (Region* prevBlock : region->getHeader()->getPrevRegions())
|
||||
{
|
||||
region->array_priv = region->array_use;
|
||||
|
||||
for (Region* prevBlock : region->getHeader()->getPrevRegions())
|
||||
prevBlock->replaceInNextRegions(region, region->getHeader());
|
||||
region->addPrevRegion(prevBlock);
|
||||
}
|
||||
|
||||
|
||||
for (Region* nextBlock : region->getHeader()->getNextRegions())
|
||||
{
|
||||
nextBlock->replaceInPrevRegions(region, region->getHeader());
|
||||
region->addNextRegion(nextBlock);
|
||||
}
|
||||
region->instructions.push_back(instruction);
|
||||
|
||||
}
|
||||
|
||||
static void SolveDataFlowIteratively(Region* DFG)
|
||||
static void SolveDataFlowIteratively(Region* DFG)
|
||||
{
|
||||
auto blocks = DFG->getBasickBlocks();
|
||||
std::unordered_set<Region*> worklist(blocks.begin(), blocks.end());
|
||||
unordered_set<Region*> worklist(DFG->getBasickBlocks());
|
||||
do
|
||||
{
|
||||
Region* b = *worklist.begin();
|
||||
@@ -144,13 +101,13 @@ static void SolveDataFlowIteratively(Region* DFG)
|
||||
if (prevBlock->array_out.empty())
|
||||
{
|
||||
newIn.clear();
|
||||
break;
|
||||
continue;
|
||||
}
|
||||
|
||||
for (const auto& [arrayName, accessSet] : prevBlock->array_out)
|
||||
{
|
||||
if (newIn.find(arrayName) != newIn.end())
|
||||
newIn[arrayName] = newIn[arrayName].Intersect(accessSet);
|
||||
newIn[arrayName] = newIn[arrayName].Intersect(accessSet);
|
||||
else
|
||||
newIn[arrayName] = AccessingSet();
|
||||
}
|
||||
@@ -160,7 +117,7 @@ static void SolveDataFlowIteratively(Region* DFG)
|
||||
b->array_in = move(newIn);
|
||||
ArrayAccessingIndexes newOut;
|
||||
|
||||
if (b->array_def.empty())
|
||||
if (b->array_def.empty())
|
||||
newOut = b->array_in;
|
||||
else if (b->array_in.empty())
|
||||
newOut = b->array_def;
|
||||
@@ -176,157 +133,25 @@ static void SolveDataFlowIteratively(Region* DFG)
|
||||
}
|
||||
|
||||
/* can not differ */
|
||||
if (newOut != b->array_out)
|
||||
if (newOut != b->array_out)
|
||||
b->array_out = newOut;
|
||||
else
|
||||
worklist.erase(b);
|
||||
} while (!worklist.empty());
|
||||
}
|
||||
|
||||
static void SolveForBasickBlock(Region* block)
|
||||
{
|
||||
ArrayAccessingIndexes newIn;
|
||||
bool flagFirst = true;
|
||||
for (Region* prevBlock : block->getPrevRegions())
|
||||
{
|
||||
if (flagFirst)
|
||||
{
|
||||
newIn = prevBlock->array_out;
|
||||
flagFirst = false;
|
||||
}
|
||||
else
|
||||
{
|
||||
if (prevBlock->array_out.empty())
|
||||
{
|
||||
newIn.clear();
|
||||
break;
|
||||
}
|
||||
|
||||
for (const auto& [arrayName, accessSet] : prevBlock->array_out)
|
||||
{
|
||||
if (newIn.find(arrayName) != newIn.end())
|
||||
newIn[arrayName] = newIn[arrayName].Intersect(accessSet);
|
||||
else
|
||||
newIn[arrayName] = AccessingSet();
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
if (block->instructions.empty())
|
||||
block->instructions.push_back(RegionInstruction());
|
||||
|
||||
block->instructions[0].in = move(newIn);
|
||||
|
||||
for (int i = 0; i < block->instructions.size(); i++)
|
||||
{
|
||||
auto& instruction = block->instructions[i];
|
||||
|
||||
if (i > 0)
|
||||
instruction.in = block->instructions[i - 1].out;
|
||||
|
||||
ArrayAccessingIndexes newOut;
|
||||
if (instruction.def.empty())
|
||||
newOut = instruction.in;
|
||||
else if (instruction.in.empty())
|
||||
newOut = instruction.def;
|
||||
else
|
||||
{
|
||||
for (auto& [arrayName, accessSet] : instruction.def)
|
||||
{
|
||||
if (instruction.in.find(arrayName) != instruction.in.end())
|
||||
newOut[arrayName] = instruction.def[arrayName].Union(instruction.in[arrayName]);
|
||||
else
|
||||
newOut[arrayName] = accessSet;
|
||||
}
|
||||
for (auto& [arrayName, accessSet] : instruction.in)
|
||||
{
|
||||
if (newOut.find(arrayName) == newOut.end())
|
||||
{
|
||||
newOut[arrayName] = accessSet;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
instruction.out = move(newOut);
|
||||
}
|
||||
if (!block->instructions.empty())
|
||||
block->array_out = block->instructions.back().out;
|
||||
}
|
||||
|
||||
static void SolveDataFlowTopologically(Region* DFG)
|
||||
{
|
||||
for (Region* b : DFG->getBasickBlocks())
|
||||
{
|
||||
collapsed.insert(b);
|
||||
SolveForBasickBlock(b);
|
||||
}
|
||||
}
|
||||
while (!worklist.empty());
|
||||
}
|
||||
|
||||
static void SolveDataFlow(Region* DFG)
|
||||
{
|
||||
if (!DFG)
|
||||
return;
|
||||
|
||||
SolveDataFlowIteratively(DFG);
|
||||
for (Region* subRegion : DFG->getSubRegions())
|
||||
{
|
||||
SolveDataFlow(subRegion);
|
||||
DFG->addBasickBlocks(subRegion);
|
||||
}
|
||||
vector<Region*>& blocks = DFG->getBasickBlocks();
|
||||
auto pos = remove_if(blocks.begin(), blocks.end(), [](Region* r) { return collapsed.find(r) != collapsed.end(); });
|
||||
blocks.erase(pos, blocks.end());
|
||||
TopologySort(DFG->getBasickBlocks(), DFG->getHeader());
|
||||
SolveDataFlowTopologically(DFG);
|
||||
Collapse(DFG);
|
||||
}
|
||||
|
||||
static bool getArrayDeclaredDimensions(SgArrayRefExp* arrayRef, vector<uint64_t>& declaredDims)
|
||||
{
|
||||
declaredDims.clear();
|
||||
if (!arrayRef || !arrayRef->symbol() || !isSgArrayType(arrayRef->symbol()->type()))
|
||||
return false;
|
||||
SgArrayType* arrayType = (SgArrayType*)arrayRef->symbol()->type();
|
||||
int dimCount = arrayType->dimension();
|
||||
for (int i = 0; i < dimCount; i++)
|
||||
{
|
||||
SgExpression* sizeExpr = arrayType->sizeInDim(i);
|
||||
SgConstantSymb* constValSymb = isSgConstantSymb(sizeExpr->symbol());
|
||||
string strDimLength;
|
||||
if (sizeExpr && sizeExpr->variant() == INT_VAL)
|
||||
strDimLength = sizeExpr->unparse();
|
||||
else if (constValSymb)
|
||||
strDimLength = constValSymb->constantValue()->unparse();
|
||||
else
|
||||
return false;
|
||||
|
||||
if (strDimLength == "0")
|
||||
return false;
|
||||
declaredDims.push_back((uint64_t)stoi(strDimLength));
|
||||
}
|
||||
return true;
|
||||
}
|
||||
|
||||
static bool CheckDimensionLength(const AccessingSet& array)
|
||||
{
|
||||
if (array.GetElements().empty())
|
||||
return false;
|
||||
size_t dimCount = array.GetElements()[0].size();
|
||||
SgArrayRefExp* arrayRef = array.GetElements()[0][0].array;
|
||||
if (!arrayRef)
|
||||
return false;
|
||||
vector<uint64_t> declaredDims(dimCount);
|
||||
if (!getArrayDeclaredDimensions(arrayRef, declaredDims))
|
||||
return false;
|
||||
vector<ArrayDimension> testArray(dimCount);
|
||||
for (size_t i = 0; i < dimCount; i++)
|
||||
{
|
||||
testArray[i] = { 1, 1, declaredDims[i], nullptr };
|
||||
}
|
||||
AccessingSet diff = AccessingSet({ testArray }).Diff(array);
|
||||
|
||||
return diff.GetElements().empty();
|
||||
}
|
||||
|
||||
|
||||
static void AddPrivateArraysToLoop(LoopGraph* loop, const ArrayAccessingIndexes& privates, set<SgStatement*>& insertedPrivates)
|
||||
{
|
||||
SgStatement* spfStat = new SgStatement(SPF_ANALYSIS_DIR);
|
||||
@@ -336,8 +161,6 @@ static void AddPrivateArraysToLoop(LoopGraph* loop, const ArrayAccessingIndexes&
|
||||
set<SgSymbol*> arraysToInsert;
|
||||
for (const auto& [_, accessingSet] : privates)
|
||||
{
|
||||
if (!CheckDimensionLength(accessingSet))
|
||||
continue;
|
||||
for (const auto& arrayElement : accessingSet.GetElements())
|
||||
{
|
||||
if (arrayElement.empty())
|
||||
@@ -364,16 +187,16 @@ static void AddPrivateArraysToLoop(LoopGraph* loop, const ArrayAccessingIndexes&
|
||||
}
|
||||
toAdd->setLhs(new SgVarRefExp(elem));
|
||||
}
|
||||
|
||||
if (arraysToInsert.size() == 0)
|
||||
printInternalError(convertFileName(__FILE__).c_str(), __LINE__);
|
||||
|
||||
if (arraysToInsert.size() != 0)
|
||||
{
|
||||
loop->loop->insertStmtBefore(*spfStat, *loop->loop->controlParent());
|
||||
insertedPrivates.insert(spfStat);
|
||||
}
|
||||
loop->loop->insertStmtBefore(*spfStat, *loop->loop->controlParent());
|
||||
insertedPrivates.insert(spfStat);
|
||||
}
|
||||
|
||||
void FindPrivateArrays(map<string, vector<LoopGraph*>>& loopGraph, map<FuncInfo*, vector<SAPFOR::BasicBlock*>>& FullIR, set<SgStatement*>& insertedPrivates)
|
||||
{
|
||||
void FindPrivateArrays(map<string, vector<LoopGraph*>> &loopGraph, map<FuncInfo*, vector<SAPFOR::BasicBlock*>>& FullIR, set<SgStatement*> &insertedPrivates)
|
||||
{
|
||||
map<LoopGraph*, ArrayAccessingIndexes> result;
|
||||
for (const auto& [fileName, loops] : loopGraph)
|
||||
{
|
||||
@@ -387,8 +210,8 @@ void FindPrivateArrays(map<string, vector<LoopGraph*>>& loopGraph, map<FuncInfo*
|
||||
while (search_func && (!isSgProgHedrStmt(search_func)))
|
||||
search_func = search_func->controlParent();
|
||||
|
||||
for (const auto& [funcInfo, blocks] : FullIR)
|
||||
{
|
||||
for (const auto& [funcInfo, blocks]: FullIR)
|
||||
{
|
||||
if (funcInfo->fileName == fileName && funcInfo->funcPointer->GetOriginal() == search_func)
|
||||
{
|
||||
Region* loopRegion = new Region(loop, blocks);
|
||||
@@ -408,4 +231,4 @@ void FindPrivateArrays(map<string, vector<LoopGraph*>>& loopGraph, map<FuncInfo*
|
||||
AddPrivateArraysToLoop(loop, result[loop], insertedPrivates);
|
||||
}
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
@@ -29,7 +29,7 @@ static ArrayDimension* DimensionIntersection(const ArrayDimension& dim1, const A
|
||||
vector<uint64_t> partSolution = FindParticularSolution(dim1, dim2);
|
||||
if (partSolution.empty())
|
||||
return NULL;
|
||||
|
||||
|
||||
int64_t x0 = partSolution[0], y0 = partSolution[1];
|
||||
/* x = x_0 + c * t */
|
||||
/* y = y_0 + d * t */
|
||||
@@ -44,10 +44,10 @@ static ArrayDimension* DimensionIntersection(const ArrayDimension& dim1, const A
|
||||
uint64_t tMax = min(tXMax, tYMax);
|
||||
if (tMin > tMax)
|
||||
return NULL;
|
||||
|
||||
|
||||
uint64_t start3 = dim1.start + x0 * dim1.step;
|
||||
uint64_t step3 = c * dim1.step;
|
||||
ArrayDimension* result = new(ArrayDimension){ start3, step3, tMax + 1 , dim1.array };
|
||||
ArrayDimension* result = new(ArrayDimension){ start3, step3, tMax + 1 , dim1.array};
|
||||
return result;
|
||||
}
|
||||
|
||||
@@ -57,12 +57,12 @@ static vector<ArrayDimension> DimensionDifference(const ArrayDimension& dim1, co
|
||||
ArrayDimension* intersection = DimensionIntersection(dim1, dim2);
|
||||
if (!intersection)
|
||||
return { dim1 };
|
||||
|
||||
|
||||
vector<ArrayDimension> result;
|
||||
/* add the part before intersection */
|
||||
if (dim1.start < intersection->start)
|
||||
result.push_back({ dim1.start, dim1.step, (intersection->start - dim1.start) / dim1.step, dim1.array });
|
||||
|
||||
if (dim1.start < intersection->start)
|
||||
result.push_back({ dim1.start, dim1.step, (intersection->start - dim1.start) / dim1.step, dim1.array});
|
||||
|
||||
/* add the parts between intersection steps */
|
||||
if (intersection->step > dim1.step)
|
||||
{
|
||||
@@ -70,7 +70,7 @@ static vector<ArrayDimension> DimensionDifference(const ArrayDimension& dim1, co
|
||||
uint64_t interValue = intersection->start;
|
||||
for (int64_t i = start; interValue <= intersection->start + intersection->step * (intersection->tripCount - 1); i++)
|
||||
{
|
||||
result.push_back({ interValue + dim1.step, dim1.step, intersection->step / dim1.step, dim1.array });
|
||||
result.push_back({interValue + dim1.step, dim1.step, intersection->step / dim1.step, dim1.array});
|
||||
interValue += intersection->step;
|
||||
}
|
||||
}
|
||||
@@ -109,7 +109,7 @@ static vector<ArrayDimension> ElementsIntersection(const vector<ArrayDimension>&
|
||||
{
|
||||
if (firstElement.empty() || secondElement.empty())
|
||||
return {};
|
||||
|
||||
|
||||
size_t dimAmount = firstElement.size();
|
||||
/* check if there is no intersecction */
|
||||
for (size_t i = 0; i < dimAmount; i++)
|
||||
@@ -132,16 +132,14 @@ static vector<ArrayDimension> ElementsIntersection(const vector<ArrayDimension>&
|
||||
static vector<vector<ArrayDimension>> ElementsDifference(const vector<ArrayDimension>& firstElement,
|
||||
const vector<ArrayDimension>& secondElement)
|
||||
{
|
||||
if (firstElement.empty())
|
||||
if (firstElement.empty() || secondElement.empty())
|
||||
return {};
|
||||
if (secondElement.empty())
|
||||
return { firstElement };
|
||||
|
||||
|
||||
vector<ArrayDimension> intersection = ElementsIntersection(firstElement, secondElement);
|
||||
vector<vector<ArrayDimension>> result;
|
||||
if (intersection.empty())
|
||||
return { firstElement };
|
||||
|
||||
|
||||
for (int i = 0; i < firstElement.size(); i++)
|
||||
{
|
||||
auto dimDiff = DimensionDifference(firstElement[i], secondElement[i]);
|
||||
@@ -190,7 +188,7 @@ bool AccessingSet::ContainsElement(const vector<ArrayDimension>& element) const
|
||||
{
|
||||
vector<vector<ArrayDimension>> tails;
|
||||
FindUncovered(element, tails);
|
||||
return tails.empty();
|
||||
return !tails.empty();
|
||||
}
|
||||
|
||||
void AccessingSet::FindCoveredBy(const vector<ArrayDimension>& element, vector<vector<ArrayDimension>>& result) const
|
||||
@@ -254,15 +252,13 @@ AccessingSet AccessingSet::Diff(const AccessingSet& secondSet) const
|
||||
return *this;
|
||||
|
||||
AccessingSet intersection = this->Intersect(secondSet);
|
||||
vector<vector<ArrayDimension>> uncovered;
|
||||
for (const auto& element : allElements)
|
||||
AccessingSet uncovered = *this;
|
||||
vector<vector<ArrayDimension>> result;
|
||||
for (const auto& element : intersection.GetElements())
|
||||
{
|
||||
vector<vector<ArrayDimension>> current_uncovered;
|
||||
intersection.FindUncovered(element, current_uncovered);
|
||||
uncovered.insert(uncovered.end(),
|
||||
std::move_iterator(current_uncovered.begin()),
|
||||
std::move_iterator(current_uncovered.end())
|
||||
);
|
||||
uncovered.FindUncovered(element, current_uncovered);
|
||||
uncovered = AccessingSet(current_uncovered);
|
||||
}
|
||||
return uncovered;
|
||||
}
|
||||
@@ -293,4 +289,4 @@ bool operator!=(const ArrayAccessingIndexes& lhs, const ArrayAccessingIndexes& r
|
||||
return true;
|
||||
|
||||
return false;
|
||||
}
|
||||
}
|
||||
|
||||
@@ -1,16 +1,14 @@
|
||||
#include <algorithm>
|
||||
#include <vector>
|
||||
#include <map>
|
||||
#include <unordered_set>
|
||||
#include <unordered_map>
|
||||
#include <string>
|
||||
#include<vector>
|
||||
#include<map>
|
||||
#include<unordered_set>
|
||||
#include<unordered_map>
|
||||
#include<string>
|
||||
#include <numeric>
|
||||
#include <iostream>
|
||||
|
||||
#include "range_structures.h"
|
||||
#include "region.h"
|
||||
|
||||
#include "..\Transformations\ExpressionSubstitution\expr_transform.h"
|
||||
#include "SgUtils.h"
|
||||
|
||||
using namespace std;
|
||||
@@ -64,14 +62,14 @@ static void BuildLoopIndex(map<string, LoopGraph*>& loopForIndex, LoopGraph* loo
|
||||
static string FindIndexName(int pos, SAPFOR::BasicBlock* block, map<string, LoopGraph*>& loopForIndex) {
|
||||
unordered_set<SAPFOR::Argument*> args = { block->getInstructions()[pos]->getInstruction()->getArg1() };
|
||||
|
||||
for (int i = pos - 1; i >= 0; i--)
|
||||
for (int i = pos - 1; i >= 0; i--)
|
||||
{
|
||||
SAPFOR::Argument* res = block->getInstructions()[i]->getInstruction()->getResult();
|
||||
if (res && args.find(res) != args.end())
|
||||
if (res && args.find(res) != args.end())
|
||||
{
|
||||
SAPFOR::Argument* arg1 = block->getInstructions()[i]->getInstruction()->getArg1();
|
||||
SAPFOR::Argument* arg2 = block->getInstructions()[i]->getInstruction()->getArg2();
|
||||
if (arg1)
|
||||
if (arg1)
|
||||
{
|
||||
string name = arg1->getValue();
|
||||
int idx = name.find('%');
|
||||
@@ -95,7 +93,7 @@ static string FindIndexName(int pos, SAPFOR::BasicBlock* block, map<string, Loop
|
||||
return "";
|
||||
}
|
||||
|
||||
static int GetDefUseArray(SAPFOR::BasicBlock* block, LoopGraph* loop, ArrayAccessingIndexes& def, ArrayAccessingIndexes& use, Region* region) {
|
||||
static int GetDefUseArray(SAPFOR::BasicBlock* block, LoopGraph* loop, ArrayAccessingIndexes& def, ArrayAccessingIndexes& use) {
|
||||
auto instructions = block->getInstructions();
|
||||
map<string, LoopGraph*> loopForIndex;
|
||||
BuildLoopIndex(loopForIndex, loop);
|
||||
@@ -125,11 +123,7 @@ static int GetDefUseArray(SAPFOR::BasicBlock* block, LoopGraph* loop, ArrayAcces
|
||||
}
|
||||
|
||||
if (point.size() == dimCount)
|
||||
{
|
||||
def[instruction->getInstruction()->getResult()->getValue()] = AccessingSet({ point });
|
||||
RegionInstruction regionInstruction;
|
||||
regionInstruction.def[instruction->getInstruction()->getResult()->getValue()] = AccessingSet({ point });
|
||||
}
|
||||
def[instruction->getInstruction()->getResult()->getValue()] = AccessingSet({point});
|
||||
}
|
||||
}
|
||||
}
|
||||
@@ -137,7 +131,7 @@ static int GetDefUseArray(SAPFOR::BasicBlock* block, LoopGraph* loop, ArrayAcces
|
||||
{
|
||||
vector<SAPFOR::Argument*> index_vars;
|
||||
vector<int> refPos;
|
||||
string array_name = instruction->getInstruction()->getArg1()->getValue();
|
||||
string array_name = instruction->getInstruction()->getArg1()->getValue();
|
||||
|
||||
int j = i - 1;
|
||||
while (j >= 0 && instructions[j]->getInstruction()->getOperation() == SAPFOR::CFG_OP::REF)
|
||||
@@ -154,53 +148,39 @@ static int GetDefUseArray(SAPFOR::BasicBlock* block, LoopGraph* loop, ArrayAcces
|
||||
auto* ref = isSgArrayRefExp(instruction->getInstruction()->getExpression());
|
||||
int fillCount = 0;
|
||||
|
||||
vector<pair<int, int>> coeffsForDims;
|
||||
int subs = ref->numberOfSubscripts();
|
||||
for (int i = 0; ref && i < ref->numberOfSubscripts(); ++i)
|
||||
{
|
||||
const vector<int*>& coeffs = getAttributes<SgExpression*, int*>(ref->subscript(i), set<int>{ INT_VAL });
|
||||
if (coeffs.size() == 1)
|
||||
{
|
||||
const pair<int, int> coef(coeffs[0][0], coeffs[0][1]);
|
||||
coeffsForDims.push_back(coef);
|
||||
}
|
||||
|
||||
}
|
||||
coeffsForDims = { coeffsForDims.rbegin(), coeffsForDims.rend() };
|
||||
|
||||
while (!index_vars.empty() && !refPos.empty() && !coeffsForDims.empty())
|
||||
while (!index_vars.empty() && !refPos.empty())
|
||||
{
|
||||
auto var = index_vars.back();
|
||||
int currentVarPos = refPos.back();
|
||||
ArrayDimension current_dim;
|
||||
if (var->getType() == SAPFOR::CFG_ARG_TYPE::CONST)
|
||||
current_dim = { stoul(var->getValue()), 1, 1, ref };
|
||||
current_dim = { stoul(var->getValue()), 1, 1, ref};
|
||||
else
|
||||
{
|
||||
string name, full_name = var->getValue();
|
||||
int pos = full_name.find('%');
|
||||
LoopGraph* currentLoop;
|
||||
if (pos != -1)
|
||||
if (pos != -1)
|
||||
{
|
||||
name = full_name.substr(pos + 1);
|
||||
if (loopForIndex.find(name) != loopForIndex.end())
|
||||
currentLoop = loopForIndex[name];
|
||||
currentLoop = loopForIndex[name];
|
||||
else
|
||||
return -1;
|
||||
}
|
||||
else
|
||||
else
|
||||
{
|
||||
name = FindIndexName(currentVarPos, block, loopForIndex);
|
||||
if (name == "")
|
||||
return -1;
|
||||
|
||||
if (loopForIndex.find(name) != loopForIndex.end())
|
||||
currentLoop = loopForIndex[name];
|
||||
currentLoop = loopForIndex[name];
|
||||
else
|
||||
return -1;
|
||||
}
|
||||
|
||||
uint64_t start = coeffsForDims.back().second * currentLoop->startVal + coeffsForDims.back().first;
|
||||
uint64_t start = currentLoop->startVal;
|
||||
uint64_t step = currentLoop->stepVal;
|
||||
uint64_t iters = currentLoop->calculatedCountOfIters;
|
||||
current_dim = { start, step, iters, ref };
|
||||
@@ -213,29 +193,14 @@ static int GetDefUseArray(SAPFOR::BasicBlock* block, LoopGraph* loop, ArrayAcces
|
||||
}
|
||||
index_vars.pop_back();
|
||||
refPos.pop_back();
|
||||
coeffsForDims.pop_back();
|
||||
}
|
||||
|
||||
if (fillCount == accessPoint.size())
|
||||
{
|
||||
RegionInstruction instruction;
|
||||
if (operation == SAPFOR::CFG_OP::STORE)
|
||||
{
|
||||
def[array_name].Insert(accessPoint);
|
||||
instruction.def[array_name] = { { accessPoint } };
|
||||
}
|
||||
else
|
||||
{
|
||||
instruction.use[array_name] = { { accessPoint } };
|
||||
if (def.find(array_name) == def.end())
|
||||
use[array_name].Insert(accessPoint);
|
||||
else
|
||||
{
|
||||
AccessingSet element({ accessPoint });
|
||||
use[array_name] = use[array_name].Union(element.Diff(def[array_name]));
|
||||
}
|
||||
}
|
||||
region->instructions.push_back(instruction);
|
||||
use[array_name].Insert(accessPoint);
|
||||
}
|
||||
}
|
||||
}
|
||||
@@ -243,41 +208,6 @@ static int GetDefUseArray(SAPFOR::BasicBlock* block, LoopGraph* loop, ArrayAcces
|
||||
|
||||
}
|
||||
|
||||
static void RemoveHeaderConnection(SAPFOR::BasicBlock* header, const unordered_set<SAPFOR::BasicBlock*>& blockSet, unordered_map<SAPFOR::BasicBlock*, Region*>& bbToRegion)
|
||||
{
|
||||
for (SAPFOR::BasicBlock* block : blockSet)
|
||||
{
|
||||
bool isCycleBlock = false;
|
||||
for (SAPFOR::BasicBlock* prevBlock : block->getPrev())
|
||||
isCycleBlock = isCycleBlock || (blockSet.find(prevBlock) != blockSet.end());
|
||||
|
||||
if (isCycleBlock)
|
||||
{
|
||||
bbToRegion[block]->removeNextRegion(bbToRegion[header]);
|
||||
bbToRegion[header]->removePrevRegion(bbToRegion[block]);
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
static void DFS(Region* block, vector<Region*>& result, unordered_set<Region*> cycleBlocks)
|
||||
{
|
||||
for (Region* nextBlock : block->getNextRegions())
|
||||
{
|
||||
if (cycleBlocks.find(nextBlock) != cycleBlocks.end())
|
||||
DFS(nextBlock, result, cycleBlocks);
|
||||
}
|
||||
result.push_back(block);
|
||||
}
|
||||
|
||||
void TopologySort(std::vector<Region*>& basikBlocks, Region* header)
|
||||
{
|
||||
vector<Region*> result;
|
||||
unordered_set<Region*> cycleBlocks(basikBlocks.begin(), basikBlocks.end());
|
||||
DFS(header, result, cycleBlocks);
|
||||
reverse(result.begin(), result.end());
|
||||
basikBlocks = result;
|
||||
}
|
||||
|
||||
static void SetConnections(unordered_map<SAPFOR::BasicBlock*, Region*>& bbToRegion, const unordered_set<SAPFOR::BasicBlock*>& blockSet)
|
||||
{
|
||||
for (SAPFOR::BasicBlock* block : blockSet)
|
||||
@@ -285,26 +215,25 @@ static void SetConnections(unordered_map<SAPFOR::BasicBlock*, Region*>& bbToRegi
|
||||
for (SAPFOR::BasicBlock* nextBlock : block->getNext())
|
||||
if (bbToRegion.find(nextBlock) != bbToRegion.end())
|
||||
bbToRegion[block]->addNextRegion(bbToRegion[nextBlock]);
|
||||
|
||||
|
||||
for (SAPFOR::BasicBlock* prevBlock : block->getPrev())
|
||||
if (bbToRegion.find(prevBlock) != bbToRegion.end())
|
||||
bbToRegion[block]->addPrevRegion(bbToRegion[prevBlock]);
|
||||
}
|
||||
}
|
||||
|
||||
static Region* CreateSubRegion(LoopGraph* loop, const vector<SAPFOR::BasicBlock*>& Blocks, unordered_map<SAPFOR::BasicBlock*, Region*>& bbToRegion)
|
||||
static Region* CreateSubRegion(LoopGraph* loop, const vector<SAPFOR::BasicBlock*>& Blocks, const unordered_map<SAPFOR::BasicBlock*, Region*>& bbToRegion)
|
||||
{
|
||||
Region* region = new Region;
|
||||
auto [header, blockSet] = GetBasicBlocksForLoop(loop, Blocks);
|
||||
RemoveHeaderConnection(header, blockSet, bbToRegion);
|
||||
if (bbToRegion.find(header) != bbToRegion.end())
|
||||
region->setHeader(bbToRegion.at(header));
|
||||
region->setHeader(bbToRegion.at(header));
|
||||
else
|
||||
{
|
||||
printInternalError(convertFileName(__FILE__).c_str(), __LINE__);
|
||||
return NULL;
|
||||
}
|
||||
|
||||
|
||||
for (SAPFOR::BasicBlock* block : blockSet)
|
||||
if (bbToRegion.find(block) != bbToRegion.end())
|
||||
region->addBasickBlocks(bbToRegion.at(block));
|
||||
@@ -315,7 +244,6 @@ static Region* CreateSubRegion(LoopGraph* loop, const vector<SAPFOR::BasicBlock*
|
||||
continue;
|
||||
region->addSubRegions(CreateSubRegion(childLoop, Blocks, bbToRegion));
|
||||
}
|
||||
TopologySort(region->getBasickBlocks(), region->getHeader());
|
||||
return region;
|
||||
}
|
||||
|
||||
@@ -326,13 +254,12 @@ Region::Region(LoopGraph* loop, const vector<SAPFOR::BasicBlock*>& Blocks)
|
||||
for (auto poiner : blockSet)
|
||||
{
|
||||
bbToRegion[poiner] = new Region(*poiner);
|
||||
this->basickBlocks.push_back(bbToRegion[poiner]);
|
||||
GetDefUseArray(poiner, loop, bbToRegion[poiner]->array_def, bbToRegion[poiner]->array_use, bbToRegion[poiner]);
|
||||
this->basickBlocks.insert(bbToRegion[poiner]);
|
||||
GetDefUseArray(poiner, loop, bbToRegion[poiner]->array_def, bbToRegion[poiner]->array_use);
|
||||
|
||||
}
|
||||
this->header = bbToRegion[header];
|
||||
SetConnections(bbToRegion, blockSet);
|
||||
RemoveHeaderConnection(header, blockSet, bbToRegion);
|
||||
//create subRegions
|
||||
for (LoopGraph* childLoop : loop->children)
|
||||
{
|
||||
@@ -340,5 +267,4 @@ Region::Region(LoopGraph* loop, const vector<SAPFOR::BasicBlock*>& Blocks)
|
||||
continue;
|
||||
subRegions.insert(CreateSubRegion(childLoop, Blocks, bbToRegion));
|
||||
}
|
||||
TopologySort(basickBlocks, this->header);
|
||||
}
|
||||
}
|
||||
|
||||
@@ -8,11 +8,6 @@
|
||||
#include "graph_loops.h"
|
||||
#include "CFGraph/CFGraph.h"
|
||||
|
||||
struct RegionInstruction
|
||||
{
|
||||
ArrayAccessingIndexes def, use, in, out;
|
||||
};
|
||||
|
||||
class Region : public SAPFOR::BasicBlock {
|
||||
public:
|
||||
Region() { header = nullptr; }
|
||||
@@ -25,25 +20,13 @@ public:
|
||||
|
||||
void setHeader(Region* region) { header = region; }
|
||||
|
||||
std::vector<Region*>& getBasickBlocks() { return basickBlocks; }
|
||||
std::unordered_set<Region*>& getBasickBlocks() { return basickBlocks; }
|
||||
|
||||
void addBasickBlocks(Region* region) { basickBlocks.push_back(region); }
|
||||
void addBasickBlocks(Region* region) { basickBlocks.insert(region); }
|
||||
|
||||
const std::unordered_set<Region*>& getPrevRegions() { return prevRegions; }
|
||||
|
||||
std::unordered_set<Region*>& getNextRegions() { return nextRegions; }
|
||||
|
||||
void removeNextRegion(Region* region)
|
||||
{
|
||||
if (nextRegions.find(region) != nextRegions.end())
|
||||
nextRegions.erase(region);
|
||||
}
|
||||
|
||||
void removePrevRegion(Region* region)
|
||||
{
|
||||
if (prevRegions.find(region) != prevRegions.end())
|
||||
prevRegions.erase(region);
|
||||
}
|
||||
std::unordered_set<Region*> getNextRegions() { return nextRegions; }
|
||||
|
||||
void addPrevRegion(Region* region) { prevRegions.insert(region); }
|
||||
|
||||
@@ -65,18 +48,13 @@ public:
|
||||
|
||||
void addSubRegions(Region* region) { subRegions.insert(region); }
|
||||
|
||||
std::vector<RegionInstruction> instructions;
|
||||
|
||||
ArrayAccessingIndexes array_def, array_use, array_out, array_in, array_priv;
|
||||
|
||||
private:
|
||||
std::vector<Region*> basickBlocks;
|
||||
std::unordered_set<Region*> subRegions;
|
||||
std::unordered_set<Region*> subRegions, basickBlocks;
|
||||
/*next Region which is BB for current BB Region*/
|
||||
std::unordered_set<Region*> nextRegions;
|
||||
/*prev Regions which is BBs for current BB Region*/
|
||||
std::unordered_set<Region*> prevRegions;
|
||||
Region* header;
|
||||
};
|
||||
|
||||
void TopologySort(std::vector<Region*>& basikBlocks, Region* header);
|
||||
104
src/Sapfor.cpp
104
src/Sapfor.cpp
@@ -58,6 +58,7 @@
|
||||
#include "expr_transform.h"
|
||||
|
||||
#include "Predictor/PredictScheme.h"
|
||||
#include "Predictor/PredictSchemeWithLibrary.h"
|
||||
#include "Predictor/PredictorModel.h"
|
||||
#include "SageAnalysisTool/depInterfaceExt.h"
|
||||
#include "DvmhRegions/DvmhRegionInserter.h"
|
||||
@@ -1732,103 +1733,7 @@ static bool runAnalysis(SgProject &project, const int curr_regime, const bool ne
|
||||
}
|
||||
}
|
||||
else if (curr_regime == PREDICT_SCHEME)
|
||||
{
|
||||
int maxSizeDist = 0;
|
||||
for (int z = 0; z < parallelRegions.size(); ++z)
|
||||
{
|
||||
const DataDirective &dataDirectives = parallelRegions[z]->GetDataDir();
|
||||
const vector<int> ¤tVariant = parallelRegions[z]->GetCurrentVariant();
|
||||
|
||||
auto &tmp = dataDirectives.distrRules;
|
||||
vector<pair<DIST::Array*, const DistrVariant*>> currentVar;
|
||||
for (int z1 = 0; z1 < currentVariant.size(); ++z1)
|
||||
currentVar.push_back(make_pair(tmp[z1].first, &tmp[z1].second[currentVariant[z1]]));
|
||||
|
||||
for (auto &elem : currentVar)
|
||||
{
|
||||
DIST::Array *array = elem.first;
|
||||
const DistrVariant *var = elem.second;
|
||||
|
||||
int countBlock = 0;
|
||||
for (int z = 0; z < var->distRule.size(); ++z)
|
||||
if (var->distRule[z] == dist::BLOCK)
|
||||
++countBlock;
|
||||
maxSizeDist = std::max(maxSizeDist, countBlock);
|
||||
}
|
||||
}
|
||||
|
||||
SpfInterval *mainIterval = getMainInterval(&project, intervals, SPF_messages);
|
||||
topologies.clear();
|
||||
if (maxSizeDist)
|
||||
{
|
||||
const int procNum = 8;
|
||||
//TODO:
|
||||
//topologies = getTopologies(procNum, maxSizeDist);
|
||||
throw -10;
|
||||
|
||||
const int countOfTop = topologies.size();
|
||||
if (countOfTop < 0)
|
||||
printInternalError(convertFileName(__FILE__).c_str(), __LINE__);
|
||||
|
||||
for (auto &inter : intervals)
|
||||
initTimeForIntervalTree(countOfTop, inter.second);
|
||||
|
||||
for (int z = 0; z < parallelRegions.size(); ++z)
|
||||
{
|
||||
const DataDirective &dataDirectives = parallelRegions[z]->GetDataDir();
|
||||
const vector<int> ¤tVariant = parallelRegions[z]->GetCurrentVariant();
|
||||
DIST::Arrays<int> &allArrays = parallelRegions[z]->GetAllArraysToModify();
|
||||
|
||||
auto &tmp = dataDirectives.distrRules;
|
||||
vector<pair<DIST::Array*, const DistrVariant*>> currentVar;
|
||||
for (int z1 = 0; z1 < currentVariant.size(); ++z1)
|
||||
currentVar.push_back(make_pair(tmp[z1].first, &tmp[z1].second[currentVariant[z1]]));
|
||||
|
||||
map<LoopGraph*, ParallelDirective*> parallelDirs;
|
||||
vector<std::tuple<DIST::Array*, vector<long>, pair<string, int>>> allSingleRemotes;
|
||||
for (int i = n - 1; i >= 0; --i)
|
||||
{
|
||||
SgFile *file = &(project.file(i));
|
||||
auto fountInfo = findAllDirectives(file, getObjectForFileFromMap(file->filename(), loopGraph), parallelRegions[z]->GetId());
|
||||
parallelDirs.insert(fountInfo.begin(), fountInfo.end());
|
||||
|
||||
auto fountRem = findAllSingleRemotes(file, parallelRegions[z]->GetId(), parallelRegions);
|
||||
allSingleRemotes.insert(allSingleRemotes.end(), fountRem.begin(), fountRem.end());
|
||||
}
|
||||
//TODO!
|
||||
//int err = predictScheme(parallelRegions[z], currentVar, allArrays.GetArrays(), parallelDirs, intervals, SPF_messages, allSingleRemotes, maxSizeDist, procNum);
|
||||
/*if (err != 0)
|
||||
internalExit = err;*/
|
||||
}
|
||||
|
||||
vector<SpfInterval*> tmp = { mainIterval };
|
||||
aggregatePredictedTimes(tmp);
|
||||
|
||||
int idx = 0;
|
||||
int best = -1;
|
||||
double bestSpeedUp = 0;
|
||||
for (auto &top : topologies)
|
||||
{
|
||||
string outStr = "";
|
||||
for (auto &elem : top)
|
||||
outStr += std::to_string(elem) + " ";
|
||||
double currS = mainIterval->exec_time / mainIterval->predictedTimes[idx];
|
||||
__spf_print(1, "%d: speed up %f for top. %s\n", idx, currS, outStr.c_str());
|
||||
|
||||
if (best == -1 || bestSpeedUp < currS)
|
||||
{
|
||||
bestSpeedUp = currS;
|
||||
best = idx;
|
||||
}
|
||||
++idx;
|
||||
}
|
||||
__spf_print(1, "best topology %d with speed up %f\n", best, bestSpeedUp);
|
||||
}
|
||||
else
|
||||
for (auto &inter : intervals)
|
||||
initTimeForIntervalTree(0, inter.second);
|
||||
|
||||
}
|
||||
runPredictScheme(project, parallelRegions, loopGraph, SPF_messages);
|
||||
else if (curr_regime == CREATE_INTER_TREE)
|
||||
{
|
||||
if (keepFiles)
|
||||
@@ -2229,9 +2134,8 @@ void runPass(const int curr_regime, const char *proj_name, const char *folderNam
|
||||
|
||||
runAnalysis(*project, CALCULATE_STATS_SCHEME, false);
|
||||
|
||||
//TODO: need to rewrite this to new algo
|
||||
/*if (!folderName && !consoleMode || predictOn)
|
||||
runAnalysis(*project, PREDICT_SCHEME, false); */
|
||||
if (!folderName && !consoleMode || predictOn)
|
||||
runAnalysis(*project, PREDICT_SCHEME, false);
|
||||
|
||||
runAnalysis(*project, REMOVE_COPIES, false);
|
||||
runAnalysis(*project, SWAP_LOOPS, false);
|
||||
|
||||
@@ -132,7 +132,7 @@ std::map<std::string, PredictorStats> allPredictorStats;
|
||||
|
||||
//for DVM INTERVALS
|
||||
std::map<std::string, std::vector<SpfInterval*>> intervals; // file -> intervals
|
||||
std::vector<std::vector<long>> topologies; // current topologies
|
||||
std::vector<std::vector<size_t>> topologies; // current topologies
|
||||
//
|
||||
|
||||
//for GCOV_PARSER
|
||||
|
||||
@@ -78,7 +78,12 @@ enum typeMessage { WARR, ERROR, NOTE };
|
||||
// 60 "Format misplaced"
|
||||
// 61 "Array has declaration area conflict"
|
||||
// 62 "need to move common declaration to main for DECLATE"
|
||||
//
|
||||
// 63 "Failed to initialize libpredict cluster"
|
||||
// 64 "Failed to initialize libpredict grid"
|
||||
// 65 "Failed to distribute array with libpredict"
|
||||
// 66 "Failed to align array with libpredict"
|
||||
// 67 "Failed to process shadow_renew with libpredict"
|
||||
//
|
||||
// 20xx TRANSFORM GROUP
|
||||
// 01 "can not convert array assign to loop"
|
||||
// 02 "converted arithmetic IF to simple IF"
|
||||
@@ -305,7 +310,7 @@ static void printStackTrace() { };
|
||||
} \
|
||||
} while (0)
|
||||
|
||||
// Свободный - R206
|
||||
// Свободный - R210
|
||||
// Гайд по русификации сообщений: При добавлении нового сообщения, меняется последний сводобный идентификатор.
|
||||
// В этом файле остаются только спецификаторы, для которых будет заполнен текст. Полный текст пишется в файле
|
||||
// russian_errors_text.txt. Спецификаторы там тоже сохраняются, по ним в визуализаторе будет восстановлен
|
||||
@@ -504,6 +509,18 @@ static const wchar_t *R183 = L"R183:";
|
||||
static const wchar_t *R184 = L"R184:%s";
|
||||
//1062
|
||||
static const wchar_t* R205 = L"R205:%s#%s";
|
||||
//1063
|
||||
static const wchar_t* R206 = L"R206:";
|
||||
//1064
|
||||
static const wchar_t* R207 = L"R207:";
|
||||
//1065
|
||||
static const wchar_t* R208 = L"R208:";
|
||||
//1066
|
||||
static const wchar_t* R209 = L"R209:";
|
||||
//1067
|
||||
static const wchar_t* R210 = L"R210:";
|
||||
//1068
|
||||
static const wchar_t* R211 = L"R211:";
|
||||
|
||||
//2001
|
||||
static const wchar_t *R94 = L"R94:";
|
||||
|
||||
@@ -184,8 +184,20 @@ R182 = "Редукционная операция по элементу масс
|
||||
R183 = "Расположение операторов FORMAT не поддерживается, попробуйте применить проход Коррекция стиля кода".
|
||||
//1061
|
||||
R184 = "Область объявления массива '%s' конфликтует с предыдущей областью. Возможно, это вызвано использованием include-файлов. Попробуйте применить проход 'Подстановка заголовочных файлов'".
|
||||
//1042
|
||||
//1062
|
||||
R205 = "Массив '%s' состоящий в common блоке '%s' должен иметь описание в главной программной единице для объявления в директиве DECLARE"
|
||||
//1063
|
||||
R206 = "Ошибка инициализации библиотеки libpredict с конфигурацией кластера: %s, код возврата: %d"
|
||||
//1064
|
||||
R207 = "Ошибка инициализации сетки libpredict с топологией: %zu %zu %zu %zu, код возврата: %d"
|
||||
//1065
|
||||
R208 = "Ошибка распределения массива '%s' с помощью libpredict, код возврата: %d"
|
||||
//1066
|
||||
R209 = "Ошибка выравнивания массива '%s' с массивом '%s' с помощью libpredict, код возврата: %d"
|
||||
//1067
|
||||
R210 = "Ошибка обработки shadow_renew для массива '%s' с помощью libpredict, код возврата: %d"
|
||||
//1068
|
||||
R211 = "Ошибка инициализации отображения libpredict с processes_per_processor: %zu, код возврата: %d"
|
||||
|
||||
//2001
|
||||
R94 = "Невозможно автоматически преобразовать данное присваивание к циклу"
|
||||
|
||||
@@ -950,7 +950,7 @@ int SPF_ModifyArrayDistribution(void*& context, int winHandler, short *options,
|
||||
|
||||
extern map<string, PredictorStats> allPredictorStats;
|
||||
extern map<string, vector<SpfInterval*>> intervals;
|
||||
extern vector<vector<long>> topologies;
|
||||
extern vector<vector<size_t>> topologies;
|
||||
|
||||
int SPF_CreateParallelVariant(void*& context, int winHandler, short *options, short *projName, short *folderName, int64_t *variants, int *varLen,
|
||||
string &output, string &outputMessage, string &predictorStats)
|
||||
@@ -1823,7 +1823,7 @@ static int inline runModificationPass(passes passName, short* projName, short* f
|
||||
runPassesForVisualizer(projName, { passName }, folderName);
|
||||
|
||||
//fill data
|
||||
// newFiles: <èìåíà ôàéëîâ äëÿ ìîä, ñîäåðæèìîå ôàéëà>
|
||||
// newFiles: <<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD> <20><><EFBFBD><EFBFBD><EFBFBD><EFBFBD> <20><><EFBFBD> <20><><EFBFBD>, <20><><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD> <20><><EFBFBD><EFBFBD><EFBFBD>>
|
||||
string newFile;
|
||||
|
||||
if (SgFile::switchToFile(outFileName.c_str()) == -1)
|
||||
@@ -2392,7 +2392,7 @@ const wstring Sapfor_RunAnalysis(const char* analysisName_c, const char* options
|
||||
retCode = SPF_GetArrayLinks(context, winHandler, optSh, projSh, result, output, outputMessage);
|
||||
else if (whichRun == "SPF_GetMaxMinBlockDistribution")
|
||||
retCode = SPF_GetMaxMinBlockDistribution(context, winHandler, optSh, projSh, result, output, outputMessage);
|
||||
else if (whichRun == "SPF_ÑhangeDirectory") // russian C
|
||||
else if (whichRun == "SPF_<EFBFBD>hangeDirectory") // russian C
|
||||
{
|
||||
if (options_c == NULL)
|
||||
printInternalError(convertFileName(__FILE__).c_str(), __LINE__);
|
||||
|
||||
Reference in New Issue
Block a user