Compare commits
38 Commits
libpredict
...
aa6608e7d3
| Author | SHA1 | Date | |
|---|---|---|---|
|
|
aa6608e7d3 | ||
|
|
3fa3299b06 | ||
| 641e68d748 | |||
| afc88bf056 | |||
| d6d16fed2d | |||
| 2f0fecd14d | |||
| f5b5aba32f | |||
| 50b4965354 | |||
|
|
864ef699b7 | ||
|
|
09c343a71f | ||
|
|
593c6e928c | ||
|
|
e9166d8c99 | ||
| 657175a728 | |||
| 99b884b221 | |||
| 55ccd825c7 | |||
| 93a9ccf902 | |||
| 3c119c884b | |||
|
|
dc7555c052 | ||
|
|
b7b17368a3 | ||
|
|
5998ca49b1 | ||
|
|
fff3467f56 | ||
|
|
d9a2fce7ab | ||
|
|
da51f8484c | ||
|
|
c61e18a044 | ||
|
|
27b7ea965e | ||
|
|
d110be6d01 | ||
|
|
c567cb0a42 | ||
| b298cc03bf | |||
|
|
8c6a55463c | ||
|
|
32a4a7fd0a | ||
|
|
507305ac3a | ||
|
|
a3939ed274 | ||
|
|
95ef954b6e | ||
|
|
243b1f5bdb | ||
|
|
5fb2bd79df | ||
|
|
d33659290e | ||
|
|
b8a6c92ca8 | ||
|
|
1028e20177 |
1
.gitignore
vendored
1
.gitignore
vendored
@@ -78,3 +78,4 @@ Sapfor/Sapc++/x64/
|
|||||||
|
|
||||||
Sapfor/out/
|
Sapfor/out/
|
||||||
Sapfor/_bin/*
|
Sapfor/_bin/*
|
||||||
|
_bin/*
|
||||||
|
|||||||
@@ -204,6 +204,8 @@ set(TR_INLINER src/Transformations/FunctionInlining/inliner.cpp
|
|||||||
src/Transformations/FunctionInlining/inliner.h)
|
src/Transformations/FunctionInlining/inliner.h)
|
||||||
set(TR_RENAME_SYMBOLS src/Transformations/RenameSymbols/rename_symbols.cpp
|
set(TR_RENAME_SYMBOLS src/Transformations/RenameSymbols/rename_symbols.cpp
|
||||||
src/Transformations/RenameSymbols/rename_symbols.h)
|
src/Transformations/RenameSymbols/rename_symbols.h)
|
||||||
|
SET(TR_SWAP_OPERATORS src/Transformations/SwapOperators/swap_operators.cpp
|
||||||
|
src/Transformations/SwapOperators/swap_operators.h)
|
||||||
|
|
||||||
set(TRANSFORMS
|
set(TRANSFORMS
|
||||||
${TR_DEAD_CODE}
|
${TR_DEAD_CODE}
|
||||||
@@ -226,7 +228,8 @@ set(TRANSFORMS
|
|||||||
${TR_REPLACE_ARRAYS_IN_IO}
|
${TR_REPLACE_ARRAYS_IN_IO}
|
||||||
${TR_EXPR_TRANSFORM}
|
${TR_EXPR_TRANSFORM}
|
||||||
${TR_INLINER}
|
${TR_INLINER}
|
||||||
${TR_RENAME_SYMBOLS})
|
${TR_RENAME_SYMBOLS}
|
||||||
|
${TR_SWAP_OPERATORS})
|
||||||
|
|
||||||
set(CFG src/CFGraph/IR.cpp
|
set(CFG src/CFGraph/IR.cpp
|
||||||
src/CFGraph/IR.h
|
src/CFGraph/IR.h
|
||||||
@@ -331,9 +334,7 @@ set(MAIN src/Sapfor.cpp
|
|||||||
src/Utils/PassManager.h)
|
src/Utils/PassManager.h)
|
||||||
|
|
||||||
set(PREDICTOR src/Predictor/PredictScheme.cpp
|
set(PREDICTOR src/Predictor/PredictScheme.cpp
|
||||||
src/Predictor/PredictScheme.h
|
src/Predictor/PredictScheme.h)
|
||||||
src/Predictor/PredictSchemeWithLibrary.cpp
|
|
||||||
src/Predictor/PredictSchemeWithLibrary.h)
|
|
||||||
|
|
||||||
set(LIBPREDICTOR ${libpred_sources}/cluster.cpp
|
set(LIBPREDICTOR ${libpred_sources}/cluster.cpp
|
||||||
${libpred_sources}/predictor.cpp
|
${libpred_sources}/predictor.cpp
|
||||||
@@ -461,6 +462,7 @@ source_group (Transformations\\GlobalVariables FILES ${TR_GV})
|
|||||||
source_group (Transformations\\ConvertToC FILES ${TR_CONV})
|
source_group (Transformations\\ConvertToC FILES ${TR_CONV})
|
||||||
source_group (Transformations\\SetImplicitNone FILES ${TR_IMPLICIT_NONE})
|
source_group (Transformations\\SetImplicitNone FILES ${TR_IMPLICIT_NONE})
|
||||||
source_group (Transformations\\ReplaceArraysInIO FILES ${TR_REPLACE_ARRAYS_IN_IO})
|
source_group (Transformations\\ReplaceArraysInIO FILES ${TR_REPLACE_ARRAYS_IN_IO})
|
||||||
|
source_group (Transformations\\SwapOperators FILES ${TR_SWAP_OPERATORS})
|
||||||
|
|
||||||
|
|
||||||
source_group (CreateIntervals FILES ${CREATE_INTER_T})
|
source_group (CreateIntervals FILES ${CREATE_INTER_T})
|
||||||
|
|||||||
Submodule projects/libpredictor updated: e6e805a390...d0772cdb57
@@ -122,7 +122,6 @@ static LoopGraph* createDirectiveForLoop(LoopGraph *currentLoop, MapToArray &mai
|
|||||||
if (found == false)
|
if (found == false)
|
||||||
{
|
{
|
||||||
directive->shadowRenew.push_back(make_pair(key, vector<pair<int, int>>()));
|
directive->shadowRenew.push_back(make_pair(key, vector<pair<int, int>>()));
|
||||||
directive->shadowRenewCorner.push_back(false);
|
|
||||||
|
|
||||||
const DIST::Array *arrayRef = read;
|
const DIST::Array *arrayRef = read;
|
||||||
for (int i = 0; i < arrayRef->GetDimSize(); ++i)
|
for (int i = 0; i < arrayRef->GetDimSize(); ++i)
|
||||||
|
|||||||
@@ -857,11 +857,6 @@ ParallelDirective::genDirective(File* file, const vector<pair<DIST::Array*, cons
|
|||||||
shadowRenewShifts[i].resize(shadowRenew[i].second.size());
|
shadowRenewShifts[i].resize(shadowRenew[i].second.size());
|
||||||
}
|
}
|
||||||
|
|
||||||
if (shadowRenewCorner.size() == 0)
|
|
||||||
{
|
|
||||||
shadowRenewCorner.resize(shadowRenew.size(), false);
|
|
||||||
}
|
|
||||||
|
|
||||||
string shadowAdd = ", SHADOW_RENEW(";
|
string shadowAdd = ", SHADOW_RENEW(";
|
||||||
int inserted = 0;
|
int inserted = 0;
|
||||||
|
|
||||||
@@ -904,10 +899,7 @@ ParallelDirective::genDirective(File* file, const vector<pair<DIST::Array*, cons
|
|||||||
for (auto& elem : genSubscripts(shadowRenew[i1].second, shadowRenewShifts[i1]))
|
for (auto& elem : genSubscripts(shadowRenew[i1].second, shadowRenewShifts[i1]))
|
||||||
newArrayRef->addSubscript(*elem);
|
newArrayRef->addSubscript(*elem);
|
||||||
|
|
||||||
bool needCornerFlag = shadowRenew[i1].second.size() > 1 && needCorner(shadowArray, shiftsByAccess, loop);
|
if (shadowRenew[i1].second.size() > 1 && needCorner(shadowArray, shiftsByAccess, loop))
|
||||||
shadowRenewCorner[i1] = needCornerFlag;
|
|
||||||
|
|
||||||
if (needCornerFlag)
|
|
||||||
{
|
{
|
||||||
SgExpression* tmp = new SgExpression(ARRAY_OP, newArrayRef, NULL, NULL);
|
SgExpression* tmp = new SgExpression(ARRAY_OP, newArrayRef, NULL, NULL);
|
||||||
p->setLhs(*tmp);
|
p->setLhs(*tmp);
|
||||||
|
|||||||
@@ -102,7 +102,6 @@ public:
|
|||||||
// origin_Name uniqName bounds
|
// origin_Name uniqName bounds
|
||||||
std::vector<std::pair<std::pair<std::string, std::string>, std::vector<std::pair<int, int>>>> shadowRenew;
|
std::vector<std::pair<std::pair<std::string, std::string>, std::vector<std::pair<int, int>>>> shadowRenew;
|
||||||
std::vector<std::vector<std::pair<int, int>>> shadowRenewShifts;
|
std::vector<std::vector<std::pair<int, int>>> shadowRenewShifts;
|
||||||
std::vector<bool> shadowRenewCorner;
|
|
||||||
|
|
||||||
// origin_Name uniqName bounds
|
// origin_Name uniqName bounds
|
||||||
std::vector<std::pair<std::pair<std::string, std::string>, std::vector<std::pair<int, int>>>> across;
|
std::vector<std::pair<std::pair<std::string, std::string>, std::vector<std::pair<int, int>>>> across;
|
||||||
@@ -126,7 +125,6 @@ public:
|
|||||||
privates = copyFrom.privates;
|
privates = copyFrom.privates;
|
||||||
shadowRenew = copyFrom.shadowRenew;
|
shadowRenew = copyFrom.shadowRenew;
|
||||||
shadowRenewShifts = copyFrom.shadowRenewShifts;
|
shadowRenewShifts = copyFrom.shadowRenewShifts;
|
||||||
shadowRenewCorner = copyFrom.shadowRenewCorner;
|
|
||||||
across = copyFrom.across;
|
across = copyFrom.across;
|
||||||
acrossShifts = copyFrom.acrossShifts;
|
acrossShifts = copyFrom.acrossShifts;
|
||||||
remoteAccess = copyFrom.remoteAccess;
|
remoteAccess = copyFrom.remoteAccess;
|
||||||
@@ -153,7 +151,6 @@ public:
|
|||||||
on.clear();
|
on.clear();
|
||||||
privates.clear();
|
privates.clear();
|
||||||
shadowRenew.clear();
|
shadowRenew.clear();
|
||||||
shadowRenewCorner.clear();
|
|
||||||
across.clear();
|
across.clear();
|
||||||
acrossShifts.clear();
|
acrossShifts.clear();
|
||||||
reduction.clear();
|
reduction.clear();
|
||||||
|
|||||||
@@ -23,7 +23,6 @@
|
|||||||
#include "expr_transform.h"
|
#include "expr_transform.h"
|
||||||
#include "../LoopAnalyzer/loop_analyzer.h"
|
#include "../LoopAnalyzer/loop_analyzer.h"
|
||||||
#include "CFGraph/CFGraph.h"
|
#include "CFGraph/CFGraph.h"
|
||||||
#include "../Utils/utils.h"
|
|
||||||
|
|
||||||
#include "json.hpp"
|
#include "json.hpp"
|
||||||
|
|
||||||
@@ -37,109 +36,6 @@ using std::tuple;
|
|||||||
|
|
||||||
using json = nlohmann::json;
|
using json = nlohmann::json;
|
||||||
|
|
||||||
void runPredictSchemeOld(SgProject &project,
|
|
||||||
vector<vector<size_t>> &topologies,
|
|
||||||
vector<ParallelRegion*> ¶llelRegions,
|
|
||||||
map<string, vector<LoopGraph*>> &loopGraph,
|
|
||||||
map<string, vector<SpfInterval*>> &intervals,
|
|
||||||
map<string, vector<Messages>> &SPF_messages)
|
|
||||||
{
|
|
||||||
int maxSizeDist = 0;
|
|
||||||
for (int z = 0; z < parallelRegions.size(); ++z)
|
|
||||||
{
|
|
||||||
const DataDirective &dataDirectives = parallelRegions[z]->GetDataDir();
|
|
||||||
const vector<int> ¤tVariant = parallelRegions[z]->GetCurrentVariant();
|
|
||||||
|
|
||||||
auto &tmp = dataDirectives.distrRules;
|
|
||||||
vector<pair<DIST::Array*, const DistrVariant*>> currentVar;
|
|
||||||
for (int z1 = 0; z1 < currentVariant.size(); ++z1)
|
|
||||||
currentVar.push_back(std::make_pair(tmp[z1].first, &tmp[z1].second[currentVariant[z1]]));
|
|
||||||
|
|
||||||
for (auto &elem : currentVar)
|
|
||||||
{
|
|
||||||
DIST::Array *array = elem.first;
|
|
||||||
const DistrVariant *var = elem.second;
|
|
||||||
|
|
||||||
int countBlock = 0;
|
|
||||||
for (int z = 0; z < var->distRule.size(); ++z)
|
|
||||||
if (var->distRule[z] == dist::BLOCK)
|
|
||||||
++countBlock;
|
|
||||||
maxSizeDist = std::max(maxSizeDist, countBlock);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
SpfInterval *mainIterval = getMainInterval(&project, intervals, SPF_messages);
|
|
||||||
topologies.clear();
|
|
||||||
if (maxSizeDist)
|
|
||||||
{
|
|
||||||
const int procNum = 8;
|
|
||||||
//TODO:
|
|
||||||
//topologies = getTopologies(procNum, maxSizeDist);
|
|
||||||
throw -10;
|
|
||||||
|
|
||||||
const int countOfTop = topologies.size();
|
|
||||||
if (countOfTop < 0)
|
|
||||||
printInternalError(convertFileName(__FILE__).c_str(), __LINE__);
|
|
||||||
|
|
||||||
for (auto &inter : intervals)
|
|
||||||
initTimeForIntervalTree(countOfTop, inter.second);
|
|
||||||
|
|
||||||
for (int z = 0; z < parallelRegions.size(); ++z)
|
|
||||||
{
|
|
||||||
const DataDirective &dataDirectives = parallelRegions[z]->GetDataDir();
|
|
||||||
const vector<int> ¤tVariant = parallelRegions[z]->GetCurrentVariant();
|
|
||||||
DIST::Arrays<int> &allArrays = parallelRegions[z]->GetAllArraysToModify();
|
|
||||||
|
|
||||||
auto &tmp = dataDirectives.distrRules;
|
|
||||||
vector<pair<DIST::Array*, const DistrVariant*>> currentVar;
|
|
||||||
for (int z1 = 0; z1 < currentVariant.size(); ++z1)
|
|
||||||
currentVar.push_back(std::make_pair(tmp[z1].first, &tmp[z1].second[currentVariant[z1]]));
|
|
||||||
|
|
||||||
map<LoopGraph*, ParallelDirective*> parallelDirs;
|
|
||||||
vector<std::tuple<DIST::Array*, vector<long>, pair<string, int>>> allSingleRemotes;
|
|
||||||
for (int i = project.numberOfFiles() - 1; i >= 0; --i)
|
|
||||||
{
|
|
||||||
SgFile *file = &(project.file(i));
|
|
||||||
auto fountInfo = findAllDirectives(file, getObjectForFileFromMap(file->filename(), loopGraph), parallelRegions[z]->GetId());
|
|
||||||
parallelDirs.insert(fountInfo.begin(), fountInfo.end());
|
|
||||||
|
|
||||||
auto fountRem = findAllSingleRemotes(file, parallelRegions[z]->GetId(), parallelRegions);
|
|
||||||
allSingleRemotes.insert(allSingleRemotes.end(), fountRem.begin(), fountRem.end());
|
|
||||||
}
|
|
||||||
//TODO!
|
|
||||||
//int err = predictScheme(parallelRegions[z], currentVar, allArrays.GetArrays(), parallelDirs, intervals, SPF_messages, allSingleRemotes, maxSizeDist, procNum);
|
|
||||||
/*if (err != 0)
|
|
||||||
internalExit = err;*/
|
|
||||||
}
|
|
||||||
|
|
||||||
vector<SpfInterval*> tmp = { mainIterval };
|
|
||||||
aggregatePredictedTimes(tmp);
|
|
||||||
|
|
||||||
int idx = 0;
|
|
||||||
int best = -1;
|
|
||||||
double bestSpeedUp = 0;
|
|
||||||
for (auto &top : topologies)
|
|
||||||
{
|
|
||||||
string outStr = "";
|
|
||||||
for (auto &elem : top)
|
|
||||||
outStr += std::to_string(elem) + " ";
|
|
||||||
double currS = mainIterval->exec_time / mainIterval->predictedTimes[idx];
|
|
||||||
__spf_print(1, "%d: speed up %f for top. %s\n", idx, currS, outStr.c_str());
|
|
||||||
|
|
||||||
if (best == -1 || bestSpeedUp < currS)
|
|
||||||
{
|
|
||||||
bestSpeedUp = currS;
|
|
||||||
best = idx;
|
|
||||||
}
|
|
||||||
++idx;
|
|
||||||
}
|
|
||||||
__spf_print(1, "best topology %d with speed up %f\n", best, bestSpeedUp);
|
|
||||||
}
|
|
||||||
else
|
|
||||||
for (auto &inter : intervals)
|
|
||||||
initTimeForIntervalTree(0, inter.second);
|
|
||||||
}
|
|
||||||
|
|
||||||
static void fillParallel(SgExpression *exp, ParallelStats &parStats, int &totalScoreComm)
|
static void fillParallel(SgExpression *exp, ParallelStats &parStats, int &totalScoreComm)
|
||||||
{
|
{
|
||||||
if (exp)
|
if (exp)
|
||||||
|
|||||||
@@ -61,5 +61,3 @@ void processFileToPredict(SgFile *file, PredictorStats &predictorCounts);
|
|||||||
|
|
||||||
void calculateStatsForPredictor(const std::map<std::string, std::vector<FuncInfo*>>& allFuncInfo, const std::map<std::string, std::map<int, Gcov_info>>& gCovInfo);
|
void calculateStatsForPredictor(const std::map<std::string, std::vector<FuncInfo*>>& allFuncInfo, const std::map<std::string, std::map<int, Gcov_info>>& gCovInfo);
|
||||||
void parseDvmDirForPredictor(const std::map<std::tuple<int, std::string, std::string>, std::pair<DIST::Array*, DIST::ArrayAccessInfo*>>& declaredArrays, const std::map<std::string, CommonBlock*>& commonBlocks, const std::map<std::string, std::vector<FuncInfo*>>& allFuncInfo, const std::map<std::string, std::map<int, Gcov_info>>& gCovInfo);
|
void parseDvmDirForPredictor(const std::map<std::tuple<int, std::string, std::string>, std::pair<DIST::Array*, DIST::ArrayAccessInfo*>>& declaredArrays, const std::map<std::string, CommonBlock*>& commonBlocks, const std::map<std::string, std::vector<FuncInfo*>>& allFuncInfo, const std::map<std::string, std::map<int, Gcov_info>>& gCovInfo);
|
||||||
|
|
||||||
void runPredictSchemeOld(SgProject &project, std::vector<std::vector<size_t>> &topologies, std::vector<ParallelRegion*> ¶llelRegions, std::map<std::string, std::vector<LoopGraph*>> &loopGraph, std::map<std::string, std::vector<SpfInterval*>> &intervals, std::map<std::string, std::vector<Messages>> &SPF_messages);
|
|
||||||
|
|||||||
@@ -1,439 +0,0 @@
|
|||||||
#include "leak_detector.h"
|
|
||||||
|
|
||||||
#include <limits>
|
|
||||||
#include <map>
|
|
||||||
#include <vector>
|
|
||||||
#include <string>
|
|
||||||
#include <tuple>
|
|
||||||
|
|
||||||
#include "dvm.h"
|
|
||||||
#include "PredictSchemeWithLibrary.h"
|
|
||||||
#include "../../projects/libpredictor/include/libpredict/predictor.h"
|
|
||||||
#include "../DirectiveProcessing/directive_parser.h"
|
|
||||||
#include "../Distribution/DvmhDirective.h"
|
|
||||||
#include "../ParallelizationRegions/ParRegions.h"
|
|
||||||
#include "../GraphLoop/graph_loops_func.h"
|
|
||||||
#include "../Utils/errors.h"
|
|
||||||
#include "../Utils/utils.h"
|
|
||||||
|
|
||||||
using std::map;
|
|
||||||
using std::pair;
|
|
||||||
using std::string;
|
|
||||||
using std::tuple;
|
|
||||||
using std::vector;
|
|
||||||
|
|
||||||
map<size_t, size_t> createTemplateIdMapping(const vector<ParallelRegion*>& parallelRegions)
|
|
||||||
{
|
|
||||||
size_t maxArrayId = 0;
|
|
||||||
for (int z = 0; z < parallelRegions.size(); ++z) {
|
|
||||||
const DataDirective& dataDirectives = parallelRegions[z]->GetDataDir();
|
|
||||||
|
|
||||||
for (const auto& distrRule : dataDirectives.distrRules) {
|
|
||||||
if (distrRule.first && !distrRule.first->IsTemplate()) {
|
|
||||||
maxArrayId = std::max(maxArrayId, (size_t)distrRule.first->GetId());
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
for (const auto& alignRule : dataDirectives.alignRules) {
|
|
||||||
if (alignRule.alignArray && !alignRule.alignArray->IsTemplate()) {
|
|
||||||
maxArrayId = std::max(maxArrayId, (size_t)alignRule.alignArray->GetId());
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
map<size_t, size_t> templateIdMapping;
|
|
||||||
size_t nextTemplateId = maxArrayId + 1;
|
|
||||||
for (int z = 0; z < parallelRegions.size(); ++z) {
|
|
||||||
const DataDirective& dataDirectives = parallelRegions[z]->GetDataDir();
|
|
||||||
|
|
||||||
for (const auto& distrRule : dataDirectives.distrRules) {
|
|
||||||
if (distrRule.first && distrRule.first->IsTemplate()) {
|
|
||||||
size_t originalId = distrRule.first->GetId();
|
|
||||||
if (templateIdMapping.find(originalId) == templateIdMapping.end()) {
|
|
||||||
templateIdMapping[originalId] = nextTemplateId++;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
for (const auto& alignRule : dataDirectives.alignRules) {
|
|
||||||
if (alignRule.alignWith && alignRule.alignWith->IsTemplate()) {
|
|
||||||
size_t originalId = alignRule.alignWith->GetId();
|
|
||||||
if (templateIdMapping.find(originalId) == templateIdMapping.end()) {
|
|
||||||
templateIdMapping[originalId] = nextTemplateId++;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
return templateIdMapping;
|
|
||||||
}
|
|
||||||
|
|
||||||
PrecomputedLibpredictParams precomputeLibpredictParams(
|
|
||||||
SgProject& project,
|
|
||||||
const vector<ParallelRegion*>& parallelRegions,
|
|
||||||
const map<string, vector<LoopGraph*>>& loopGraph,
|
|
||||||
const map<size_t, size_t>& templateIdMapping)
|
|
||||||
{
|
|
||||||
PrecomputedLibpredictParams result;
|
|
||||||
|
|
||||||
// distribute and align from parallelRegions
|
|
||||||
for (int z = 0; z < parallelRegions.size(); ++z) {
|
|
||||||
const DataDirective& dataDirectives = parallelRegions[z]->GetDataDir();
|
|
||||||
const vector<int>& currentVariant = parallelRegions[z]->GetCurrentVariant();
|
|
||||||
const DIST::Arrays<int>& allArrays = parallelRegions[z]->GetAllArrays();
|
|
||||||
|
|
||||||
auto& tmp = dataDirectives.distrRules;
|
|
||||||
vector<pair<DIST::Array*, const DistrVariant*>> currentVar;
|
|
||||||
for (int z1 = 0; z1 < currentVariant.size(); ++z1) {
|
|
||||||
currentVar.push_back(std::make_pair(tmp[z1].first, &tmp[z1].second[currentVariant[z1]]));
|
|
||||||
}
|
|
||||||
|
|
||||||
// distribute
|
|
||||||
for (const auto& distrRule : currentVar) {
|
|
||||||
DIST::Array* array = distrRule.first;
|
|
||||||
const DistrVariant* variant = distrRule.second;
|
|
||||||
|
|
||||||
if (array && variant && !array->IsNotDistribute()) {
|
|
||||||
PrecomputedDistributeParams params;
|
|
||||||
|
|
||||||
size_t originalId = array->GetId();
|
|
||||||
params.arrayId = originalId;
|
|
||||||
|
|
||||||
if (array->IsTemplate()) {
|
|
||||||
auto it = templateIdMapping.find(originalId);
|
|
||||||
if (it != templateIdMapping.end()) {
|
|
||||||
params.arrayId = it->second;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
params.elemSize = array->GetTypeSize();
|
|
||||||
params.array = array;
|
|
||||||
|
|
||||||
const auto& arraySizes = array->GetSizes();
|
|
||||||
for (int dim = 0; dim < array->GetDimSize(); ++dim) {
|
|
||||||
size_t dimSize = arraySizes[dim].second - arraySizes[dim].first + 1;
|
|
||||||
|
|
||||||
if (dim < variant->distRule.size() && variant->distRule[dim] == dist::BLOCK) {
|
|
||||||
params.axisDistributions.emplace_back(dimSize, libpredict::TypeDistribute::BLOCK);
|
|
||||||
} else {
|
|
||||||
params.axisDistributions.emplace_back(dimSize, libpredict::TypeDistribute::NONE);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
const auto& shadowSpec = array->GetShadowSpec();
|
|
||||||
for (int dim = 0; dim < shadowSpec.size() && dim < array->GetDimSize(); ++dim) {
|
|
||||||
if (dim < variant->distRule.size() && variant->distRule[dim] == dist::BLOCK) {
|
|
||||||
params.shadowEdges.emplace_back(shadowSpec[dim].first, shadowSpec[dim].second);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
result.distributeParams.push_back(params);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// align
|
|
||||||
for (const auto& alignRule : dataDirectives.alignRules) {
|
|
||||||
DIST::Array* alignArray = alignRule.alignArray;
|
|
||||||
DIST::Array* alignWithArray = alignRule.alignWith;
|
|
||||||
|
|
||||||
if (alignArray && alignWithArray && !alignArray->IsNotDistribute()) {
|
|
||||||
PrecomputedAlignParams params;
|
|
||||||
|
|
||||||
params.arrayId = alignArray->GetId();
|
|
||||||
size_t originalDistributedArrayId = alignWithArray->GetId();
|
|
||||||
params.distributedArrayId = originalDistributedArrayId;
|
|
||||||
|
|
||||||
if (alignWithArray->IsTemplate()) {
|
|
||||||
auto it = templateIdMapping.find(originalDistributedArrayId);
|
|
||||||
if (it != templateIdMapping.end()) {
|
|
||||||
params.distributedArrayId = it->second;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
params.elemSize = alignArray->GetTypeSize();
|
|
||||||
params.alignArray = alignArray;
|
|
||||||
params.alignWithArray = alignWithArray;
|
|
||||||
|
|
||||||
const auto& arraySizes = alignArray->GetSizes();
|
|
||||||
for (int dim = 0; dim < alignArray->GetDimSize(); ++dim) {
|
|
||||||
size_t dimSize = arraySizes[dim].second - arraySizes[dim].first + 1;
|
|
||||||
params.dimensions.push_back(dimSize);
|
|
||||||
}
|
|
||||||
|
|
||||||
for (int dim = 0; dim < alignWithArray->GetDimSize(); ++dim) {
|
|
||||||
bool found = false;
|
|
||||||
for (int i = 0; i < alignRule.alignRuleWith.size(); ++i) {
|
|
||||||
const auto& ruleWith = alignRule.alignRuleWith[i];
|
|
||||||
if (ruleWith.first == dim) {
|
|
||||||
const auto& rule = ruleWith.second;
|
|
||||||
if (rule.first == 0) {
|
|
||||||
// constant
|
|
||||||
params.distributionExpressions.emplace_back(rule.second);
|
|
||||||
} else {
|
|
||||||
// linear expression a * I + b
|
|
||||||
params.distributionExpressions.emplace_back(i, rule.first, rule.second);
|
|
||||||
}
|
|
||||||
found = true;
|
|
||||||
break;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
if (!found) {
|
|
||||||
// There is no rule for this measurement
|
|
||||||
params.distributionExpressions.emplace_back();
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
const auto& shadowSpec = alignArray->GetShadowSpec();
|
|
||||||
for (int dim = 0; dim < shadowSpec.size() && dim < alignArray->GetDimSize(); ++dim) {
|
|
||||||
params.shadowEdges.emplace_back(shadowSpec[dim].first, shadowSpec[dim].second);
|
|
||||||
}
|
|
||||||
|
|
||||||
result.alignParams.push_back(params);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// shadow_renew
|
|
||||||
map<LoopGraph*, ParallelDirective*> parallelDirs;
|
|
||||||
for (int i = project.numberOfFiles() - 1; i >= 0; --i) {
|
|
||||||
SgFile* file = &(project.file(i));
|
|
||||||
auto fountInfo = findAllDirectives(
|
|
||||||
file,
|
|
||||||
getObjectForFileFromMap(file->filename(), const_cast<map<string, vector<LoopGraph*>>&>(loopGraph)),
|
|
||||||
parallelRegions[z]->GetId());
|
|
||||||
parallelDirs.insert(fountInfo.begin(), fountInfo.end());
|
|
||||||
}
|
|
||||||
|
|
||||||
for (auto& dirPair : parallelDirs) {
|
|
||||||
LoopGraph* loopPtr = dirPair.first;
|
|
||||||
ParallelDirective* directive = dirPair.second;
|
|
||||||
|
|
||||||
if (directive && !directive->shadowRenew.empty()) {
|
|
||||||
for (size_t shadowIdx = 0; shadowIdx < directive->shadowRenew.size(); ++shadowIdx) {
|
|
||||||
const auto& shadowRenewItem = directive->shadowRenew[shadowIdx];
|
|
||||||
const string& arrayName = shadowRenewItem.first.second; // uniqName
|
|
||||||
const vector<pair<int, int>>& bounds = shadowRenewItem.second;
|
|
||||||
|
|
||||||
DIST::Array* shadowArray = allArrays.GetArrayByName(arrayName);
|
|
||||||
if (shadowArray == NULL) {
|
|
||||||
continue;
|
|
||||||
}
|
|
||||||
|
|
||||||
if (shadowArray && !shadowArray->IsNotDistribute()) {
|
|
||||||
PrecomputedShadowRenewParams params;
|
|
||||||
|
|
||||||
params.arrayId = shadowArray->GetId();
|
|
||||||
params.shadowArray = shadowArray;
|
|
||||||
|
|
||||||
for (const auto& bound : bounds) {
|
|
||||||
params.shadow_renew.emplace_back(static_cast<size_t>(bound.first),
|
|
||||||
static_cast<size_t>(bound.second));
|
|
||||||
}
|
|
||||||
|
|
||||||
params.corner = directive->shadowRenewCorner[shadowIdx];
|
|
||||||
params.number_loop_iterations = loopPtr ? static_cast<size_t>(loopPtr->countOfIters) : 1;
|
|
||||||
|
|
||||||
result.shadowRenewParams.push_back(params);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
return result;
|
|
||||||
}
|
|
||||||
|
|
||||||
double runLibpredictCalc(const vector<size_t>& topology,
|
|
||||||
const string& clusterConfStr,
|
|
||||||
const PrecomputedLibpredictParams& precomputedParams,
|
|
||||||
map<string, vector<Messages>>& SPF_messages)
|
|
||||||
{
|
|
||||||
libpredict::RetInitGrid retInitGrid = libpredict::InitGrid(topology[0], topology[1], topology[2], topology[3]);
|
|
||||||
|
|
||||||
if (retInitGrid != libpredict::INIT_GRID_SUCCESS) {
|
|
||||||
__spf_print(1, "ERROR: Failed to initialize libpredict grid with topology: %zu %zu %zu %zu, return code: %d\n",
|
|
||||||
topology[0], topology[1], topology[2], topology[3], (int)retInitGrid);
|
|
||||||
|
|
||||||
std::wstring messageR, messageE;
|
|
||||||
__spf_printToLongBuf(messageE, L"Failed to initialize libpredict grid with topology: %zu %zu %zu %zu, return code: %d",
|
|
||||||
topology[0], topology[1], topology[2], topology[3], (int)retInitGrid);
|
|
||||||
__spf_printToLongBuf(messageR, R207);
|
|
||||||
getObjectForFileFromMap(clusterConfStr.c_str(), SPF_messages).push_back(Messages(ERROR, 1, messageR, messageE, 1064));
|
|
||||||
return -1;
|
|
||||||
}
|
|
||||||
|
|
||||||
// distribute
|
|
||||||
for (const auto& params : precomputedParams.distributeParams) {
|
|
||||||
libpredict::RetDistribute retDistribute = libpredict::Distribute(
|
|
||||||
params.arrayId, params.elemSize, params.axisDistributions, params.shadowEdges);
|
|
||||||
|
|
||||||
if (retDistribute != libpredict::DISTRIBUTE_SUCCESS) {
|
|
||||||
__spf_print(1, "ERROR: Failed to distribute array '%s' (id=%zu) with libpredict, return code: %d\n",
|
|
||||||
params.array->GetShortName().c_str(), params.arrayId, (int)retDistribute);
|
|
||||||
|
|
||||||
std::wstring messageR, messageE;
|
|
||||||
__spf_printToLongBuf(messageE, L"Failed to distribute array '%s' with libpredict, return code: %d",
|
|
||||||
to_wstring(params.array->GetShortName()).c_str(), (int)retDistribute);
|
|
||||||
__spf_printToLongBuf(messageR, R208);
|
|
||||||
getObjectForFileFromMap(params.array->GetDeclInfo().begin()->first.c_str(), SPF_messages).push_back(Messages(ERROR, params.array->GetDeclInfo().begin()->second, messageR, messageE, 1065));
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// align
|
|
||||||
for (const auto& params : precomputedParams.alignParams) {
|
|
||||||
libpredict::RetAlign retAlign = libpredict::Align(
|
|
||||||
params.arrayId, params.distributedArrayId, params.elemSize,
|
|
||||||
params.dimensions, params.distributionExpressions, params.shadowEdges);
|
|
||||||
|
|
||||||
if (retAlign != libpredict::ALIGN_SUCCESS) {
|
|
||||||
__spf_print(1, "ERROR: Failed to align array '%s' (id=%zu) with array '%s' (id=%zu), return code: %d\n",
|
|
||||||
params.alignArray->GetShortName().c_str(), params.arrayId,
|
|
||||||
params.alignWithArray->GetShortName().c_str(), params.distributedArrayId, (int)retAlign);
|
|
||||||
|
|
||||||
std::wstring messageR, messageE;
|
|
||||||
__spf_printToLongBuf(messageE, L"Failed to align array '%s' with array '%s' using libpredict, return code: %d",
|
|
||||||
to_wstring(params.alignArray->GetShortName()).c_str(),
|
|
||||||
to_wstring(params.alignWithArray->GetShortName()).c_str(), (int)retAlign);
|
|
||||||
__spf_printToLongBuf(messageR, R209);
|
|
||||||
getObjectForFileFromMap(params.alignArray->GetDeclInfo().begin()->first.c_str(), SPF_messages).push_back(Messages(ERROR, params.alignArray->GetDeclInfo().begin()->second, messageR, messageE, 1066));
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// shadow_renew
|
|
||||||
for (const auto& params : precomputedParams.shadowRenewParams) {
|
|
||||||
libpredict::RetShadowRenew retShadowRenew = libpredict::ShadowRenew(
|
|
||||||
params.arrayId, params.shadow_renew, params.corner, params.number_loop_iterations);
|
|
||||||
|
|
||||||
if (retShadowRenew != libpredict::SHADOW_RENEW_SUCCESS) {
|
|
||||||
__spf_print(1, "ERROR: Failed to process shadow_renew for array '%s' (id=%zu), return code: %d\n",
|
|
||||||
params.shadowArray->GetShortName().c_str(), params.arrayId, (int)retShadowRenew);
|
|
||||||
|
|
||||||
std::wstring messageR, messageE;
|
|
||||||
__spf_printToLongBuf(messageE, L"Failed to process shadow_renew for array '%s' with libpredict, return code: %d",
|
|
||||||
to_wstring(params.shadowArray->GetShortName()).c_str(), (int)retShadowRenew);
|
|
||||||
__spf_printToLongBuf(messageR, R210);
|
|
||||||
getObjectForFileFromMap(params.shadowArray->GetDeclInfo().begin()->first.c_str(), SPF_messages).push_back(Messages(ERROR, params.shadowArray->GetDeclInfo().begin()->second, messageR, messageE, 1067));
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
return libpredict::GetTime();
|
|
||||||
}
|
|
||||||
|
|
||||||
void runPredictScheme(SgProject& project,
|
|
||||||
vector<vector<size_t>>& topologies,
|
|
||||||
const vector<ParallelRegion*>& parallelRegions,
|
|
||||||
map<string, vector<LoopGraph*>>& loopGraph,
|
|
||||||
map<string, vector<Messages>>& SPF_messages)
|
|
||||||
{
|
|
||||||
// calculating maximum dimension of distribution
|
|
||||||
int maxSizeDist = 0;
|
|
||||||
for (int z = 0; z < parallelRegions.size(); ++z) {
|
|
||||||
const DataDirective& dataDirectives = parallelRegions[z]->GetDataDir();
|
|
||||||
const vector<int>& currentVariant = parallelRegions[z]->GetCurrentVariant();
|
|
||||||
|
|
||||||
auto& tmp = dataDirectives.distrRules;
|
|
||||||
vector<const DistrVariant*> currentVar;
|
|
||||||
for (int z1 = 0; z1 < currentVariant.size(); ++z1) {
|
|
||||||
currentVar.push_back(&tmp[z1].second[currentVariant[z1]]);
|
|
||||||
}
|
|
||||||
|
|
||||||
for (auto var : currentVar) {
|
|
||||||
int countBlock = 0;
|
|
||||||
for (int z = 0; z < var->distRule.size(); ++z) {
|
|
||||||
if (var->distRule[z] == dist::BLOCK) {
|
|
||||||
++countBlock;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
maxSizeDist = std::max(maxSizeDist, countBlock);
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
// calculating name of a cluster configuration file
|
|
||||||
string clusterConfStr;
|
|
||||||
if (project.numberOfFiles() > 0) {
|
|
||||||
string firstFilePath = project.fileName(0);
|
|
||||||
|
|
||||||
size_t lastSlash = firstFilePath.find_last_of("/\\");
|
|
||||||
clusterConfStr = firstFilePath.substr(0, lastSlash + 1) + "cluster.conf";
|
|
||||||
}
|
|
||||||
|
|
||||||
// creating template ID display to avoid conflicts
|
|
||||||
map<size_t, size_t> templateIdMapping = createTemplateIdMapping(parallelRegions);
|
|
||||||
|
|
||||||
// Precomputing parameters of directive functions from libpredict
|
|
||||||
PrecomputedLibpredictParams precomputedParams = precomputeLibpredictParams(
|
|
||||||
project, parallelRegions, loopGraph, templateIdMapping);
|
|
||||||
|
|
||||||
// iterating through topologies to find most optimal one
|
|
||||||
topologies = vector<vector<size_t>>();
|
|
||||||
if (maxSizeDist) {
|
|
||||||
if (maxSizeDist > 4) {
|
|
||||||
maxSizeDist = 4;
|
|
||||||
}
|
|
||||||
|
|
||||||
// Initialize cluster
|
|
||||||
int procCount = 0;
|
|
||||||
libpredict::RetInitCluster retInitCluster = libpredict::InitCluster(clusterConfStr, procCount);
|
|
||||||
|
|
||||||
if (retInitCluster != libpredict::INIT_CLUSTER_SUCCESS) {
|
|
||||||
__spf_print(1, "ERROR: Failed to initialize libpredict cluster with config: %s, return code: %d\n", clusterConfStr.c_str(), (int)retInitCluster);
|
|
||||||
|
|
||||||
std::wstring messageR, messageE;
|
|
||||||
__spf_printToLongBuf(messageE, L"Failed to initialize libpredict cluster with config: %s, return code: %d",
|
|
||||||
to_wstring(clusterConfStr).c_str(), (int)retInitCluster);
|
|
||||||
__spf_printToLongBuf(messageR, R206);
|
|
||||||
getObjectForFileFromMap(clusterConfStr.c_str(), SPF_messages).push_back(Messages(ERROR, 1, messageR, messageE, 1063));
|
|
||||||
return;
|
|
||||||
}
|
|
||||||
|
|
||||||
for (size_t n1 = 2; n1 <= procCount; ++n1) {
|
|
||||||
for (size_t n2 = 1; n2 <= n1 && n1 * n2 <= procCount; ++n2) {
|
|
||||||
if (n2 != 1 && maxSizeDist < 2 || n2 == 1 && maxSizeDist == 2) {
|
|
||||||
continue;
|
|
||||||
}
|
|
||||||
|
|
||||||
for (size_t n3 = 1; n3 <= n2 && n1 * n2 * n3 <= procCount; ++n3) {
|
|
||||||
if (n3 != 1 && maxSizeDist < 3 || n3 == 1 && maxSizeDist == 3) {
|
|
||||||
continue;
|
|
||||||
}
|
|
||||||
|
|
||||||
for (size_t n4 = 1; n4 <= n3 && n1 * n2 * n3 * n4 <= procCount; ++n4) {
|
|
||||||
if (n4 != 1 && maxSizeDist < 4 || n4 == 1 && maxSizeDist == 4) {
|
|
||||||
continue;
|
|
||||||
}
|
|
||||||
|
|
||||||
topologies.push_back(vector<size_t>{n1, n2, n3, n4});
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
vector<size_t> best;
|
|
||||||
double bestTime = std::numeric_limits<double>::max();
|
|
||||||
for (auto& topology : topologies) {
|
|
||||||
double currTime = runLibpredictCalc(topology, clusterConfStr, precomputedParams, SPF_messages);
|
|
||||||
|
|
||||||
string outStr = "";
|
|
||||||
for (const auto& elem : topology) {
|
|
||||||
outStr += std::to_string(elem) + " ";
|
|
||||||
}
|
|
||||||
__spf_print(1, "topology %s has time %f\n", outStr.c_str(), currTime);
|
|
||||||
|
|
||||||
if (currTime == -1) {
|
|
||||||
return;
|
|
||||||
}
|
|
||||||
|
|
||||||
if (currTime < bestTime) {
|
|
||||||
bestTime = currTime;
|
|
||||||
best = topology;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
string outStr;
|
|
||||||
for (const auto& elem : best) {
|
|
||||||
outStr += std::to_string(elem) + " ";
|
|
||||||
}
|
|
||||||
|
|
||||||
__spf_print(1, "best topology %s with time %f\n", outStr.c_str(), bestTime);
|
|
||||||
} else {
|
|
||||||
__spf_print(1, "impossible to calculate best topology: project does not contain distribution directives\n");
|
|
||||||
}
|
|
||||||
}
|
|
||||||
@@ -1,57 +0,0 @@
|
|||||||
#pragma once
|
|
||||||
#include <vector>
|
|
||||||
#include <map>
|
|
||||||
#include <string>
|
|
||||||
#include "dvm.h"
|
|
||||||
#include "graph_calls.h"
|
|
||||||
#include "../../projects/libpredictor/include/libpredict/predictor.h"
|
|
||||||
|
|
||||||
struct PrecomputedDistributeParams {
|
|
||||||
size_t arrayId;
|
|
||||||
size_t elemSize;
|
|
||||||
std::vector<libpredict::DistributeAxisRule> axisDistributions;
|
|
||||||
std::vector<std::pair<size_t, size_t>> shadowEdges;
|
|
||||||
DIST::Array* array;
|
|
||||||
};
|
|
||||||
|
|
||||||
struct PrecomputedAlignParams {
|
|
||||||
size_t arrayId;
|
|
||||||
size_t distributedArrayId;
|
|
||||||
size_t elemSize;
|
|
||||||
std::vector<size_t> dimensions;
|
|
||||||
std::vector<libpredict::AlignDisplay> distributionExpressions;
|
|
||||||
std::vector<std::pair<size_t, size_t>> shadowEdges;
|
|
||||||
DIST::Array* alignArray;
|
|
||||||
DIST::Array* alignWithArray;
|
|
||||||
};
|
|
||||||
|
|
||||||
struct PrecomputedShadowRenewParams {
|
|
||||||
size_t arrayId;
|
|
||||||
std::vector<std::pair<size_t, size_t>> shadow_renew;
|
|
||||||
bool corner;
|
|
||||||
size_t number_loop_iterations;
|
|
||||||
DIST::Array* shadowArray;
|
|
||||||
};
|
|
||||||
|
|
||||||
struct PrecomputedLibpredictParams {
|
|
||||||
std::vector<PrecomputedDistributeParams> distributeParams;
|
|
||||||
std::vector<PrecomputedAlignParams> alignParams;
|
|
||||||
std::vector<PrecomputedShadowRenewParams> shadowRenewParams;
|
|
||||||
};
|
|
||||||
|
|
||||||
PrecomputedLibpredictParams precomputeLibpredictParams(
|
|
||||||
SgProject& project,
|
|
||||||
const std::vector<ParallelRegion*>& parallelRegions,
|
|
||||||
const std::map<std::string, std::vector<LoopGraph*>>& loopGraph,
|
|
||||||
const std::map<size_t, size_t>& templateIdMapping);
|
|
||||||
|
|
||||||
void runPredictScheme(SgProject& project,
|
|
||||||
std::vector<std::vector<size_t>>& topologies,
|
|
||||||
const std::vector<ParallelRegion*>& parallelRegions,
|
|
||||||
std::map<std::string, std::vector<LoopGraph*>>& loopGraph,
|
|
||||||
std::map<std::string, std::vector<Messages>>& SPF_messages);
|
|
||||||
|
|
||||||
double runLibpredictCalc(const std::vector<size_t>& topology,
|
|
||||||
const std::string& clusterConfStr,
|
|
||||||
const PrecomputedLibpredictParams& precomputedParams,
|
|
||||||
std::map<std::string, std::vector<Messages>>& SPF_messages);
|
|
||||||
111
src/Sapfor.cpp
111
src/Sapfor.cpp
@@ -57,7 +57,6 @@
|
|||||||
#include "expr_transform.h"
|
#include "expr_transform.h"
|
||||||
|
|
||||||
#include "Predictor/PredictScheme.h"
|
#include "Predictor/PredictScheme.h"
|
||||||
#include "Predictor/PredictSchemeWithLibrary.h"
|
|
||||||
#include "Predictor/PredictorModel.h"
|
#include "Predictor/PredictorModel.h"
|
||||||
#include "SageAnalysisTool/depInterfaceExt.h"
|
#include "SageAnalysisTool/depInterfaceExt.h"
|
||||||
#include "DvmhRegions/DvmhRegionInserter.h"
|
#include "DvmhRegions/DvmhRegionInserter.h"
|
||||||
@@ -90,6 +89,7 @@
|
|||||||
#include "Transformations/DeadCodeRemoving/dead_code.h"
|
#include "Transformations/DeadCodeRemoving/dead_code.h"
|
||||||
#include "Transformations/RenameSymbols/rename_symbols.h"
|
#include "Transformations/RenameSymbols/rename_symbols.h"
|
||||||
#include "Transformations/FunctionInlining/inliner.h"
|
#include "Transformations/FunctionInlining/inliner.h"
|
||||||
|
#include "Transformations/SwapOperators/swap_operators.h"
|
||||||
|
|
||||||
#include "ProjectParameters/projectParameters.h"
|
#include "ProjectParameters/projectParameters.h"
|
||||||
|
|
||||||
@@ -940,6 +940,8 @@ static bool runAnalysis(SgProject &project, const int curr_regime, const bool ne
|
|||||||
internalExit = err;
|
internalExit = err;
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
else if (curr_regime == SWAP_OPERATORS)
|
||||||
|
runSwapOperators(file, loopGraph, fullIR, countOfTransform);
|
||||||
else if (curr_regime == PRIVATE_REMOVING_ANALYSIS)
|
else if (curr_regime == PRIVATE_REMOVING_ANALYSIS)
|
||||||
{
|
{
|
||||||
auto itFound = loopGraph.find(file->filename());
|
auto itFound = loopGraph.find(file->filename());
|
||||||
@@ -1038,7 +1040,8 @@ static bool runAnalysis(SgProject &project, const int curr_regime, const bool ne
|
|||||||
PRIVATE_REMOVING,
|
PRIVATE_REMOVING,
|
||||||
PRIVATE_ARRAYS_EXPANSION,
|
PRIVATE_ARRAYS_EXPANSION,
|
||||||
PRIVATE_ARRAYS_SHRINKING,
|
PRIVATE_ARRAYS_SHRINKING,
|
||||||
REMOVE_DEAD_CODE };
|
REMOVE_DEAD_CODE,
|
||||||
|
SWAP_OPERATORS };
|
||||||
|
|
||||||
if ((countOfTransform == 0 || internalExit > 0) && applyFor.find(curr_regime) != applyFor.end())
|
if ((countOfTransform == 0 || internalExit > 0) && applyFor.find(curr_regime) != applyFor.end())
|
||||||
{
|
{
|
||||||
@@ -1729,7 +1732,103 @@ static bool runAnalysis(SgProject &project, const int curr_regime, const bool ne
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
else if (curr_regime == PREDICT_SCHEME)
|
else if (curr_regime == PREDICT_SCHEME)
|
||||||
runPredictScheme(project, topologies, parallelRegions, loopGraph, SPF_messages);
|
{
|
||||||
|
int maxSizeDist = 0;
|
||||||
|
for (int z = 0; z < parallelRegions.size(); ++z)
|
||||||
|
{
|
||||||
|
const DataDirective &dataDirectives = parallelRegions[z]->GetDataDir();
|
||||||
|
const vector<int> ¤tVariant = parallelRegions[z]->GetCurrentVariant();
|
||||||
|
|
||||||
|
auto &tmp = dataDirectives.distrRules;
|
||||||
|
vector<pair<DIST::Array*, const DistrVariant*>> currentVar;
|
||||||
|
for (int z1 = 0; z1 < currentVariant.size(); ++z1)
|
||||||
|
currentVar.push_back(make_pair(tmp[z1].first, &tmp[z1].second[currentVariant[z1]]));
|
||||||
|
|
||||||
|
for (auto &elem : currentVar)
|
||||||
|
{
|
||||||
|
DIST::Array *array = elem.first;
|
||||||
|
const DistrVariant *var = elem.second;
|
||||||
|
|
||||||
|
int countBlock = 0;
|
||||||
|
for (int z = 0; z < var->distRule.size(); ++z)
|
||||||
|
if (var->distRule[z] == dist::BLOCK)
|
||||||
|
++countBlock;
|
||||||
|
maxSizeDist = std::max(maxSizeDist, countBlock);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
SpfInterval *mainIterval = getMainInterval(&project, intervals, SPF_messages);
|
||||||
|
topologies.clear();
|
||||||
|
if (maxSizeDist)
|
||||||
|
{
|
||||||
|
const int procNum = 8;
|
||||||
|
//TODO:
|
||||||
|
//topologies = getTopologies(procNum, maxSizeDist);
|
||||||
|
throw -10;
|
||||||
|
|
||||||
|
const int countOfTop = topologies.size();
|
||||||
|
if (countOfTop < 0)
|
||||||
|
printInternalError(convertFileName(__FILE__).c_str(), __LINE__);
|
||||||
|
|
||||||
|
for (auto &inter : intervals)
|
||||||
|
initTimeForIntervalTree(countOfTop, inter.second);
|
||||||
|
|
||||||
|
for (int z = 0; z < parallelRegions.size(); ++z)
|
||||||
|
{
|
||||||
|
const DataDirective &dataDirectives = parallelRegions[z]->GetDataDir();
|
||||||
|
const vector<int> ¤tVariant = parallelRegions[z]->GetCurrentVariant();
|
||||||
|
DIST::Arrays<int> &allArrays = parallelRegions[z]->GetAllArraysToModify();
|
||||||
|
|
||||||
|
auto &tmp = dataDirectives.distrRules;
|
||||||
|
vector<pair<DIST::Array*, const DistrVariant*>> currentVar;
|
||||||
|
for (int z1 = 0; z1 < currentVariant.size(); ++z1)
|
||||||
|
currentVar.push_back(make_pair(tmp[z1].first, &tmp[z1].second[currentVariant[z1]]));
|
||||||
|
|
||||||
|
map<LoopGraph*, ParallelDirective*> parallelDirs;
|
||||||
|
vector<std::tuple<DIST::Array*, vector<long>, pair<string, int>>> allSingleRemotes;
|
||||||
|
for (int i = n - 1; i >= 0; --i)
|
||||||
|
{
|
||||||
|
SgFile *file = &(project.file(i));
|
||||||
|
auto fountInfo = findAllDirectives(file, getObjectForFileFromMap(file->filename(), loopGraph), parallelRegions[z]->GetId());
|
||||||
|
parallelDirs.insert(fountInfo.begin(), fountInfo.end());
|
||||||
|
|
||||||
|
auto fountRem = findAllSingleRemotes(file, parallelRegions[z]->GetId(), parallelRegions);
|
||||||
|
allSingleRemotes.insert(allSingleRemotes.end(), fountRem.begin(), fountRem.end());
|
||||||
|
}
|
||||||
|
//TODO!
|
||||||
|
//int err = predictScheme(parallelRegions[z], currentVar, allArrays.GetArrays(), parallelDirs, intervals, SPF_messages, allSingleRemotes, maxSizeDist, procNum);
|
||||||
|
/*if (err != 0)
|
||||||
|
internalExit = err;*/
|
||||||
|
}
|
||||||
|
|
||||||
|
vector<SpfInterval*> tmp = { mainIterval };
|
||||||
|
aggregatePredictedTimes(tmp);
|
||||||
|
|
||||||
|
int idx = 0;
|
||||||
|
int best = -1;
|
||||||
|
double bestSpeedUp = 0;
|
||||||
|
for (auto &top : topologies)
|
||||||
|
{
|
||||||
|
string outStr = "";
|
||||||
|
for (auto &elem : top)
|
||||||
|
outStr += std::to_string(elem) + " ";
|
||||||
|
double currS = mainIterval->exec_time / mainIterval->predictedTimes[idx];
|
||||||
|
__spf_print(1, "%d: speed up %f for top. %s\n", idx, currS, outStr.c_str());
|
||||||
|
|
||||||
|
if (best == -1 || bestSpeedUp < currS)
|
||||||
|
{
|
||||||
|
bestSpeedUp = currS;
|
||||||
|
best = idx;
|
||||||
|
}
|
||||||
|
++idx;
|
||||||
|
}
|
||||||
|
__spf_print(1, "best topology %d with speed up %f\n", best, bestSpeedUp);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
for (auto &inter : intervals)
|
||||||
|
initTimeForIntervalTree(0, inter.second);
|
||||||
|
|
||||||
|
}
|
||||||
else if (curr_regime == CREATE_INTER_TREE)
|
else if (curr_regime == CREATE_INTER_TREE)
|
||||||
{
|
{
|
||||||
if (keepFiles)
|
if (keepFiles)
|
||||||
@@ -2125,8 +2224,9 @@ void runPass(const int curr_regime, const char *proj_name, const char *folderNam
|
|||||||
|
|
||||||
runAnalysis(*project, CALCULATE_STATS_SCHEME, false);
|
runAnalysis(*project, CALCULATE_STATS_SCHEME, false);
|
||||||
|
|
||||||
if (!folderName && !consoleMode || predictOn)
|
//TODO: need to rewrite this to new algo
|
||||||
runAnalysis(*project, PREDICT_SCHEME, false);
|
/*if (!folderName && !consoleMode || predictOn)
|
||||||
|
runAnalysis(*project, PREDICT_SCHEME, false); */
|
||||||
|
|
||||||
runAnalysis(*project, REMOVE_COPIES, false);
|
runAnalysis(*project, REMOVE_COPIES, false);
|
||||||
runAnalysis(*project, SWAP_LOOPS, false);
|
runAnalysis(*project, SWAP_LOOPS, false);
|
||||||
@@ -2238,6 +2338,7 @@ void runPass(const int curr_regime, const char *proj_name, const char *folderNam
|
|||||||
case INSERT_NO_DISTR_FLAGS_FROM_GUI:
|
case INSERT_NO_DISTR_FLAGS_FROM_GUI:
|
||||||
case PRIVATE_REMOVING:
|
case PRIVATE_REMOVING:
|
||||||
case RENAME_INLCUDES:
|
case RENAME_INLCUDES:
|
||||||
|
case SWAP_OPERATORS:
|
||||||
runAnalysis(*project, curr_regime, true, "", folderName);
|
runAnalysis(*project, curr_regime, true, "", folderName);
|
||||||
break;
|
break;
|
||||||
case INLINE_PROCEDURES:
|
case INLINE_PROCEDURES:
|
||||||
|
|||||||
@@ -122,6 +122,8 @@ enum passes {
|
|||||||
CREATE_INTER_TREE,
|
CREATE_INTER_TREE,
|
||||||
INSERT_INTER_TREE,
|
INSERT_INTER_TREE,
|
||||||
|
|
||||||
|
SWAP_OPERATORS,
|
||||||
|
|
||||||
SHADOW_GROUPING,
|
SHADOW_GROUPING,
|
||||||
INLINE_PROCEDURES,
|
INLINE_PROCEDURES,
|
||||||
FILL_PARALLEL_REG_IR,
|
FILL_PARALLEL_REG_IR,
|
||||||
@@ -319,6 +321,7 @@ static void setPassValues()
|
|||||||
passNames[CHECK_PAR_REG_DIR] = "CHECK_PAR_REG_DIR";
|
passNames[CHECK_PAR_REG_DIR] = "CHECK_PAR_REG_DIR";
|
||||||
passNames[CREATE_INTER_TREE] = "CREATE_INTER_TREE";
|
passNames[CREATE_INTER_TREE] = "CREATE_INTER_TREE";
|
||||||
passNames[INSERT_INTER_TREE] = "INSERT_INTER_TREE";
|
passNames[INSERT_INTER_TREE] = "INSERT_INTER_TREE";
|
||||||
|
passNames[SWAP_OPERATORS] = "SWAP_OPERATORS";
|
||||||
passNames[CREATE_PARALLEL_REGIONS] = "CREATE_PARALLEL_REGIONS";
|
passNames[CREATE_PARALLEL_REGIONS] = "CREATE_PARALLEL_REGIONS";
|
||||||
passNames[PRIVATE_REMOVING_ANALYSIS] = "PRIVATE_REMOVING_ANALYSIS";
|
passNames[PRIVATE_REMOVING_ANALYSIS] = "PRIVATE_REMOVING_ANALYSIS";
|
||||||
passNames[PRIVATE_REMOVING] = "PRIVATE_REMOVING";
|
passNames[PRIVATE_REMOVING] = "PRIVATE_REMOVING";
|
||||||
|
|||||||
@@ -132,7 +132,7 @@ std::map<std::string, PredictorStats> allPredictorStats;
|
|||||||
|
|
||||||
//for DVM INTERVALS
|
//for DVM INTERVALS
|
||||||
std::map<std::string, std::vector<SpfInterval*>> intervals; // file -> intervals
|
std::map<std::string, std::vector<SpfInterval*>> intervals; // file -> intervals
|
||||||
std::vector<std::vector<size_t>> topologies; // current topologies
|
std::vector<std::vector<long>> topologies; // current topologies
|
||||||
//
|
//
|
||||||
|
|
||||||
//for GCOV_PARSER
|
//for GCOV_PARSER
|
||||||
|
|||||||
422
src/Transformations/SwapOperators/swap_operators.cpp
Normal file
422
src/Transformations/SwapOperators/swap_operators.cpp
Normal file
@@ -0,0 +1,422 @@
|
|||||||
|
#include <map>
|
||||||
|
#include <unordered_set>
|
||||||
|
#include <vector>
|
||||||
|
#include <queue>
|
||||||
|
#include <iostream>
|
||||||
|
|
||||||
|
#include "../../Utils/errors.h"
|
||||||
|
#include "../../Utils/SgUtils.h"
|
||||||
|
#include "../../GraphCall/graph_calls.h"
|
||||||
|
#include "../../GraphCall/graph_calls_func.h"
|
||||||
|
#include "../../CFGraph/CFGraph.h"
|
||||||
|
#include "../../CFGraph/IR.h"
|
||||||
|
#include "../../GraphLoop/graph_loops.h"
|
||||||
|
#include "swap_operators.h"
|
||||||
|
|
||||||
|
using namespace std;
|
||||||
|
|
||||||
|
|
||||||
|
unordered_set<int> loop_tags = {FOR_NODE/*, FORALL_NODE, WHILE_NODE, DO_WHILE_NODE*/};
|
||||||
|
unordered_set<int> importantDepsTags = {FOR_NODE, IF_NODE};
|
||||||
|
unordered_set<int> importantUpdDepsTags = {ELSEIF_NODE};
|
||||||
|
unordered_set<int> importantEndTags = {CONTROL_END};
|
||||||
|
|
||||||
|
|
||||||
|
vector<SAPFOR::IR_Block*> findInstructionsFromOperator(SgStatement* st, vector<SAPFOR::BasicBlock*> Blocks)
|
||||||
|
{
|
||||||
|
vector<SAPFOR::IR_Block*> result;
|
||||||
|
string filename = st -> fileName();
|
||||||
|
for (auto& block: Blocks)
|
||||||
|
{
|
||||||
|
vector<SAPFOR::IR_Block*> instructionsInBlock = block -> getInstructions();
|
||||||
|
for (auto& instruction: instructionsInBlock)
|
||||||
|
{
|
||||||
|
SgStatement* curOperator = instruction -> getInstruction() -> getOperator();
|
||||||
|
if (curOperator -> lineNumber() == st -> lineNumber())
|
||||||
|
result.push_back(instruction);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return result;
|
||||||
|
}
|
||||||
|
|
||||||
|
vector<SAPFOR::BasicBlock*> findFuncBlocksByFuncStatement(SgStatement *st, map<FuncInfo*, vector<SAPFOR::BasicBlock*>>& FullIR)
|
||||||
|
{
|
||||||
|
vector<SAPFOR::BasicBlock*> result;
|
||||||
|
Statement* forSt = (Statement*)st;
|
||||||
|
for (auto& func: FullIR)
|
||||||
|
{
|
||||||
|
if (func.first -> funcPointer -> getCurrProcessFile() == forSt -> getCurrProcessFile()
|
||||||
|
&& func.first -> funcPointer -> lineNumber() == forSt -> lineNumber())
|
||||||
|
result = func.second;
|
||||||
|
}
|
||||||
|
return result;
|
||||||
|
}
|
||||||
|
|
||||||
|
map<SgForStmt*, vector<SAPFOR::BasicBlock*>> findAndAnalyzeLoops(SgStatement *st, vector<SAPFOR::BasicBlock*> blocks)
|
||||||
|
{
|
||||||
|
map<SgForStmt*, vector<SAPFOR::BasicBlock*>> result;
|
||||||
|
SgStatement *lastNode = st->lastNodeOfStmt();
|
||||||
|
while (st && st != lastNode)
|
||||||
|
{
|
||||||
|
if (loop_tags.find(st -> variant()) != loop_tags.end())
|
||||||
|
{
|
||||||
|
// part with find statements of loop
|
||||||
|
SgForStmt *forSt = (SgForStmt*)st;
|
||||||
|
SgStatement *loopBody = forSt -> body();
|
||||||
|
SgStatement *lastLoopNode = st->lastNodeOfStmt();
|
||||||
|
// part with find blocks and instructions of loops
|
||||||
|
unordered_set<int> blocks_nums;
|
||||||
|
while (loopBody && loopBody != lastLoopNode)
|
||||||
|
{
|
||||||
|
SAPFOR::IR_Block* IR = findInstructionsFromOperator(loopBody, blocks).front();
|
||||||
|
if (blocks_nums.find(IR -> getBasicBlock() -> getNumber()) == blocks_nums.end())
|
||||||
|
{
|
||||||
|
result[forSt].push_back(IR -> getBasicBlock());
|
||||||
|
blocks_nums.insert(IR -> getBasicBlock() -> getNumber());
|
||||||
|
}
|
||||||
|
loopBody = loopBody -> lexNext();
|
||||||
|
}
|
||||||
|
std::sort(result[forSt].begin(), result[forSt].end());
|
||||||
|
}
|
||||||
|
st = st -> lexNext();
|
||||||
|
}
|
||||||
|
return result;
|
||||||
|
}
|
||||||
|
|
||||||
|
map<SgStatement*, set<SgStatement*>> AnalyzeLoopAndFindDeps(SgForStmt* forStatement, vector<SAPFOR::BasicBlock*> loopBlocks, map<FuncInfo*, vector<SAPFOR::BasicBlock*>>& FullIR)
|
||||||
|
{
|
||||||
|
map<SgStatement*, set<SgStatement*>> result;
|
||||||
|
for (SAPFOR::BasicBlock* bb: loopBlocks)
|
||||||
|
{
|
||||||
|
map<SAPFOR::Argument*, set<int>> blockReachingDefinitions = bb -> getRD_In();
|
||||||
|
vector<SAPFOR::IR_Block*> instructions = bb -> getInstructions();
|
||||||
|
for (SAPFOR::IR_Block* irBlock: instructions)
|
||||||
|
{
|
||||||
|
// TODO: Think about what to do with function calls and array references. Because there are also dependencies there that are not reflected in RD, but they must be taken into account
|
||||||
|
SAPFOR::Instruction* instr = irBlock -> getInstruction();
|
||||||
|
result[instr -> getOperator()];
|
||||||
|
// take Argument 1 and it's RD and push operators to final set
|
||||||
|
if (instr -> getArg1() != NULL)
|
||||||
|
{
|
||||||
|
SAPFOR::Argument* arg = instr -> getArg1();
|
||||||
|
set<int> prevInstructionsNumbers = blockReachingDefinitions[arg];
|
||||||
|
for (int i: prevInstructionsNumbers)
|
||||||
|
{
|
||||||
|
SAPFOR::Instruction* foundInstruction = getInstructionAndBlockByNumber(FullIR, i).first;
|
||||||
|
if (foundInstruction != NULL)
|
||||||
|
{
|
||||||
|
SgStatement* prevOp = foundInstruction -> getOperator();
|
||||||
|
if (prevOp != forStatement && instr -> getOperator() != forStatement && instr -> getOperator() -> lineNumber() > prevOp -> lineNumber()
|
||||||
|
&& prevOp -> lineNumber() > forStatement -> lineNumber())
|
||||||
|
result[instr -> getOperator()].insert(prevOp);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
// take Argument 2 (if exists) and it's RD and push operators to final set
|
||||||
|
if (instr -> getArg2() != NULL)
|
||||||
|
{
|
||||||
|
SAPFOR::Argument* arg = instr -> getArg2();
|
||||||
|
set<int> prevInstructionsNumbers = blockReachingDefinitions[arg];
|
||||||
|
for (int i: prevInstructionsNumbers)
|
||||||
|
{
|
||||||
|
SAPFOR::Instruction* foundInstruction = getInstructionAndBlockByNumber(FullIR, i).first;
|
||||||
|
if (foundInstruction != NULL)
|
||||||
|
{
|
||||||
|
SgStatement* prevOp = foundInstruction -> getOperator();
|
||||||
|
if (prevOp != forStatement && instr -> getOperator() != forStatement&& instr -> getOperator() -> lineNumber() > prevOp -> lineNumber()
|
||||||
|
&& prevOp -> lineNumber() > forStatement -> lineNumber())
|
||||||
|
result[instr -> getOperator()].insert(prevOp);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
// update RD
|
||||||
|
if (instr -> getResult() != NULL)
|
||||||
|
blockReachingDefinitions[instr -> getResult()] = {instr -> getNumber()};
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return result;
|
||||||
|
}
|
||||||
|
|
||||||
|
void buildAdditionalDeps(SgForStmt* forStatement, map<SgStatement*, set<SgStatement*>>& dependencies)
|
||||||
|
{
|
||||||
|
SgStatement* lastNode = forStatement->lastNodeOfStmt();
|
||||||
|
vector<SgStatement*> importantDeps;
|
||||||
|
SgStatement* st = (SgStatement*) forStatement;
|
||||||
|
st = st -> lexNext();
|
||||||
|
SgStatement* logIfOp = NULL;
|
||||||
|
while (st && st != lastNode)
|
||||||
|
{
|
||||||
|
if(importantDeps.size() != 0)
|
||||||
|
{
|
||||||
|
if (st != importantDeps.back())
|
||||||
|
{
|
||||||
|
dependencies[st].insert(importantDeps.back());
|
||||||
|
}
|
||||||
|
}
|
||||||
|
if (logIfOp != NULL)
|
||||||
|
{
|
||||||
|
dependencies[st].insert(logIfOp);
|
||||||
|
logIfOp = NULL;
|
||||||
|
}
|
||||||
|
if (st -> variant() == LOGIF_NODE)
|
||||||
|
{
|
||||||
|
logIfOp = st;
|
||||||
|
}
|
||||||
|
if (importantDepsTags.find(st -> variant()) != importantDepsTags.end())
|
||||||
|
{
|
||||||
|
importantDeps.push_back(st);
|
||||||
|
}
|
||||||
|
if (importantUpdDepsTags.find(st -> variant()) != importantUpdDepsTags.end())
|
||||||
|
{
|
||||||
|
importantDeps.pop_back();
|
||||||
|
importantDeps.push_back(st);
|
||||||
|
}
|
||||||
|
if (importantEndTags.find(st -> variant()) != importantEndTags.end())
|
||||||
|
{
|
||||||
|
if(importantDeps.size() != 0)
|
||||||
|
{
|
||||||
|
importantDeps.pop_back();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
st = st -> lexNext();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
struct ReadyOp {
|
||||||
|
SgStatement* stmt;
|
||||||
|
int degree;
|
||||||
|
size_t arrival;
|
||||||
|
ReadyOp(SgStatement* s, int d, size_t a): stmt(s), degree(d), arrival(a) {}
|
||||||
|
};
|
||||||
|
|
||||||
|
struct ReadyOpCompare {
|
||||||
|
bool operator()(const ReadyOp& a, const ReadyOp& b) const {
|
||||||
|
if (a.degree != b.degree)
|
||||||
|
return a.degree > b.degree;
|
||||||
|
else
|
||||||
|
return a.arrival > b.arrival;
|
||||||
|
}
|
||||||
|
};
|
||||||
|
|
||||||
|
vector<SgStatement*> scheduleOperations(const map<SgStatement*, set<SgStatement*>>& dependencies)
|
||||||
|
{
|
||||||
|
// get all statements
|
||||||
|
unordered_set<SgStatement*> allStmtsSet;
|
||||||
|
for (const auto& pair : dependencies)
|
||||||
|
{
|
||||||
|
allStmtsSet.insert(pair.first);
|
||||||
|
for (SgStatement* dep : pair.second)
|
||||||
|
{
|
||||||
|
allStmtsSet.insert(dep);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
vector<SgStatement*> allStmts(allStmtsSet.begin(), allStmtsSet.end());
|
||||||
|
// count deps and build reversed graph
|
||||||
|
unordered_map<SgStatement*, vector<SgStatement*>> graph;
|
||||||
|
unordered_map<SgStatement*, int> inDegree;
|
||||||
|
unordered_map<SgStatement*, int> degree;
|
||||||
|
for (auto op : allStmts)
|
||||||
|
inDegree[op] = 0;
|
||||||
|
// find and remember initial dependencies
|
||||||
|
unordered_set<SgStatement*> dependentStmts;
|
||||||
|
for (const auto& pair : dependencies)
|
||||||
|
{
|
||||||
|
SgStatement* op = pair.first;
|
||||||
|
const auto& deps = pair.second;
|
||||||
|
degree[op] = deps.size();
|
||||||
|
inDegree[op] = deps.size();
|
||||||
|
if (!deps.empty())
|
||||||
|
dependentStmts.insert(op);
|
||||||
|
for (auto dep : deps)
|
||||||
|
graph[dep].push_back(op);
|
||||||
|
}
|
||||||
|
for (SgStatement* op : allStmts)
|
||||||
|
{
|
||||||
|
if (!degree.count(op))
|
||||||
|
{
|
||||||
|
degree[op] = 0;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
// build queues
|
||||||
|
using PQ = priority_queue<ReadyOp, vector<ReadyOp>, ReadyOpCompare>;
|
||||||
|
PQ readyDependent;
|
||||||
|
queue<SgStatement*> readyIndependent;
|
||||||
|
size_t arrivalCounter = 0;
|
||||||
|
for (auto op : allStmts)
|
||||||
|
{
|
||||||
|
if (inDegree[op] == 0)
|
||||||
|
{
|
||||||
|
if (dependentStmts.count(op))
|
||||||
|
{
|
||||||
|
readyDependent.emplace(op, degree[op], arrivalCounter++);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
readyIndependent.push(op);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
// main sort algorythm
|
||||||
|
vector<SgStatement*> executionOrder;
|
||||||
|
while (!readyDependent.empty() || !readyIndependent.empty())
|
||||||
|
{
|
||||||
|
SgStatement* current = nullptr;
|
||||||
|
if (!readyDependent.empty())
|
||||||
|
{
|
||||||
|
current = readyDependent.top().stmt;
|
||||||
|
readyDependent.pop();
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
current = readyIndependent.front();
|
||||||
|
readyIndependent.pop();
|
||||||
|
}
|
||||||
|
executionOrder.push_back(current);
|
||||||
|
for (SgStatement* neighbor : graph[current])
|
||||||
|
{
|
||||||
|
inDegree[neighbor]--;
|
||||||
|
if (inDegree[neighbor] == 0) {
|
||||||
|
if (dependentStmts.count(neighbor))
|
||||||
|
{
|
||||||
|
readyDependent.emplace(neighbor, degree[neighbor], arrivalCounter++);
|
||||||
|
}
|
||||||
|
else
|
||||||
|
{
|
||||||
|
readyIndependent.push(neighbor);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return executionOrder;
|
||||||
|
}
|
||||||
|
|
||||||
|
static bool buildNewAST(SgStatement* loop, vector<SgStatement*>& newBody)
|
||||||
|
{
|
||||||
|
if (!loop) {return false;}
|
||||||
|
if (newBody.empty()) {return true;}
|
||||||
|
if (loop->variant() != FOR_NODE) {return false;}
|
||||||
|
|
||||||
|
SgStatement* loopStart = loop->lexNext();
|
||||||
|
SgStatement* loopEnd = loop->lastNodeOfStmt();
|
||||||
|
if (!loopStart || !loopEnd) {return false;}
|
||||||
|
|
||||||
|
for (SgStatement* stmt : newBody) {
|
||||||
|
if (stmt && stmt != loop && stmt != loopEnd) {
|
||||||
|
SgStatement* current = loopStart;
|
||||||
|
bool found = false;
|
||||||
|
while (current && current != loopEnd->lexNext()) {
|
||||||
|
if (current == stmt) {
|
||||||
|
found = true;
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
current = current->lexNext();
|
||||||
|
}
|
||||||
|
if (!found) {return false;}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
vector<SgStatement*> extractedStatements;
|
||||||
|
vector<char*> savedComments;
|
||||||
|
vector<int> savedLineNumbers;
|
||||||
|
|
||||||
|
for (SgStatement* stmt : newBody) {
|
||||||
|
if (stmt && stmt != loop && stmt != loopEnd) {
|
||||||
|
savedComments.push_back(stmt->comments() ? strdup(stmt->comments()) : nullptr);
|
||||||
|
savedLineNumbers.push_back(stmt->lineNumber());
|
||||||
|
SgStatement* extracted = stmt->extractStmt();
|
||||||
|
if (extracted) {extractedStatements.push_back(extracted);}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
SgStatement* currentPos = loop;
|
||||||
|
int lineCounter = loop->lineNumber() + 1;
|
||||||
|
|
||||||
|
for (size_t i = 0; i < extractedStatements.size(); i++) {
|
||||||
|
SgStatement* stmt = extractedStatements[i];
|
||||||
|
if (stmt) {
|
||||||
|
if (i < savedComments.size() && savedComments[i]) {
|
||||||
|
stmt->setComments(savedComments[i]);
|
||||||
|
}
|
||||||
|
stmt->setlineNumber(lineCounter++);
|
||||||
|
currentPos->insertStmtAfter(*stmt, *loop);
|
||||||
|
currentPos = stmt;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
for (char* comment : savedComments) {
|
||||||
|
if (comment) {
|
||||||
|
free(comment);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if (currentPos && currentPos->lexNext() != loopEnd) {
|
||||||
|
currentPos->setLexNext(*loopEnd);
|
||||||
|
}
|
||||||
|
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
static bool validateNewOrder(SgStatement* loop, const vector<SgStatement*>& newOrder)
|
||||||
|
{
|
||||||
|
if (!loop || newOrder.empty()) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
unordered_set<SgStatement*> seen;
|
||||||
|
for (SgStatement* stmt : newOrder) {
|
||||||
|
if (stmt && stmt != loop && stmt != loop->lastNodeOfStmt()) {
|
||||||
|
if (seen.count(stmt)) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
seen.insert(stmt);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
void runSwapOperators(SgFile *file, std::map<std::string, std::vector<LoopGraph*>>& loopGraph, std::map<FuncInfo*, std::vector<SAPFOR::BasicBlock*>>& FullIR, int& countOfTransform)
|
||||||
|
{
|
||||||
|
std::cout << "SWAP_OPERATORS Pass" << std::endl; // to remove
|
||||||
|
countOfTransform += 1; // to remove
|
||||||
|
|
||||||
|
const int funcNum = file -> numberOfFunctions();
|
||||||
|
for (int i = 0; i < funcNum; ++i)
|
||||||
|
{
|
||||||
|
SgStatement *st = file -> functions(i);
|
||||||
|
vector<SAPFOR::BasicBlock*> blocks = findFuncBlocksByFuncStatement(st, FullIR);
|
||||||
|
map<SgForStmt*, vector<SAPFOR::BasicBlock*>> loopsMapping = findAndAnalyzeLoops(st, blocks);
|
||||||
|
for (pair<SgForStmt*, vector<SAPFOR::BasicBlock*>> loopForAnalyze: loopsMapping)
|
||||||
|
{
|
||||||
|
map<SgStatement*, set<SgStatement*>> dependencyGraph = AnalyzeLoopAndFindDeps(loopForAnalyze.first, loopForAnalyze.second, FullIR);
|
||||||
|
// TODO: Write a function that will go through the operators and update all dependencies so that there are no mix-ups and splits inside the semantic blocks (for if, do and may be some other cases)
|
||||||
|
buildAdditionalDeps(loopForAnalyze.first, dependencyGraph);
|
||||||
|
cout << endl;
|
||||||
|
int firstLine = loopForAnalyze.first -> lineNumber();
|
||||||
|
int lastLine = loopForAnalyze.first -> lastNodeOfStmt() -> lineNumber();
|
||||||
|
cout << "LOOP ANALYZE FROM " << firstLine << " TO " << lastLine << " RES" << endl;
|
||||||
|
// for (auto &v: dependencyGraph) {
|
||||||
|
// cout << "OPERATOR: " << v.first -> lineNumber() << " " << v.first -> variant() << "\nDEPENDS ON:" << endl;
|
||||||
|
// if (v.second.size() != 0)
|
||||||
|
// for (auto vv: v.second)
|
||||||
|
// cout << vv -> lineNumber() << " ";
|
||||||
|
// cout << endl;
|
||||||
|
// }
|
||||||
|
vector<SgStatement*> new_order = scheduleOperations(dependencyGraph);
|
||||||
|
cout << "RESULT ORDER:" << endl;
|
||||||
|
for (auto v: new_order)
|
||||||
|
if (v -> lineNumber() > firstLine)
|
||||||
|
cout << v -> lineNumber() << endl;
|
||||||
|
|
||||||
|
if (validateNewOrder(loopForAnalyze.first, new_order)) {
|
||||||
|
buildNewAST(loopForAnalyze.first, new_order);
|
||||||
|
}
|
||||||
|
st = loopForAnalyze.first -> lexNext();
|
||||||
|
while (st != loopForAnalyze.first -> lastNodeOfStmt())
|
||||||
|
{
|
||||||
|
cout << st -> lineNumber() << " " << st -> sunparse() << endl;
|
||||||
|
st = st -> lexNext();
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
return;
|
||||||
|
};
|
||||||
6
src/Transformations/SwapOperators/swap_operators.h
Normal file
6
src/Transformations/SwapOperators/swap_operators.h
Normal file
@@ -0,0 +1,6 @@
|
|||||||
|
#pragma once
|
||||||
|
|
||||||
|
#include "../../GraphLoop/graph_loops.h"
|
||||||
|
#include "../../CFGraph/CFGraph.h"
|
||||||
|
|
||||||
|
void runSwapOperators(SgFile *file, std::map<std::string, std::vector<LoopGraph*>>& loopGraph, std::map<FuncInfo*, std::vector<SAPFOR::BasicBlock*>>& FullIR, int& countOfTransform);
|
||||||
@@ -212,6 +212,8 @@ void InitPassesDependencies(map<passes, vector<passes>> &passDepsIn, set<passes>
|
|||||||
|
|
||||||
Pass(BUILD_IR) <= Pass(SUBST_EXPR_RD) <= Pass(SUBST_EXPR_RD_AND_UNPARSE);
|
Pass(BUILD_IR) <= Pass(SUBST_EXPR_RD) <= Pass(SUBST_EXPR_RD_AND_UNPARSE);
|
||||||
|
|
||||||
|
list({BUILD_IR, CALL_GRAPH2}) <= Pass(SWAP_OPERATORS);
|
||||||
|
|
||||||
list({ LOOP_ANALYZER_DATA_DIST_S1, SUBST_EXPR_RD } ) <= Pass(PRIVATE_REMOVING_ANALYSIS);
|
list({ LOOP_ANALYZER_DATA_DIST_S1, SUBST_EXPR_RD } ) <= Pass(PRIVATE_REMOVING_ANALYSIS);
|
||||||
list({ PRIVATE_REMOVING_ANALYSIS, REVERT_SUBST_EXPR_RD }) <= Pass(PRIVATE_REMOVING);
|
list({ PRIVATE_REMOVING_ANALYSIS, REVERT_SUBST_EXPR_RD }) <= Pass(PRIVATE_REMOVING);
|
||||||
|
|
||||||
|
|||||||
@@ -78,11 +78,6 @@ enum typeMessage { WARR, ERROR, NOTE };
|
|||||||
// 60 "Format misplaced"
|
// 60 "Format misplaced"
|
||||||
// 61 "Array has declaration area conflict"
|
// 61 "Array has declaration area conflict"
|
||||||
// 62 "need to move common declaration to main for DECLATE"
|
// 62 "need to move common declaration to main for DECLATE"
|
||||||
// 63 "Failed to initialize libpredict cluster"
|
|
||||||
// 64 "Failed to initialize libpredict grid"
|
|
||||||
// 65 "Failed to distribute array with libpredict"
|
|
||||||
// 66 "Failed to align array with libpredict"
|
|
||||||
// 67 "Failed to process shadow_renew with libpredict"
|
|
||||||
//
|
//
|
||||||
// 20xx TRANSFORM GROUP
|
// 20xx TRANSFORM GROUP
|
||||||
// 01 "can not convert array assign to loop"
|
// 01 "can not convert array assign to loop"
|
||||||
@@ -310,7 +305,7 @@ static void printStackTrace() { };
|
|||||||
} \
|
} \
|
||||||
} while (0)
|
} while (0)
|
||||||
|
|
||||||
// Свободный - R210
|
// Свободный - R206
|
||||||
// Гайд по русификации сообщений: При добавлении нового сообщения, меняется последний сводобный идентификатор.
|
// Гайд по русификации сообщений: При добавлении нового сообщения, меняется последний сводобный идентификатор.
|
||||||
// В этом файле остаются только спецификаторы, для которых будет заполнен текст. Полный текст пишется в файле
|
// В этом файле остаются только спецификаторы, для которых будет заполнен текст. Полный текст пишется в файле
|
||||||
// russian_errors_text.txt. Спецификаторы там тоже сохраняются, по ним в визуализаторе будет восстановлен
|
// russian_errors_text.txt. Спецификаторы там тоже сохраняются, по ним в визуализаторе будет восстановлен
|
||||||
@@ -509,16 +504,6 @@ static const wchar_t *R183 = L"R183:";
|
|||||||
static const wchar_t *R184 = L"R184:%s";
|
static const wchar_t *R184 = L"R184:%s";
|
||||||
//1062
|
//1062
|
||||||
static const wchar_t* R205 = L"R205:%s#%s";
|
static const wchar_t* R205 = L"R205:%s#%s";
|
||||||
//1063
|
|
||||||
static const wchar_t* R206 = L"R206:";
|
|
||||||
//1064
|
|
||||||
static const wchar_t* R207 = L"R207:";
|
|
||||||
//1065
|
|
||||||
static const wchar_t* R208 = L"R208:";
|
|
||||||
//1066
|
|
||||||
static const wchar_t* R209 = L"R209:";
|
|
||||||
//1067
|
|
||||||
static const wchar_t* R210 = L"R210:";
|
|
||||||
|
|
||||||
//2001
|
//2001
|
||||||
static const wchar_t *R94 = L"R94:";
|
static const wchar_t *R94 = L"R94:";
|
||||||
|
|||||||
@@ -184,18 +184,8 @@ R182 = "Редукционная операция по элементу масс
|
|||||||
R183 = "Расположение операторов FORMAT не поддерживается, попробуйте применить проход Коррекция стиля кода".
|
R183 = "Расположение операторов FORMAT не поддерживается, попробуйте применить проход Коррекция стиля кода".
|
||||||
//1061
|
//1061
|
||||||
R184 = "Область объявления массива '%s' конфликтует с предыдущей областью. Возможно, это вызвано использованием include-файлов. Попробуйте применить проход 'Подстановка заголовочных файлов'".
|
R184 = "Область объявления массива '%s' конфликтует с предыдущей областью. Возможно, это вызвано использованием include-файлов. Попробуйте применить проход 'Подстановка заголовочных файлов'".
|
||||||
//1062
|
//1042
|
||||||
R205 = "Массив '%s' состоящий в common блоке '%s' должен иметь описание в главной программной единице для объявления в директиве DECLARE"
|
R205 = "Массив '%s' состоящий в common блоке '%s' должен иметь описание в главной программной единице для объявления в директиве DECLARE"
|
||||||
//1063
|
|
||||||
R206 = "Ошибка инициализации библиотеки libpredict с конфигурацией кластера: %s, код возврата: %d"
|
|
||||||
//1064
|
|
||||||
R207 = "Ошибка инициализации сетки libpredict с топологией: %zu %zu %zu %zu, код возврата: %d"
|
|
||||||
//1065
|
|
||||||
R208 = "Ошибка распределения массива '%s' с помощью libpredict, код возврата: %d"
|
|
||||||
//1066
|
|
||||||
R209 = "Ошибка выравнивания массива '%s' с массивом '%s' с помощью libpredict, код возврата: %d"
|
|
||||||
//1067
|
|
||||||
R210 = "Ошибка обработки shadow_renew для массива '%s' с помощью libpredict, код возврата: %d"
|
|
||||||
|
|
||||||
//2001
|
//2001
|
||||||
R94 = "Невозможно автоматически преобразовать данное присваивание к циклу"
|
R94 = "Невозможно автоматически преобразовать данное присваивание к циклу"
|
||||||
|
|||||||
@@ -950,7 +950,7 @@ int SPF_ModifyArrayDistribution(void*& context, int winHandler, short *options,
|
|||||||
|
|
||||||
extern map<string, PredictorStats> allPredictorStats;
|
extern map<string, PredictorStats> allPredictorStats;
|
||||||
extern map<string, vector<SpfInterval*>> intervals;
|
extern map<string, vector<SpfInterval*>> intervals;
|
||||||
extern vector<vector<size_t>> topologies;
|
extern vector<vector<long>> topologies;
|
||||||
|
|
||||||
int SPF_CreateParallelVariant(void*& context, int winHandler, short *options, short *projName, short *folderName, int64_t *variants, int *varLen,
|
int SPF_CreateParallelVariant(void*& context, int winHandler, short *options, short *projName, short *folderName, int64_t *variants, int *varLen,
|
||||||
string &output, string &outputMessage, string &predictorStats)
|
string &output, string &outputMessage, string &predictorStats)
|
||||||
@@ -1807,7 +1807,7 @@ static int inline runModificationPass(passes passName, short* projName, short* f
|
|||||||
runPassesForVisualizer(projName, { passName }, folderName);
|
runPassesForVisualizer(projName, { passName }, folderName);
|
||||||
|
|
||||||
//fill data
|
//fill data
|
||||||
// newFiles: <<3C><><EFBFBD><EFBFBD><EFBFBD> <20><><EFBFBD><EFBFBD><EFBFBD><EFBFBD> <20><><EFBFBD> <20><><EFBFBD>, <20><><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD> <20><><EFBFBD><EFBFBD><EFBFBD>>
|
// newFiles: <<3C><><EFBFBD><EFBFBD><EFBFBD> <20><><EFBFBD><EFBFBD><EFBFBD><EFBFBD> <20><><EFBFBD> <20><><EFBFBD>, <20><><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD> <20><><EFBFBD><EFBFBD><EFBFBD>>
|
||||||
string newFile;
|
string newFile;
|
||||||
|
|
||||||
if (SgFile::switchToFile(outFileName.c_str()) == -1)
|
if (SgFile::switchToFile(outFileName.c_str()) == -1)
|
||||||
@@ -2376,7 +2376,7 @@ const wstring Sapfor_RunAnalysis(const char* analysisName_c, const char* options
|
|||||||
retCode = SPF_GetArrayLinks(context, winHandler, optSh, projSh, result, output, outputMessage);
|
retCode = SPF_GetArrayLinks(context, winHandler, optSh, projSh, result, output, outputMessage);
|
||||||
else if (whichRun == "SPF_GetMaxMinBlockDistribution")
|
else if (whichRun == "SPF_GetMaxMinBlockDistribution")
|
||||||
retCode = SPF_GetMaxMinBlockDistribution(context, winHandler, optSh, projSh, result, output, outputMessage);
|
retCode = SPF_GetMaxMinBlockDistribution(context, winHandler, optSh, projSh, result, output, outputMessage);
|
||||||
else if (whichRun == "SPF_<EFBFBD>hangeDirectory") // russian C
|
else if (whichRun == "SPF_<EFBFBD>hangeDirectory") // russian C
|
||||||
{
|
{
|
||||||
if (options_c == NULL)
|
if (options_c == NULL)
|
||||||
printInternalError(convertFileName(__FILE__).c_str(), __LINE__);
|
printInternalError(convertFileName(__FILE__).c_str(), __LINE__);
|
||||||
|
|||||||
Reference in New Issue
Block a user