Page Menu
Home
c4science
Search
Configure Global Search
Log In
Files
F85679760
control.hpp
No One
Temporary
Actions
Download File
Edit File
Delete File
View Transforms
Subscribe
Mute Notifications
Award Token
Subscribers
None
File Metadata
Details
File Info
Storage
Attached
Created
Tue, Oct 1, 03:32
Size
4 KB
Mime Type
text/x-c
Expires
Thu, Oct 3, 03:32 (2 d)
Engine
blob
Format
Raw Data
Handle
21238797
Attached To
rLAMMPS lammps
control.hpp
View Options
#pragma once
#ifndef __CONTROL_HPP__
#define __CONTROL_HPP__
#include "util.hpp"
/// \file control.hpp
/// \brief A collection of control trees composing high-level variants of algorithms.
/// \author Kyungjoo Kim (kyukim@sandia.gov)
/// description is a bit wrong
using
namespace
std
;
namespace
Tacho
{
// forward declaration for control tree
template
<
int
ArgAlgo
,
int
ArgVariant
>
struct
Control
{
static
constexpr
int
Self
[
2
]
=
{
ArgAlgo
,
ArgVariant
};
};
// ----------------------------------------------------------------------------------
// - CholByblocks Variant 1
// * partitioned block matrix (blocks are sparse)
template
<>
struct
Control
<
AlgoChol
::
ByBlocks
,
Variant
::
One
>
{
// chol var 1 : nested data parallel for is applied in the second inner loop
// chol var 2 : nested data parallel for is applied in the most inner loop
static
constexpr
int
Chol
[
2
]
=
{
AlgoChol
::
UnblockedOpt
,
Variant
::
Two
};
static
constexpr
int
Trsm
[
2
]
=
{
AlgoTrsm
::
ForFactorBlocked
,
Variant
::
One
};
static
constexpr
int
Herk
[
2
]
=
{
AlgoHerk
::
ForFactorBlocked
,
Variant
::
One
};
static
constexpr
int
Gemm
[
2
]
=
{
AlgoGemm
::
ForFactorBlocked
,
Variant
::
One
};
};
// - CholByBlocks Variant 2
// * diagonal blocks have nested dense blocks
template
<>
struct
Control
<
AlgoChol
::
ByBlocks
,
Variant
::
Two
>
{
static
constexpr
int
Chol
[
2
]
=
{
AlgoChol
::
UnblockedOpt
,
Variant
::
One
};
static
constexpr
int
Trsm
[
2
]
=
{
AlgoTrsm
::
ForFactorBlocked
,
Variant
::
One
};
static
constexpr
int
Herk
[
2
]
=
{
AlgoHerk
::
ForFactorBlocked
,
Variant
::
One
};
static
constexpr
int
Gemm
[
2
]
=
{
AlgoGemm
::
ForFactorBlocked
,
Variant
::
One
};
};
// - CholByBlocks Variant 3
// * all blocks have nested dense blocks (full supernodal algorithm)
// template<> struct Control<AlgoChol::ByBlocks,Variant::Three> {
// static constexpr int Chol[2] = { AlgoChol::NestedDenseBlock, Variant::One };
// static constexpr int Trsm[2] = { AlgoTrsm::NestedDenseBlock, Variant::One };
// static constexpr int Herk[2] = { AlgoHerk::NestedDenseBlock, Variant::One };
// static constexpr int Gemm[2] = { AlgoGemm::NestedDenseBlock, Variant::One };
// };
// - CholByBlocks Variant 4
// * diagonal blocks have nested hier dense blocks (hierarchical task scheduling)
// template<> struct Control<AlgoChol::ByBlocks,Variant::Four> {
// static constexpr int Chol[2] = { AlgoChol::NestedDenseByBlocks, Variant::One };
// static constexpr int Trsm[2] = { AlgoTrsm::ForFactorBlocked, Variant::One };
// static constexpr int Herk[2] = { AlgoHerk::ForFactorBlocked, Variant::One };
// static constexpr int Gemm[2] = { AlgoGemm::ForFactorBlocked, Variant::One };
//};
// - CholByBlocks Variant 5
// * diagonal blocks have nested hier dense blocks (hierarchical task scheduling)
// template<> struct Control<AlgoChol::ByBlocks,Variant::Four> {
// static constexpr int Chol[2] = { AlgoChol::NestedDenseByBlocks, Variant::One };
// static constexpr int Trsm[2] = { AlgoTrsm::NestedDenseByBlocks, Variant::One };
// static constexpr int Herk[2] = { AlgoHerk::NestedDenseByBlocks, Variant::One };
// static constexpr int Gemm[2] = { AlgoGemm::NestedDenseByBlocks, Variant::One };
// };
// ----------------------------------------------------------------------------------
// - CholNestedDenseBlock
// * branch control between sparse and dense operations
template
<>
struct
Control
<
AlgoChol
::
NestedDenseBlock
,
Variant
::
One
>
{
static
constexpr
int
CholSparse
[
2
]
=
{
AlgoChol
::
UnblockedOpt
,
Variant
::
One
};
static
constexpr
int
CholDense
[
2
]
=
{
AlgoChol
::
ExternalLapack
,
Variant
::
One
};
};
// - CholNestedDenseBlock
// * branch control between sparse and dense operations
template
<>
struct
Control
<
AlgoChol
::
NestedDenseByBlocks
,
Variant
::
One
>
{
static
constexpr
int
CholSparse
[
2
]
=
{
AlgoChol
::
UnblockedOpt
,
Variant
::
One
};
static
constexpr
int
CholDenseByBlocks
[
2
]
=
{
AlgoChol
::
DenseByBlocks
,
Variant
::
One
};
};
// ----------------------------------------------------------------------------------
// - CholDenseBlock
// * dense matrix Cholesky-by-blocks
template
<>
struct
Control
<
AlgoChol
::
DenseByBlocks
,
Variant
::
One
>
{
static
constexpr
int
Chol
[
2
]
=
{
AlgoChol
::
ExternalLapack
,
Variant
::
One
};
static
constexpr
int
Trsm
[
2
]
=
{
AlgoTrsm
::
ExternalBlas
,
Variant
::
One
};
static
constexpr
int
Herk
[
2
]
=
{
AlgoHerk
::
ExternalBlas
,
Variant
::
One
};
static
constexpr
int
Gemm
[
2
]
=
{
AlgoGemm
::
ExternalBlas
,
Variant
::
One
};
};
template
<>
struct
Control
<
AlgoGemm
::
DenseByBlocks
,
Variant
::
One
>
{
static
constexpr
int
Gemm
[
2
]
=
{
AlgoGemm
::
ExternalBlas
,
Variant
::
One
};
};
template
<>
struct
Control
<
AlgoTrsm
::
DenseByBlocks
,
Variant
::
One
>
{
static
constexpr
int
Gemm
[
2
]
=
{
AlgoGemm
::
ExternalBlas
,
Variant
::
One
};
static
constexpr
int
Trsm
[
2
]
=
{
AlgoTrsm
::
ExternalBlas
,
Variant
::
One
};
};
}
#endif
Event Timeline
Log In to Comment