feat(reduction): add reduction generic PII int
This commit is contained in:
@@ -0,0 +1,194 @@
|
||||
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
|
||||
<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
|
||||
<head>
|
||||
<meta http-equiv="content-type" content="text/html; charset=utf-8" />
|
||||
<meta name="generator" content="CppTest - https://github.com/cpptest/cpptest" />
|
||||
|
||||
<title>Reduce_Generic_IntII_justesse </title>
|
||||
|
||||
<style type="text/css" media="screen">
|
||||
<!--
|
||||
hr {
|
||||
width: 100%;
|
||||
border-width: 0px;
|
||||
height: 1px;
|
||||
color: #cccccc;
|
||||
background-color: #cccccc;
|
||||
padding: 0px;
|
||||
}
|
||||
|
||||
table {
|
||||
width:100%;
|
||||
border-collapse:separate;
|
||||
border-spacing: 2px;
|
||||
border:0px;
|
||||
}
|
||||
tr {
|
||||
margin:0px;
|
||||
padding:0px;
|
||||
}
|
||||
td {
|
||||
margin:0px;
|
||||
padding:1px;
|
||||
}
|
||||
.table_summary {
|
||||
}
|
||||
.table_suites {
|
||||
}
|
||||
.table_suite {
|
||||
}
|
||||
.table_result {
|
||||
margin: 0px 0px 1em 0px;
|
||||
}
|
||||
.tablecell_title {
|
||||
background-color: #a5cef7;
|
||||
font-weight: bold;
|
||||
}
|
||||
|
||||
.tablecell_success {
|
||||
background-color: #efefe7;
|
||||
}
|
||||
|
||||
.tablecell_error {
|
||||
color: #ff0808;
|
||||
background-color: #efefe7;
|
||||
font-weight: bold;
|
||||
}
|
||||
p.spaced {
|
||||
margin: 0px;
|
||||
padding: 1em 0px 2em 0px;
|
||||
}
|
||||
p.unspaced {
|
||||
margin: 0px;
|
||||
padding: 0px 0px 2em 0px;
|
||||
}
|
||||
-->
|
||||
</style>
|
||||
</head>
|
||||
|
||||
<body>
|
||||
|
||||
<h1><a name="top"></a>Reduce_Generic_IntII_justesse </h1>
|
||||
|
||||
<div style="text-align:right">
|
||||
Designed by <a href="https://github.com/cpptest/cpptest">CppTest</a>
|
||||
</div>
|
||||
<hr />
|
||||
|
||||
<h2>Summary</h2>
|
||||
<table summary="Summary of test results" class="table_summary">
|
||||
<tr>
|
||||
<td style="width:30%" class="tablecell_title">Tests</td>
|
||||
<td style="width:30%" class="tablecell_title">Errors</td>
|
||||
<td style="width:30%" class="tablecell_title">Success</td>
|
||||
<td style="width:10%" class="tablecell_title">Time (s)</td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td style="width:30%" class="tablecell_success">0</td>
|
||||
<td style="width:30%" class="tablecell_success">0</td>
|
||||
<td style="width:30%" class="tablecell_success">100%</td>
|
||||
<td style="width:10%" class="tablecell_success">0.000000</td>
|
||||
</tr>
|
||||
</table>
|
||||
<hr />
|
||||
|
||||
<h2>Test suites</h2>
|
||||
<table summary="Test Suites" class="table_suites">
|
||||
<tr>
|
||||
<td class="tablecell_title">Name</td>
|
||||
<td style="width:10%" class="tablecell_title">Tests</td>
|
||||
<td style="width:10%" class="tablecell_title">Errors</td>
|
||||
<td style="width:10%" class="tablecell_title">Success</td>
|
||||
<td style="width:10%" class="tablecell_title">Time (s)</td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="tablecell_success"><a href="#TestReductionGenericII">TestReductionGenericII</a></td>
|
||||
<td style="width:10%" class="tablecell_success">10</td>
|
||||
<td style="width:10%" class="tablecell_success">0</td>
|
||||
<td style="width:10%" class="tablecell_success">100%</td>
|
||||
<td style="width:10%" class="tablecell_success">0.000000</td>
|
||||
</tr>
|
||||
</table>
|
||||
<hr />
|
||||
|
||||
<h3><a name="TestReductionGenericII"></a>Suite: TestReductionGenericII</h3>
|
||||
<table summary="Details for suite TestReductionGenericII" class="table_suite">
|
||||
<tr>
|
||||
<td class="tablecell_title">Name</td>
|
||||
<td style="width:10%" class="tablecell_title">Errors</td>
|
||||
<td style="width:10%" class="tablecell_title">Success</td>
|
||||
<td style="width:10%" class="tablecell_title">Time (s)</td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="tablecell_success">testDB2</td>
|
||||
<td class="tablecell_success">0</td>
|
||||
<td class="tablecell_success">true</td>
|
||||
<td class="tablecell_success">0.000000</td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="tablecell_success">testDB4</td>
|
||||
<td class="tablecell_success">0</td>
|
||||
<td class="tablecell_success">true</td>
|
||||
<td class="tablecell_success">0.000000</td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="tablecell_success">testDB8</td>
|
||||
<td class="tablecell_success">0</td>
|
||||
<td class="tablecell_success">true</td>
|
||||
<td class="tablecell_success">0.000000</td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="tablecell_success">testDB16</td>
|
||||
<td class="tablecell_success">0</td>
|
||||
<td class="tablecell_success">true</td>
|
||||
<td class="tablecell_success">0.000000</td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="tablecell_success">testDB32</td>
|
||||
<td class="tablecell_success">0</td>
|
||||
<td class="tablecell_success">true</td>
|
||||
<td class="tablecell_success">0.000000</td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="tablecell_success">testDB64</td>
|
||||
<td class="tablecell_success">0</td>
|
||||
<td class="tablecell_success">true</td>
|
||||
<td class="tablecell_success">0.000000</td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="tablecell_success">testDB128</td>
|
||||
<td class="tablecell_success">0</td>
|
||||
<td class="tablecell_success">true</td>
|
||||
<td class="tablecell_success">0.000000</td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="tablecell_success">testGrid</td>
|
||||
<td class="tablecell_success">0</td>
|
||||
<td class="tablecell_success">true</td>
|
||||
<td class="tablecell_success">0.000000</td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="tablecell_success">testMonoBlock</td>
|
||||
<td class="tablecell_success">0</td>
|
||||
<td class="tablecell_success">true</td>
|
||||
<td class="tablecell_success">0.000000</td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="tablecell_success">testSpecialeMax</td>
|
||||
<td class="tablecell_success">0</td>
|
||||
<td class="tablecell_success">true</td>
|
||||
<td class="tablecell_success">0.000000</td>
|
||||
</tr>
|
||||
</table>
|
||||
<p class="spaced"><a href="#top">Back to top</a>
|
||||
</p>
|
||||
<hr />
|
||||
|
||||
|
||||
<p>
|
||||
<a href="http://validator.w3.org/#validate-by-upload">
|
||||
Valid XHTML 1.0 Strict
|
||||
</a>
|
||||
</p>
|
||||
</body>
|
||||
</html>
|
||||
@@ -0,0 +1,140 @@
|
||||
<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Strict//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-strict.dtd">
|
||||
<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en" lang="en">
|
||||
<head>
|
||||
<meta http-equiv="content-type" content="text/html; charset=utf-8" />
|
||||
<meta name="generator" content="CppTest - https://github.com/cpptest/cpptest" />
|
||||
|
||||
<title>Reduce_Generic_IntII_performance </title>
|
||||
|
||||
<style type="text/css" media="screen">
|
||||
<!--
|
||||
hr {
|
||||
width: 100%;
|
||||
border-width: 0px;
|
||||
height: 1px;
|
||||
color: #cccccc;
|
||||
background-color: #cccccc;
|
||||
padding: 0px;
|
||||
}
|
||||
|
||||
table {
|
||||
width:100%;
|
||||
border-collapse:separate;
|
||||
border-spacing: 2px;
|
||||
border:0px;
|
||||
}
|
||||
tr {
|
||||
margin:0px;
|
||||
padding:0px;
|
||||
}
|
||||
td {
|
||||
margin:0px;
|
||||
padding:1px;
|
||||
}
|
||||
.table_summary {
|
||||
}
|
||||
.table_suites {
|
||||
}
|
||||
.table_suite {
|
||||
}
|
||||
.table_result {
|
||||
margin: 0px 0px 1em 0px;
|
||||
}
|
||||
.tablecell_title {
|
||||
background-color: #a5cef7;
|
||||
font-weight: bold;
|
||||
}
|
||||
|
||||
.tablecell_success {
|
||||
background-color: #efefe7;
|
||||
}
|
||||
|
||||
.tablecell_error {
|
||||
color: #ff0808;
|
||||
background-color: #efefe7;
|
||||
font-weight: bold;
|
||||
}
|
||||
p.spaced {
|
||||
margin: 0px;
|
||||
padding: 1em 0px 2em 0px;
|
||||
}
|
||||
p.unspaced {
|
||||
margin: 0px;
|
||||
padding: 0px 0px 2em 0px;
|
||||
}
|
||||
-->
|
||||
</style>
|
||||
</head>
|
||||
|
||||
<body>
|
||||
|
||||
<h1><a name="top"></a>Reduce_Generic_IntII_performance </h1>
|
||||
|
||||
<div style="text-align:right">
|
||||
Designed by <a href="https://github.com/cpptest/cpptest">CppTest</a>
|
||||
</div>
|
||||
<hr />
|
||||
|
||||
<h2>Summary</h2>
|
||||
<table summary="Summary of test results" class="table_summary">
|
||||
<tr>
|
||||
<td style="width:30%" class="tablecell_title">Tests</td>
|
||||
<td style="width:30%" class="tablecell_title">Errors</td>
|
||||
<td style="width:30%" class="tablecell_title">Success</td>
|
||||
<td style="width:10%" class="tablecell_title">Time (s)</td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td style="width:30%" class="tablecell_success">1</td>
|
||||
<td style="width:30%" class="tablecell_success">0</td>
|
||||
<td style="width:30%" class="tablecell_success">100%</td>
|
||||
<td style="width:10%" class="tablecell_success">11.000000</td>
|
||||
</tr>
|
||||
</table>
|
||||
<hr />
|
||||
|
||||
<h2>Test suites</h2>
|
||||
<table summary="Test Suites" class="table_suites">
|
||||
<tr>
|
||||
<td class="tablecell_title">Name</td>
|
||||
<td style="width:10%" class="tablecell_title">Tests</td>
|
||||
<td style="width:10%" class="tablecell_title">Errors</td>
|
||||
<td style="width:10%" class="tablecell_title">Success</td>
|
||||
<td style="width:10%" class="tablecell_title">Time (s)</td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="tablecell_success"><a href="#TestPerformance_RunnableGPU_A">TestPerformance_RunnableGPU_A</a></td>
|
||||
<td style="width:10%" class="tablecell_success">1</td>
|
||||
<td style="width:10%" class="tablecell_success">0</td>
|
||||
<td style="width:10%" class="tablecell_success">100%</td>
|
||||
<td style="width:10%" class="tablecell_success">11.000000</td>
|
||||
</tr>
|
||||
</table>
|
||||
<hr />
|
||||
|
||||
<h3><a name="TestPerformance_RunnableGPU_A"></a>Suite: TestPerformance_RunnableGPU_A</h3>
|
||||
<table summary="Details for suite TestPerformance_RunnableGPU_A" class="table_suite">
|
||||
<tr>
|
||||
<td class="tablecell_title">Name</td>
|
||||
<td style="width:10%" class="tablecell_title">Errors</td>
|
||||
<td style="width:10%" class="tablecell_title">Success</td>
|
||||
<td style="width:10%" class="tablecell_title">Time (s)</td>
|
||||
</tr>
|
||||
<tr>
|
||||
<td class="tablecell_success">performanceOnly</td>
|
||||
<td class="tablecell_success">0</td>
|
||||
<td class="tablecell_success">true</td>
|
||||
<td class="tablecell_success">11.000000</td>
|
||||
</tr>
|
||||
</table>
|
||||
<p class="spaced"><a href="#top">Back to top</a>
|
||||
</p>
|
||||
<hr />
|
||||
|
||||
|
||||
<p>
|
||||
<a href="http://validator.w3.org/#validate-by-upload">
|
||||
Valid XHTML 1.0 Strict
|
||||
</a>
|
||||
</p>
|
||||
</body>
|
||||
</html>
|
||||
@@ -1,4 +1,4 @@
|
||||
#include "Thread1D.cu.h"
|
||||
#include "Thread2D.cu.h"
|
||||
#include "cudas.h"
|
||||
|
||||
#include "Reduction.cu.h"
|
||||
@@ -24,10 +24,16 @@ static __device__ void addAtomicV2(int* ptrX , int y);
|
||||
/**
|
||||
* TID partout en tabSM
|
||||
*/
|
||||
__global__ void KIntProtocoleII(int* ptrSumGM)
|
||||
{
|
||||
__global__
|
||||
void KIntProtocoleII(int* ptrSumGM) {
|
||||
// TODO ReductionIntII
|
||||
}
|
||||
|
||||
extern __shared__ int tabSM[];
|
||||
reductionIntraThread(tabSM);
|
||||
__syncthreads();
|
||||
|
||||
Reduction::reduce(add, addAtomicV1, tabSM, ptrSumGM);
|
||||
}
|
||||
|
||||
/*--------------------------------------*\
|
||||
|* Private *|
|
||||
@@ -36,46 +42,52 @@ __global__ void KIntProtocoleII(int* ptrSumGM)
|
||||
/**
|
||||
* TID partout en tabSM
|
||||
*/
|
||||
__device__ void reductionIntraThread(int* tabSM)
|
||||
{
|
||||
__device__
|
||||
void reductionIntraThread(int* tabSM) {
|
||||
// TODO ReductionIntII
|
||||
}
|
||||
const int TID = Thread2D::tid();
|
||||
const int tidLocal = Thread2D::tidLocal();
|
||||
|
||||
tabSM[tidLocal] = TID;
|
||||
}
|
||||
|
||||
/*----------------------------*\
|
||||
|* Operateur reduction *|
|
||||
\*---------------------------*/
|
||||
|
||||
__inline__
|
||||
__device__ int add(int x , int y)
|
||||
{
|
||||
__device__
|
||||
int add(int x , int y) {
|
||||
// TODO ReductionIntII
|
||||
}
|
||||
return x + y;
|
||||
}
|
||||
|
||||
/**
|
||||
* Utiliser la methode system : atomicAdd(pointeurDestination, valeurSource);
|
||||
*/
|
||||
__inline__
|
||||
__device__ void addAtomicV1(int* ptrX , int y)
|
||||
{
|
||||
__device__
|
||||
void addAtomicV1(int* ptrX , int y) {
|
||||
// TODO ReductionIntII
|
||||
}
|
||||
atomicAdd(ptrX, y);
|
||||
}
|
||||
|
||||
/**
|
||||
* Une alternative, moins performante, mais generalisable serait d'employer un lock
|
||||
* Tip : le Lock est implementer avec deux methodes atomic
|
||||
*/
|
||||
__device__ int volatile mutex = 0; //variable global
|
||||
__device__ void addAtomicV2(int* ptrX , int y)
|
||||
{
|
||||
__device__
|
||||
void addAtomicV2(int* ptrX , int y) {
|
||||
Lock locker(&mutex);
|
||||
locker.lock();
|
||||
|
||||
// TODO ReductionIntII
|
||||
*ptrX = *ptrX + y;
|
||||
|
||||
locker.unlock();
|
||||
}
|
||||
}
|
||||
|
||||
/*----------------------------------------------------------------------*\
|
||||
|* End *|
|
||||
\*---------------------------------------------------------------------*/
|
||||
|
||||
|
||||
@@ -27,25 +27,29 @@ extern __global__ void KIntProtocoleII(int* ptrSumGM);
|
||||
ReductionIntII::ReductionIntII(const Grid& grid , int* ptrSum,bool isVerbose) :
|
||||
//RunnableGPU(grid, "Reduce_Generic_IntII_" + to_string(grid.threadCounts()),isVerbose), // classe parente
|
||||
RunnableGPU(grid, "Reduce_Generic_IntII" ,isVerbose), // classe parente
|
||||
ptrSum(ptrSum)
|
||||
{
|
||||
ptrSum(ptrSum) {
|
||||
// TODO ReductionIntII
|
||||
this->sizeSM = -1;
|
||||
}
|
||||
this->sizeSM = grid.threadByBlock() * sizeof(int);
|
||||
|
||||
ReductionIntII::~ReductionIntII()
|
||||
{
|
||||
GM::mallocInt0(&ptrSumGM);
|
||||
}
|
||||
|
||||
ReductionIntII::~ReductionIntII() {
|
||||
// TODO ReductionIntII
|
||||
}
|
||||
|
||||
GM::free(ptrSumGM);
|
||||
}
|
||||
|
||||
/*--------------------------------------*\
|
||||
|* Methode *|
|
||||
\*-------------------------------------*/
|
||||
|
||||
void ReductionIntII::run()
|
||||
{
|
||||
void ReductionIntII::run() {
|
||||
// TODO ReductionIntII
|
||||
}
|
||||
|
||||
KIntProtocoleII<<<dg, db, this->sizeSM>>>(ptrSumGM);
|
||||
GM::memcpyDToH_int(ptrSum, ptrSumGM);
|
||||
}
|
||||
|
||||
/*----------------------------------------------------------------------*\
|
||||
|* End *|
|
||||
|
||||
@@ -8,8 +8,7 @@
|
||||
|* Declaration *|
|
||||
\*---------------------------------------------------------------------*/
|
||||
|
||||
class ReductionIntII: public RunnableGPU
|
||||
{
|
||||
class ReductionIntII: public RunnableGPU {
|
||||
/*--------------------------------------*\
|
||||
|* Constructor *|
|
||||
\*-------------------------------------*/
|
||||
@@ -44,7 +43,7 @@ class ReductionIntII: public RunnableGPU
|
||||
int* ptrSumGM;
|
||||
size_t sizeSM;
|
||||
|
||||
};
|
||||
};
|
||||
|
||||
/*----------------------------------------------------------------------*\
|
||||
|* End *|
|
||||
|
||||
@@ -58,8 +58,8 @@ void generic() {
|
||||
VTReductionGenericII test2;
|
||||
VTReductionGenericLongII test3;
|
||||
|
||||
test1.run();
|
||||
// test2.run();
|
||||
// test1.run();
|
||||
test2.run();
|
||||
// test3.run();
|
||||
}
|
||||
|
||||
|
||||
@@ -70,17 +70,17 @@ void reduction_add(bool& isOk) {
|
||||
*/
|
||||
void reduction_generic(bool& isOk) {
|
||||
// InbI
|
||||
{
|
||||
UseReductionIntI algo(IS_VERBOSE);
|
||||
isOk &= algo.isOk(IS_VERBOSE);
|
||||
}
|
||||
|
||||
// IntII
|
||||
// {
|
||||
// UseReductionIntII algo(IS_VERBOSE);
|
||||
// UseReductionIntI algo(IS_VERBOSE);
|
||||
// isOk &= algo.isOk(IS_VERBOSE);
|
||||
// }
|
||||
|
||||
// IntII
|
||||
{
|
||||
UseReductionIntII algo(IS_VERBOSE);
|
||||
isOk &= algo.isOk(IS_VERBOSE);
|
||||
}
|
||||
|
||||
// LongII
|
||||
// {
|
||||
// UseReductionLongII algo(IS_VERBOSE);
|
||||
|
||||
Reference in New Issue
Block a user