Implement the reduction in OpenACC

This commit is contained in:
Tom Deakin 2016-10-14 14:40:08 +01:00
parent 614613e7d4
commit 0ef9b6691b
2 changed files with 19 additions and 0 deletions

View File

@ -112,6 +112,24 @@ void ACCStream<T>::triad()
a[i] = b[i] + scalar * c[i];
}
}
template <class T>
T ACCStream<T>::dot()
{
T sum = 0.0;
unsigned int array_size = this->array_size;
T * restrict a = this->a;
T * restrict b = this->b;
#pragma acc kernels present(a[0:array_size], b[0:array_size]) wait
for (int i = 0; i < array_size; i++)
{
sum += a[i] * b[i];
}
return sum;
}
void listDevices(void)
{
// Get number of devices

View File

@ -35,6 +35,7 @@ class ACCStream : public Stream<T>
virtual void add() override;
virtual void mul() override;
virtual void triad() override;
virtual T dot() override;
virtual void write_arrays(const std::vector<T>& a, const std::vector<T>& b, const std::vector<T>& c) override;
virtual void read_arrays(std::vector<T>& a, std::vector<T>& b, std::vector<T>& c) override;