Add dot kernel to OpenMP 4.5 - tested with clang-ykt
This commit is contained in:
parent
abe423ac6b
commit
8a100f07b4
@ -111,6 +111,26 @@ void OMP45Stream<T>::triad()
|
|||||||
a[i] = b[i] + scalar * c[i];
|
a[i] = b[i] + scalar * c[i];
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
template <class T>
|
||||||
|
T OMP45Stream<T>::dot()
|
||||||
|
{
|
||||||
|
T sum = 0.0;
|
||||||
|
|
||||||
|
unsigned int array_size = this->array_size;
|
||||||
|
T *a = this->a;
|
||||||
|
T *b = this->b;
|
||||||
|
#pragma omp target teams distribute parallel for simd reduction(+:sum) map(tofrom: sum)
|
||||||
|
for (int i = 0; i < array_size; i++)
|
||||||
|
{
|
||||||
|
sum += a[i] * b[i];
|
||||||
|
}
|
||||||
|
|
||||||
|
return sum;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
|
||||||
void listDevices(void)
|
void listDevices(void)
|
||||||
{
|
{
|
||||||
// Get number of devices
|
// Get number of devices
|
||||||
|
|||||||
@ -36,6 +36,7 @@ class OMP45Stream : public Stream<T>
|
|||||||
virtual void add() override;
|
virtual void add() override;
|
||||||
virtual void mul() override;
|
virtual void mul() override;
|
||||||
virtual void triad() override;
|
virtual void triad() override;
|
||||||
|
virtual T dot() override;
|
||||||
|
|
||||||
virtual void write_arrays(const std::vector<T>& a, const std::vector<T>& b, const std::vector<T>& c) override;
|
virtual void write_arrays(const std::vector<T>& a, const std::vector<T>& b, const std::vector<T>& c) override;
|
||||||
virtual void read_arrays(std::vector<T>& a, std::vector<T>& b, std::vector<T>& c) override;
|
virtual void read_arrays(std::vector<T>& a, std::vector<T>& b, std::vector<T>& c) override;
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user