do initial assignment through parallel_for_each
This commit is contained in:
parent
383c5a3ae7
commit
3fc0b57a2c
80
HCStream.cpp
80
HCStream.cpp
@ -78,65 +78,38 @@ HCStream<T>::~HCStream()
|
|||||||
template <class T>
|
template <class T>
|
||||||
void HCStream<T>::init_arrays(T _a, T _b, T _c)
|
void HCStream<T>::init_arrays(T _a, T _b, T _c)
|
||||||
{
|
{
|
||||||
// hc::array_view<T,1> view_a(this->d_a);
|
hc::array_view<T,1> view_a(this->d_a);
|
||||||
// hc::array_view<T,1> view_b(this->d_b);
|
hc::array_view<T,1> view_b(this->d_b);
|
||||||
// hc::array_view<T,1> view_c(this->d_c);
|
hc::array_view<T,1> view_c(this->d_c);
|
||||||
|
|
||||||
// hc::completion_future future_a= hc::parallel_for_each(hc::extent<1>(array_size)
|
hc::completion_future future_a= hc::parallel_for_each(hc::extent<1>(array_size)
|
||||||
// , [=](hc::index<1> i) [[hc]] {
|
, [=](hc::index<1> i) [[hc]] {
|
||||||
// view_a[i] = _a;
|
view_a[i] = _a;
|
||||||
// });
|
});
|
||||||
|
|
||||||
// hc::completion_future future_b= hc::parallel_for_each(hc::extent<1>(array_size)
|
hc::completion_future future_b= hc::parallel_for_each(hc::extent<1>(array_size)
|
||||||
// , [=](hc::index<1> i) [[hc]] {
|
, [=](hc::index<1> i) [[hc]] {
|
||||||
// view_b[i] = _b;
|
view_b[i] = _b;
|
||||||
// });
|
});
|
||||||
// hc::completion_future future_c= hc::parallel_for_each(hc::extent<1>(array_size)
|
hc::completion_future future_c= hc::parallel_for_each(hc::extent<1>(array_size)
|
||||||
// , [=](hc::index<1> i) [[hc]] {
|
, [=](hc::index<1> i) [[hc]] {
|
||||||
// view_c[i] = _c;
|
view_c[i] = _c;
|
||||||
// });
|
});
|
||||||
// try{
|
try{
|
||||||
// future_a.wait();
|
future_a.wait();
|
||||||
// }
|
future_b.wait();
|
||||||
// catch(std::exception& e){
|
future_c.wait();
|
||||||
// std::cout << __FILE__ << ":" << __LINE__ << "\t future_a " << e.what() << std::endl;
|
}
|
||||||
// throw;
|
catch(std::exception& e){
|
||||||
// }
|
std::cout << __FILE__ << ":" << __LINE__ << "\t future_{a,b,c} " << e.what() << std::endl;
|
||||||
|
throw;
|
||||||
// try{
|
}
|
||||||
// future_b.wait();
|
|
||||||
// }
|
|
||||||
// catch(std::exception& e){
|
|
||||||
// std::cout << __FILE__ << ":" << __LINE__ << "\t future_b " << e.what() << std::endl;
|
|
||||||
// throw;
|
|
||||||
// }
|
|
||||||
|
|
||||||
|
|
||||||
// try{
|
|
||||||
// future_c.wait();
|
|
||||||
// }
|
|
||||||
// catch(std::exception& e){
|
|
||||||
// std::cout << __FILE__ << ":" << __LINE__ << "\t future_c " << e.what() << std::endl;
|
|
||||||
// throw;
|
|
||||||
// }
|
|
||||||
|
|
||||||
|
|
||||||
std::vector<T> temp(array_size,_a);
|
|
||||||
hc::copy(temp.begin(), temp.end(),this->d_a);
|
|
||||||
|
|
||||||
std::fill(temp.begin(), temp.end(),_b);
|
|
||||||
hc::copy(temp.begin(), temp.end(),this->d_b);
|
|
||||||
|
|
||||||
std::fill(temp.begin(), temp.end(),_c);
|
|
||||||
hc::copy(temp.begin(), temp.end(),this->d_c);
|
|
||||||
|
|
||||||
}
|
}
|
||||||
|
|
||||||
template <class T>
|
template <class T>
|
||||||
void HCStream<T>::read_arrays(std::vector<T>& a, std::vector<T>& b, std::vector<T>& c)
|
void HCStream<T>::read_arrays(std::vector<T>& a, std::vector<T>& b, std::vector<T>& c)
|
||||||
{
|
{
|
||||||
|
|
||||||
// Copy device memory to host
|
|
||||||
hc::copy(d_a,a.begin());
|
hc::copy(d_a,a.begin());
|
||||||
hc::copy(d_b,b.begin());
|
hc::copy(d_b,b.begin());
|
||||||
hc::copy(d_c,c.begin());
|
hc::copy(d_c,c.begin());
|
||||||
@ -151,7 +124,6 @@ void HCStream<T>::copy()
|
|||||||
hc::array_view<T,1> view_c = this->d_c;
|
hc::array_view<T,1> view_c = this->d_c;
|
||||||
|
|
||||||
try{
|
try{
|
||||||
// launch a GPU kernel to compute the saxpy in parallel
|
|
||||||
hc::completion_future future_kernel = hc::parallel_for_each(hc::extent<1>(array_size)
|
hc::completion_future future_kernel = hc::parallel_for_each(hc::extent<1>(array_size)
|
||||||
, [=](hc::index<1> index) [[hc]] {
|
, [=](hc::index<1> index) [[hc]] {
|
||||||
view_c[index] = view_a[index];
|
view_c[index] = view_a[index];
|
||||||
@ -173,7 +145,6 @@ void HCStream<T>::mul()
|
|||||||
hc::array_view<T,1> view_c = this->d_c;
|
hc::array_view<T,1> view_c = this->d_c;
|
||||||
|
|
||||||
try{
|
try{
|
||||||
// launch a GPU kernel to compute the saxpy in parallel
|
|
||||||
hc::completion_future future_kernel = hc::parallel_for_each(hc::extent<1>(array_size)
|
hc::completion_future future_kernel = hc::parallel_for_each(hc::extent<1>(array_size)
|
||||||
, [=](hc::index<1> i) [[hc]] {
|
, [=](hc::index<1> i) [[hc]] {
|
||||||
view_b[i] = scalar*view_c[i];
|
view_b[i] = scalar*view_c[i];
|
||||||
@ -196,7 +167,6 @@ void HCStream<T>::add()
|
|||||||
hc::array_view<T,1> view_c(this->d_c);
|
hc::array_view<T,1> view_c(this->d_c);
|
||||||
|
|
||||||
try{
|
try{
|
||||||
// launch a GPU kernel to compute the saxpy in parallel
|
|
||||||
hc::completion_future future_kernel = hc::parallel_for_each(hc::extent<1>(array_size)
|
hc::completion_future future_kernel = hc::parallel_for_each(hc::extent<1>(array_size)
|
||||||
, [=](hc::index<1> i) [[hc]] {
|
, [=](hc::index<1> i) [[hc]] {
|
||||||
view_c[i] = view_a[i]+view_b[i];
|
view_c[i] = view_a[i]+view_b[i];
|
||||||
@ -219,7 +189,6 @@ void HCStream<T>::triad()
|
|||||||
hc::array_view<T,1> view_c(this->d_c);
|
hc::array_view<T,1> view_c(this->d_c);
|
||||||
|
|
||||||
try{
|
try{
|
||||||
// launch a GPU kernel to compute the saxpy in parallel
|
|
||||||
hc::completion_future future_kernel = hc::parallel_for_each(hc::extent<1>(array_size)
|
hc::completion_future future_kernel = hc::parallel_for_each(hc::extent<1>(array_size)
|
||||||
, [=](hc::index<1> i) [[hc]] {
|
, [=](hc::index<1> i) [[hc]] {
|
||||||
view_a[i] = view_b[i] + scalar*view_c[i];
|
view_a[i] = view_b[i] + scalar*view_c[i];
|
||||||
@ -242,7 +211,6 @@ T HCStream<T>::dot()
|
|||||||
T sum = static_cast<T>(0);
|
T sum = static_cast<T>(0);
|
||||||
|
|
||||||
try{
|
try{
|
||||||
// launch a GPU kernel to compute the saxpy in parallel
|
|
||||||
hc::completion_future future_kernel = hc::parallel_for_each(view_a.get_extent(),
|
hc::completion_future future_kernel = hc::parallel_for_each(view_a.get_extent(),
|
||||||
[=](hc::index<1> i) [[hc]] {
|
[=](hc::index<1> i) [[hc]] {
|
||||||
view_p[i] = view_p[i]*view_a[i];
|
view_p[i] = view_p[i]*view_a[i];
|
||||||
|
|||||||
Loading…
Reference in New Issue
Block a user