У меня есть следующий код
int main(int argc, char** argv )
{
std::cout<<"running Lenna..\n";
cv::Mat mat = imread("lena.bmp", cv::IMREAD_GRAYSCALE );
//convert to vec
std::vector<double> BWvec;
BWvec.assign((double*)mat.data, (double*)mat.data + mat.total());
std::vector < std::vector<double>> vec2D;
for (int i = 0; i < mat.rows; i++) {
auto first = BWvec.begin() + (mat.rows * i);
auto last = BWvec.begin() + (mat.rows * i) + mat.rows;
std::vector<double> vec0(first, last);
vec2D.push_back(vec0);
}
//#pragma acc parallel loop
for (int i = 0; i <= 5; i++) {
for (int j = 0; j <= 5; j++) {
mat(cv::Rect(i,j, (4 - 0), (4 - 0)));
//sub-vector[5:10][25:100]:
std::vector<std::vector<double>> sub_vector;
sub_vector.reserve(5);
for (std::size_t k = 5; k < 10; ++k) {
sub_vector.emplace_back(vec2D[k+i].begin() + 25, vec2D[k+i].begin() + 100);
}
}
}
return 0;
}
Когда я набираю pgc++ -fast -ta=nvidia:cuda9.2,managed -Minfo=accel -o lenna lenna.cpp -std=c++11
pkg-config --cflags --libs opencv -lgomp && ./lenna
, он отлично работает последовательно, но когда я раскомментирую #pragma acc parallel loop
, я получаю сообщение об ошибке
procedures called in a compute region must have acc routine information
accelerator region ignored, accelerator restriction .. no acc routine information
Я получаю эту ошибку также, если я закомментирую mat(cv::Rect(i,j,(4-0),(4-0)))
и оставлю часть после sub-vector[5:10][25:100]
, или если я раскомментирую mat(cv::Rect(i,j,(4-0),(4-0)))
и прокомментирую часть после sub-vector[5:10][25:100]
Как я могу это исправить?
ИЗМЕНИТЬ
Чтобы сделать это проще, я предоставил 2 отдельных кода и ошибки, которые они дают:
lenna1.cpp
:
#include <stdio.h>
#include <cmath>
#include <omp.h>
#include <opencv2/opencv.hpp>
using namespace std;
using namespace cv;
//pgc++ -fast -ta=nvidia:cuda9.2,managed -Minfo=accel -o lenna lenna.cpp -std=c++11 `pkg-config --cflags --libs opencv` -lgomp && ./lenna
int main(int argc, char** argv )
{
std::cout<<"running Lenna..\n";
cv::Mat mat = imread("lena.bmp", cv::IMREAD_GRAYSCALE );
#pragma acc parallel loop
for (int i = 0; i <= 5; i++) {
for (int j = 0; j <= 5; j++) {
mat(cv::Rect(i, j, (4 - 0), (4 - 0)));
}
}
return 0;
}
ошибка от lenna1.cpp
:
pgc++ -fast -ta=nvidia:cuda9.2,managed -Minfo=accel -o lenna1 lenna1.cpp -std=c++11 `pkg-config --cflags --libs opencv` -lgomp && ./lenna1
lenna1.cpp:
"lenna1.cpp", line 23: warning: last line of file ends without a newline
}
^
PGCC-S-0155-Procedures called in a compute region must have acc routine information: cv::Mat::Mat(const cv::Mat&, const cv::Rect_<int> &) (lenna1.cpp: 379)
PGCC-S-0155-Accelerator region ignored; see -Minfo messages (lenna1.cpp: 14)
main:
14, Accelerator region ignored
379, Accelerator restriction: call to 'cv::Mat::Mat(const cv::Mat&, const cv::Rect_<int> &)' with no acc routine information
PGCC/x86-64 Linux 19.10-0: compilation completed with severe errors
lenna2.cpp
:
#include <stdio.h>
#include <cmath>
#include <omp.h>
#include <opencv2/opencv.hpp>
using namespace std;
using namespace cv;
//pgc++ -fast -ta=nvidia:cuda9.2,managed -Minfo=accel -o lenna lenna.cpp -std=c++11 `pkg-config --cflags --libs opencv` -lgomp && ./lenna
int main(int argc, char** argv )
{
std::cout<<"running Lenna..\n";
cv::Mat mat = imread("lena.bmp", cv::IMREAD_GRAYSCALE );
//convert to vec
std::vector<double> BWvec;
BWvec.assign((double*)mat.data, (double*)mat.data + mat.total());
std::vector < std::vector<double>> vec2D;
for (int i = 0; i < mat.rows; i++) {
auto first = BWvec.begin() + (mat.rows * i);
auto last = BWvec.begin() + (mat.rows * i) + mat.rows;
std::vector<double> vec0(first, last);
vec2D.push_back(vec0);
}
#pragma acc parallel loop
for (int i = 0; i <= 5; i++) {
for (int j = 0; j <= 5; j++) {
//sub-vector[5:10][25:100]:
std::vector<std::vector<double>> sub_vector;
sub_vector.reserve(5);
for (std::size_t i = 5; i < 10; ++i) {
sub_vector.emplace_back(vec2D[i].begin() + 25, vec2D[i].begin() + 100);
}
}
}
return 0;
}
ошибка от lenna2.cpp
:
pgc++ -fast -ta=nvidia:cuda9.2,managed -Minfo=accel -o lenna2 lenna2.cpp -std=c++11 `pkg-config --cflags --libs opencv` -lgomp && ./lenna2
lenna2.cpp:
"lenna2.cpp", line 40: warning: last line of file ends without a newline
}
^
operator new (unsigned long, void *):
4, include "opencv.hpp"
47, include "core.hpp"
56, include "algorithm"
10, include "algorithm"
62, include "stl_algo.h"
62, include "stl_tempbuf.h"
60, include "stl_construct.h"
59, include "new"
130, Generating implicit acc routine seq
Generating acc routine seq
Generating Tesla code
operator delete (void *, void *):
4, include "opencv.hpp"
47, include "core.hpp"
56, include "algorithm"
10, include "algorithm"
62, include "stl_algo.h"
62, include "stl_tempbuf.h"
60, include "stl_construct.h"
59, include "new"
135, Generating implicit acc routine seq
Generating acc routine seq
Generating Tesla code
PGCC-S-0155-Procedures called in a compute region must have acc routine information: std::__throw_length_error(const char *) (lenna2.cpp: 69)
PGCC-S-0155-Accelerator region ignored; see -Minfo messages (lenna2.cpp: 25)
main:
25, Accelerator region ignored
69, Accelerator restriction: call to 'std::__throw_length_error(const char *)' with no acc routine information
PGCC/x86-64 Linux 19.10-0: compilation completed with severe errors