mirror of
https://github.com/NVIDIA/cuda-samples.git
synced 2024-11-28 14:09:17 +08:00
428 lines
14 KiB
C++
428 lines
14 KiB
C++
/* Copyright (c) 2022, NVIDIA CORPORATION. All rights reserved.
|
|
*
|
|
* Redistribution and use in source and binary forms, with or without
|
|
* modification, are permitted provided that the following conditions
|
|
* are met:
|
|
* * Redistributions of source code must retain the above copyright
|
|
* notice, this list of conditions and the following disclaimer.
|
|
* * Redistributions in binary form must reproduce the above copyright
|
|
* notice, this list of conditions and the following disclaimer in the
|
|
* documentation and/or other materials provided with the distribution.
|
|
* * Neither the name of NVIDIA CORPORATION nor the names of its
|
|
* contributors may be used to endorse or promote products derived
|
|
* from this software without specific prior written permission.
|
|
*
|
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY
|
|
* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
|
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
|
|
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
|
|
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
|
|
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
|
|
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
|
|
* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
|
|
* OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
|
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
|
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
|
|
*/
|
|
|
|
// This sample needs at least CUDA 10.1.
|
|
// It demonstrates usages of the nvJPEG library
|
|
|
|
#ifndef NV_JPEG_EXAMPLE
|
|
#define NV_JPEG_EXAMPLE
|
|
|
|
#ifdef _WIN64
|
|
#include <windows.h>
|
|
#endif
|
|
|
|
#include "cuda_runtime.h"
|
|
#include "nvjpeg.h"
|
|
#include "helper_cuda.h"
|
|
#include "helper_timer.h"
|
|
|
|
#include <cstdlib>
|
|
#include <fstream>
|
|
#include <iostream>
|
|
#include <sstream>
|
|
#include <string>
|
|
#include <vector>
|
|
|
|
#include <string.h> // strcmpi
|
|
#ifndef _WIN64
|
|
#include <sys/time.h> // timings
|
|
|
|
#include <dirent.h> // linux dir traverse
|
|
#include <unistd.h>
|
|
#endif
|
|
#include <sys/stat.h>
|
|
#include <sys/types.h>
|
|
|
|
// write bmp, input - RGB, device
|
|
int writeBMP(const char *filename, const unsigned char *d_chanR, int pitchR,
|
|
const unsigned char *d_chanG, int pitchG,
|
|
const unsigned char *d_chanB, int pitchB, int width, int height) {
|
|
unsigned int headers[13];
|
|
FILE *outfile;
|
|
int extrabytes;
|
|
int paddedsize;
|
|
int x;
|
|
int y;
|
|
int n;
|
|
int red, green, blue;
|
|
|
|
std::vector<unsigned char> vchanR(height * width);
|
|
std::vector<unsigned char> vchanG(height * width);
|
|
std::vector<unsigned char> vchanB(height * width);
|
|
unsigned char *chanR = vchanR.data();
|
|
unsigned char *chanG = vchanG.data();
|
|
unsigned char *chanB = vchanB.data();
|
|
checkCudaErrors(cudaMemcpy2D(chanR, (size_t)width, d_chanR, (size_t)pitchR,
|
|
width, height, cudaMemcpyDeviceToHost));
|
|
checkCudaErrors(cudaMemcpy2D(chanG, (size_t)width, d_chanG, (size_t)pitchR,
|
|
width, height, cudaMemcpyDeviceToHost));
|
|
checkCudaErrors(cudaMemcpy2D(chanB, (size_t)width, d_chanB, (size_t)pitchR,
|
|
width, height, cudaMemcpyDeviceToHost));
|
|
|
|
extrabytes =
|
|
4 - ((width * 3) % 4); // How many bytes of padding to add to each
|
|
// horizontal line - the size of which must
|
|
// be a multiple of 4 bytes.
|
|
if (extrabytes == 4) extrabytes = 0;
|
|
|
|
paddedsize = ((width * 3) + extrabytes) * height;
|
|
|
|
// Headers...
|
|
// Note that the "BM" identifier in bytes 0 and 1 is NOT included in these
|
|
// "headers".
|
|
|
|
headers[0] = paddedsize + 54; // bfSize (whole file size)
|
|
headers[1] = 0; // bfReserved (both)
|
|
headers[2] = 54; // bfOffbits
|
|
headers[3] = 40; // biSize
|
|
headers[4] = width; // biWidth
|
|
headers[5] = height; // biHeight
|
|
|
|
// Would have biPlanes and biBitCount in position 6, but they're shorts.
|
|
// It's easier to write them out separately (see below) than pretend
|
|
// they're a single int, especially with endian issues...
|
|
|
|
headers[7] = 0; // biCompression
|
|
headers[8] = paddedsize; // biSizeImage
|
|
headers[9] = 0; // biXPelsPerMeter
|
|
headers[10] = 0; // biYPelsPerMeter
|
|
headers[11] = 0; // biClrUsed
|
|
headers[12] = 0; // biClrImportant
|
|
|
|
if (!(outfile = fopen(filename, "wb"))) {
|
|
std::cerr << "Cannot open file: " << filename << std::endl;
|
|
return 1;
|
|
}
|
|
|
|
//
|
|
// Headers begin...
|
|
// When printing ints and shorts, we write out 1 character at a time to avoid
|
|
// endian issues.
|
|
//
|
|
fprintf(outfile, "BM");
|
|
|
|
for (n = 0; n <= 5; n++) {
|
|
fprintf(outfile, "%c", headers[n] & 0x000000FF);
|
|
fprintf(outfile, "%c", (headers[n] & 0x0000FF00) >> 8);
|
|
fprintf(outfile, "%c", (headers[n] & 0x00FF0000) >> 16);
|
|
fprintf(outfile, "%c", (headers[n] & (unsigned int)0xFF000000) >> 24);
|
|
}
|
|
|
|
// These next 4 characters are for the biPlanes and biBitCount fields.
|
|
|
|
fprintf(outfile, "%c", 1);
|
|
fprintf(outfile, "%c", 0);
|
|
fprintf(outfile, "%c", 24);
|
|
fprintf(outfile, "%c", 0);
|
|
|
|
for (n = 7; n <= 12; n++) {
|
|
fprintf(outfile, "%c", headers[n] & 0x000000FF);
|
|
fprintf(outfile, "%c", (headers[n] & 0x0000FF00) >> 8);
|
|
fprintf(outfile, "%c", (headers[n] & 0x00FF0000) >> 16);
|
|
fprintf(outfile, "%c", (headers[n] & (unsigned int)0xFF000000) >> 24);
|
|
}
|
|
|
|
//
|
|
// Headers done, now write the data...
|
|
//
|
|
|
|
for (y = height - 1; y >= 0;
|
|
y--) // BMP image format is written from bottom to top...
|
|
{
|
|
for (x = 0; x <= width - 1; x++) {
|
|
red = chanR[y * width + x];
|
|
green = chanG[y * width + x];
|
|
blue = chanB[y * width + x];
|
|
|
|
if (red > 255) red = 255;
|
|
if (red < 0) red = 0;
|
|
if (green > 255) green = 255;
|
|
if (green < 0) green = 0;
|
|
if (blue > 255) blue = 255;
|
|
if (blue < 0) blue = 0;
|
|
// Also, it's written in (b,g,r) format...
|
|
|
|
fprintf(outfile, "%c", blue);
|
|
fprintf(outfile, "%c", green);
|
|
fprintf(outfile, "%c", red);
|
|
}
|
|
if (extrabytes) // See above - BMP lines must be of lengths divisible by 4.
|
|
{
|
|
for (n = 1; n <= extrabytes; n++) {
|
|
fprintf(outfile, "%c", 0);
|
|
}
|
|
}
|
|
}
|
|
|
|
fclose(outfile);
|
|
return 0;
|
|
}
|
|
|
|
// write bmp, input - RGB, device
|
|
int writeBMPi(const char *filename, const unsigned char *d_RGB, int pitch,
|
|
int width, int height) {
|
|
unsigned int headers[13];
|
|
FILE *outfile;
|
|
int extrabytes;
|
|
int paddedsize;
|
|
int x;
|
|
int y;
|
|
int n;
|
|
int red, green, blue;
|
|
|
|
std::vector<unsigned char> vchanRGB(height * width * 3);
|
|
unsigned char *chanRGB = vchanRGB.data();
|
|
checkCudaErrors(cudaMemcpy2D(chanRGB, (size_t)width * 3, d_RGB, (size_t)pitch,
|
|
width * 3, height, cudaMemcpyDeviceToHost));
|
|
|
|
extrabytes =
|
|
4 - ((width * 3) % 4); // How many bytes of padding to add to each
|
|
// horizontal line - the size of which must
|
|
// be a multiple of 4 bytes.
|
|
if (extrabytes == 4) extrabytes = 0;
|
|
|
|
paddedsize = ((width * 3) + extrabytes) * height;
|
|
|
|
// Headers...
|
|
// Note that the "BM" identifier in bytes 0 and 1 is NOT included in these
|
|
// "headers".
|
|
headers[0] = paddedsize + 54; // bfSize (whole file size)
|
|
headers[1] = 0; // bfReserved (both)
|
|
headers[2] = 54; // bfOffbits
|
|
headers[3] = 40; // biSize
|
|
headers[4] = width; // biWidth
|
|
headers[5] = height; // biHeight
|
|
|
|
// Would have biPlanes and biBitCount in position 6, but they're shorts.
|
|
// It's easier to write them out separately (see below) than pretend
|
|
// they're a single int, especially with endian issues...
|
|
|
|
headers[7] = 0; // biCompression
|
|
headers[8] = paddedsize; // biSizeImage
|
|
headers[9] = 0; // biXPelsPerMeter
|
|
headers[10] = 0; // biYPelsPerMeter
|
|
headers[11] = 0; // biClrUsed
|
|
headers[12] = 0; // biClrImportant
|
|
|
|
if (!(outfile = fopen(filename, "wb"))) {
|
|
std::cerr << "Cannot open file: " << filename << std::endl;
|
|
return 1;
|
|
}
|
|
|
|
//
|
|
// Headers begin...
|
|
// When printing ints and shorts, we write out 1 character at a time to avoid
|
|
// endian issues.
|
|
//
|
|
|
|
fprintf(outfile, "BM");
|
|
|
|
for (n = 0; n <= 5; n++) {
|
|
fprintf(outfile, "%c", headers[n] & 0x000000FF);
|
|
fprintf(outfile, "%c", (headers[n] & 0x0000FF00) >> 8);
|
|
fprintf(outfile, "%c", (headers[n] & 0x00FF0000) >> 16);
|
|
fprintf(outfile, "%c", (headers[n] & (unsigned int)0xFF000000) >> 24);
|
|
}
|
|
|
|
// These next 4 characters are for the biPlanes and biBitCount fields.
|
|
|
|
fprintf(outfile, "%c", 1);
|
|
fprintf(outfile, "%c", 0);
|
|
fprintf(outfile, "%c", 24);
|
|
fprintf(outfile, "%c", 0);
|
|
|
|
for (n = 7; n <= 12; n++) {
|
|
fprintf(outfile, "%c", headers[n] & 0x000000FF);
|
|
fprintf(outfile, "%c", (headers[n] & 0x0000FF00) >> 8);
|
|
fprintf(outfile, "%c", (headers[n] & 0x00FF0000) >> 16);
|
|
fprintf(outfile, "%c", (headers[n] & (unsigned int)0xFF000000) >> 24);
|
|
}
|
|
|
|
//
|
|
// Headers done, now write the data...
|
|
//
|
|
for (y = height - 1; y >= 0;
|
|
y--) // BMP image format is written from bottom to top...
|
|
{
|
|
for (x = 0; x <= width - 1; x++) {
|
|
red = chanRGB[(y * width + x) * 3];
|
|
green = chanRGB[(y * width + x) * 3 + 1];
|
|
blue = chanRGB[(y * width + x) * 3 + 2];
|
|
|
|
if (red > 255) red = 255;
|
|
if (red < 0) red = 0;
|
|
if (green > 255) green = 255;
|
|
if (green < 0) green = 0;
|
|
if (blue > 255) blue = 255;
|
|
if (blue < 0) blue = 0;
|
|
// Also, it's written in (b,g,r) format...
|
|
|
|
fprintf(outfile, "%c", blue);
|
|
fprintf(outfile, "%c", green);
|
|
fprintf(outfile, "%c", red);
|
|
}
|
|
if (extrabytes) // See above - BMP lines must be of lengths divisible by 4.
|
|
{
|
|
for (n = 1; n <= extrabytes; n++) {
|
|
fprintf(outfile, "%c", 0);
|
|
}
|
|
}
|
|
}
|
|
|
|
fclose(outfile);
|
|
return 0;
|
|
}
|
|
|
|
int inputDirExists(const char *pathname) {
|
|
struct stat info;
|
|
if (stat(pathname, &info) != 0) {
|
|
return 0; // Directory does not exists
|
|
} else if (info.st_mode & S_IFDIR) {
|
|
// is a directory
|
|
return 1;
|
|
} else {
|
|
// is not a directory
|
|
return 0;
|
|
}
|
|
}
|
|
|
|
int readInput(const std::string &sInputPath,
|
|
std::vector<std::string> &filelist) {
|
|
int error_code = 1;
|
|
#ifndef _WIN64
|
|
struct stat s;
|
|
|
|
if (stat(sInputPath.c_str(), &s) == 0) {
|
|
if (s.st_mode & S_IFREG) {
|
|
filelist.push_back(sInputPath);
|
|
} else if (s.st_mode & S_IFDIR) {
|
|
// processing each file in directory
|
|
DIR *dir_handle;
|
|
struct dirent *dir;
|
|
dir_handle = opendir(sInputPath.c_str());
|
|
std::vector<std::string> filenames;
|
|
if (dir_handle) {
|
|
error_code = 0;
|
|
while ((dir = readdir(dir_handle)) != NULL) {
|
|
std::string sFileName = sInputPath + dir->d_name;
|
|
if (inputDirExists(sFileName.c_str()))
|
|
{
|
|
std::string sname = dir->d_name;
|
|
if (sname != "." && sname != "..") {
|
|
readInput(sInputPath + sname + "/", filelist);
|
|
}
|
|
}
|
|
else
|
|
{
|
|
filelist.push_back(sFileName);
|
|
}
|
|
}
|
|
closedir(dir_handle);
|
|
} else {
|
|
std::cout << "Cannot open input directory: " << sInputPath << std::endl;
|
|
return error_code;
|
|
}
|
|
} else {
|
|
std::cout << "Cannot open input: " << sInputPath << std::endl;
|
|
return error_code;
|
|
}
|
|
} else {
|
|
std::cout << "Cannot find input path " << sInputPath << std::endl;
|
|
return error_code;
|
|
}
|
|
#else
|
|
std::string search_path = sInputPath + "/*.*";
|
|
WIN32_FIND_DATA fd;
|
|
HANDLE hFind = ::FindFirstFile(search_path.c_str(), &fd);
|
|
if (hFind != INVALID_HANDLE_VALUE) {
|
|
do {
|
|
// read all (real) files in current folder
|
|
// , delete '!' read other 2 default folder . and ..
|
|
if (!(fd.dwFileAttributes & FILE_ATTRIBUTE_DIRECTORY)) {
|
|
std::string temp(sInputPath + "\\" + fd.cFileName);
|
|
filelist.push_back(temp);
|
|
}
|
|
} while (::FindNextFile(hFind, &fd));
|
|
::FindClose(hFind);
|
|
} else {
|
|
std::cout << "Cannot open input directory: " << sInputPath << std::endl;
|
|
return error_code;
|
|
}
|
|
#endif
|
|
return 0;
|
|
}
|
|
|
|
|
|
int getInputDir(std::string &input_dir, const char *executable_path) {
|
|
int found = 0;
|
|
if (executable_path != 0) {
|
|
std::string executable_name = std::string(executable_path);
|
|
#if defined(WIN32) || defined(_WIN32) || defined(WIN64) || defined(_WIN64)
|
|
// Windows path delimiter
|
|
size_t delimiter_pos = executable_name.find_last_of('\\');
|
|
executable_name.erase(0, delimiter_pos + 1);
|
|
|
|
if (executable_name.rfind(".exe") != std::string::npos) {
|
|
// we strip .exe, only if the .exe is found
|
|
executable_name.resize(executable_name.size() - 4);
|
|
}
|
|
#else
|
|
// Linux & OSX path delimiter
|
|
size_t delimiter_pos = executable_name.find_last_of('/');
|
|
executable_name.erase(0, delimiter_pos + 1);
|
|
#endif
|
|
|
|
// Search in default paths for input images.
|
|
std::string pathname = "";
|
|
const char *searchPath[] = {
|
|
"./images",
|
|
"../../../../Samples/4_CUDA_Libraries/<executable_name>/images",
|
|
"../../../Samples/4_CUDA_Libraries/<executable_name>/images",
|
|
"../../Samples/4_CUDA_Libraries/<executable_name>/images"};
|
|
|
|
for (unsigned int i = 0; i < sizeof(searchPath) / sizeof(char *); ++i) {
|
|
std::string pathname(searchPath[i]);
|
|
size_t executable_name_pos = pathname.find("<executable_name>");
|
|
|
|
// If there is executable_name variable in the searchPath
|
|
// replace it with the value
|
|
if (executable_name_pos != std::string::npos) {
|
|
pathname.replace(executable_name_pos, strlen("<executable_name>"),
|
|
executable_name);
|
|
}
|
|
|
|
if (inputDirExists(pathname.c_str())) {
|
|
input_dir = pathname + "/";
|
|
found = 1;
|
|
break;
|
|
}
|
|
}
|
|
}
|
|
return found;
|
|
}
|
|
|
|
#endif |