You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
428 lines
14 KiB
428 lines
14 KiB
/* Copyright (c) 2022, NVIDIA CORPORATION. All rights reserved. |
|
* |
|
* Redistribution and use in source and binary forms, with or without |
|
* modification, are permitted provided that the following conditions |
|
* are met: |
|
* * Redistributions of source code must retain the above copyright |
|
* notice, this list of conditions and the following disclaimer. |
|
* * Redistributions in binary form must reproduce the above copyright |
|
* notice, this list of conditions and the following disclaimer in the |
|
* documentation and/or other materials provided with the distribution. |
|
* * Neither the name of NVIDIA CORPORATION nor the names of its |
|
* contributors may be used to endorse or promote products derived |
|
* from this software without specific prior written permission. |
|
* |
|
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS ``AS IS'' AND ANY |
|
* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
|
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR |
|
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR |
|
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, |
|
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, |
|
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR |
|
* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY |
|
* OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
|
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
|
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
|
*/ |
|
|
|
// This sample needs at least CUDA 10.1. |
|
// It demonstrates usages of the nvJPEG library |
|
|
|
#ifndef NV_JPEG_EXAMPLE |
|
#define NV_JPEG_EXAMPLE |
|
|
|
#ifdef _WIN64 |
|
#include <windows.h> |
|
#endif |
|
|
|
#include "cuda_runtime.h" |
|
#include "nvjpeg.h" |
|
#include "helper_cuda.h" |
|
#include "helper_timer.h" |
|
|
|
#include <cstdlib> |
|
#include <fstream> |
|
#include <iostream> |
|
#include <sstream> |
|
#include <string> |
|
#include <vector> |
|
|
|
#include <string.h> // strcmpi |
|
#ifndef _WIN64 |
|
#include <sys/time.h> // timings |
|
|
|
#include <dirent.h> // linux dir traverse |
|
#include <unistd.h> |
|
#endif |
|
#include <sys/stat.h> |
|
#include <sys/types.h> |
|
|
|
// write bmp, input - RGB, device |
|
int writeBMP(const char *filename, const unsigned char *d_chanR, int pitchR, |
|
const unsigned char *d_chanG, int pitchG, |
|
const unsigned char *d_chanB, int pitchB, int width, int height) { |
|
unsigned int headers[13]; |
|
FILE *outfile; |
|
int extrabytes; |
|
int paddedsize; |
|
int x; |
|
int y; |
|
int n; |
|
int red, green, blue; |
|
|
|
std::vector<unsigned char> vchanR(height * width); |
|
std::vector<unsigned char> vchanG(height * width); |
|
std::vector<unsigned char> vchanB(height * width); |
|
unsigned char *chanR = vchanR.data(); |
|
unsigned char *chanG = vchanG.data(); |
|
unsigned char *chanB = vchanB.data(); |
|
checkCudaErrors(cudaMemcpy2D(chanR, (size_t)width, d_chanR, (size_t)pitchR, |
|
width, height, cudaMemcpyDeviceToHost)); |
|
checkCudaErrors(cudaMemcpy2D(chanG, (size_t)width, d_chanG, (size_t)pitchR, |
|
width, height, cudaMemcpyDeviceToHost)); |
|
checkCudaErrors(cudaMemcpy2D(chanB, (size_t)width, d_chanB, (size_t)pitchR, |
|
width, height, cudaMemcpyDeviceToHost)); |
|
|
|
extrabytes = |
|
4 - ((width * 3) % 4); // How many bytes of padding to add to each |
|
// horizontal line - the size of which must |
|
// be a multiple of 4 bytes. |
|
if (extrabytes == 4) extrabytes = 0; |
|
|
|
paddedsize = ((width * 3) + extrabytes) * height; |
|
|
|
// Headers... |
|
// Note that the "BM" identifier in bytes 0 and 1 is NOT included in these |
|
// "headers". |
|
|
|
headers[0] = paddedsize + 54; // bfSize (whole file size) |
|
headers[1] = 0; // bfReserved (both) |
|
headers[2] = 54; // bfOffbits |
|
headers[3] = 40; // biSize |
|
headers[4] = width; // biWidth |
|
headers[5] = height; // biHeight |
|
|
|
// Would have biPlanes and biBitCount in position 6, but they're shorts. |
|
// It's easier to write them out separately (see below) than pretend |
|
// they're a single int, especially with endian issues... |
|
|
|
headers[7] = 0; // biCompression |
|
headers[8] = paddedsize; // biSizeImage |
|
headers[9] = 0; // biXPelsPerMeter |
|
headers[10] = 0; // biYPelsPerMeter |
|
headers[11] = 0; // biClrUsed |
|
headers[12] = 0; // biClrImportant |
|
|
|
if (!(outfile = fopen(filename, "wb"))) { |
|
std::cerr << "Cannot open file: " << filename << std::endl; |
|
return 1; |
|
} |
|
|
|
// |
|
// Headers begin... |
|
// When printing ints and shorts, we write out 1 character at a time to avoid |
|
// endian issues. |
|
// |
|
fprintf(outfile, "BM"); |
|
|
|
for (n = 0; n <= 5; n++) { |
|
fprintf(outfile, "%c", headers[n] & 0x000000FF); |
|
fprintf(outfile, "%c", (headers[n] & 0x0000FF00) >> 8); |
|
fprintf(outfile, "%c", (headers[n] & 0x00FF0000) >> 16); |
|
fprintf(outfile, "%c", (headers[n] & (unsigned int)0xFF000000) >> 24); |
|
} |
|
|
|
// These next 4 characters are for the biPlanes and biBitCount fields. |
|
|
|
fprintf(outfile, "%c", 1); |
|
fprintf(outfile, "%c", 0); |
|
fprintf(outfile, "%c", 24); |
|
fprintf(outfile, "%c", 0); |
|
|
|
for (n = 7; n <= 12; n++) { |
|
fprintf(outfile, "%c", headers[n] & 0x000000FF); |
|
fprintf(outfile, "%c", (headers[n] & 0x0000FF00) >> 8); |
|
fprintf(outfile, "%c", (headers[n] & 0x00FF0000) >> 16); |
|
fprintf(outfile, "%c", (headers[n] & (unsigned int)0xFF000000) >> 24); |
|
} |
|
|
|
// |
|
// Headers done, now write the data... |
|
// |
|
|
|
for (y = height - 1; y >= 0; |
|
y--) // BMP image format is written from bottom to top... |
|
{ |
|
for (x = 0; x <= width - 1; x++) { |
|
red = chanR[y * width + x]; |
|
green = chanG[y * width + x]; |
|
blue = chanB[y * width + x]; |
|
|
|
if (red > 255) red = 255; |
|
if (red < 0) red = 0; |
|
if (green > 255) green = 255; |
|
if (green < 0) green = 0; |
|
if (blue > 255) blue = 255; |
|
if (blue < 0) blue = 0; |
|
// Also, it's written in (b,g,r) format... |
|
|
|
fprintf(outfile, "%c", blue); |
|
fprintf(outfile, "%c", green); |
|
fprintf(outfile, "%c", red); |
|
} |
|
if (extrabytes) // See above - BMP lines must be of lengths divisible by 4. |
|
{ |
|
for (n = 1; n <= extrabytes; n++) { |
|
fprintf(outfile, "%c", 0); |
|
} |
|
} |
|
} |
|
|
|
fclose(outfile); |
|
return 0; |
|
} |
|
|
|
// write bmp, input - RGB, device |
|
int writeBMPi(const char *filename, const unsigned char *d_RGB, int pitch, |
|
int width, int height) { |
|
unsigned int headers[13]; |
|
FILE *outfile; |
|
int extrabytes; |
|
int paddedsize; |
|
int x; |
|
int y; |
|
int n; |
|
int red, green, blue; |
|
|
|
std::vector<unsigned char> vchanRGB(height * width * 3); |
|
unsigned char *chanRGB = vchanRGB.data(); |
|
checkCudaErrors(cudaMemcpy2D(chanRGB, (size_t)width * 3, d_RGB, (size_t)pitch, |
|
width * 3, height, cudaMemcpyDeviceToHost)); |
|
|
|
extrabytes = |
|
4 - ((width * 3) % 4); // How many bytes of padding to add to each |
|
// horizontal line - the size of which must |
|
// be a multiple of 4 bytes. |
|
if (extrabytes == 4) extrabytes = 0; |
|
|
|
paddedsize = ((width * 3) + extrabytes) * height; |
|
|
|
// Headers... |
|
// Note that the "BM" identifier in bytes 0 and 1 is NOT included in these |
|
// "headers". |
|
headers[0] = paddedsize + 54; // bfSize (whole file size) |
|
headers[1] = 0; // bfReserved (both) |
|
headers[2] = 54; // bfOffbits |
|
headers[3] = 40; // biSize |
|
headers[4] = width; // biWidth |
|
headers[5] = height; // biHeight |
|
|
|
// Would have biPlanes and biBitCount in position 6, but they're shorts. |
|
// It's easier to write them out separately (see below) than pretend |
|
// they're a single int, especially with endian issues... |
|
|
|
headers[7] = 0; // biCompression |
|
headers[8] = paddedsize; // biSizeImage |
|
headers[9] = 0; // biXPelsPerMeter |
|
headers[10] = 0; // biYPelsPerMeter |
|
headers[11] = 0; // biClrUsed |
|
headers[12] = 0; // biClrImportant |
|
|
|
if (!(outfile = fopen(filename, "wb"))) { |
|
std::cerr << "Cannot open file: " << filename << std::endl; |
|
return 1; |
|
} |
|
|
|
// |
|
// Headers begin... |
|
// When printing ints and shorts, we write out 1 character at a time to avoid |
|
// endian issues. |
|
// |
|
|
|
fprintf(outfile, "BM"); |
|
|
|
for (n = 0; n <= 5; n++) { |
|
fprintf(outfile, "%c", headers[n] & 0x000000FF); |
|
fprintf(outfile, "%c", (headers[n] & 0x0000FF00) >> 8); |
|
fprintf(outfile, "%c", (headers[n] & 0x00FF0000) >> 16); |
|
fprintf(outfile, "%c", (headers[n] & (unsigned int)0xFF000000) >> 24); |
|
} |
|
|
|
// These next 4 characters are for the biPlanes and biBitCount fields. |
|
|
|
fprintf(outfile, "%c", 1); |
|
fprintf(outfile, "%c", 0); |
|
fprintf(outfile, "%c", 24); |
|
fprintf(outfile, "%c", 0); |
|
|
|
for (n = 7; n <= 12; n++) { |
|
fprintf(outfile, "%c", headers[n] & 0x000000FF); |
|
fprintf(outfile, "%c", (headers[n] & 0x0000FF00) >> 8); |
|
fprintf(outfile, "%c", (headers[n] & 0x00FF0000) >> 16); |
|
fprintf(outfile, "%c", (headers[n] & (unsigned int)0xFF000000) >> 24); |
|
} |
|
|
|
// |
|
// Headers done, now write the data... |
|
// |
|
for (y = height - 1; y >= 0; |
|
y--) // BMP image format is written from bottom to top... |
|
{ |
|
for (x = 0; x <= width - 1; x++) { |
|
red = chanRGB[(y * width + x) * 3]; |
|
green = chanRGB[(y * width + x) * 3 + 1]; |
|
blue = chanRGB[(y * width + x) * 3 + 2]; |
|
|
|
if (red > 255) red = 255; |
|
if (red < 0) red = 0; |
|
if (green > 255) green = 255; |
|
if (green < 0) green = 0; |
|
if (blue > 255) blue = 255; |
|
if (blue < 0) blue = 0; |
|
// Also, it's written in (b,g,r) format... |
|
|
|
fprintf(outfile, "%c", blue); |
|
fprintf(outfile, "%c", green); |
|
fprintf(outfile, "%c", red); |
|
} |
|
if (extrabytes) // See above - BMP lines must be of lengths divisible by 4. |
|
{ |
|
for (n = 1; n <= extrabytes; n++) { |
|
fprintf(outfile, "%c", 0); |
|
} |
|
} |
|
} |
|
|
|
fclose(outfile); |
|
return 0; |
|
} |
|
|
|
int inputDirExists(const char *pathname) { |
|
struct stat info; |
|
if (stat(pathname, &info) != 0) { |
|
return 0; // Directory does not exists |
|
} else if (info.st_mode & S_IFDIR) { |
|
// is a directory |
|
return 1; |
|
} else { |
|
// is not a directory |
|
return 0; |
|
} |
|
} |
|
|
|
int readInput(const std::string &sInputPath, |
|
std::vector<std::string> &filelist) { |
|
int error_code = 1; |
|
#ifndef _WIN64 |
|
struct stat s; |
|
|
|
if (stat(sInputPath.c_str(), &s) == 0) { |
|
if (s.st_mode & S_IFREG) { |
|
filelist.push_back(sInputPath); |
|
} else if (s.st_mode & S_IFDIR) { |
|
// processing each file in directory |
|
DIR *dir_handle; |
|
struct dirent *dir; |
|
dir_handle = opendir(sInputPath.c_str()); |
|
std::vector<std::string> filenames; |
|
if (dir_handle) { |
|
error_code = 0; |
|
while ((dir = readdir(dir_handle)) != NULL) { |
|
std::string sFileName = sInputPath + dir->d_name; |
|
if (inputDirExists(sFileName.c_str())) |
|
{ |
|
std::string sname = dir->d_name; |
|
if (sname != "." && sname != "..") { |
|
readInput(sInputPath + sname + "/", filelist); |
|
} |
|
} |
|
else |
|
{ |
|
filelist.push_back(sFileName); |
|
} |
|
} |
|
closedir(dir_handle); |
|
} else { |
|
std::cout << "Cannot open input directory: " << sInputPath << std::endl; |
|
return error_code; |
|
} |
|
} else { |
|
std::cout << "Cannot open input: " << sInputPath << std::endl; |
|
return error_code; |
|
} |
|
} else { |
|
std::cout << "Cannot find input path " << sInputPath << std::endl; |
|
return error_code; |
|
} |
|
#else |
|
std::string search_path = sInputPath + "/*.*"; |
|
WIN32_FIND_DATA fd; |
|
HANDLE hFind = ::FindFirstFile(search_path.c_str(), &fd); |
|
if (hFind != INVALID_HANDLE_VALUE) { |
|
do { |
|
// read all (real) files in current folder |
|
// , delete '!' read other 2 default folder . and .. |
|
if (!(fd.dwFileAttributes & FILE_ATTRIBUTE_DIRECTORY)) { |
|
std::string temp(sInputPath + "\\" + fd.cFileName); |
|
filelist.push_back(temp); |
|
} |
|
} while (::FindNextFile(hFind, &fd)); |
|
::FindClose(hFind); |
|
} else { |
|
std::cout << "Cannot open input directory: " << sInputPath << std::endl; |
|
return error_code; |
|
} |
|
#endif |
|
return 0; |
|
} |
|
|
|
|
|
int getInputDir(std::string &input_dir, const char *executable_path) { |
|
int found = 0; |
|
if (executable_path != 0) { |
|
std::string executable_name = std::string(executable_path); |
|
#if defined(WIN32) || defined(_WIN32) || defined(WIN64) || defined(_WIN64) |
|
// Windows path delimiter |
|
size_t delimiter_pos = executable_name.find_last_of('\\'); |
|
executable_name.erase(0, delimiter_pos + 1); |
|
|
|
if (executable_name.rfind(".exe") != std::string::npos) { |
|
// we strip .exe, only if the .exe is found |
|
executable_name.resize(executable_name.size() - 4); |
|
} |
|
#else |
|
// Linux & OSX path delimiter |
|
size_t delimiter_pos = executable_name.find_last_of('/'); |
|
executable_name.erase(0, delimiter_pos + 1); |
|
#endif |
|
|
|
// Search in default paths for input images. |
|
std::string pathname = ""; |
|
const char *searchPath[] = { |
|
"./images", |
|
"../../../../Samples/4_CUDA_Libraries/<executable_name>/images", |
|
"../../../Samples/4_CUDA_Libraries/<executable_name>/images", |
|
"../../Samples/4_CUDA_Libraries/<executable_name>/images"}; |
|
|
|
for (unsigned int i = 0; i < sizeof(searchPath) / sizeof(char *); ++i) { |
|
std::string pathname(searchPath[i]); |
|
size_t executable_name_pos = pathname.find("<executable_name>"); |
|
|
|
// If there is executable_name variable in the searchPath |
|
// replace it with the value |
|
if (executable_name_pos != std::string::npos) { |
|
pathname.replace(executable_name_pos, strlen("<executable_name>"), |
|
executable_name); |
|
} |
|
|
|
if (inputDirExists(pathname.c_str())) { |
|
input_dir = pathname + "/"; |
|
found = 1; |
|
break; |
|
} |
|
} |
|
} |
|
return found; |
|
} |
|
|
|
#endif |