43#include "MagickCore/studio.h"
44#include "MagickCore/accelerate-kernels-private.h"
45#include "MagickCore/artifact.h"
46#include "MagickCore/cache.h"
47#include "MagickCore/cache-private.h"
48#include "MagickCore/color.h"
49#include "MagickCore/compare.h"
50#include "MagickCore/constitute.h"
51#include "MagickCore/configure.h"
52#include "MagickCore/distort.h"
53#include "MagickCore/draw.h"
54#include "MagickCore/effect.h"
55#include "MagickCore/exception.h"
56#include "MagickCore/exception-private.h"
57#include "MagickCore/fx.h"
58#include "MagickCore/gem.h"
59#include "MagickCore/geometry.h"
60#include "MagickCore/image.h"
61#include "MagickCore/image-private.h"
62#include "MagickCore/layer.h"
63#include "MagickCore/locale_.h"
64#include "MagickCore/mime-private.h"
65#include "MagickCore/memory_.h"
66#include "MagickCore/memory-private.h"
67#include "MagickCore/monitor.h"
68#include "MagickCore/montage.h"
69#include "MagickCore/morphology.h"
70#include "MagickCore/nt-base.h"
71#include "MagickCore/nt-base-private.h"
72#include "MagickCore/opencl.h"
73#include "MagickCore/opencl-private.h"
74#include "MagickCore/option.h"
75#include "MagickCore/policy.h"
76#include "MagickCore/property.h"
77#include "MagickCore/quantize.h"
78#include "MagickCore/quantum.h"
79#include "MagickCore/random_.h"
80#include "MagickCore/random-private.h"
81#include "MagickCore/resample.h"
82#include "MagickCore/resource_.h"
83#include "MagickCore/splay-tree.h"
84#include "MagickCore/semaphore.h"
85#include "MagickCore/statistic.h"
86#include "MagickCore/string_.h"
87#include "MagickCore/string-private.h"
88#include "MagickCore/token.h"
89#include "MagickCore/utility.h"
90#include "MagickCore/utility-private.h"
92#if defined(MAGICKCORE_OPENCL_SUPPORT)
93#if defined(MAGICKCORE_LTDL_DELEGATE)
100#define IMAGEMAGICK_PROFILE_FILE "ImagemagickOpenCLDeviceProfile.xml"
126} MagickCLDeviceBenchmark;
132static MagickBooleanType
133 HasOpenCLDevices(MagickCLEnv,ExceptionInfo *),
134 LoadOpenCLLibrary(
void);
137 RelinquishMagickCLDevice(MagickCLDevice);
140 RelinquishMagickCLEnv(MagickCLEnv);
143 BenchmarkOpenCLDevices(MagickCLEnv);
161 *cache_directory_lock;
163static inline MagickBooleanType IsSameOpenCLDevice(MagickCLDevice a,
166 if ((LocaleCompare(a->platform_name,b->platform_name) == 0) &&
167 (LocaleCompare(a->vendor_name,b->vendor_name) == 0) &&
168 (LocaleCompare(a->name,b->name) == 0) &&
169 (LocaleCompare(a->version,b->version) == 0) &&
170 (a->max_clock_frequency == b->max_clock_frequency) &&
171 (a->max_compute_units == b->max_compute_units))
177static inline MagickBooleanType IsBenchmarkedOpenCLDevice(MagickCLDevice a,
178 MagickCLDeviceBenchmark *b)
180 if ((LocaleCompare(a->platform_name,b->platform_name) == 0) &&
181 (LocaleCompare(a->vendor_name,b->vendor_name) == 0) &&
182 (LocaleCompare(a->name,b->name) == 0) &&
183 (LocaleCompare(a->version,b->version) == 0) &&
184 (a->max_clock_frequency == b->max_clock_frequency) &&
185 (a->max_compute_units == b->max_compute_units))
191static inline void RelinquishMagickCLDevices(MagickCLEnv clEnv)
196 if (clEnv->devices != (MagickCLDevice *) NULL)
198 for (i = 0; i < clEnv->number_devices; i++)
199 clEnv->devices[i]=RelinquishMagickCLDevice(clEnv->devices[i]);
200 clEnv->devices=(MagickCLDevice *) RelinquishMagickMemory(clEnv->devices);
202 clEnv->number_devices=0;
205static inline MagickBooleanType MagickCreateDirectory(
const char *path)
210#ifdef MAGICKCORE_WINDOWS_SUPPORT
213 status=mkdir(path,0777);
215 return(status == 0 ? MagickTrue : MagickFalse);
218static inline void InitAccelerateTimer(AccelerateTimer *timer)
221 QueryPerformanceFrequency((LARGE_INTEGER*)&timer->freq);
223 timer->freq=(
long long)1.0E3;
229static inline double ReadAccelerateTimer(AccelerateTimer *timer)
231 return (
double)timer->clocks/(double)timer->freq;
234static inline void StartAccelerateTimer(AccelerateTimer* timer)
237 QueryPerformanceCounter((LARGE_INTEGER*)&timer->start);
242 timer->start=(
long long)s.tv_sec*(
long long)1.0E3+(
long long)s.tv_usec/
247static inline void StopAccelerateTimer(AccelerateTimer *timer)
254 QueryPerformanceCounter((LARGE_INTEGER*)&(n));
259 n=(
long long)s.tv_sec*(
long long)1.0E3+(
long long)s.tv_usec/
267static const char *GetOpenCLCacheDirectory()
269 if (cache_directory == (
char *) NULL)
272 ActivateSemaphoreInfo(&cache_directory_lock);
273 LockSemaphoreInfo(cache_directory_lock);
274 if (cache_directory == (
char *) NULL)
278 path[MagickPathExtent],
288 home=GetEnvironmentValue(
"MAGICK_OPENCL_CACHE_DIR");
289 if (home == (
char *) NULL)
291 home=GetEnvironmentValue(
"XDG_CACHE_HOME");
292#if defined(MAGICKCORE_WINDOWS_SUPPORT) || defined(__MINGW32__)
293 if (home == (
char *) NULL)
294 home=GetEnvironmentValue(
"LOCALAPPDATA");
295 if (home == (
char *) NULL)
296 home=GetEnvironmentValue(
"APPDATA");
297 if (home == (
char *) NULL)
298 home=GetEnvironmentValue(
"USERPROFILE");
302 if (home != (
char *) NULL)
305 (void) FormatLocaleString(path,MagickPathExtent,
"%s",home);
306 status=GetPathAttributes(path,&attributes);
307 if (status == MagickFalse)
308 status=MagickCreateDirectory(path);
311 if (status != MagickFalse)
313 (void) FormatLocaleString(path,MagickPathExtent,
314 "%s%sImageMagick",home,DirectorySeparator);
316 status=GetPathAttributes(path,&attributes);
317 if (status == MagickFalse)
318 status=MagickCreateDirectory(path);
321 if (status != MagickFalse)
323 temp=(
char*) AcquireCriticalMemory(strlen(path)+1);
324 (void) CopyMagickString(temp,path,strlen(path)+1);
326 home=DestroyString(home);
330 home=GetEnvironmentValue(
"HOME");
331 if (home != (
char *) NULL)
334 (void) FormatLocaleString(path,MagickPathExtent,
"%s%s.cache",
335 home,DirectorySeparator);
336 status=GetPathAttributes(path,&attributes);
337 if (status == MagickFalse)
338 status=MagickCreateDirectory(path);
341 if (status != MagickFalse)
343 (void) FormatLocaleString(path,MagickPathExtent,
344 "%s%s.cache%sImageMagick",home,DirectorySeparator,
346 status=GetPathAttributes(path,&attributes);
347 if (status == MagickFalse)
348 status=MagickCreateDirectory(path);
351 if (status != MagickFalse)
353 temp=(
char*) AcquireCriticalMemory(strlen(path)+1);
354 (void) CopyMagickString(temp,path,strlen(path)+1);
356 home=DestroyString(home);
359 if (temp == (
char *) NULL)
361 temp=AcquireString(
"?");
362 (void) LogMagickEvent(AccelerateEvent,GetMagickModule(),
363 "Cannot use cache directory: \"%s\"",path);
366 (
void) LogMagickEvent(AccelerateEvent,GetMagickModule(),
367 "Using cache directory: \"%s\"",temp);
368 cache_directory=temp;
370 UnlockSemaphoreInfo(cache_directory_lock);
372 if (*cache_directory ==
'?')
373 return((
const char *) NULL);
374 return(cache_directory);
377static void SelectOpenCLDevice(MagickCLEnv clEnv,cl_device_type type)
386 (void) LogMagickEvent(AccelerateEvent,GetMagickModule(),
387 "Selecting device for type: %d",(
int) type);
388 for (i = 0; i < clEnv->number_devices; i++)
389 clEnv->devices[i]->enabled=MagickFalse;
391 for (i = 0; i < clEnv->number_devices; i++)
393 device=clEnv->devices[i];
394 if (device->type != type)
397 device->enabled=MagickTrue;
398 (void) LogMagickEvent(AccelerateEvent,GetMagickModule(),
399 "Selected device: %s",device->name);
400 for (j = i+1; j < clEnv->number_devices; j++)
405 other_device=clEnv->devices[j];
406 if (IsSameOpenCLDevice(device,other_device))
407 other_device->enabled=MagickTrue;
412static size_t StringSignature(
const char*
string)
427 stringLength=(size_t) strlen(
string);
428 signature=stringLength;
429 n=stringLength/
sizeof(size_t);
431 for (i = 0; i < n; i++)
433 if (n *
sizeof(
size_t) != stringLength)
439 for (i = 0; i < 4; i++, j++)
441 if (j < stringLength)
452static void DestroyMagickCLCacheInfo(MagickCLCacheInfo info)
457 for (i=0; i < (ssize_t) info->event_count; i++)
458 openCL_library->clReleaseEvent(info->events[i]);
459 info->events=(cl_event *) RelinquishMagickMemory(info->events);
460 if (info->buffer != (cl_mem) NULL)
461 openCL_library->clReleaseMemObject(info->buffer);
462 RelinquishSemaphoreInfo(&info->events_semaphore);
463 ReleaseOpenCLDevice(info->device);
464 RelinquishMagickMemory(info);
471MagickPrivate cl_mem CreateOpenCLBuffer(MagickCLDevice device,
472 cl_mem_flags flags,
size_t size,
void *host_ptr)
474 return(openCL_library->clCreateBuffer(device->context,flags,size,host_ptr,
478MagickPrivate
void ReleaseOpenCLKernel(cl_kernel kernel)
480 (void) openCL_library->clReleaseKernel(kernel);
483MagickPrivate
void ReleaseOpenCLMemObject(cl_mem memobj)
485 (void) openCL_library->clReleaseMemObject(memobj);
488MagickPrivate
void RetainOpenCLMemObject(cl_mem memobj)
490 (void) openCL_library->clRetainMemObject(memobj);
493MagickPrivate cl_int SetOpenCLKernelArg(cl_kernel kernel,
size_t arg_index,
494 size_t arg_size,
const void *arg_value)
496 return(openCL_library->clSetKernelArg(kernel,(cl_uint) arg_index,arg_size,
528MagickPrivate MagickCLCacheInfo AcquireMagickCLCacheInfo(MagickCLDevice device,
529 Quantum *pixels,
const MagickSizeType length)
537 info=(MagickCLCacheInfo) AcquireCriticalMemory(
sizeof(*info));
538 (void) memset(info,0,
sizeof(*info));
539 LockSemaphoreInfo(openCL_lock);
541 UnlockSemaphoreInfo(openCL_lock);
545 info->events_semaphore=AcquireSemaphoreInfo();
546 info->buffer=openCL_library->clCreateBuffer(device->context,
547 CL_MEM_READ_WRITE | CL_MEM_USE_HOST_PTR,(
size_t) length,(
void *) pixels,
549 if (status == CL_SUCCESS)
551 DestroyMagickCLCacheInfo(info);
552 return((MagickCLCacheInfo) NULL);
574static MagickCLDevice AcquireMagickCLDevice()
579 device=(MagickCLDevice) AcquireMagickMemory(
sizeof(*device));
582 (void) memset(device,0,
sizeof(*device));
583 ActivateSemaphoreInfo(&device->lock);
584 device->score=MAGICKCORE_OPENCL_UNDEFINED_SCORE;
585 device->command_queues_index=-1;
586 device->enabled=MagickTrue;
606static MagickCLEnv AcquireMagickCLEnv(
void)
614 clEnv=(MagickCLEnv) AcquireMagickMemory(
sizeof(*clEnv));
615 if (clEnv != (MagickCLEnv) NULL)
617 (void) memset(clEnv,0,
sizeof(*clEnv));
618 ActivateSemaphoreInfo(&clEnv->lock);
619 clEnv->cpu_score=MAGICKCORE_OPENCL_UNDEFINED_SCORE;
620 clEnv->enabled=MagickFalse;
621 option=GetEnvironmentValue(
"MAGICK_OCL_DEVICE");
622 if (option != (
const char *) NULL)
624 if ((IsStringTrue(option) != MagickFalse) ||
625 (strcmp(option,
"GPU") == 0) ||
626 (strcmp(option,
"CPU") == 0))
627 clEnv->enabled=MagickTrue;
628 option=DestroyString(option);
657MagickPrivate cl_command_queue AcquireOpenCLCommandQueue(MagickCLDevice device)
662 cl_command_queue_properties
665 assert(device != (MagickCLDevice) NULL);
666 LockSemaphoreInfo(device->lock);
667 if ((device->profile_kernels == MagickFalse) &&
668 (device->command_queues_index >= 0))
670 queue=device->command_queues[device->command_queues_index--];
671 UnlockSemaphoreInfo(device->lock);
675 UnlockSemaphoreInfo(device->lock);
677 if (device->profile_kernels != MagickFalse)
678 properties=CL_QUEUE_PROFILING_ENABLE;
679 queue=openCL_library->clCreateCommandQueue(device->context,
680 device->deviceID,properties,(cl_int *) NULL);
713MagickPrivate cl_kernel AcquireOpenCLKernel(MagickCLDevice device,
714 const char *kernel_name)
719 assert(device != (MagickCLDevice) NULL);
720 (void) LogMagickEvent(AccelerateEvent,GetMagickModule(),
"Using kernel: %s",
722 kernel=openCL_library->clCreateKernel(device->program,kernel_name,
753#if !MAGICKCORE_ZERO_CONFIGURATION_SUPPORT
754static MagickCLDeviceBenchmark* RelinquishDeviceBenchmark(
755 MagickCLDeviceBenchmark *device_benchmark)
757 if (device_benchmark == (MagickCLDeviceBenchmark*) NULL)
758 return((MagickCLDeviceBenchmark *) NULL);
760 device_benchmark->platform_name=(
char *) RelinquishMagickMemory(
761 device_benchmark->platform_name);
762 device_benchmark->vendor_name=(
char *) RelinquishMagickMemory(
763 device_benchmark->vendor_name);
764 device_benchmark->name=(
char *) RelinquishMagickMemory(
765 device_benchmark->name);
766 device_benchmark->version=(
char *) RelinquishMagickMemory(
767 device_benchmark->version);
768 return((MagickCLDeviceBenchmark *) RelinquishMagickMemory(
772static void LoadOpenCLDeviceBenchmark(MagickCLEnv clEnv,
const char *xml)
775 keyword[MagickPathExtent],
781 MagickCLDeviceBenchmark
788 if (xml == (
char *) NULL)
790 device_benchmark=(MagickCLDeviceBenchmark *) NULL;
791 token=AcquireString(xml);
792 extent=strlen(token)+MagickPathExtent;
793 for (q=(
char *) xml; *q !=
'\0'; )
798 (void) GetNextToken(q,&q,extent,token);
801 (void) CopyMagickString(keyword,token,MagickPathExtent);
802 if (LocaleNCompare(keyword,
"<!DOCTYPE",9) == 0)
807 while ((LocaleNCompare(q,
"]>",2) != 0) && (*q !=
'\0'))
808 (void) GetNextToken(q,&q,extent,token);
811 if (LocaleNCompare(keyword,
"<!--",4) == 0)
816 while ((LocaleNCompare(q,
"->",2) != 0) && (*q !=
'\0'))
817 (void) GetNextToken(q,&q,extent,token);
820 if (LocaleCompare(keyword,
"<device") == 0)
825 device_benchmark=(MagickCLDeviceBenchmark *) AcquireQuantumMemory(1,
826 sizeof(*device_benchmark));
827 if (device_benchmark == (MagickCLDeviceBenchmark *) NULL)
829 (void) memset(device_benchmark,0,
sizeof(*device_benchmark));
830 device_benchmark->score=MAGICKCORE_OPENCL_UNDEFINED_SCORE;
833 if (device_benchmark == (MagickCLDeviceBenchmark *) NULL)
835 if (LocaleCompare(keyword,
"/>") == 0)
837 if (device_benchmark->score != MAGICKCORE_OPENCL_UNDEFINED_SCORE)
839 if (LocaleCompare(device_benchmark->name,
"CPU") == 0)
840 clEnv->cpu_score=device_benchmark->score;
849 for (i = 0; i < clEnv->number_devices; i++)
851 device=clEnv->devices[i];
852 if (IsBenchmarkedOpenCLDevice(device,device_benchmark))
853 device->score=device_benchmark->score;
857 device_benchmark=RelinquishDeviceBenchmark(device_benchmark);
860 (void) GetNextToken(q,(
const char **) NULL,extent,token);
863 (void) GetNextToken(q,&q,extent,token);
864 (void) GetNextToken(q,&q,extent,token);
870 if (LocaleCompare((
char *) keyword,
"maxClockFrequency") == 0)
872 device_benchmark->max_clock_frequency=StringToInteger(token);
875 if (LocaleCompare((
char *) keyword,
"maxComputeUnits") == 0)
877 device_benchmark->max_compute_units=StringToInteger(token);
885 if (LocaleCompare((
char *) keyword,
"name") == 0)
886 device_benchmark->name=ConstantString(token);
892 if (LocaleCompare((
char *) keyword,
"platform") == 0)
893 device_benchmark->platform_name=ConstantString(token);
899 if (LocaleCompare((
char *) keyword,
"score") == 0)
900 device_benchmark->score=StringToDouble(token,(
char **) NULL);
906 if (LocaleCompare((
char *) keyword,
"vendor") == 0)
907 device_benchmark->vendor_name=ConstantString(token);
908 if (LocaleCompare((
char *) keyword,
"version") == 0)
909 device_benchmark->version=ConstantString(token);
916 token=(
char *) RelinquishMagickMemory(token);
917 device_benchmark=RelinquishDeviceBenchmark(device_benchmark);
920static MagickBooleanType CanWriteProfileToFile(
const char *filename)
925 profileFile=fopen_utf8(filename,
"ab");
927 if (profileFile == (FILE *) NULL)
929 (void) LogMagickEvent(AccelerateEvent,GetMagickModule(),
930 "Unable to save profile to: \"%s\"",filename);
939static MagickBooleanType LoadOpenCLBenchmarks(MagickCLEnv clEnv)
941#if !MAGICKCORE_ZERO_CONFIGURATION_SUPPORT
943 filename[MagickPathExtent];
948 (void) FormatLocaleString(filename,MagickPathExtent,
"%s%s%s",
949 GetOpenCLCacheDirectory(),DirectorySeparator,IMAGEMAGICK_PROFILE_FILE);
955 if (CanWriteProfileToFile(filename) == MagickFalse)
961 for (i = 0; i < clEnv->number_devices; i++)
962 clEnv->devices[i]->score=1.0;
964 SelectOpenCLDevice(clEnv,CL_DEVICE_TYPE_GPU);
967#if !MAGICKCORE_ZERO_CONFIGURATION_SUPPORT
968 option=ConfigureFileToStringInfo(filename);
969 LoadOpenCLDeviceBenchmark(clEnv,(
const char *) GetStringInfoDatum(option));
970 option=DestroyStringInfo(option);
975static void AutoSelectOpenCLDevices(MagickCLEnv clEnv)
989 option=GetEnvironmentValue(
"MAGICK_OCL_DEVICE");
990 if (option != (
const char *) NULL)
992 if (strcmp(option,
"GPU") == 0)
993 SelectOpenCLDevice(clEnv,CL_DEVICE_TYPE_GPU);
994 else if (strcmp(option,
"CPU") == 0)
995 SelectOpenCLDevice(clEnv,CL_DEVICE_TYPE_CPU);
996 option=DestroyString(option);
999 if (LoadOpenCLBenchmarks(clEnv) == MagickFalse)
1002 benchmark=MagickFalse;
1003 if (clEnv->cpu_score == MAGICKCORE_OPENCL_UNDEFINED_SCORE)
1004 benchmark=MagickTrue;
1007 for (i = 0; i < clEnv->number_devices; i++)
1009 if (clEnv->devices[i]->score == MAGICKCORE_OPENCL_UNDEFINED_SCORE)
1011 benchmark=MagickTrue;
1017 if (benchmark != MagickFalse)
1018 BenchmarkOpenCLDevices(clEnv);
1020 best_score=clEnv->cpu_score;
1021 for (i = 0; i < clEnv->number_devices; i++)
1022 best_score=MagickMin(clEnv->devices[i]->score,best_score);
1024 for (i = 0; i < clEnv->number_devices; i++)
1026 if (clEnv->devices[i]->score != best_score)
1027 clEnv->devices[i]->enabled=MagickFalse;
1056static double RunOpenCLBenchmark(MagickBooleanType is_cpu)
1073 exception=AcquireExceptionInfo();
1074 imageInfo=AcquireImageInfo();
1075 CloneString(&imageInfo->size,
"2048x1536");
1076 (void) CopyMagickString(imageInfo->filename,
"xc:none",MagickPathExtent);
1077 inputImage=ReadImage(imageInfo,exception);
1078 if (inputImage == (Image *) NULL)
1081 InitAccelerateTimer(&timer);
1083 for (i=0; i<=2; i++)
1091 StartAccelerateTimer(&timer);
1093 blurredImage=BlurImage(inputImage,10.0f,3.5f,exception);
1094 unsharpedImage=UnsharpMaskImage(blurredImage,2.0f,2.0f,50.0f,10.0f,
1096 resizedImage=ResizeImage(unsharpedImage,640,480,LanczosFilter,
1103 if (is_cpu == MagickFalse)
1108 cache_info=(CacheInfo *) resizedImage->cache;
1109 if (cache_info->opencl != (MagickCLCacheInfo) NULL)
1110 openCL_library->clWaitForEvents(cache_info->opencl->event_count,
1111 cache_info->opencl->events);
1115 StopAccelerateTimer(&timer);
1117 if (blurredImage != (Image *) NULL)
1118 DestroyImage(blurredImage);
1119 if (unsharpedImage != (Image *) NULL)
1120 DestroyImage(unsharpedImage);
1121 if (resizedImage != (Image *) NULL)
1122 DestroyImage(resizedImage);
1124 DestroyImage(inputImage);
1125 return(ReadAccelerateTimer(&timer));
1128static void RunDeviceBenchmark(MagickCLEnv clEnv,MagickCLEnv testEnv,
1129 MagickCLDevice device)
1131 testEnv->devices[0]=device;
1132 default_CLEnv=testEnv;
1133 device->score=RunOpenCLBenchmark(MagickFalse);
1134 default_CLEnv=clEnv;
1135 testEnv->devices[0]=(MagickCLDevice) NULL;
1138static void CacheOpenCLBenchmarks(MagickCLEnv clEnv)
1141 filename[MagickPathExtent];
1153 (void) FormatLocaleString(filename,MagickPathExtent,
"%s%s%s",
1154 GetOpenCLCacheDirectory(),DirectorySeparator,
1155 IMAGEMAGICK_PROFILE_FILE);
1157 cache_file=fopen_utf8(filename,
"wb");
1158 if (cache_file == (FILE *) NULL)
1160 fwrite(
"<devices>\n",
sizeof(
char),10,cache_file);
1161 fprintf(cache_file,
" <device name=\"CPU\" score=\"%.4g\"/>\n",
1163 for (i = 0; i < clEnv->number_devices; i++)
1168 device=clEnv->devices[i];
1169 duplicate=MagickFalse;
1170 for (j = 0; j < i; j++)
1172 if (IsSameOpenCLDevice(clEnv->devices[j],device))
1174 duplicate=MagickTrue;
1182 if (device->score != MAGICKCORE_OPENCL_UNDEFINED_SCORE)
1183 fprintf(cache_file,
" <device platform=\"%s\" vendor=\"%s\" name=\"%s\"\
1184 version=\"%s\" maxClockFrequency=\"%d\" maxComputeUnits=\"%d\"\
1185 score=\"%.4g\"/>\n",
1186 device->platform_name,device->vendor_name,device->name,device->version,
1187 (
int)device->max_clock_frequency,(
int)device->max_compute_units,
1190 fwrite(
"</devices>",
sizeof(
char),10,cache_file);
1195static void BenchmarkOpenCLDevices(MagickCLEnv clEnv)
1207 (void) LogMagickEvent(AccelerateEvent,GetMagickModule(),
1208 "Starting benchmark");
1209 testEnv=AcquireMagickCLEnv();
1210 testEnv->library=openCL_library;
1211 testEnv->devices=(MagickCLDevice *) AcquireCriticalMemory(
1212 sizeof(MagickCLDevice));
1213 testEnv->number_devices=1;
1214 testEnv->benchmark_thread_id=GetMagickThreadId();
1215 testEnv->initialized=MagickTrue;
1217 for (i = 0; i < clEnv->number_devices; i++)
1218 clEnv->devices[i]->score=MAGICKCORE_OPENCL_UNDEFINED_SCORE;
1220 for (i = 0; i < clEnv->number_devices; i++)
1222 device=clEnv->devices[i];
1223 if (device->score == MAGICKCORE_OPENCL_UNDEFINED_SCORE)
1224 RunDeviceBenchmark(clEnv,testEnv,device);
1227 for (j = i+1; j < clEnv->number_devices; j++)
1232 other_device=clEnv->devices[j];
1233 if (IsSameOpenCLDevice(device,other_device))
1234 other_device->score=device->score;
1238 testEnv->enabled=MagickFalse;
1239 default_CLEnv=testEnv;
1240 clEnv->cpu_score=RunOpenCLBenchmark(MagickTrue);
1241 default_CLEnv=clEnv;
1243 testEnv=RelinquishMagickCLEnv(testEnv);
1244 CacheOpenCLBenchmarks(clEnv);
1281static void CacheOpenCLKernel(MagickCLDevice device,
char *filename,
1282 ExceptionInfo *exception)
1293 status=openCL_library->clGetProgramInfo(device->program,
1294 CL_PROGRAM_BINARY_SIZES,
sizeof(
size_t),&binaryProgramSize,NULL);
1295 if (status != CL_SUCCESS)
1297 binaryProgram=(
unsigned char*) AcquireQuantumMemory(1,binaryProgramSize);
1298 if (binaryProgram == (
unsigned char *) NULL)
1300 (void) ThrowMagickException(exception,GetMagickModule(),
1301 ResourceLimitError,
"MemoryAllocationFailed",
"`%s'",filename);
1304 status=openCL_library->clGetProgramInfo(device->program,
1305 CL_PROGRAM_BINARIES,
sizeof(
unsigned char*),&binaryProgram,NULL);
1306 if (status == CL_SUCCESS)
1308 (void) LogMagickEvent(AccelerateEvent,GetMagickModule(),
1309 "Creating cache file: \"%s\"",filename);
1310 (void) BlobToFile(filename,binaryProgram,binaryProgramSize,exception);
1312 binaryProgram=(
unsigned char *) RelinquishMagickMemory(binaryProgram);
1315static MagickBooleanType LoadCachedOpenCLKernels(MagickCLDevice device,
1316 const char *filename)
1331 sans_exception=AcquireExceptionInfo();
1332 binaryProgram=(
unsigned char *) FileToBlob(filename,SIZE_MAX,&length,
1334 sans_exception=DestroyExceptionInfo(sans_exception);
1335 if (binaryProgram == (
unsigned char *) NULL)
1336 return(MagickFalse);
1337 (void) LogMagickEvent(AccelerateEvent,GetMagickModule(),
1338 "Loaded cached kernels: \"%s\"",filename);
1339 device->program=openCL_library->clCreateProgramWithBinary(device->context,1,
1340 &device->deviceID,&length,(
const unsigned char**)&binaryProgram,
1341 &binaryStatus,&status);
1342 binaryProgram=(
unsigned char *) RelinquishMagickMemory(binaryProgram);
1343 return((status != CL_SUCCESS) || (binaryStatus != CL_SUCCESS) ? MagickFalse :
1347static void LogOpenCLBuildFailure(MagickCLDevice device,
const char *kernel,
1348 ExceptionInfo *exception)
1351 filename[MagickPathExtent],
1357 (void) FormatLocaleString(filename,MagickPathExtent,
"%s%s%s",
1358 GetOpenCLCacheDirectory(),DirectorySeparator,
"magick_badcl.cl");
1360 (void) remove_utf8(filename);
1361 (void) BlobToFile(filename,kernel,strlen(kernel),exception);
1363 openCL_library->clGetProgramBuildInfo(device->program,device->deviceID,
1364 CL_PROGRAM_BUILD_LOG,0,NULL,&log_size);
1365 log=(
char*)AcquireCriticalMemory(log_size);
1366 openCL_library->clGetProgramBuildInfo(device->program,device->deviceID,
1367 CL_PROGRAM_BUILD_LOG,log_size,log,&log_size);
1369 (void) FormatLocaleString(filename,MagickPathExtent,
"%s%s%s",
1370 GetOpenCLCacheDirectory(),DirectorySeparator,
"magick_badcl.log");
1372 (void) remove_utf8(filename);
1373 (void) BlobToFile(filename,log,log_size,exception);
1374 log=(
char*)RelinquishMagickMemory(log);
1377static MagickBooleanType CompileOpenCLKernel(MagickCLDevice device,
1378 const char *kernel,
const char *options,
size_t signature,
1379 ExceptionInfo *exception)
1382 deviceName[MagickPathExtent],
1383 filename[MagickPathExtent],
1395 (void) CopyMagickString(deviceName,device->name,MagickPathExtent);
1398 while (*ptr !=
'\0')
1400 if ((*ptr ==
' ') || (*ptr ==
'\\') || (*ptr ==
'/') || (*ptr ==
':') ||
1401 (*ptr ==
'*') || (*ptr ==
'?') || (*ptr ==
'"') || (*ptr ==
'<') ||
1402 (*ptr ==
'>' || *ptr ==
'|'))
1406 (void) FormatLocaleString(filename,MagickPathExtent,
1407 "%s%s%s_%s_%08x_%.20g.bin",GetOpenCLCacheDirectory(),
1408 DirectorySeparator,
"magick_opencl",deviceName,(
unsigned int) signature,
1409 (
double)
sizeof(
char*)*8);
1410 loaded=LoadCachedOpenCLKernels(device,filename);
1411 if (loaded == MagickFalse)
1414 length=strlen(kernel);
1415 device->program=openCL_library->clCreateProgramWithSource(
1416 device->context,1,&kernel,&length,&status);
1417 if (status != CL_SUCCESS)
1418 return(MagickFalse);
1421 status=openCL_library->clBuildProgram(device->program,1,&device->deviceID,
1423 if (status != CL_SUCCESS)
1425 (void) ThrowMagickException(exception,GetMagickModule(),DelegateWarning,
1426 "clBuildProgram failed.",
"(%d)",(
int)status);
1427 LogOpenCLBuildFailure(device,kernel,exception);
1428 return(MagickFalse);
1432 if (loaded == MagickFalse)
1433 CacheOpenCLKernel(device,filename,exception);
1438static cl_event* CopyOpenCLEvents(MagickCLCacheInfo first,
1439 MagickCLCacheInfo second,cl_uint *event_count)
1450 assert(first != (MagickCLCacheInfo) NULL);
1451 assert(event_count != (cl_uint *) NULL);
1452 events=(cl_event *) NULL;
1453 LockSemaphoreInfo(first->events_semaphore);
1454 if (second != (MagickCLCacheInfo) NULL)
1455 LockSemaphoreInfo(second->events_semaphore);
1456 *event_count=first->event_count;
1457 if (second != (MagickCLCacheInfo) NULL)
1458 *event_count+=second->event_count;
1459 if (*event_count > 0)
1461 events=(cl_event *) AcquireQuantumMemory(*event_count,
sizeof(*events));
1462 if (events == (cl_event *) NULL)
1467 for (i=0; i < first->event_count; i++, j++)
1468 events[j]=first->events[i];
1469 if (second != (MagickCLCacheInfo) NULL)
1471 for (i=0; i < second->event_count; i++, j++)
1472 events[j]=second->events[i];
1476 UnlockSemaphoreInfo(first->events_semaphore);
1477 if (second != (MagickCLCacheInfo) NULL)
1478 UnlockSemaphoreInfo(second->events_semaphore);
1504MagickPrivate MagickCLCacheInfo CopyMagickCLCacheInfo(MagickCLCacheInfo info)
1518 if (info == (MagickCLCacheInfo) NULL)
1519 return((MagickCLCacheInfo) NULL);
1520 events=CopyOpenCLEvents(info,(MagickCLCacheInfo) NULL,&event_count);
1521 if (events != (cl_event *) NULL)
1523 queue=AcquireOpenCLCommandQueue(info->device);
1524 pixels=(Quantum *) openCL_library->clEnqueueMapBuffer(queue,info->buffer,
1525 CL_TRUE,CL_MAP_READ | CL_MAP_WRITE,0,(
size_t) info->length,event_count,
1527 (cl_event *) NULL,(cl_int *) NULL);
1528 assert(pixels == info->pixels);
1529 ReleaseOpenCLCommandQueue(info->device,queue);
1530 events=(cl_event *) RelinquishMagickMemory(events);
1532 return(RelinquishMagickCLCacheInfo(info,MagickFalse));
1554MagickPrivate
void DumpOpenCLProfileData()
1556#define OpenCLLog(message) \
1557 fwrite(message,sizeof(char),strlen(message),log); \
1558 fwrite("\n",sizeof(char),1,log);
1562 filename[MagickPathExtent],
1572 if (default_CLEnv == (MagickCLEnv) NULL)
1575 for (i = 0; i < default_CLEnv->number_devices; i++)
1576 if (default_CLEnv->devices[i]->profile_kernels != MagickFalse)
1578 if (i == default_CLEnv->number_devices)
1581 (void) FormatLocaleString(filename,MagickPathExtent,
"%s%s%s",
1582 GetOpenCLCacheDirectory(),DirectorySeparator,
"ImageMagickOpenCL.log");
1584 log=fopen_utf8(filename,
"wb");
1585 if (log == (FILE *) NULL)
1587 for (i = 0; i < default_CLEnv->number_devices; i++)
1592 device=default_CLEnv->devices[i];
1593 if ((device->profile_kernels == MagickFalse) ||
1594 (device->profile_records == (KernelProfileRecord *) NULL))
1597 OpenCLLog(
"====================================================");
1598 fprintf(log,
"Device: %s\n",device->name);
1599 fprintf(log,
"Version: %s\n",device->version);
1600 OpenCLLog(
"====================================================");
1601 OpenCLLog(
" average calls min max");
1602 OpenCLLog(
" ------- ----- --- ---");
1604 while (device->profile_records[j] != (KernelProfileRecord) NULL)
1609 profile=device->profile_records[j];
1610 (void) CopyMagickString(indent,
" ",
1612 (void) CopyMagickString(indent,profile->kernel_name,MagickMin(strlen(
1613 profile->kernel_name),strlen(indent)));
1614 (void) FormatLocaleString(buf,
sizeof(buf),
"%s %7d %7d %7d %7d",indent,
1615 (
int) (profile->total/profile->count),(
int) profile->count,
1616 (
int) profile->min,(
int) profile->max);
1620 OpenCLLog(
"====================================================");
1621 fwrite(
"\n\n",
sizeof(
char),2,log);
1673static MagickBooleanType RegisterCacheEvent(MagickCLCacheInfo info,
1676 assert(info != (MagickCLCacheInfo) NULL);
1677 assert(event != (cl_event) NULL);
1678 if (openCL_library->clRetainEvent(event) != CL_SUCCESS)
1680 openCL_library->clWaitForEvents(1,&event);
1681 return(MagickFalse);
1683 LockSemaphoreInfo(info->events_semaphore);
1684 if (info->events == (cl_event *) NULL)
1686 info->events=(cl_event *) AcquireMagickMemory(
sizeof(*info->events));
1687 info->event_count=1;
1690 info->events=(cl_event *) ResizeQuantumMemory(info->events,
1691 ++info->event_count,
sizeof(*info->events));
1692 if (info->events == (cl_event *) NULL)
1693 ThrowFatalException(ResourceLimitFatalError,
"MemoryAllocationFailed");
1694 info->events[info->event_count-1]=event;
1695 UnlockSemaphoreInfo(info->events_semaphore);
1699MagickPrivate MagickBooleanType EnqueueOpenCLKernel(cl_command_queue queue,
1700 cl_kernel kernel,cl_uint work_dim,
const size_t *offset,
const size_t *gsize,
1701 const size_t *lsize,
const Image *input_image,
const Image *output_image,
1702 MagickBooleanType flush,ExceptionInfo *exception)
1718 assert(input_image != (
const Image *) NULL);
1719 input_info=(CacheInfo *) input_image->cache;
1720 assert(input_info != (CacheInfo *) NULL);
1721 assert(input_info->opencl != (MagickCLCacheInfo) NULL);
1722 output_info=(CacheInfo *) NULL;
1723 if (output_image == (
const Image *) NULL)
1724 events=CopyOpenCLEvents(input_info->opencl,(MagickCLCacheInfo) NULL,
1728 output_info=(CacheInfo *) output_image->cache;
1729 assert(output_info != (CacheInfo *) NULL);
1730 assert(output_info->opencl != (MagickCLCacheInfo) NULL);
1731 events=CopyOpenCLEvents(input_info->opencl,output_info->opencl,
1734 status=openCL_library->clEnqueueNDRangeKernel(queue,kernel,work_dim,offset,
1735 gsize,lsize,event_count,events,&event);
1737 if ((status != CL_SUCCESS) && (event_count > 0))
1739 openCL_library->clFinish(queue);
1740 status=openCL_library->clEnqueueNDRangeKernel(queue,kernel,work_dim,
1741 offset,gsize,lsize,event_count,events,&event);
1743 events=(cl_event *) RelinquishMagickMemory(events);
1744 if (status != CL_SUCCESS)
1746 (void) OpenCLThrowMagickException(input_info->opencl->device,exception,
1747 GetMagickModule(),ResourceLimitWarning,
1748 "clEnqueueNDRangeKernel failed.",
"'%s'",
".");
1749 return(MagickFalse);
1751 if (flush != MagickFalse)
1752 openCL_library->clFlush(queue);
1753 if (RecordProfileData(input_info->opencl->device,kernel,event) == MagickFalse)
1755 if (RegisterCacheEvent(input_info->opencl,event) != MagickFalse)
1757 if (output_info != (CacheInfo *) NULL)
1758 (void) RegisterCacheEvent(output_info->opencl,event);
1761 openCL_library->clReleaseEvent(event);
1784MagickPrivate MagickCLEnv GetCurrentOpenCLEnv(
void)
1786 if (default_CLEnv != (MagickCLEnv) NULL)
1788 if ((default_CLEnv->benchmark_thread_id != (MagickThreadType) 0) &&
1789 (default_CLEnv->benchmark_thread_id != GetMagickThreadId()))
1790 return((MagickCLEnv) NULL);
1792 return(default_CLEnv);
1795 if (GetOpenCLCacheDirectory() == (
char *) NULL)
1796 return((MagickCLEnv) NULL);
1799 ActivateSemaphoreInfo(&openCL_lock);
1801 LockSemaphoreInfo(openCL_lock);
1802 if (default_CLEnv == (MagickCLEnv) NULL)
1803 default_CLEnv=AcquireMagickCLEnv();
1804 UnlockSemaphoreInfo(openCL_lock);
1806 return(default_CLEnv);
1833MagickExport
double GetOpenCLDeviceBenchmarkScore(
1834 const MagickCLDevice device)
1836 if (device == (MagickCLDevice) NULL)
1837 return(MAGICKCORE_OPENCL_UNDEFINED_SCORE);
1838 return(device->score);
1863MagickExport MagickBooleanType GetOpenCLDeviceEnabled(
1864 const MagickCLDevice device)
1866 if (device == (MagickCLDevice) NULL)
1867 return(MagickFalse);
1868 return(device->enabled);
1893MagickExport
const char *GetOpenCLDeviceName(
const MagickCLDevice device)
1895 if (device == (MagickCLDevice) NULL)
1896 return((
const char *) NULL);
1897 return(device->name);
1922MagickExport
const char *GetOpenCLDeviceVendorName(
const MagickCLDevice device)
1924 if (device == (MagickCLDevice) NULL)
1925 return((
const char *) NULL);
1926 return(device->vendor_name);
1956MagickExport MagickCLDevice *GetOpenCLDevices(
size_t *length,
1957 ExceptionInfo *exception)
1962 clEnv=GetCurrentOpenCLEnv();
1963 if (clEnv == (MagickCLEnv) NULL)
1965 if (length != (
size_t *) NULL)
1967 return((MagickCLDevice *) NULL);
1969 InitializeOpenCL(clEnv,exception);
1970 if (length != (
size_t *) NULL)
1971 *length=clEnv->number_devices;
1972 return(clEnv->devices);
1997MagickExport MagickCLDeviceType GetOpenCLDeviceType(
1998 const MagickCLDevice device)
2000 if (device == (MagickCLDevice) NULL)
2001 return(UndefinedCLDeviceType);
2002 if (device->type == CL_DEVICE_TYPE_GPU)
2003 return(GpuCLDeviceType);
2004 if (device->type == CL_DEVICE_TYPE_CPU)
2005 return(CpuCLDeviceType);
2006 return(UndefinedCLDeviceType);
2031MagickExport
const char *GetOpenCLDeviceVersion(
const MagickCLDevice device)
2033 if (device == (MagickCLDevice) NULL)
2034 return((
const char *) NULL);
2035 return(device->version);
2057MagickExport MagickBooleanType GetOpenCLEnabled(
void)
2062 clEnv=GetCurrentOpenCLEnv();
2063 if (clEnv == (MagickCLEnv) NULL)
2064 return(MagickFalse);
2065 return(clEnv->enabled);
2091MagickExport
const KernelProfileRecord *GetOpenCLKernelProfileRecords(
2092 const MagickCLDevice device,
size_t *length)
2094 if ((device == (
const MagickCLDevice) NULL) || (device->profile_records ==
2095 (KernelProfileRecord *) NULL))
2097 if (length != (
size_t *) NULL)
2099 return((
const KernelProfileRecord *) NULL);
2101 if (length != (
size_t *) NULL)
2104 LockSemaphoreInfo(device->lock);
2105 while (device->profile_records[*length] != (KernelProfileRecord) NULL)
2107 UnlockSemaphoreInfo(device->lock);
2109 return(device->profile_records);
2140static MagickBooleanType HasOpenCLDevices(MagickCLEnv clEnv,
2141 ExceptionInfo *exception)
2144 *accelerateKernelsBuffer,
2145 options[MagickPathExtent];
2157 for (i = 0; i < clEnv->number_devices; i++)
2159 if ((clEnv->devices[i]->enabled != MagickFalse))
2162 if (i == clEnv->number_devices)
2163 return(MagickFalse);
2167 for (i = 0; i < clEnv->number_devices; i++)
2169 if ((clEnv->devices[i]->enabled != MagickFalse) &&
2170 (clEnv->devices[i]->program == (cl_program) NULL))
2176 if (status != MagickFalse)
2180 (void) FormatLocaleString(options,MagickPathExtent,CLOptions,
2181 (
float)QuantumRange,(
float)CLCharQuantumScale,(
float)MagickEpsilon,
2182 (
float)MagickPI,(
unsigned int)MaxMap,(
unsigned int)MAGICKCORE_QUANTUM_DEPTH);
2184 signature=StringSignature(options);
2185 accelerateKernelsBuffer=(
char*) AcquireQuantumMemory(1,
2186 strlen(accelerateKernels)+strlen(accelerateKernels2)+1);
2187 if (accelerateKernelsBuffer == (
char*) NULL)
2188 return(MagickFalse);
2189 (void) FormatLocaleString(accelerateKernelsBuffer,strlen(accelerateKernels)+
2190 strlen(accelerateKernels2)+1,
"%s%s",accelerateKernels,accelerateKernels2);
2191 signature^=StringSignature(accelerateKernelsBuffer);
2194 for (i = 0; i < clEnv->number_devices; i++)
2202 device=clEnv->devices[i];
2203 if ((device->enabled == MagickFalse) ||
2204 (device->program != (cl_program) NULL))
2207 LockSemaphoreInfo(device->lock);
2208 if (device->program != (cl_program) NULL)
2210 UnlockSemaphoreInfo(device->lock);
2213 device_signature=signature;
2214 device_signature^=StringSignature(device->platform_name);
2215 status=CompileOpenCLKernel(device,accelerateKernelsBuffer,options,
2216 device_signature,exception);
2217 UnlockSemaphoreInfo(device->lock);
2218 if (status == MagickFalse)
2221 accelerateKernelsBuffer=(
char *) RelinquishMagickMemory(
2222 accelerateKernelsBuffer);
2250static cl_uint GetOpenCLDeviceCount(MagickCLEnv clEnv,cl_platform_id platform)
2253 version[MagickPathExtent];
2258 if (clEnv->library->clGetPlatformInfo(platform,CL_PLATFORM_VERSION,
2259 MagickPathExtent,version,NULL) != CL_SUCCESS)
2261 if (strncmp(version,
"OpenCL 1.0 ",11) == 0)
2263 if (clEnv->library->clGetDeviceIDs(platform,
2264 CL_DEVICE_TYPE_CPU|CL_DEVICE_TYPE_GPU,0,NULL,&num) != CL_SUCCESS)
2269static inline char *GetOpenCLPlatformString(cl_platform_id platform,
2270 cl_platform_info param_name)
2278 openCL_library->clGetPlatformInfo(platform,param_name,0,NULL,&length);
2279 value=(
char *) AcquireCriticalMemory(length*
sizeof(*value));
2280 openCL_library->clGetPlatformInfo(platform,param_name,length,value,NULL);
2284static inline char *GetOpenCLDeviceString(cl_device_id device,
2285 cl_device_info param_name)
2293 openCL_library->clGetDeviceInfo(device,param_name,0,NULL,&length);
2294 value=(
char *) AcquireCriticalMemory(length*
sizeof(*value));
2295 openCL_library->clGetDeviceInfo(device,param_name,length,value,NULL);
2299static void LoadOpenCLDevices(MagickCLEnv clEnv)
2301 cl_context_properties
2321 if (openCL_library->clGetPlatformIDs(0,NULL,&number_platforms) != CL_SUCCESS)
2323 if (number_platforms == 0)
2325 platforms=(cl_platform_id *) AcquireQuantumMemory(1,number_platforms*
2326 sizeof(cl_platform_id));
2327 if (platforms == (cl_platform_id *) NULL)
2329 if (openCL_library->clGetPlatformIDs(number_platforms,platforms,NULL) != CL_SUCCESS)
2331 platforms=(cl_platform_id *) RelinquishMagickMemory(platforms);
2334 for (i = 0; i < number_platforms; i++)
2336 number_devices=GetOpenCLDeviceCount(clEnv,platforms[i]);
2337 if (number_devices == 0)
2338 platforms[i]=(cl_platform_id) NULL;
2340 clEnv->number_devices+=number_devices;
2342 if (clEnv->number_devices == 0)
2344 platforms=(cl_platform_id *) RelinquishMagickMemory(platforms);
2347 clEnv->devices=(MagickCLDevice *) AcquireQuantumMemory(clEnv->number_devices,
2348 sizeof(MagickCLDevice));
2349 if (clEnv->devices == (MagickCLDevice *) NULL)
2351 RelinquishMagickCLDevices(clEnv);
2352 platforms=(cl_platform_id *) RelinquishMagickMemory(platforms);
2355 (void) memset(clEnv->devices,0,clEnv->number_devices*
sizeof(MagickCLDevice));
2356 devices=(cl_device_id *) AcquireQuantumMemory(clEnv->number_devices,
2357 sizeof(cl_device_id));
2358 if (devices == (cl_device_id *) NULL)
2360 platforms=(cl_platform_id *) RelinquishMagickMemory(platforms);
2361 RelinquishMagickCLDevices(clEnv);
2364 (void) memset(devices,0,clEnv->number_devices*
sizeof(cl_device_id));
2365 clEnv->number_contexts=(size_t) number_platforms;
2366 clEnv->contexts=(cl_context *) AcquireQuantumMemory(clEnv->number_contexts,
2367 sizeof(cl_context));
2368 if (clEnv->contexts == (cl_context *) NULL)
2370 devices=(cl_device_id *) RelinquishMagickMemory(devices);
2371 platforms=(cl_platform_id *) RelinquishMagickMemory(platforms);
2372 RelinquishMagickCLDevices(clEnv);
2375 (void) memset(clEnv->contexts,0,clEnv->number_contexts*
sizeof(cl_context));
2377 for (i = 0; i < number_platforms; i++)
2379 if (platforms[i] == (cl_platform_id) NULL)
2382 status=clEnv->library->clGetDeviceIDs(platforms[i],CL_DEVICE_TYPE_CPU |
2383 CL_DEVICE_TYPE_GPU,(cl_uint) clEnv->number_devices,devices,&number_devices);
2384 if (status != CL_SUCCESS)
2387 properties[0]=CL_CONTEXT_PLATFORM;
2388 properties[1]=(cl_context_properties) platforms[i];
2390 clEnv->contexts[i]=openCL_library->clCreateContext(properties,number_devices,
2391 devices,NULL,NULL,&status);
2392 if (status != CL_SUCCESS)
2395 for (j = 0; j < number_devices; j++,next++)
2400 device=AcquireMagickCLDevice();
2401 if (device == (MagickCLDevice) NULL)
2404 device->context=clEnv->contexts[i];
2405 device->deviceID=devices[j];
2407 device->platform_name=GetOpenCLPlatformString(platforms[i],
2410 device->vendor_name=GetOpenCLPlatformString(platforms[i],
2411 CL_PLATFORM_VENDOR);
2413 device->name=GetOpenCLDeviceString(devices[j],CL_DEVICE_NAME);
2415 device->version=GetOpenCLDeviceString(devices[j],CL_DRIVER_VERSION);
2417 openCL_library->clGetDeviceInfo(devices[j],CL_DEVICE_MAX_CLOCK_FREQUENCY,
2418 sizeof(cl_uint),&device->max_clock_frequency,NULL);
2420 openCL_library->clGetDeviceInfo(devices[j],CL_DEVICE_MAX_COMPUTE_UNITS,
2421 sizeof(cl_uint),&device->max_compute_units,NULL);
2423 openCL_library->clGetDeviceInfo(devices[j],CL_DEVICE_TYPE,
2424 sizeof(cl_device_type),&device->type,NULL);
2426 openCL_library->clGetDeviceInfo(devices[j],CL_DEVICE_LOCAL_MEM_SIZE,
2427 sizeof(cl_ulong),&device->local_memory_size,NULL);
2429 clEnv->devices[next]=device;
2430 (void) LogMagickEvent(AccelerateEvent,GetMagickModule(),
2431 "Found device: %s (%s)",device->name,device->platform_name);
2434 if (next != clEnv->number_devices)
2435 RelinquishMagickCLDevices(clEnv);
2436 platforms=(cl_platform_id *) RelinquishMagickMemory(platforms);
2437 devices=(cl_device_id *) RelinquishMagickMemory(devices);
2440MagickPrivate MagickBooleanType InitializeOpenCL(MagickCLEnv clEnv,
2441 ExceptionInfo *exception)
2443 LockSemaphoreInfo(clEnv->lock);
2444 if (clEnv->initialized != MagickFalse)
2446 UnlockSemaphoreInfo(clEnv->lock);
2447 return(HasOpenCLDevices(clEnv,exception));
2449 if (LoadOpenCLLibrary() != MagickFalse)
2451 clEnv->library=openCL_library;
2452 LoadOpenCLDevices(clEnv);
2453 if (clEnv->number_devices > 0)
2454 AutoSelectOpenCLDevices(clEnv);
2456 clEnv->initialized=MagickTrue;
2457 UnlockSemaphoreInfo(clEnv->lock);
2458 return(HasOpenCLDevices(clEnv,exception));
2480void *OsLibraryGetFunctionAddress(
void *library,
const char *functionName)
2482 if ((library == (
void *) NULL) || (functionName == (
const char *) NULL))
2483 return (
void *) NULL;
2484 return lt_dlsym(library,functionName);
2487static MagickBooleanType BindOpenCLFunctions()
2489#ifdef MAGICKCORE_HAVE_OPENCL_CL_H
2490#define BIND(X) openCL_library->X= &X;
2492 (void) memset(openCL_library,0,
sizeof(MagickLibrary));
2493#ifdef MAGICKCORE_WINDOWS_SUPPORT
2494 openCL_library->library=(
void *)lt_dlopen(
"OpenCL.dll");
2496 openCL_library->library=(
void *)lt_dlopen(
"libOpenCL.so");
2499 if ((openCL_library->X=(MAGICKpfn_##X)OsLibraryGetFunctionAddress(openCL_library->library,#X)) == NULL) \
2500 return(MagickFalse);
2503 if (openCL_library->library == (
void*) NULL)
2504 return(MagickFalse);
2506 BIND(clGetPlatformIDs);
2507 BIND(clGetPlatformInfo);
2509 BIND(clGetDeviceIDs);
2510 BIND(clGetDeviceInfo);
2512 BIND(clCreateBuffer);
2513 BIND(clReleaseMemObject);
2514 BIND(clRetainMemObject);
2516 BIND(clCreateContext);
2517 BIND(clReleaseContext);
2519 BIND(clCreateCommandQueue);
2520 BIND(clReleaseCommandQueue);
2524 BIND(clCreateProgramWithSource);
2525 BIND(clCreateProgramWithBinary);
2526 BIND(clReleaseProgram);
2527 BIND(clBuildProgram);
2528 BIND(clGetProgramBuildInfo);
2529 BIND(clGetProgramInfo);
2531 BIND(clCreateKernel);
2532 BIND(clReleaseKernel);
2533 BIND(clSetKernelArg);
2534 BIND(clGetKernelInfo);
2536 BIND(clEnqueueReadBuffer);
2537 BIND(clEnqueueMapBuffer);
2538 BIND(clEnqueueUnmapMemObject);
2539 BIND(clEnqueueNDRangeKernel);
2541 BIND(clGetEventInfo);
2542 BIND(clWaitForEvents);
2543 BIND(clReleaseEvent);
2544 BIND(clRetainEvent);
2545 BIND(clSetEventCallback);
2547 BIND(clGetEventProfilingInfo);
2552static MagickBooleanType LoadOpenCLLibrary(
void)
2554 openCL_library=(MagickLibrary *) AcquireMagickMemory(
sizeof(MagickLibrary));
2555 if (openCL_library == (MagickLibrary *) NULL)
2556 return(MagickFalse);
2558 if (BindOpenCLFunctions() == MagickFalse)
2560 openCL_library=(MagickLibrary *)RelinquishMagickMemory(openCL_library);
2561 return(MagickFalse);
2586MagickPrivate
void OpenCLTerminus()
2588 DumpOpenCLProfileData();
2589 if (cache_directory != (
char *) NULL)
2590 cache_directory=DestroyString(cache_directory);
2592 RelinquishSemaphoreInfo(&cache_directory_lock);
2593 if (default_CLEnv != (MagickCLEnv) NULL)
2594 default_CLEnv=RelinquishMagickCLEnv(default_CLEnv);
2596 RelinquishSemaphoreInfo(&openCL_lock);
2597 if (openCL_library != (MagickLibrary *) NULL)
2599 if (openCL_library->library != (
void *) NULL)
2600 (void) lt_dlclose(openCL_library->library);
2601 openCL_library=(MagickLibrary *) RelinquishMagickMemory(openCL_library);
2644MagickPrivate MagickBooleanType OpenCLThrowMagickException(
2645 MagickCLDevice device,ExceptionInfo *exception,
const char *module,
2646 const char *function,
const size_t line,
const ExceptionType severity,
2647 const char *tag,
const char *format,...)
2652 assert(device != (MagickCLDevice) NULL);
2653 assert(exception != (ExceptionInfo *) NULL);
2654 assert(exception->signature == MagickCoreSignature);
2659 if (device->type == CL_DEVICE_TYPE_CPU)
2663 if (strncmp(device->platform_name,
"Intel",5) == 0)
2664 default_CLEnv->enabled=MagickFalse;
2668#ifdef OPENCLLOG_ENABLED
2672 va_start(operands,format);
2673 status=ThrowMagickExceptionList(exception,module,function,line,severity,tag,
2678 magick_unreferenced(module);
2679 magick_unreferenced(function);
2680 magick_unreferenced(line);
2681 magick_unreferenced(tag);
2682 magick_unreferenced(format);
2714MagickPrivate MagickBooleanType RecordProfileData(MagickCLDevice device,
2715 cl_kernel kernel,cl_event event)
2735 if (device->profile_kernels == MagickFalse)
2736 return(MagickFalse);
2737 status=openCL_library->clWaitForEvents(1,&event);
2738 if (status != CL_SUCCESS)
2739 return(MagickFalse);
2740 status=openCL_library->clGetKernelInfo(kernel,CL_KERNEL_FUNCTION_NAME,0,NULL,
2742 if (status != CL_SUCCESS)
2744 name=(
char *) AcquireQuantumMemory(length,
sizeof(*name));
2745 if (name == (
char *) NULL)
2747 start=end=elapsed=0;
2748 status=openCL_library->clGetKernelInfo(kernel,CL_KERNEL_FUNCTION_NAME,length,
2749 name,(
size_t *) NULL);
2750 status|=openCL_library->clGetEventProfilingInfo(event,
2751 CL_PROFILING_COMMAND_START,
sizeof(cl_ulong),&start,NULL);
2752 status|=openCL_library->clGetEventProfilingInfo(event,
2753 CL_PROFILING_COMMAND_END,
sizeof(cl_ulong),&end,NULL);
2754 if (status != CL_SUCCESS)
2756 name=DestroyString(name);
2762 LockSemaphoreInfo(device->lock);
2764 profile_record=(KernelProfileRecord) NULL;
2765 if (device->profile_records != (KernelProfileRecord *) NULL)
2767 while (device->profile_records[i] != (KernelProfileRecord) NULL)
2769 if (LocaleCompare(device->profile_records[i]->kernel_name,name) == 0)
2771 profile_record=device->profile_records[i];
2777 if (profile_record != (KernelProfileRecord) NULL)
2778 name=DestroyString(name);
2781 profile_record=(KernelProfileRecord) AcquireCriticalMemory(
2782 sizeof(*profile_record));
2783 (void) memset(profile_record,0,
sizeof(*profile_record));
2784 profile_record->kernel_name=name;
2785 device->profile_records=(KernelProfileRecord *) ResizeQuantumMemory(
2786 device->profile_records,(i+2),
sizeof(*device->profile_records));
2787 if (device->profile_records == (KernelProfileRecord *) NULL)
2788 ThrowFatalException(ResourceLimitFatalError,
"MemoryAllocationFailed");
2789 device->profile_records[i]=profile_record;
2790 device->profile_records[i+1]=(KernelProfileRecord) NULL;
2792 if ((elapsed < profile_record->min) || (profile_record->count == 0))
2793 profile_record->min=(
unsigned long) elapsed;
2794 if (elapsed > profile_record->max)
2795 profile_record->max=(
unsigned long) elapsed;
2796 profile_record->total+=(
unsigned long) elapsed;
2797 profile_record->count+=1;
2798 UnlockSemaphoreInfo(device->lock);
2827MagickPrivate
void ReleaseOpenCLCommandQueue(MagickCLDevice device,
2828 cl_command_queue queue)
2830 if (queue == (cl_command_queue) NULL)
2833 assert(device != (MagickCLDevice) NULL);
2834 LockSemaphoreInfo(device->lock);
2835 if ((device->profile_kernels != MagickFalse) ||
2836 (device->command_queues_index >= MAGICKCORE_OPENCL_COMMAND_QUEUES-1))
2838 UnlockSemaphoreInfo(device->lock);
2839 openCL_library->clFinish(queue);
2840 (void) openCL_library->clReleaseCommandQueue(queue);
2844 openCL_library->clFlush(queue);
2845 device->command_queues[++device->command_queues_index]=queue;
2846 UnlockSemaphoreInfo(device->lock);
2873MagickPrivate
void ReleaseOpenCLDevice(MagickCLDevice device)
2875 assert(device != (MagickCLDevice) NULL);
2876 LockSemaphoreInfo(openCL_lock);
2877 device->requested--;
2878 UnlockSemaphoreInfo(openCL_lock);
2908static void CL_API_CALL DestroyMagickCLCacheInfoAndPixels(
2909 cl_event magick_unused(event),
2910 cl_int magick_unused(event_command_exec_status),
void *user_data)
2921 magick_unreferenced(event);
2922 magick_unreferenced(event_command_exec_status);
2923 info=(MagickCLCacheInfo) user_data;
2924 for (i=(ssize_t)info->event_count-1; i >= 0; i--)
2932 status=openCL_library->clGetEventInfo(info->events[i],
2933 CL_EVENT_COMMAND_EXECUTION_STATUS,
sizeof(event_status),&event_status,
2935 if ((status == CL_SUCCESS) && (event_status > CL_COMPLETE))
2937 openCL_library->clSetEventCallback(info->events[i],CL_COMPLETE,
2938 &DestroyMagickCLCacheInfoAndPixels,info);
2942 pixels=info->pixels;
2943 RelinquishMagickResource(MemoryResource,info->length);
2944 DestroyMagickCLCacheInfo(info);
2945 (void) RelinquishAlignedMemory(pixels);
2948MagickPrivate MagickCLCacheInfo RelinquishMagickCLCacheInfo(
2949 MagickCLCacheInfo info,
const MagickBooleanType relinquish_pixels)
2951 if (info == (MagickCLCacheInfo) NULL)
2952 return((MagickCLCacheInfo) NULL);
2953 if (relinquish_pixels != MagickFalse)
2954 DestroyMagickCLCacheInfoAndPixels((cl_event) NULL,0,info);
2956 DestroyMagickCLCacheInfo(info);
2957 return((MagickCLCacheInfo) NULL);
2983static MagickCLDevice RelinquishMagickCLDevice(MagickCLDevice device)
2985 if (device == (MagickCLDevice) NULL)
2986 return((MagickCLDevice) NULL);
2988 device->platform_name=(
char *) RelinquishMagickMemory(device->platform_name);
2989 device->vendor_name=(
char *) RelinquishMagickMemory(device->vendor_name);
2990 device->name=(
char *) RelinquishMagickMemory(device->name);
2991 device->version=(
char *) RelinquishMagickMemory(device->version);
2992 if (device->program != (cl_program) NULL)
2993 (void) openCL_library->clReleaseProgram(device->program);
2994 while (device->command_queues_index >= 0)
2995 (void) openCL_library->clReleaseCommandQueue(
2996 device->command_queues[device->command_queues_index--]);
2997 RelinquishSemaphoreInfo(&device->lock);
2998 return((MagickCLDevice) RelinquishMagickMemory(device));
3024static MagickCLEnv RelinquishMagickCLEnv(MagickCLEnv clEnv)
3026 if (clEnv == (MagickCLEnv) NULL)
3027 return((MagickCLEnv) NULL);
3029 RelinquishSemaphoreInfo(&clEnv->lock);
3030 RelinquishMagickCLDevices(clEnv);
3031 if (clEnv->contexts != (cl_context *) NULL)
3036 for (i=0; i < (ssize_t) clEnv->number_contexts; i++)
3037 if (clEnv->contexts[i] != (cl_context) NULL)
3038 (void) openCL_library->clReleaseContext(clEnv->contexts[i]);
3039 clEnv->contexts=(cl_context *) RelinquishMagickMemory(clEnv->contexts);
3041 return((MagickCLEnv) RelinquishMagickMemory(clEnv));
3066MagickPrivate MagickCLDevice RequestOpenCLDevice(MagickCLEnv clEnv)
3078 if (clEnv == (MagickCLEnv) NULL)
3079 return((MagickCLDevice) NULL);
3081 if (clEnv->number_devices == 1)
3083 if (clEnv->devices[0]->enabled)
3084 return(clEnv->devices[0]);
3086 return((MagickCLDevice) NULL);
3089 device=(MagickCLDevice) NULL;
3091 LockSemaphoreInfo(openCL_lock);
3092 for (i = 0; i < clEnv->number_devices; i++)
3094 if (clEnv->devices[i]->enabled == MagickFalse)
3097 score=clEnv->devices[i]->score+(clEnv->devices[i]->score*
3098 clEnv->devices[i]->requested);
3099 if ((device == (MagickCLDevice) NULL) || (score < best_score))
3101 device=clEnv->devices[i];
3105 if (device != (MagickCLDevice)NULL)
3106 device->requested++;
3107 UnlockSemaphoreInfo(openCL_lock);
3137MagickExport
void SetOpenCLDeviceEnabled(MagickCLDevice device,
3138 const MagickBooleanType value)
3140 if (device == (MagickCLDevice) NULL)
3142 device->enabled=value;
3172MagickExport
void SetOpenCLKernelProfileEnabled(MagickCLDevice device,
3173 const MagickBooleanType value)
3175 if (device == (MagickCLDevice) NULL)
3177 device->profile_kernels=value;
3202MagickExport MagickBooleanType SetOpenCLEnabled(
const MagickBooleanType value)
3207 clEnv=GetCurrentOpenCLEnv();
3208 if (clEnv == (MagickCLEnv) NULL)
3209 return(MagickFalse);
3210 clEnv->enabled=value;
3211 return(clEnv->enabled);
3216MagickExport
double GetOpenCLDeviceBenchmarkScore(
3217 const MagickCLDevice magick_unused(device))
3219 magick_unreferenced(device);
3223MagickExport MagickBooleanType GetOpenCLDeviceEnabled(
3224 const MagickCLDevice magick_unused(device))
3226 magick_unreferenced(device);
3227 return(MagickFalse);
3230MagickExport
const char *GetOpenCLDeviceName(
3231 const MagickCLDevice magick_unused(device))
3233 magick_unreferenced(device);
3234 return((
const char *) NULL);
3237MagickExport MagickCLDevice *GetOpenCLDevices(
size_t *length,
3238 ExceptionInfo *magick_unused(exception))
3240 magick_unreferenced(exception);
3241 if (length != (
size_t *) NULL)
3243 return((MagickCLDevice *) NULL);
3246MagickExport MagickCLDeviceType GetOpenCLDeviceType(
3247 const MagickCLDevice magick_unused(device))
3249 magick_unreferenced(device);
3250 return(UndefinedCLDeviceType);
3253MagickExport
const KernelProfileRecord *GetOpenCLKernelProfileRecords(
3254 const MagickCLDevice magick_unused(device),
size_t *length)
3256 magick_unreferenced(device);
3257 if (length != (
size_t *) NULL)
3259 return((
const KernelProfileRecord *) NULL);
3262MagickExport
const char *GetOpenCLDeviceVersion(
3263 const MagickCLDevice magick_unused(device))
3265 magick_unreferenced(device);
3266 return((
const char *) NULL);
3269MagickExport MagickBooleanType GetOpenCLEnabled(
void)
3271 return(MagickFalse);
3274MagickExport
void SetOpenCLDeviceEnabled(
3275 MagickCLDevice magick_unused(device),
3276 const MagickBooleanType magick_unused(value))
3278 magick_unreferenced(device);
3279 magick_unreferenced(value);
3282MagickExport MagickBooleanType SetOpenCLEnabled(
3283 const MagickBooleanType magick_unused(value))
3285 magick_unreferenced(value);
3286 return(MagickFalse);
3289MagickExport
void SetOpenCLKernelProfileEnabled(
3290 MagickCLDevice magick_unused(device),
3291 const MagickBooleanType magick_unused(value))
3293 magick_unreferenced(device);
3294 magick_unreferenced(value);