program.hpp 20 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650
  1. //---------------------------------------------------------------------------//
  2. // Copyright (c) 2013 Kyle Lutz <kyle.r.lutz@gmail.com>
  3. //
  4. // Distributed under the Boost Software License, Version 1.0
  5. // See accompanying file LICENSE_1_0.txt or copy at
  6. // http://www.boost.org/LICENSE_1_0.txt
  7. //
  8. // See http://boostorg.github.com/compute for more information.
  9. //---------------------------------------------------------------------------//
  10. #ifndef BOOST_COMPUTE_PROGRAM_HPP
  11. #define BOOST_COMPUTE_PROGRAM_HPP
  12. #include <string>
  13. #include <vector>
  14. #include <fstream>
  15. #include <streambuf>
  16. #ifdef BOOST_COMPUTE_DEBUG_KERNEL_COMPILATION
  17. #include <iostream>
  18. #endif
  19. #include <boost/compute/config.hpp>
  20. #include <boost/compute/context.hpp>
  21. #include <boost/compute/exception.hpp>
  22. #include <boost/compute/detail/assert_cl_success.hpp>
  23. #ifdef BOOST_COMPUTE_USE_OFFLINE_CACHE
  24. #include <sstream>
  25. #include <boost/optional.hpp>
  26. #include <boost/compute/platform.hpp>
  27. #include <boost/compute/detail/getenv.hpp>
  28. #include <boost/compute/detail/path.hpp>
  29. #include <boost/compute/detail/sha1.hpp>
  30. #endif
  31. namespace boost {
  32. namespace compute {
  33. class kernel;
  34. /// \class program
  35. /// \brief A compute program.
  36. ///
  37. /// The program class represents an OpenCL program.
  38. ///
  39. /// Program objects are created with one of the static \c create_with_*
  40. /// functions. For example, to create a program from a source string:
  41. ///
  42. /// \snippet test/test_program.cpp create_with_source
  43. ///
  44. /// And to create a program from a source file:
  45. /// \code
  46. /// boost::compute::program bar_program =
  47. /// boost::compute::program::create_with_source_file("/path/to/bar.cl", context);
  48. /// \endcode
  49. ///
  50. /// Once a program object has been succesfully created, it can be compiled
  51. /// using the \c build() method:
  52. /// \code
  53. /// // build the program
  54. /// foo_program.build();
  55. /// \endcode
  56. ///
  57. /// Once the program is built, \ref kernel objects can be created using the
  58. /// \c create_kernel() method by passing their name:
  59. /// \code
  60. /// // create a kernel from the compiled program
  61. /// boost::compute::kernel foo_kernel = foo_program.create_kernel("foo");
  62. /// \endcode
  63. ///
  64. /// \see kernel
  65. class program
  66. {
  67. public:
  68. /// Creates a null program object.
  69. program()
  70. : m_program(0)
  71. {
  72. }
  73. /// Creates a program object for \p program. If \p retain is \c true,
  74. /// the reference count for \p program will be incremented.
  75. explicit program(cl_program program, bool retain = true)
  76. : m_program(program)
  77. {
  78. if(m_program && retain){
  79. clRetainProgram(m_program);
  80. }
  81. }
  82. /// Creates a new program object as a copy of \p other.
  83. program(const program &other)
  84. : m_program(other.m_program)
  85. {
  86. if(m_program){
  87. clRetainProgram(m_program);
  88. }
  89. }
  90. /// Copies the program object from \p other to \c *this.
  91. program& operator=(const program &other)
  92. {
  93. if(this != &other){
  94. if(m_program){
  95. clReleaseProgram(m_program);
  96. }
  97. m_program = other.m_program;
  98. if(m_program){
  99. clRetainProgram(m_program);
  100. }
  101. }
  102. return *this;
  103. }
  104. #ifndef BOOST_COMPUTE_NO_RVALUE_REFERENCES
  105. /// Move-constructs a new program object from \p other.
  106. program(program&& other) BOOST_NOEXCEPT
  107. : m_program(other.m_program)
  108. {
  109. other.m_program = 0;
  110. }
  111. /// Move-assigns the program from \p other to \c *this.
  112. program& operator=(program&& other) BOOST_NOEXCEPT
  113. {
  114. if(m_program){
  115. clReleaseProgram(m_program);
  116. }
  117. m_program = other.m_program;
  118. other.m_program = 0;
  119. return *this;
  120. }
  121. #endif // BOOST_COMPUTE_NO_RVALUE_REFERENCES
  122. /// Destroys the program object.
  123. ~program()
  124. {
  125. if(m_program){
  126. BOOST_COMPUTE_ASSERT_CL_SUCCESS(
  127. clReleaseProgram(m_program)
  128. );
  129. }
  130. }
  131. /// Returns the underlying OpenCL program.
  132. cl_program& get() const
  133. {
  134. return const_cast<cl_program &>(m_program);
  135. }
  136. /// Returns the source code for the program.
  137. std::string source() const
  138. {
  139. return get_info<std::string>(CL_PROGRAM_SOURCE);
  140. }
  141. /// Returns the binary for the program.
  142. std::vector<unsigned char> binary() const
  143. {
  144. size_t binary_size = get_info<size_t>(CL_PROGRAM_BINARY_SIZES);
  145. std::vector<unsigned char> binary(binary_size);
  146. unsigned char *binary_ptr = &binary[0];
  147. cl_int error = clGetProgramInfo(m_program,
  148. CL_PROGRAM_BINARIES,
  149. sizeof(unsigned char **),
  150. &binary_ptr,
  151. 0);
  152. if(error != CL_SUCCESS){
  153. BOOST_THROW_EXCEPTION(opencl_error(error));
  154. }
  155. return binary;
  156. }
  157. std::vector<device> get_devices() const
  158. {
  159. std::vector<cl_device_id> device_ids =
  160. get_info<std::vector<cl_device_id> >(CL_PROGRAM_DEVICES);
  161. std::vector<device> devices;
  162. for(size_t i = 0; i < device_ids.size(); i++){
  163. devices.push_back(device(device_ids[i]));
  164. }
  165. return devices;
  166. }
  167. /// Returns the context for the program.
  168. context get_context() const
  169. {
  170. return context(get_info<cl_context>(CL_PROGRAM_CONTEXT));
  171. }
  172. /// Returns information about the program.
  173. ///
  174. /// \see_opencl_ref{clGetProgramInfo}
  175. template<class T>
  176. T get_info(cl_program_info info) const
  177. {
  178. return detail::get_object_info<T>(clGetProgramInfo, m_program, info);
  179. }
  180. /// \overload
  181. template<int Enum>
  182. typename detail::get_object_info_type<program, Enum>::type
  183. get_info() const;
  184. /// Returns build information about the program.
  185. ///
  186. /// For example, this function can be used to retreive the options used
  187. /// to build the program:
  188. /// \code
  189. /// std::string build_options =
  190. /// program.get_build_info<std::string>(CL_PROGRAM_BUILD_OPTIONS);
  191. /// \endcode
  192. ///
  193. /// \see_opencl_ref{clGetProgramInfo}
  194. template<class T>
  195. T get_build_info(cl_program_build_info info, const device &device) const
  196. {
  197. return detail::get_object_info<T>(clGetProgramBuildInfo, m_program, info, device.id());
  198. }
  199. /// Builds the program with \p options.
  200. ///
  201. /// If the program fails to compile, this function will throw an
  202. /// opencl_error exception.
  203. /// \code
  204. /// try {
  205. /// // attempt to compile to program
  206. /// program.build();
  207. /// }
  208. /// catch(boost::compute::opencl_error &e){
  209. /// // program failed to compile, print out the build log
  210. /// std::cout << program.build_log() << std::endl;
  211. /// }
  212. /// \endcode
  213. ///
  214. /// \see_opencl_ref{clBuildProgram}
  215. void build(const std::string &options = std::string())
  216. {
  217. const char *options_string = 0;
  218. if(!options.empty()){
  219. options_string = options.c_str();
  220. }
  221. cl_int ret = clBuildProgram(m_program, 0, 0, options_string, 0, 0);
  222. #ifdef BOOST_COMPUTE_DEBUG_KERNEL_COMPILATION
  223. if(ret != CL_SUCCESS){
  224. // print the error, source code and build log
  225. std::cerr << "Boost.Compute: "
  226. << "kernel compilation failed (" << ret << ")\n"
  227. << "--- source ---\n"
  228. << source()
  229. << "\n--- build log ---\n"
  230. << build_log()
  231. << std::endl;
  232. }
  233. #endif
  234. if(ret != CL_SUCCESS){
  235. BOOST_THROW_EXCEPTION(opencl_error(ret));
  236. }
  237. }
  238. #if defined(CL_VERSION_1_2) || defined(BOOST_COMPUTE_DOXYGEN_INVOKED)
  239. /// Compiles the program with \p options.
  240. ///
  241. /// \opencl_version_warning{1,2}
  242. ///
  243. /// \see_opencl_ref{clCompileProgram}
  244. void compile(const std::string &options = std::string())
  245. {
  246. const char *options_string = 0;
  247. if(!options.empty()){
  248. options_string = options.c_str();
  249. }
  250. cl_int ret = clCompileProgram(
  251. m_program, 0, 0, options_string, 0, 0, 0, 0, 0
  252. );
  253. if(ret != CL_SUCCESS){
  254. BOOST_THROW_EXCEPTION(opencl_error(ret));
  255. }
  256. }
  257. /// Links the programs in \p programs with \p options in \p context.
  258. ///
  259. /// \opencl_version_warning{1,2}
  260. ///
  261. /// \see_opencl_ref{clLinkProgram}
  262. static program link(const std::vector<program> &programs,
  263. const context &context,
  264. const std::string &options = std::string())
  265. {
  266. const char *options_string = 0;
  267. if(!options.empty()){
  268. options_string = options.c_str();
  269. }
  270. cl_int ret;
  271. cl_program program_ = clLinkProgram(
  272. context.get(),
  273. 0,
  274. 0,
  275. options_string,
  276. static_cast<uint_>(programs.size()),
  277. reinterpret_cast<const cl_program*>(&programs[0]),
  278. 0,
  279. 0,
  280. &ret
  281. );
  282. if(!program_){
  283. BOOST_THROW_EXCEPTION(opencl_error(ret));
  284. }
  285. return program(program_, false);
  286. }
  287. #endif // CL_VERSION_1_2
  288. /// Returns the build log.
  289. std::string build_log() const
  290. {
  291. return get_build_info<std::string>(CL_PROGRAM_BUILD_LOG, get_devices().front());
  292. }
  293. /// Creates and returns a new kernel object for \p name.
  294. ///
  295. /// For example, to create the \c "foo" kernel (after the program has been
  296. /// created and built):
  297. /// \code
  298. /// boost::compute::kernel foo_kernel = foo_program.create_kernel("foo");
  299. /// \endcode
  300. kernel create_kernel(const std::string &name) const;
  301. /// Returns \c true if the program is the same at \p other.
  302. bool operator==(const program &other) const
  303. {
  304. return m_program == other.m_program;
  305. }
  306. /// Returns \c true if the program is different from \p other.
  307. bool operator!=(const program &other) const
  308. {
  309. return m_program != other.m_program;
  310. }
  311. /// \internal_
  312. operator cl_program() const
  313. {
  314. return m_program;
  315. }
  316. /// Creates a new program with \p source in \p context.
  317. ///
  318. /// \see_opencl_ref{clCreateProgramWithSource}
  319. static program create_with_source(const std::string &source,
  320. const context &context)
  321. {
  322. const char *source_string = source.c_str();
  323. cl_int error = 0;
  324. cl_program program_ = clCreateProgramWithSource(context,
  325. uint_(1),
  326. &source_string,
  327. 0,
  328. &error);
  329. if(!program_){
  330. BOOST_THROW_EXCEPTION(opencl_error(error));
  331. }
  332. return program(program_, false);
  333. }
  334. /// Creates a new program with \p sources in \p context.
  335. ///
  336. /// \see_opencl_ref{clCreateProgramWithSource}
  337. static program create_with_source(const std::vector<std::string> &sources,
  338. const context &context)
  339. {
  340. std::vector<const char*> source_strings(sources.size());
  341. for(size_t i = 0; i < sources.size(); i++){
  342. source_strings[i] = sources[i].c_str();
  343. }
  344. cl_int error = 0;
  345. cl_program program_ = clCreateProgramWithSource(context,
  346. uint_(sources.size()),
  347. &source_strings[0],
  348. 0,
  349. &error);
  350. if(!program_){
  351. BOOST_THROW_EXCEPTION(opencl_error(error));
  352. }
  353. return program(program_, false);
  354. }
  355. /// Creates a new program with \p file in \p context.
  356. ///
  357. /// \see_opencl_ref{clCreateProgramWithSource}
  358. static program create_with_source_file(const std::string &file,
  359. const context &context)
  360. {
  361. // open file stream
  362. std::ifstream stream(file.c_str());
  363. if(stream.fail()){
  364. BOOST_THROW_EXCEPTION(std::ios_base::failure("failed to create stream."));
  365. }
  366. // read source
  367. std::string source(
  368. (std::istreambuf_iterator<char>(stream)),
  369. std::istreambuf_iterator<char>()
  370. );
  371. // create program
  372. return create_with_source(source, context);
  373. }
  374. /// Creates a new program with \p binary of \p binary_size in
  375. /// \p context.
  376. ///
  377. /// \see_opencl_ref{clCreateProgramWithBinary}
  378. static program create_with_binary(const unsigned char *binary,
  379. size_t binary_size,
  380. const context &context)
  381. {
  382. const cl_device_id device = context.get_device().id();
  383. cl_int error = 0;
  384. cl_int binary_status = 0;
  385. cl_program program_ = clCreateProgramWithBinary(context,
  386. uint_(1),
  387. &device,
  388. &binary_size,
  389. &binary,
  390. &binary_status,
  391. &error);
  392. if(!program_){
  393. BOOST_THROW_EXCEPTION(opencl_error(error));
  394. }
  395. if(binary_status != CL_SUCCESS){
  396. BOOST_THROW_EXCEPTION(opencl_error(binary_status));
  397. }
  398. return program(program_, false);
  399. }
  400. /// Creates a new program with \p binary in \p context.
  401. ///
  402. /// \see_opencl_ref{clCreateProgramWithBinary}
  403. static program create_with_binary(const std::vector<unsigned char> &binary,
  404. const context &context)
  405. {
  406. return create_with_binary(&binary[0], binary.size(), context);
  407. }
  408. /// Creates a new program with \p file in \p context.
  409. ///
  410. /// \see_opencl_ref{clCreateProgramWithBinary}
  411. static program create_with_binary_file(const std::string &file,
  412. const context &context)
  413. {
  414. // open file stream
  415. std::ifstream stream(file.c_str(), std::ios::in | std::ios::binary);
  416. // read binary
  417. std::vector<unsigned char> binary(
  418. (std::istreambuf_iterator<char>(stream)),
  419. std::istreambuf_iterator<char>()
  420. );
  421. // create program
  422. return create_with_binary(&binary[0], binary.size(), context);
  423. }
  424. #if defined(CL_VERSION_1_2) || defined(BOOST_COMPUTE_DOXYGEN_INVOKED)
  425. /// Creates a new program with the built-in kernels listed in
  426. /// \p kernel_names for \p devices in \p context.
  427. ///
  428. /// \opencl_version_warning{1,2}
  429. ///
  430. /// \see_opencl_ref{clCreateProgramWithBuiltInKernels}
  431. static program create_with_builtin_kernels(const context &context,
  432. const std::vector<device> &devices,
  433. const std::string &kernel_names)
  434. {
  435. cl_int error = 0;
  436. cl_program program_ = clCreateProgramWithBuiltInKernels(
  437. context.get(),
  438. static_cast<uint_>(devices.size()),
  439. reinterpret_cast<const cl_device_id *>(&devices[0]),
  440. kernel_names.c_str(),
  441. &error
  442. );
  443. if(!program_){
  444. BOOST_THROW_EXCEPTION(opencl_error(error));
  445. }
  446. return program(program_, false);
  447. }
  448. #endif // CL_VERSION_1_2
  449. /// Create a new program with \p source in \p context and builds it with \p options.
  450. /**
  451. * In case BOOST_COMPUTE_USE_OFFLINE_CACHE macro is defined,
  452. * the compiled binary is stored for reuse in the offline cache located in
  453. * $HOME/.boost_compute on UNIX-like systems and in %APPDATA%/boost_compute
  454. * on Windows.
  455. */
  456. static program build_with_source(
  457. const std::string &source,
  458. const context &context,
  459. const std::string &options = std::string()
  460. )
  461. {
  462. #ifdef BOOST_COMPUTE_USE_OFFLINE_CACHE
  463. // Get hash string for the kernel.
  464. device d = context.get_device();
  465. platform p = d.platform();
  466. detail::sha1 hash;
  467. hash.process( p.name() )
  468. .process( p.version() )
  469. .process( d.name() )
  470. .process( options )
  471. .process( source )
  472. ;
  473. // Try to get cached program binaries:
  474. try {
  475. boost::optional<program> prog = load_program_binary(hash, context);
  476. if (prog) {
  477. prog->build(options);
  478. return *prog;
  479. }
  480. } catch (...) {
  481. // Something bad happened. Fallback to normal compilation.
  482. }
  483. // Cache is apparently not available. Just compile the sources.
  484. #endif
  485. const char *source_string = source.c_str();
  486. cl_int error = 0;
  487. cl_program program_ = clCreateProgramWithSource(context,
  488. uint_(1),
  489. &source_string,
  490. 0,
  491. &error);
  492. if(!program_){
  493. BOOST_THROW_EXCEPTION(opencl_error(error));
  494. }
  495. program prog(program_, false);
  496. prog.build(options);
  497. #ifdef BOOST_COMPUTE_USE_OFFLINE_CACHE
  498. // Save program binaries for future reuse.
  499. save_program_binary(hash, prog);
  500. #endif
  501. return prog;
  502. }
  503. private:
  504. #ifdef BOOST_COMPUTE_USE_OFFLINE_CACHE
  505. // Saves program binaries for future reuse.
  506. static void save_program_binary(const std::string &hash, const program &prog)
  507. {
  508. std::string fname = detail::program_binary_path(hash, true) + "kernel";
  509. std::ofstream bfile(fname.c_str(), std::ios::binary);
  510. if (!bfile) return;
  511. std::vector<unsigned char> binary = prog.binary();
  512. size_t binary_size = binary.size();
  513. bfile.write((char*)&binary_size, sizeof(size_t));
  514. bfile.write((char*)binary.data(), binary_size);
  515. }
  516. // Tries to read program binaries from file cache.
  517. static boost::optional<program> load_program_binary(
  518. const std::string &hash, const context &ctx
  519. )
  520. {
  521. std::string fname = detail::program_binary_path(hash) + "kernel";
  522. std::ifstream bfile(fname.c_str(), std::ios::binary);
  523. if (!bfile) return boost::optional<program>();
  524. size_t binary_size;
  525. std::vector<unsigned char> binary;
  526. bfile.read((char*)&binary_size, sizeof(size_t));
  527. binary.resize(binary_size);
  528. bfile.read((char*)binary.data(), binary_size);
  529. return boost::optional<program>(
  530. program::create_with_binary(
  531. binary.data(), binary_size, ctx
  532. )
  533. );
  534. }
  535. #endif // BOOST_COMPUTE_USE_OFFLINE_CACHE
  536. private:
  537. cl_program m_program;
  538. };
  539. /// \internal_ define get_info() specializations for program
  540. BOOST_COMPUTE_DETAIL_DEFINE_GET_INFO_SPECIALIZATIONS(program,
  541. ((cl_uint, CL_PROGRAM_REFERENCE_COUNT))
  542. ((cl_context, CL_PROGRAM_CONTEXT))
  543. ((cl_uint, CL_PROGRAM_NUM_DEVICES))
  544. ((std::vector<cl_device_id>, CL_PROGRAM_DEVICES))
  545. ((std::string, CL_PROGRAM_SOURCE))
  546. ((std::vector<size_t>, CL_PROGRAM_BINARY_SIZES))
  547. ((std::vector<unsigned char *>, CL_PROGRAM_BINARIES))
  548. )
  549. #ifdef CL_VERSION_1_2
  550. BOOST_COMPUTE_DETAIL_DEFINE_GET_INFO_SPECIALIZATIONS(program,
  551. ((size_t, CL_PROGRAM_NUM_KERNELS))
  552. ((std::string, CL_PROGRAM_KERNEL_NAMES))
  553. )
  554. #endif // CL_VERSION_1_2
  555. } // end compute namespace
  556. } // end boost namespace
  557. #endif // BOOST_COMPUTE_PROGRAM_HPP