offload_target_main.cpp 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368
  1. /* Plugin for offload execution on Intel MIC devices.
  2. Copyright (C) 2014 Free Software Foundation, Inc.
  3. Contributed by Ilya Verbin <ilya.verbin@intel.com>.
  4. This file is part of the GNU Offloading and Multi Processing Library
  5. (libgomp).
  6. Libgomp is free software; you can redistribute it and/or modify it
  7. under the terms of the GNU General Public License as published by
  8. the Free Software Foundation; either version 3, or (at your option)
  9. any later version.
  10. Libgomp is distributed in the hope that it will be useful, but WITHOUT ANY
  11. WARRANTY; without even the implied warranty of MERCHANTABILITY or FITNESS
  12. FOR A PARTICULAR PURPOSE. See the GNU General Public License for
  13. more details.
  14. Under Section 7 of GPL version 3, you are granted additional
  15. permissions described in the GCC Runtime Library Exception, version
  16. 3.1, as published by the Free Software Foundation.
  17. You should have received a copy of the GNU General Public License and
  18. a copy of the GCC Runtime Library Exception along with this program;
  19. see the files COPYING3 and COPYING.RUNTIME respectively. If not, see
  20. <http://www.gnu.org/licenses/>. */
  21. /* Target side part of a libgomp plugin. */
  22. #include <stdint.h>
  23. #include <stdio.h>
  24. #include <stdlib.h>
  25. #include "compiler_if_target.h"
  26. #ifdef DEBUG
  27. #define TRACE(...) \
  28. { \
  29. fprintf (stderr, "TARGET:\t%s:%s ", __FILE__, __FUNCTION__); \
  30. fprintf (stderr, __VA_ARGS__); \
  31. fprintf (stderr, "\n"); \
  32. }
  33. #else
  34. #define TRACE { }
  35. #endif
  36. static VarDesc vd_host2tgt = {
  37. { 1, 1 }, /* dst, src */
  38. { 1, 0 }, /* in, out */
  39. 1, /* alloc_if */
  40. 1, /* free_if */
  41. 4, /* align */
  42. 0, /* mic_offset */
  43. { 0, 0, 0, 0, 0, 0, 0, 0 }, /* is_static, is_static_dstn, has_length,
  44. is_stack_buf, sink_addr, alloc_disp,
  45. is_noncont_src, is_noncont_dst */
  46. 0, /* offset */
  47. 0, /* size */
  48. 1, /* count */
  49. 0, /* alloc */
  50. 0, /* into */
  51. 0 /* ptr */
  52. };
  53. static VarDesc vd_tgt2host = {
  54. { 1, 1 }, /* dst, src */
  55. { 0, 1 }, /* in, out */
  56. 1, /* alloc_if */
  57. 1, /* free_if */
  58. 4, /* align */
  59. 0, /* mic_offset */
  60. { 0, 0, 0, 0, 0, 0, 0, 0 }, /* is_static, is_static_dstn, has_length,
  61. is_stack_buf, sink_addr, alloc_disp,
  62. is_noncont_src, is_noncont_dst */
  63. 0, /* offset */
  64. 0, /* size */
  65. 1, /* count */
  66. 0, /* alloc */
  67. 0, /* into */
  68. 0 /* ptr */
  69. };
  70. /* Pointer to the descriptor of the last loaded shared library. */
  71. static void *last_loaded_library = NULL;
  72. /* Pointer and size of the variable, used in __offload_target_host2tgt_p[12]
  73. and __offload_target_tgt2host_p[12]. */
  74. static void *last_var_ptr = NULL;
  75. static int last_var_size = 0;
  76. /* Override the corresponding functions from libgomp. */
  77. extern "C" int
  78. omp_is_initial_device (void) __GOMP_NOTHROW
  79. {
  80. return 0;
  81. }
  82. extern "C" int32_t
  83. omp_is_initial_device_ (void)
  84. {
  85. return omp_is_initial_device ();
  86. }
  87. /* Dummy function needed for the initialization of target process during the
  88. first call to __offload_offload1. */
  89. static void
  90. __offload_target_init_proc (OFFLOAD ofldt)
  91. {
  92. TRACE ("");
  93. }
  94. /* Collect addresses of the offload functions and of the global variables from
  95. the library descriptor and send them to host.
  96. Part 1: Send num_funcs and num_vars to host. */
  97. static void
  98. __offload_target_table_p1 (OFFLOAD ofldt)
  99. {
  100. void ***lib_descr = (void ***) last_loaded_library;
  101. if (lib_descr == NULL)
  102. {
  103. TRACE ("");
  104. fprintf (stderr, "Error! No shared libraries loaded on target.\n");
  105. return;
  106. }
  107. void **func_table_begin = lib_descr[0];
  108. void **func_table_end = lib_descr[1];
  109. void **var_table_begin = lib_descr[2];
  110. void **var_table_end = lib_descr[3];
  111. /* The func table contains only addresses, the var table contains addresses
  112. and corresponding sizes. */
  113. int num_funcs = func_table_end - func_table_begin;
  114. int num_vars = (var_table_end - var_table_begin) / 2;
  115. TRACE ("(num_funcs = %d, num_vars = %d)", num_funcs, num_vars);
  116. VarDesc vd1[2] = { vd_tgt2host, vd_tgt2host };
  117. vd1[0].ptr = &num_funcs;
  118. vd1[0].size = sizeof (num_funcs);
  119. vd1[1].ptr = &num_vars;
  120. vd1[1].size = sizeof (num_vars);
  121. VarDesc2 vd2[2] = { { "num_funcs", 0 }, { "num_vars", 0 } };
  122. __offload_target_enter (ofldt, 2, vd1, vd2);
  123. __offload_target_leave (ofldt);
  124. }
  125. /* Part 2: Send the table with addresses to host. */
  126. static void
  127. __offload_target_table_p2 (OFFLOAD ofldt)
  128. {
  129. void ***lib_descr = (void ***) last_loaded_library;
  130. void **func_table_begin = lib_descr[0];
  131. void **func_table_end = lib_descr[1];
  132. void **var_table_begin = lib_descr[2];
  133. void **var_table_end = lib_descr[3];
  134. int num_funcs = func_table_end - func_table_begin;
  135. int num_vars = (var_table_end - var_table_begin) / 2;
  136. int table_size = (num_funcs + 2 * num_vars) * sizeof (void *);
  137. void **table = (void **) malloc (table_size);
  138. TRACE ("(table_size = %d)", table_size);
  139. VarDesc vd1;
  140. vd1 = vd_tgt2host;
  141. vd1.ptr = table;
  142. vd1.size = table_size;
  143. VarDesc2 vd2 = { "table", 0 };
  144. __offload_target_enter (ofldt, 1, &vd1, &vd2);
  145. void **p;
  146. int i = 0;
  147. for (p = func_table_begin; p < func_table_end; p++, i++)
  148. table[i] = *p;
  149. for (p = var_table_begin; p < var_table_end; p++, i++)
  150. table[i] = *p;
  151. __offload_target_leave (ofldt);
  152. free (table);
  153. }
  154. /* Allocate size bytes and send a pointer to the allocated memory to host. */
  155. static void
  156. __offload_target_alloc (OFFLOAD ofldt)
  157. {
  158. size_t size = 0;
  159. void *ptr = NULL;
  160. VarDesc vd1[2] = { vd_host2tgt, vd_tgt2host };
  161. vd1[0].ptr = &size;
  162. vd1[0].size = sizeof (size);
  163. vd1[1].ptr = &ptr;
  164. vd1[1].size = sizeof (void *);
  165. VarDesc2 vd2[2] = { { "size", 0 }, { "ptr", 0 } };
  166. __offload_target_enter (ofldt, 2, vd1, vd2);
  167. ptr = malloc (size);
  168. TRACE ("(size = %d): ptr = %p", size, ptr);
  169. __offload_target_leave (ofldt);
  170. }
  171. /* Free the memory space pointed to by ptr. */
  172. static void
  173. __offload_target_free (OFFLOAD ofldt)
  174. {
  175. void *ptr = 0;
  176. VarDesc vd1 = vd_host2tgt;
  177. vd1.ptr = &ptr;
  178. vd1.size = sizeof (void *);
  179. VarDesc2 vd2 = { "ptr", 0 };
  180. __offload_target_enter (ofldt, 1, &vd1, &vd2);
  181. TRACE ("(ptr = %p)", ptr);
  182. free (ptr);
  183. __offload_target_leave (ofldt);
  184. }
  185. /* Receive var_size bytes from host and store to var_ptr.
  186. Part 1: Receive var_ptr and var_size from host. */
  187. static void
  188. __offload_target_host2tgt_p1 (OFFLOAD ofldt)
  189. {
  190. void *var_ptr = NULL;
  191. size_t var_size = 0;
  192. VarDesc vd1[2] = { vd_host2tgt, vd_host2tgt };
  193. vd1[0].ptr = &var_ptr;
  194. vd1[0].size = sizeof (void *);
  195. vd1[1].ptr = &var_size;
  196. vd1[1].size = sizeof (var_size);
  197. VarDesc2 vd2[2] = { { "var_ptr", 0 }, { "var_size", 0 } };
  198. __offload_target_enter (ofldt, 2, vd1, vd2);
  199. TRACE ("(var_ptr = %p, var_size = %d)", var_ptr, var_size);
  200. last_var_ptr = var_ptr;
  201. last_var_size = var_size;
  202. __offload_target_leave (ofldt);
  203. }
  204. /* Part 2: Receive the data from host. */
  205. static void
  206. __offload_target_host2tgt_p2 (OFFLOAD ofldt)
  207. {
  208. TRACE ("(last_var_ptr = %p, last_var_size = %d)",
  209. last_var_ptr, last_var_size);
  210. VarDesc vd1 = vd_host2tgt;
  211. vd1.ptr = last_var_ptr;
  212. vd1.size = last_var_size;
  213. VarDesc2 vd2 = { "var", 0 };
  214. __offload_target_enter (ofldt, 1, &vd1, &vd2);
  215. __offload_target_leave (ofldt);
  216. }
  217. /* Send var_size bytes from var_ptr to host.
  218. Part 1: Receive var_ptr and var_size from host. */
  219. static void
  220. __offload_target_tgt2host_p1 (OFFLOAD ofldt)
  221. {
  222. void *var_ptr = NULL;
  223. size_t var_size = 0;
  224. VarDesc vd1[2] = { vd_host2tgt, vd_host2tgt };
  225. vd1[0].ptr = &var_ptr;
  226. vd1[0].size = sizeof (void *);
  227. vd1[1].ptr = &var_size;
  228. vd1[1].size = sizeof (var_size);
  229. VarDesc2 vd2[2] = { { "var_ptr", 0 }, { "var_size", 0 } };
  230. __offload_target_enter (ofldt, 2, vd1, vd2);
  231. TRACE ("(var_ptr = %p, var_size = %d)", var_ptr, var_size);
  232. last_var_ptr = var_ptr;
  233. last_var_size = var_size;
  234. __offload_target_leave (ofldt);
  235. }
  236. /* Part 2: Send the data to host. */
  237. static void
  238. __offload_target_tgt2host_p2 (OFFLOAD ofldt)
  239. {
  240. TRACE ("(last_var_ptr = %p, last_var_size = %d)",
  241. last_var_ptr, last_var_size);
  242. VarDesc vd1 = vd_tgt2host;
  243. vd1.ptr = last_var_ptr;
  244. vd1.size = last_var_size;
  245. VarDesc2 vd2 = { "var", 0 };
  246. __offload_target_enter (ofldt, 1, &vd1, &vd2);
  247. __offload_target_leave (ofldt);
  248. }
  249. /* Call offload function by the address fn_ptr and pass vars_ptr to it. */
  250. static void
  251. __offload_target_run (OFFLOAD ofldt)
  252. {
  253. void *fn_ptr;
  254. void *vars_ptr;
  255. VarDesc vd1[2] = { vd_host2tgt, vd_host2tgt };
  256. vd1[0].ptr = &fn_ptr;
  257. vd1[0].size = sizeof (void *);
  258. vd1[1].ptr = &vars_ptr;
  259. vd1[1].size = sizeof (void *);
  260. VarDesc2 vd2[2] = { { "fn_ptr", 0 }, { "vars_ptr", 0 } };
  261. __offload_target_enter (ofldt, 2, vd1, vd2);
  262. TRACE ("(fn_ptr = %p, vars_ptr = %p)", fn_ptr, vars_ptr);
  263. void (*fn)(void *) = (void (*)(void *)) fn_ptr;
  264. fn (vars_ptr);
  265. __offload_target_leave (ofldt);
  266. }
  267. /* This should be called from every library with offloading. */
  268. extern "C" void
  269. target_register_lib (const void *target_table)
  270. {
  271. TRACE ("(target_table = %p { %p, %p, %p, %p })", target_table,
  272. ((void **) target_table)[0], ((void **) target_table)[1],
  273. ((void **) target_table)[2], ((void **) target_table)[3]);
  274. last_loaded_library = (void *) target_table;
  275. }
  276. /* Use __offload_target_main from liboffload. */
  277. int
  278. main (int argc, char **argv)
  279. {
  280. __offload_target_main ();
  281. return 0;
  282. }
  283. /* Register offload_target_main's functions in the liboffload. */
  284. struct Entry {
  285. const char *name;
  286. void *func;
  287. };
  288. #define REGISTER(f) \
  289. extern "C" const Entry __offload_target_##f##_$entry \
  290. __attribute__ ((section(".OffloadEntryTable."))) = { \
  291. "__offload_target_"#f, \
  292. (void *) __offload_target_##f \
  293. }
  294. REGISTER (init_proc);
  295. REGISTER (table_p1);
  296. REGISTER (table_p2);
  297. REGISTER (alloc);
  298. REGISTER (free);
  299. REGISTER (host2tgt_p1);
  300. REGISTER (host2tgt_p2);
  301. REGISTER (tgt2host_p1);
  302. REGISTER (tgt2host_p2);
  303. REGISTER (run);
  304. #undef REGISTER