shader_gles3.cpp 26 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808
  1. /**************************************************************************/
  2. /* shader_gles3.cpp */
  3. /**************************************************************************/
  4. /* This file is part of: */
  5. /* GODOT ENGINE */
  6. /* https://godotengine.org */
  7. /**************************************************************************/
  8. /* Copyright (c) 2014-present Godot Engine contributors (see AUTHORS.md). */
  9. /* Copyright (c) 2007-2014 Juan Linietsky, Ariel Manzur. */
  10. /* */
  11. /* Permission is hereby granted, free of charge, to any person obtaining */
  12. /* a copy of this software and associated documentation files (the */
  13. /* "Software"), to deal in the Software without restriction, including */
  14. /* without limitation the rights to use, copy, modify, merge, publish, */
  15. /* distribute, sublicense, and/or sell copies of the Software, and to */
  16. /* permit persons to whom the Software is furnished to do so, subject to */
  17. /* the following conditions: */
  18. /* */
  19. /* The above copyright notice and this permission notice shall be */
  20. /* included in all copies or substantial portions of the Software. */
  21. /* */
  22. /* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, */
  23. /* EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF */
  24. /* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. */
  25. /* IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY */
  26. /* CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, */
  27. /* TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE */
  28. /* SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. */
  29. /**************************************************************************/
  30. #include "shader_gles3.h"
  31. #ifdef GLES3_ENABLED
  32. #include "core/io/compression.h"
  33. #include "core/io/dir_access.h"
  34. #include "core/io/file_access.h"
  35. static String _mkid(const String &p_id) {
  36. String id = "m_" + p_id.replace("__", "_dus_");
  37. return id.replace("__", "_dus_"); //doubleunderscore is reserved in glsl
  38. }
  39. void ShaderGLES3::_add_stage(const char *p_code, StageType p_stage_type) {
  40. Vector<String> lines = String(p_code).split("\n");
  41. String text;
  42. for (int i = 0; i < lines.size(); i++) {
  43. String l = lines[i];
  44. bool push_chunk = false;
  45. StageTemplate::Chunk chunk;
  46. if (l.begins_with("#GLOBALS")) {
  47. switch (p_stage_type) {
  48. case STAGE_TYPE_VERTEX:
  49. chunk.type = StageTemplate::Chunk::TYPE_VERTEX_GLOBALS;
  50. break;
  51. case STAGE_TYPE_FRAGMENT:
  52. chunk.type = StageTemplate::Chunk::TYPE_FRAGMENT_GLOBALS;
  53. break;
  54. default: {
  55. }
  56. }
  57. push_chunk = true;
  58. } else if (l.begins_with("#MATERIAL_UNIFORMS")) {
  59. chunk.type = StageTemplate::Chunk::TYPE_MATERIAL_UNIFORMS;
  60. push_chunk = true;
  61. } else if (l.begins_with("#CODE")) {
  62. chunk.type = StageTemplate::Chunk::TYPE_CODE;
  63. push_chunk = true;
  64. chunk.code = l.replace_first("#CODE", String()).replace(":", "").strip_edges().to_upper();
  65. } else {
  66. text += l + "\n";
  67. }
  68. if (push_chunk) {
  69. if (text != String()) {
  70. StageTemplate::Chunk text_chunk;
  71. text_chunk.type = StageTemplate::Chunk::TYPE_TEXT;
  72. text_chunk.text = text.utf8();
  73. stage_templates[p_stage_type].chunks.push_back(text_chunk);
  74. text = String();
  75. }
  76. stage_templates[p_stage_type].chunks.push_back(chunk);
  77. }
  78. if (text != String()) {
  79. StageTemplate::Chunk text_chunk;
  80. text_chunk.type = StageTemplate::Chunk::TYPE_TEXT;
  81. text_chunk.text = text.utf8();
  82. stage_templates[p_stage_type].chunks.push_back(text_chunk);
  83. text = String();
  84. }
  85. }
  86. }
  87. void ShaderGLES3::_setup(const char *p_vertex_code, const char *p_fragment_code, const char *p_name, int p_uniform_count, const char **p_uniform_names, int p_ubo_count, const UBOPair *p_ubos, int p_feedback_count, const Feedback *p_feedback, int p_texture_count, const TexUnitPair *p_tex_units, int p_specialization_count, const Specialization *p_specializations, int p_variant_count, const char **p_variants) {
  88. name = p_name;
  89. if (p_vertex_code) {
  90. _add_stage(p_vertex_code, STAGE_TYPE_VERTEX);
  91. }
  92. if (p_fragment_code) {
  93. _add_stage(p_fragment_code, STAGE_TYPE_FRAGMENT);
  94. }
  95. uniform_names = p_uniform_names;
  96. uniform_count = p_uniform_count;
  97. ubo_pairs = p_ubos;
  98. ubo_count = p_ubo_count;
  99. texunit_pairs = p_tex_units;
  100. texunit_pair_count = p_texture_count;
  101. specializations = p_specializations;
  102. specialization_count = p_specialization_count;
  103. specialization_default_mask = 0;
  104. for (int i = 0; i < specialization_count; i++) {
  105. if (specializations[i].default_value) {
  106. specialization_default_mask |= (uint64_t(1) << uint64_t(i));
  107. }
  108. }
  109. variant_defines = p_variants;
  110. variant_count = p_variant_count;
  111. feedbacks = p_feedback;
  112. feedback_count = p_feedback_count;
  113. StringBuilder tohash;
  114. /*
  115. tohash.append("[SpirvCacheKey]");
  116. tohash.append(RenderingDevice::get_singleton()->shader_get_spirv_cache_key());
  117. tohash.append("[BinaryCacheKey]");
  118. tohash.append(RenderingDevice::get_singleton()->shader_get_binary_cache_key());
  119. */
  120. tohash.append("[Vertex]");
  121. tohash.append(p_vertex_code ? p_vertex_code : "");
  122. tohash.append("[Fragment]");
  123. tohash.append(p_fragment_code ? p_fragment_code : "");
  124. base_sha256 = tohash.as_string().sha256_text();
  125. }
  126. RID ShaderGLES3::version_create() {
  127. //initialize() was never called
  128. ERR_FAIL_COND_V(variant_count == 0, RID());
  129. Version version;
  130. return version_owner.make_rid(version);
  131. }
  132. void ShaderGLES3::_build_variant_code(StringBuilder &builder, uint32_t p_variant, const Version *p_version, StageType p_stage_type, uint64_t p_specialization) {
  133. #ifdef GLES_OVER_GL
  134. builder.append("#version 330\n");
  135. builder.append("#define USE_GLES_OVER_GL\n");
  136. #else
  137. builder.append("#version 300 es\n");
  138. #endif
  139. for (int i = 0; i < specialization_count; i++) {
  140. if (p_specialization & (uint64_t(1) << uint64_t(i))) {
  141. builder.append("#define " + String(specializations[i].name) + "\n");
  142. }
  143. }
  144. if (p_version->uniforms.size()) {
  145. builder.append("#define MATERIAL_UNIFORMS_USED\n");
  146. }
  147. for (const KeyValue<StringName, CharString> &E : p_version->code_sections) {
  148. builder.append(String("#define ") + String(E.key) + "_CODE_USED\n");
  149. }
  150. builder.append("\n"); //make sure defines begin at newline
  151. builder.append(general_defines.get_data());
  152. builder.append(variant_defines[p_variant]);
  153. builder.append("\n");
  154. for (int j = 0; j < p_version->custom_defines.size(); j++) {
  155. builder.append(p_version->custom_defines[j].get_data());
  156. }
  157. builder.append("\n"); //make sure defines begin at newline
  158. // Insert multiview extension loading, because it needs to appear before
  159. // any non-preprocessor code (like the "precision highp..." lines below).
  160. builder.append("#ifdef USE_MULTIVIEW\n");
  161. builder.append("#if defined(GL_OVR_multiview2)\n");
  162. builder.append("#extension GL_OVR_multiview2 : require\n");
  163. builder.append("#elif defined(GL_OVR_multiview)\n");
  164. builder.append("#extension GL_OVR_multiview : require\n");
  165. builder.append("#endif\n");
  166. if (p_stage_type == StageType::STAGE_TYPE_VERTEX) {
  167. builder.append("layout(num_views=2) in;\n");
  168. }
  169. builder.append("#define ViewIndex gl_ViewID_OVR\n");
  170. builder.append("#define MAX_VIEWS 2\n");
  171. builder.append("#else\n");
  172. builder.append("#define ViewIndex uint(0)\n");
  173. builder.append("#define MAX_VIEWS 1\n");
  174. builder.append("#endif\n");
  175. // Default to highp precision unless specified otherwise.
  176. builder.append("precision highp float;\n");
  177. builder.append("precision highp int;\n");
  178. #ifndef GLES_OVER_GL
  179. builder.append("precision highp sampler2D;\n");
  180. builder.append("precision highp samplerCube;\n");
  181. builder.append("precision highp sampler2DArray;\n");
  182. #endif
  183. const StageTemplate &stage_template = stage_templates[p_stage_type];
  184. for (uint32_t i = 0; i < stage_template.chunks.size(); i++) {
  185. const StageTemplate::Chunk &chunk = stage_template.chunks[i];
  186. switch (chunk.type) {
  187. case StageTemplate::Chunk::TYPE_MATERIAL_UNIFORMS: {
  188. builder.append(p_version->uniforms.get_data()); //uniforms (same for vertex and fragment)
  189. } break;
  190. case StageTemplate::Chunk::TYPE_VERTEX_GLOBALS: {
  191. builder.append(p_version->vertex_globals.get_data()); // vertex globals
  192. } break;
  193. case StageTemplate::Chunk::TYPE_FRAGMENT_GLOBALS: {
  194. builder.append(p_version->fragment_globals.get_data()); // fragment globals
  195. } break;
  196. case StageTemplate::Chunk::TYPE_CODE: {
  197. if (p_version->code_sections.has(chunk.code)) {
  198. builder.append(p_version->code_sections[chunk.code].get_data());
  199. }
  200. } break;
  201. case StageTemplate::Chunk::TYPE_TEXT: {
  202. builder.append(chunk.text.get_data());
  203. } break;
  204. }
  205. }
  206. }
  207. static void _display_error_with_code(const String &p_error, const String &p_code) {
  208. int line = 1;
  209. Vector<String> lines = p_code.split("\n");
  210. for (int j = 0; j < lines.size(); j++) {
  211. print_line(itos(line) + ": " + lines[j]);
  212. line++;
  213. }
  214. ERR_PRINT(p_error);
  215. }
  216. void ShaderGLES3::_get_uniform_locations(Version::Specialization &spec, Version *p_version) {
  217. glUseProgram(spec.id);
  218. spec.uniform_location.resize(uniform_count);
  219. for (int i = 0; i < uniform_count; i++) {
  220. spec.uniform_location[i] = glGetUniformLocation(spec.id, uniform_names[i]);
  221. }
  222. for (int i = 0; i < texunit_pair_count; i++) {
  223. GLint loc = glGetUniformLocation(spec.id, texunit_pairs[i].name);
  224. if (loc >= 0) {
  225. if (texunit_pairs[i].index < 0) {
  226. glUniform1i(loc, max_image_units + texunit_pairs[i].index);
  227. } else {
  228. glUniform1i(loc, texunit_pairs[i].index);
  229. }
  230. }
  231. }
  232. for (int i = 0; i < ubo_count; i++) {
  233. GLint loc = glGetUniformBlockIndex(spec.id, ubo_pairs[i].name);
  234. if (loc >= 0) {
  235. glUniformBlockBinding(spec.id, loc, ubo_pairs[i].index);
  236. }
  237. }
  238. // textures
  239. int texture_index = 0;
  240. for (uint32_t i = 0; i < p_version->texture_uniforms.size(); i++) {
  241. String native_uniform_name = _mkid(p_version->texture_uniforms[i].name);
  242. GLint location = glGetUniformLocation(spec.id, (native_uniform_name).ascii().get_data());
  243. Vector<int32_t> texture_uniform_bindings;
  244. int texture_count = p_version->texture_uniforms[i].array_size;
  245. for (int j = 0; j < texture_count; j++) {
  246. texture_uniform_bindings.append(texture_index + base_texture_index);
  247. texture_index++;
  248. }
  249. glUniform1iv(location, texture_uniform_bindings.size(), texture_uniform_bindings.ptr());
  250. }
  251. glUseProgram(0);
  252. }
  253. void ShaderGLES3::_compile_specialization(Version::Specialization &spec, uint32_t p_variant, Version *p_version, uint64_t p_specialization) {
  254. spec.id = glCreateProgram();
  255. spec.ok = false;
  256. GLint status;
  257. //vertex stage
  258. {
  259. StringBuilder builder;
  260. _build_variant_code(builder, p_variant, p_version, STAGE_TYPE_VERTEX, p_specialization);
  261. spec.vert_id = glCreateShader(GL_VERTEX_SHADER);
  262. String builder_string = builder.as_string();
  263. CharString cs = builder_string.utf8();
  264. const char *cstr = cs.ptr();
  265. glShaderSource(spec.vert_id, 1, &cstr, nullptr);
  266. glCompileShader(spec.vert_id);
  267. glGetShaderiv(spec.vert_id, GL_COMPILE_STATUS, &status);
  268. if (status == GL_FALSE) {
  269. GLsizei iloglen;
  270. glGetShaderiv(spec.vert_id, GL_INFO_LOG_LENGTH, &iloglen);
  271. if (iloglen < 0) {
  272. glDeleteShader(spec.vert_id);
  273. glDeleteProgram(spec.id);
  274. spec.id = 0;
  275. ERR_PRINT("No OpenGL vertex shader compiler log.");
  276. } else {
  277. if (iloglen == 0) {
  278. iloglen = 4096; // buggy driver (Adreno 220+)
  279. }
  280. char *ilogmem = (char *)Memory::alloc_static(iloglen + 1);
  281. ilogmem[iloglen] = '\0';
  282. glGetShaderInfoLog(spec.vert_id, iloglen, &iloglen, ilogmem);
  283. String err_string = name + ": Vertex shader compilation failed:\n";
  284. err_string += ilogmem;
  285. _display_error_with_code(err_string, builder_string);
  286. Memory::free_static(ilogmem);
  287. glDeleteShader(spec.vert_id);
  288. glDeleteProgram(spec.id);
  289. spec.id = 0;
  290. }
  291. ERR_FAIL();
  292. }
  293. }
  294. //fragment stage
  295. {
  296. StringBuilder builder;
  297. _build_variant_code(builder, p_variant, p_version, STAGE_TYPE_FRAGMENT, p_specialization);
  298. spec.frag_id = glCreateShader(GL_FRAGMENT_SHADER);
  299. String builder_string = builder.as_string();
  300. CharString cs = builder_string.utf8();
  301. const char *cstr = cs.ptr();
  302. glShaderSource(spec.frag_id, 1, &cstr, nullptr);
  303. glCompileShader(spec.frag_id);
  304. glGetShaderiv(spec.frag_id, GL_COMPILE_STATUS, &status);
  305. if (status == GL_FALSE) {
  306. GLsizei iloglen;
  307. glGetShaderiv(spec.frag_id, GL_INFO_LOG_LENGTH, &iloglen);
  308. if (iloglen < 0) {
  309. glDeleteShader(spec.frag_id);
  310. glDeleteProgram(spec.id);
  311. spec.id = 0;
  312. ERR_PRINT("No OpenGL fragment shader compiler log.");
  313. } else {
  314. if (iloglen == 0) {
  315. iloglen = 4096; // buggy driver (Adreno 220+)
  316. }
  317. char *ilogmem = (char *)Memory::alloc_static(iloglen + 1);
  318. ilogmem[iloglen] = '\0';
  319. glGetShaderInfoLog(spec.frag_id, iloglen, &iloglen, ilogmem);
  320. String err_string = name + ": Fragment shader compilation failed:\n";
  321. err_string += ilogmem;
  322. _display_error_with_code(err_string, builder_string);
  323. Memory::free_static(ilogmem);
  324. glDeleteShader(spec.frag_id);
  325. glDeleteProgram(spec.id);
  326. spec.id = 0;
  327. }
  328. ERR_FAIL();
  329. }
  330. }
  331. glAttachShader(spec.id, spec.frag_id);
  332. glAttachShader(spec.id, spec.vert_id);
  333. // If feedback exists, set it up.
  334. if (feedback_count) {
  335. Vector<const char *> feedback;
  336. for (int i = 0; i < feedback_count; i++) {
  337. if (feedbacks[i].specialization == 0 || (feedbacks[i].specialization & p_specialization)) {
  338. // Specialization for this feedback is enabled
  339. feedback.push_back(feedbacks[i].name);
  340. }
  341. }
  342. if (feedback.size()) {
  343. glTransformFeedbackVaryings(spec.id, feedback.size(), feedback.ptr(), GL_INTERLEAVED_ATTRIBS);
  344. }
  345. }
  346. glLinkProgram(spec.id);
  347. glGetProgramiv(spec.id, GL_LINK_STATUS, &status);
  348. if (status == GL_FALSE) {
  349. GLsizei iloglen;
  350. glGetProgramiv(spec.id, GL_INFO_LOG_LENGTH, &iloglen);
  351. if (iloglen < 0) {
  352. glDeleteShader(spec.frag_id);
  353. glDeleteShader(spec.vert_id);
  354. glDeleteProgram(spec.id);
  355. spec.id = 0;
  356. ERR_PRINT("No OpenGL program link log. Something is wrong.");
  357. ERR_FAIL();
  358. }
  359. if (iloglen == 0) {
  360. iloglen = 4096; // buggy driver (Adreno 220+)
  361. }
  362. char *ilogmem = (char *)Memory::alloc_static(iloglen + 1);
  363. ilogmem[iloglen] = '\0';
  364. glGetProgramInfoLog(spec.id, iloglen, &iloglen, ilogmem);
  365. String err_string = name + ": Program linking failed:\n";
  366. err_string += ilogmem;
  367. _display_error_with_code(err_string, String());
  368. Memory::free_static(ilogmem);
  369. glDeleteShader(spec.frag_id);
  370. glDeleteShader(spec.vert_id);
  371. glDeleteProgram(spec.id);
  372. spec.id = 0;
  373. ERR_FAIL();
  374. }
  375. _get_uniform_locations(spec, p_version);
  376. spec.ok = true;
  377. }
  378. RS::ShaderNativeSourceCode ShaderGLES3::version_get_native_source_code(RID p_version) {
  379. Version *version = version_owner.get_or_null(p_version);
  380. RS::ShaderNativeSourceCode source_code;
  381. ERR_FAIL_COND_V(!version, source_code);
  382. source_code.versions.resize(variant_count);
  383. for (int i = 0; i < source_code.versions.size(); i++) {
  384. //vertex stage
  385. {
  386. StringBuilder builder;
  387. _build_variant_code(builder, i, version, STAGE_TYPE_VERTEX, specialization_default_mask);
  388. RS::ShaderNativeSourceCode::Version::Stage stage;
  389. stage.name = "vertex";
  390. stage.code = builder.as_string();
  391. source_code.versions.write[i].stages.push_back(stage);
  392. }
  393. //fragment stage
  394. {
  395. StringBuilder builder;
  396. _build_variant_code(builder, i, version, STAGE_TYPE_FRAGMENT, specialization_default_mask);
  397. RS::ShaderNativeSourceCode::Version::Stage stage;
  398. stage.name = "fragment";
  399. stage.code = builder.as_string();
  400. source_code.versions.write[i].stages.push_back(stage);
  401. }
  402. }
  403. return source_code;
  404. }
  405. String ShaderGLES3::_version_get_sha1(Version *p_version) const {
  406. StringBuilder hash_build;
  407. hash_build.append("[uniforms]");
  408. hash_build.append(p_version->uniforms.get_data());
  409. hash_build.append("[vertex_globals]");
  410. hash_build.append(p_version->vertex_globals.get_data());
  411. hash_build.append("[fragment_globals]");
  412. hash_build.append(p_version->fragment_globals.get_data());
  413. Vector<StringName> code_sections;
  414. for (const KeyValue<StringName, CharString> &E : p_version->code_sections) {
  415. code_sections.push_back(E.key);
  416. }
  417. code_sections.sort_custom<StringName::AlphCompare>();
  418. for (int i = 0; i < code_sections.size(); i++) {
  419. hash_build.append(String("[code:") + String(code_sections[i]) + "]");
  420. hash_build.append(p_version->code_sections[code_sections[i]].get_data());
  421. }
  422. for (int i = 0; i < p_version->custom_defines.size(); i++) {
  423. hash_build.append("[custom_defines:" + itos(i) + "]");
  424. hash_build.append(p_version->custom_defines[i].get_data());
  425. }
  426. return hash_build.as_string().sha1_text();
  427. }
  428. #ifndef WEB_ENABLED // not supported in webgl
  429. static const char *shader_file_header = "GLSC";
  430. static const uint32_t cache_file_version = 3;
  431. #endif
  432. bool ShaderGLES3::_load_from_cache(Version *p_version) {
  433. #ifdef WEB_ENABLED // not supported in webgl
  434. return false;
  435. #else
  436. #ifdef GLES_OVER_GL
  437. if (glProgramBinary == NULL) { // ARB_get_program_binary extension not available
  438. return false;
  439. }
  440. #endif
  441. String sha1 = _version_get_sha1(p_version);
  442. String path = shader_cache_dir.path_join(name).path_join(base_sha256).path_join(sha1) + ".cache";
  443. Ref<FileAccess> f = FileAccess::open(path, FileAccess::READ);
  444. if (f.is_null()) {
  445. return false;
  446. }
  447. char header[5] = {};
  448. f->get_buffer((uint8_t *)header, 4);
  449. ERR_FAIL_COND_V(header != String(shader_file_header), false);
  450. uint32_t file_version = f->get_32();
  451. if (file_version != cache_file_version) {
  452. return false; // wrong version
  453. }
  454. int cache_variant_count = static_cast<int>(f->get_32());
  455. ERR_FAIL_COND_V_MSG(cache_variant_count != this->variant_count, false, "shader cache variant count mismatch, expected " + itos(this->variant_count) + " got " + itos(cache_variant_count)); //should not happen but check
  456. LocalVector<OAHashMap<uint64_t, Version::Specialization>> variants;
  457. for (int i = 0; i < cache_variant_count; i++) {
  458. uint32_t cache_specialization_count = f->get_32();
  459. OAHashMap<uint64_t, Version::Specialization> variant;
  460. for (uint32_t j = 0; j < cache_specialization_count; j++) {
  461. uint64_t specialization_key = f->get_64();
  462. uint32_t variant_size = f->get_32();
  463. if (variant_size == 0) {
  464. continue;
  465. }
  466. uint32_t variant_format = f->get_32();
  467. Vector<uint8_t> variant_bytes;
  468. variant_bytes.resize(variant_size);
  469. uint32_t br = f->get_buffer(variant_bytes.ptrw(), variant_size);
  470. ERR_FAIL_COND_V(br != variant_size, false);
  471. Version::Specialization specialization;
  472. specialization.id = glCreateProgram();
  473. glProgramBinary(specialization.id, variant_format, variant_bytes.ptr(), variant_bytes.size());
  474. GLint link_status = 0;
  475. glGetProgramiv(specialization.id, GL_LINK_STATUS, &link_status);
  476. if (link_status != GL_TRUE) {
  477. WARN_PRINT_ONCE("Failed to load cached shader, recompiling.");
  478. return false;
  479. }
  480. _get_uniform_locations(specialization, p_version);
  481. specialization.ok = true;
  482. variant.insert(specialization_key, specialization);
  483. }
  484. variants.push_back(variant);
  485. }
  486. p_version->variants = variants;
  487. return true;
  488. #endif // WEB_ENABLED
  489. }
  490. void ShaderGLES3::_save_to_cache(Version *p_version) {
  491. #ifdef WEB_ENABLED // not supported in webgl
  492. return;
  493. #else
  494. #ifdef GLES_OVER_GL
  495. if (glGetProgramBinary == NULL) { // ARB_get_program_binary extension not available
  496. return;
  497. }
  498. #endif
  499. String sha1 = _version_get_sha1(p_version);
  500. String path = shader_cache_dir.path_join(name).path_join(base_sha256).path_join(sha1) + ".cache";
  501. Error error;
  502. Ref<FileAccess> f = FileAccess::open(path, FileAccess::WRITE, &error);
  503. ERR_FAIL_COND(f.is_null());
  504. f->store_buffer((const uint8_t *)shader_file_header, 4);
  505. f->store_32(cache_file_version);
  506. f->store_32(variant_count);
  507. for (int i = 0; i < variant_count; i++) {
  508. int cache_specialization_count = p_version->variants[i].get_num_elements();
  509. f->store_32(cache_specialization_count);
  510. for (OAHashMap<uint64_t, ShaderGLES3::Version::Specialization>::Iterator it = p_version->variants[i].iter(); it.valid; it = p_version->variants[i].next_iter(it)) {
  511. const uint64_t specialization_key = *it.key;
  512. f->store_64(specialization_key);
  513. const Version::Specialization *specialization = it.value;
  514. if (specialization == nullptr) {
  515. f->store_32(0);
  516. continue;
  517. }
  518. GLint program_size = 0;
  519. glGetProgramiv(specialization->id, GL_PROGRAM_BINARY_LENGTH, &program_size);
  520. if (program_size == 0) {
  521. f->store_32(0);
  522. continue;
  523. }
  524. PackedByteArray compiled_program;
  525. compiled_program.resize(program_size);
  526. GLenum binary_format = 0;
  527. glGetProgramBinary(specialization->id, program_size, nullptr, &binary_format, compiled_program.ptrw());
  528. if (program_size != compiled_program.size()) {
  529. f->store_32(0);
  530. continue;
  531. }
  532. f->store_32(program_size);
  533. f->store_32(binary_format);
  534. f->store_buffer(compiled_program.ptr(), compiled_program.size());
  535. }
  536. }
  537. #endif // WEB_ENABLED
  538. }
  539. void ShaderGLES3::_clear_version(Version *p_version) {
  540. // Variants not compiled yet, just return
  541. if (p_version->variants.size() == 0) {
  542. return;
  543. }
  544. for (int i = 0; i < variant_count; i++) {
  545. for (OAHashMap<uint64_t, Version::Specialization>::Iterator it = p_version->variants[i].iter(); it.valid; it = p_version->variants[i].next_iter(it)) {
  546. if (it.value->id != 0) {
  547. glDeleteShader(it.value->vert_id);
  548. glDeleteShader(it.value->frag_id);
  549. glDeleteProgram(it.value->id);
  550. }
  551. }
  552. }
  553. p_version->variants.clear();
  554. }
  555. void ShaderGLES3::_initialize_version(Version *p_version) {
  556. ERR_FAIL_COND(p_version->variants.size() > 0);
  557. if (_load_from_cache(p_version)) {
  558. return;
  559. }
  560. p_version->variants.reserve(variant_count);
  561. for (int i = 0; i < variant_count; i++) {
  562. OAHashMap<uint64_t, Version::Specialization> variant;
  563. p_version->variants.push_back(variant);
  564. Version::Specialization spec;
  565. _compile_specialization(spec, i, p_version, specialization_default_mask);
  566. p_version->variants[i].insert(specialization_default_mask, spec);
  567. }
  568. _save_to_cache(p_version);
  569. }
  570. void ShaderGLES3::version_set_code(RID p_version, const HashMap<String, String> &p_code, const String &p_uniforms, const String &p_vertex_globals, const String &p_fragment_globals, const Vector<String> &p_custom_defines, const LocalVector<ShaderGLES3::TextureUniformData> &p_texture_uniforms, bool p_initialize) {
  571. Version *version = version_owner.get_or_null(p_version);
  572. ERR_FAIL_COND(!version);
  573. _clear_version(version); //clear if existing
  574. version->vertex_globals = p_vertex_globals.utf8();
  575. version->fragment_globals = p_fragment_globals.utf8();
  576. version->uniforms = p_uniforms.utf8();
  577. version->code_sections.clear();
  578. version->texture_uniforms = p_texture_uniforms;
  579. for (const KeyValue<String, String> &E : p_code) {
  580. version->code_sections[StringName(E.key.to_upper())] = E.value.utf8();
  581. }
  582. version->custom_defines.clear();
  583. for (int i = 0; i < p_custom_defines.size(); i++) {
  584. version->custom_defines.push_back(p_custom_defines[i].utf8());
  585. }
  586. if (p_initialize) {
  587. _initialize_version(version);
  588. }
  589. }
  590. bool ShaderGLES3::version_is_valid(RID p_version) {
  591. Version *version = version_owner.get_or_null(p_version);
  592. return version != nullptr;
  593. }
  594. bool ShaderGLES3::version_free(RID p_version) {
  595. if (version_owner.owns(p_version)) {
  596. Version *version = version_owner.get_or_null(p_version);
  597. _clear_version(version);
  598. version_owner.free(p_version);
  599. } else {
  600. return false;
  601. }
  602. return true;
  603. }
  604. bool ShaderGLES3::shader_cache_cleanup_on_start = false;
  605. ShaderGLES3::ShaderGLES3() {
  606. }
  607. void ShaderGLES3::initialize(const String &p_general_defines, int p_base_texture_index) {
  608. general_defines = p_general_defines.utf8();
  609. base_texture_index = p_base_texture_index;
  610. _init();
  611. if (shader_cache_dir != String()) {
  612. StringBuilder hash_build;
  613. hash_build.append("[base_hash]");
  614. hash_build.append(base_sha256);
  615. hash_build.append("[general_defines]");
  616. hash_build.append(general_defines.get_data());
  617. for (int i = 0; i < variant_count; i++) {
  618. hash_build.append("[variant_defines:" + itos(i) + "]");
  619. hash_build.append(variant_defines[i]);
  620. }
  621. base_sha256 = hash_build.as_string().sha256_text();
  622. Ref<DirAccess> d = DirAccess::open(shader_cache_dir);
  623. ERR_FAIL_COND(d.is_null());
  624. if (d->change_dir(name) != OK) {
  625. Error err = d->make_dir(name);
  626. ERR_FAIL_COND(err != OK);
  627. d->change_dir(name);
  628. }
  629. //erase other versions?
  630. if (shader_cache_cleanup_on_start) {
  631. }
  632. //
  633. if (d->change_dir(base_sha256) != OK) {
  634. Error err = d->make_dir(base_sha256);
  635. ERR_FAIL_COND(err != OK);
  636. }
  637. shader_cache_dir_valid = true;
  638. print_verbose("Shader '" + name + "' SHA256: " + base_sha256);
  639. }
  640. glGetInteger64v(GL_MAX_TEXTURE_IMAGE_UNITS, &max_image_units);
  641. }
  642. void ShaderGLES3::set_shader_cache_dir(const String &p_dir) {
  643. shader_cache_dir = p_dir;
  644. }
  645. void ShaderGLES3::set_shader_cache_save_compressed(bool p_enable) {
  646. shader_cache_save_compressed = p_enable;
  647. }
  648. void ShaderGLES3::set_shader_cache_save_compressed_zstd(bool p_enable) {
  649. shader_cache_save_compressed_zstd = p_enable;
  650. }
  651. void ShaderGLES3::set_shader_cache_save_debug(bool p_enable) {
  652. shader_cache_save_debug = p_enable;
  653. }
  654. String ShaderGLES3::shader_cache_dir;
  655. bool ShaderGLES3::shader_cache_save_compressed = true;
  656. bool ShaderGLES3::shader_cache_save_compressed_zstd = true;
  657. bool ShaderGLES3::shader_cache_save_debug = true;
  658. ShaderGLES3::~ShaderGLES3() {
  659. List<RID> remaining;
  660. version_owner.get_owned_list(&remaining);
  661. if (remaining.size()) {
  662. ERR_PRINT(itos(remaining.size()) + " shaders of type " + name + " were never freed");
  663. while (remaining.size()) {
  664. version_free(remaining.front()->get());
  665. remaining.pop_front();
  666. }
  667. }
  668. }
  669. #endif