From 7c7836d9d4062d6858e3fb337b135c417ccee6ce Mon Sep 17 00:00:00 2001 From: 0cc4m Date: Sun, 16 Jun 2024 07:17:31 +0200 Subject: Vulkan Shader Refactor, Memory Debugging Option (#7947) * Refactor shaders, extract GLSL code from ggml_vk_generate_shaders.py into vulkan-shaders directory * Improve debug log code * Add memory debug output option * Fix flake8 * Fix unnecessary high llama-3 VRAM use --- vulkan-shaders/relu.comp | 21 +++++++++++++++++++++ 1 file changed, 21 insertions(+) create mode 100644 vulkan-shaders/relu.comp (limited to 'vulkan-shaders/relu.comp') diff --git a/vulkan-shaders/relu.comp b/vulkan-shaders/relu.comp new file mode 100644 index 00000000..7e5baa5b --- /dev/null +++ b/vulkan-shaders/relu.comp @@ -0,0 +1,21 @@ +#version 450 + +#include "generic_head.comp" +#include "types.comp" + +#extension GL_EXT_control_flow_attributes : enable + +layout(local_size_x = 512, local_size_y = 1, local_size_z = 1) in; + +layout (binding = 0) readonly buffer X {A_TYPE data_a[];}; +layout (binding = 1) writeonly buffer D {D_TYPE data_d[];}; + +void main() { + const uint i = gl_GlobalInvocationID.x; + + if (i >= p.KX) { + return; + } + + data_d[i] = max(float(data_a[i]), 0); +} -- cgit v1.2.3