|
|
@@ -16,7 +16,8 @@
|
|
|
"HARDSWISH_FUNC": "{{MUTATE}}[dst_i] = src[src_i] * min(1.0, max(0.0, (src[src_i] + 3.0) / 6.0));",
|
|
|
"GELU_FUNC": "{{MUTATE}}[dst_i] = 0.5 * src[src_i] * (1.0 + tanh(clamp(sqrt(2.0 / 3.14159265) * (src[src_i] + 0.044715 * pow(src[src_i], 3.0)), -9.010913, 9.010913))); // Regarding tanh() domain restrictions in wgsl https://github.com/gpuweb/gpuweb/issues/4458",
|
|
|
"GELU_QUICK_FUNC": "{{MUTATE}}[dst_i] = src[src_i] * 0.5 * (1.0 + tanh(clamp(0.79788456 * (src[src_i] + 0.044715 * src[src_i] * src[src_i] * src[src_i]), -9.010913, 9.010913))); // Regarding tanh() domain restrictions in wgsl https://github.com/gpuweb/gpuweb/issues/4458",
|
|
|
- "GELU_ERF_FUNC": "{{MUTATE}}[dst_i] = 0.5 * src[src_i] * (1.0 + tanh(clamp(0.79788456 * (src[src_i] + 0.044715 * src[src_i] * src[src_i] * src[src_i]), -9.010913, 9.010913))); // Regarding tanh() domain restrictions in wgsl https://github.com/gpuweb/gpuweb/issues/4458"
|
|
|
+ "GELU_ERF_FUNC": "{{MUTATE}}[dst_i] = 0.5 * src[src_i] * (1.0 + tanh(clamp(0.79788456 * (src[src_i] + 0.044715 * src[src_i] * src[src_i] * src[src_i]), -9.010913, 9.010913))); // Regarding tanh() domain restrictions in wgsl https://github.com/gpuweb/gpuweb/issues/4458",
|
|
|
+ "CEIL_FUNC": "{{MUTATE}}[dst_i] = ceil(src[src_i]);"
|
|
|
}
|
|
|
|
|
|
#end(REPL_TEMPLATES)
|
|
|
@@ -357,6 +358,27 @@
|
|
|
"SHADER_NAME": "gelu_erf_inplace_f16",
|
|
|
"REPLS": { "TYPE": "f16", "FUNC": "GELU_ERF_FUNC", "EXT_PARAMS": "", "MUTATE": "src" },
|
|
|
"DECLS": ["INPLACE"]
|
|
|
+ },
|
|
|
+
|
|
|
+ {
|
|
|
+ "SHADER_NAME": "ceil_f32",
|
|
|
+ "REPLS": { "TYPE": "f32", "FUNC": "CEIL_FUNC", "EXT_PARAMS": "", "MUTATE": "dst" },
|
|
|
+ "DECLS": ["NOT_INPLACE"]
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "SHADER_NAME": "ceil_f16",
|
|
|
+ "REPLS": { "TYPE": "f16", "FUNC": "CEIL_FUNC", "EXT_PARAMS": "", "MUTATE": "dst" },
|
|
|
+ "DECLS": ["NOT_INPLACE"]
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "SHADER_NAME": "ceil_inplace_f32",
|
|
|
+ "REPLS": { "TYPE": "f32", "FUNC": "CEIL_FUNC", "EXT_PARAMS": "", "MUTATE": "src" },
|
|
|
+ "DECLS": ["INPLACE"]
|
|
|
+ },
|
|
|
+ {
|
|
|
+ "SHADER_NAME": "ceil_inplace_f16",
|
|
|
+ "REPLS": { "TYPE": "f16", "FUNC": "CEIL_FUNC", "EXT_PARAMS": "", "MUTATE": "src" },
|
|
|
+ "DECLS": ["INPLACE"]
|
|
|
}
|
|
|
]
|
|
|
|