há 2 anos atrás · 5ec8dd5a3c
--- a/ggml-cuda.cu
+++ b/ggml-cuda.cu
@@ -2635,7 +2635,7 @@ void ggml_cuda_free_scratch() {
 
				 bool ggml_cuda_compute_forward(struct ggml_compute_params * params, struct ggml_tensor * tensor){
			
 
				     ggml_cuda_func_t func;
			
 
				     const bool any_on_device = tensor->backend == GGML_BACKEND_GPU
			
 
				-        || tensor->src0->backend == GGML_BACKEND_GPU || tensor->src0->backend == GGML_BACKEND_GPU_SPLIT
			
 
				+        || (tensor->src0 != nullptr && (tensor->src0->backend == GGML_BACKEND_GPU || tensor->src0->backend == GGML_BACKEND_GPU_SPLIT))
			
 
				         || (tensor->src1 != nullptr && tensor->src1->backend == GGML_BACKEND_GPU);
			
 
				 
			
 
				     switch (tensor->op) {
			
--- a/ggml.c
+++ b/ggml.c
@@ -14911,7 +14911,7 @@ static void ggml_compute_forward(struct ggml_compute_params * params, struct ggm
 
				     if (skip_cpu) {
			
 
				         return;
			
 
				     }
			
 
				-    GGML_ASSERT(tensor->src0->backend == GGML_BACKEND_CPU);
			
 
				+    GGML_ASSERT(tensor->src0 == NULL || tensor->src0->backend == GGML_BACKEND_CPU);
			
 
				     GGML_ASSERT(tensor->src1 == NULL || tensor->src1->backend == GGML_BACKEND_CPU);
			
 
				 #endif // GGML_USE_CUBLAS