Skip to content

Commit 421e39b

Browse files
committed
use ggml_backend_tensor_get_async and sync for cuda backend
1 parent 9ea2bcd commit 421e39b

File tree

1 file changed

+6
-2
lines changed

1 file changed

+6
-2
lines changed

stable-diffusion.cpp

Lines changed: 6 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -606,8 +606,12 @@ std::pair<std::unordered_map<std::string, float>, std::string> extract_and_remov
606606
}
607607

608608
void ggml_backend_tensor_get_and_sync(ggml_backend_t backend, const struct ggml_tensor * tensor, void * data, size_t offset, size_t size) {
609-
ggml_backend_tensor_get(tensor, data, offset, size);
610-
ggml_backend_synchronize(backend);
609+
#ifdef SD_USE_CUBLAS
610+
ggml_backend_tensor_get_async(backend, tensor, data, offset, size);
611+
ggml_backend_synchronize(backend);
612+
#else
613+
ggml_backend_tensor_get(tensor, data, offset, size);
614+
#endif
611615
}
612616

613617
/*================================================== CLIPTokenizer ===================================================*/

0 commit comments

Comments
 (0)