diff --git a/llama.cpp b/llama.cpp index 08d6c162a5d7c..81083e167c3aa 100644 --- a/llama.cpp +++ b/llama.cpp @@ -6639,6 +6639,7 @@ static void llama_model_quantize_internal(const std::string & fname_inp, const s } std::ofstream fout(fname_out, std::ios::binary); + fout.exceptions(std::ofstream::failbit); // fail fast on write errors const size_t meta_size = gguf_get_meta_size(ctx_out);