Skip to content

Commit f061021

Browse files
authored
llama : print size and type of overridden tensors (#13364)
1 parent 8733e0c commit f061021

File tree

1 file changed

+4
-1
lines changed

1 file changed

+4
-1
lines changed

src/llama-model.cpp

Lines changed: 4 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1651,8 +1651,11 @@ bool llama_model::load_tensors(llama_model_loader & ml) {
16511651
for (const auto * overrides = ml.tensor_buft_overrides; overrides->pattern != nullptr; ++overrides) {
16521652
std::regex pattern(overrides->pattern);
16531653
if (std::regex_search(tensor_name, pattern)) {
1654-
LLAMA_LOG_DEBUG("tensor %s buffer type overriden to %s\n", tensor_name.c_str(), ggml_backend_buft_name(overrides->buft));
16551654
buft = overrides->buft;
1655+
LLAMA_LOG_DEBUG("tensor %s (%zu MiB %s) buffer type overridden to %s\n",
1656+
tensor_name.c_str(),
1657+
ggml_nbytes(t_meta) / 1024 / 1024, ggml_type_name(t_meta->type),
1658+
ggml_backend_buft_name(buft));
16561659
break;
16571660
}
16581661
}

0 commit comments

Comments
 (0)