File tree Expand file tree Collapse file tree 1 file changed +1
-4
lines changed Expand file tree Collapse file tree 1 file changed +1
-4
lines changed Original file line number Diff line number Diff line change @@ -5469,9 +5469,6 @@ static struct ggml_cgraph * llama_build_graph(
5469
5469
// check if we should build the worst-case graph (for memory measurement)
5470
5470
const bool worst_case = ggml_allocr_is_measure (lctx.alloc );
5471
5471
5472
- // count the number of times a tensor with a given name has been offloaded
5473
- std::unordered_map<std::string, int > offload_n;
5474
-
5475
5472
// keep track of the input that has already been allocated
5476
5473
bool alloc_inp_tokens = false ;
5477
5474
bool alloc_inp_embd = false ;
@@ -5654,7 +5651,7 @@ static struct ggml_cgraph * llama_build_graph(
5654
5651
break ;
5655
5652
case OFFLOAD_FUNC:
5656
5653
if (n_gpu_layers < n_layer) {
5657
- if (offload_n[name]++ < i_gpu_start) {
5654
+ if (il < i_gpu_start) {
5658
5655
func_e = OFFLOAD_FUNC_NOP;
5659
5656
}
5660
5657
}
You can’t perform that action at this time.
0 commit comments