File tree Expand file tree Collapse file tree 2 files changed +0
-11
lines changed Expand file tree Collapse file tree 2 files changed +0
-11
lines changed Original file line number Diff line number Diff line change @@ -72,11 +72,3 @@ class ggml_tensor_extra_split_expert : public ggml_tensor_extra_interface {
72
72
void *get_expert_param (int expert_id) override ;
73
73
void *get_expert_param_gpu (int expert_id) override ;
74
74
};
75
-
76
- class ggml_tensor_extra_gpu_cache : public ggml_tensor_extra_interface {
77
- public:
78
- void * data_cache_host;
79
- size_t per_expert_nbytes;
80
- long get_per_expert_alloc_nbytes () override { return per_expert_nbytes; }
81
- void * get_expert_param (int expert_id) override ;
82
- };
Original file line number Diff line number Diff line change @@ -117,9 +117,6 @@ void sparse_llm_cache_context::init_gpu_states() {
117
117
states->prefetch_mngr ->launch_thread ();
118
118
}
119
119
120
- void * ggml_tensor_extra_gpu_cache::get_expert_param (int expert_id) {
121
- return (uint8_t *)data_cache_host + expert_id*this ->per_expert_nbytes ;
122
- }
123
120
void * ggml_tensor_extra_split_expert::get_expert_param (int expert_id) {
124
121
// return this->get_expert_param_gpu(expert_id);
125
122
return this ->per_expert_host_data [expert_id];
You can’t perform that action at this time.
0 commit comments