File tree Expand file tree Collapse file tree 3 files changed +3
-3
lines changed
components/backends/trtllm/engine_configs/llama4/eagle_one_model Expand file tree Collapse file tree 3 files changed +3
-3
lines changed Original file line number Diff line number Diff line change @@ -24,7 +24,7 @@ disable_overlap_scheduler: true # disable_overlap_scheduler is having acc issue
2424speculative_config :
2525 decoding_type : Eagle
2626 max_draft_len : 3
27- pytorch_weights_path : nvidia/Llama-4-Maverick-17B-128E-Eagle3
27+ speculative_model_dir : nvidia/Llama-4-Maverick-17B-128E-Eagle3
2828 eagle3_one_model : true
2929
3030kv_cache_config :
Original file line number Diff line number Diff line change @@ -26,7 +26,7 @@ disable_overlap_scheduler: true
2626speculative_config :
2727 decoding_type : Eagle
2828 max_draft_len : 3
29- pytorch_weights_path : nvidia/Llama-4-Maverick-17B-128E-Eagle3
29+ speculative_model_dir : nvidia/Llama-4-Maverick-17B-128E-Eagle3
3030 eagle3_one_model : True
3131
3232kv_cache_config :
Original file line number Diff line number Diff line change @@ -26,7 +26,7 @@ disable_overlap_scheduler: true
2626speculative_config :
2727 decoding_type : Eagle
2828 max_draft_len : 3
29- pytorch_weights_path : nvidia/Llama-4-Maverick-17B-128E-Eagle3
29+ speculative_model_dir : nvidia/Llama-4-Maverick-17B-128E-Eagle3
3030 eagle3_one_model : True
3131
3232kv_cache_config :
You can’t perform that action at this time.
0 commit comments