[Core] Support dynamically loading Lora adapter from HuggingFace (#6234)
Co-authored-by: Antoni Baum <antoni.baum@protonmail.com>
This commit is contained in:
@@ -29,7 +29,7 @@ def _create_lora_request(lora_id, long_context_infos):
|
||||
context_len = long_context_infos[lora_id]["context_length"]
|
||||
scaling_factor = context_len_to_scaling_factor[context_len]
|
||||
return LoRARequest(context_len, lora_id,
|
||||
long_context_infos[lora_id]["lora"],
|
||||
long_context_infos[lora_id]["lora"], None,
|
||||
4096 * scaling_factor)
|
||||
|
||||
|
||||
|
||||
Reference in New Issue
Block a user