diff --git a/fastchat/model/model_adapter.py b/fastchat/model/model_adapter.py index afe79a6bf..8c2fbde32 100644 --- a/fastchat/model/model_adapter.py +++ b/fastchat/model/model_adapter.py @@ -1339,7 +1339,8 @@ def load_model(self, model_path: str, from_pretrained_kwargs: dict): model_path, trust_remote_code=True, ) - config.use_flash_attn = False + # NOTE: if you use the old version of model file, please remove the comments below + # config.use_flash_attn = False config.fp16 = True generation_config = GenerationConfig.from_pretrained( model_path, trust_remote_code=True