Skip to content
Merged
Changes from 2 commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
5 changes: 5 additions & 0 deletions fastchat/serve/model_worker.py
Original file line number Diff line number Diff line change
Expand Up @@ -82,6 +82,7 @@ def __init__(
gptq_config=gptq_config,
awq_config=awq_config,
exllama_config=exllama_config,
debug=kwargs["debug"],
)
self.device = device
if self.tokenizer.pad_token == None:
Expand Down Expand Up @@ -283,6 +284,9 @@ def create_model_worker():
default=None,
help="Overwrite the random seed for each generation.",
)
parser.add_argument(
"--debug", type=bool, default=False, help="Print debugging messages"
)
args = parser.parse_args()
logger.info(f"args: {args}")

Expand Down Expand Up @@ -333,6 +337,7 @@ def create_model_worker():
conv_template=args.conv_template,
embed_in_truncate=args.embed_in_truncate,
seed=args.seed,
debug=args.debug,
)
return args, worker

Expand Down