diff --git a/server/lorax_server/models/flash_causal_lm.py b/server/lorax_server/models/flash_causal_lm.py index 1de051999..4ec97c5d6 100644 --- a/server/lorax_server/models/flash_causal_lm.py +++ b/server/lorax_server/models/flash_causal_lm.py @@ -271,7 +271,6 @@ def from_pb( max_length = max(max_length, input_length + max_new_tokens) adapter_indices = torch.cat(adapter_indices_list).to(dtype=torch.int64, device=device) - print("!!! ADAPTER INDICES", adapter_indices) request_tokenizers = [ tokenizers.get_tokenizer(r.adapter_index, tokenizer)