mirror of
https://github.com/deepseek-ai/DeepSeek-VL2
synced 2025-01-22 12:25:32 +00:00
Update inference.py
This commit is contained in:
parent
9789f97283
commit
66ec91081c
@ -127,10 +127,10 @@ def main(args):
|
||||
|
||||
with torch.no_grad():
|
||||
|
||||
inputs_embeds = None
|
||||
past_key_values = None
|
||||
|
||||
if args.chunk_size > 0:
|
||||
if args.chunk_size == -1:
|
||||
inputs_embeds = vl_gpt.prepare_inputs_embeds(**prepare_inputs)
|
||||
past_key_values = None
|
||||
else:
|
||||
# incremental_prefilling when using 40G GPU for vl2-small
|
||||
inputs_embeds, past_key_values = vl_gpt.incremental_prefilling(
|
||||
input_ids=prepare_inputs.input_ids,
|
||||
|
Loading…
Reference in New Issue
Block a user