mirror of
https://github.com/deepseek-ai/DeepSeek-VL2
synced 2025-06-26 18:25:56 +00:00
Update inference.py
This commit is contained in:
@@ -127,10 +127,10 @@ def main(args):
|
||||
|
||||
with torch.no_grad():
|
||||
|
||||
inputs_embeds = None
|
||||
past_key_values = None
|
||||
|
||||
if args.chunk_size > 0:
|
||||
if args.chunk_size == -1:
|
||||
inputs_embeds = vl_gpt.prepare_inputs_embeds(**prepare_inputs)
|
||||
past_key_values = None
|
||||
else:
|
||||
# incremental_prefilling when using 40G GPU for vl2-small
|
||||
inputs_embeds, past_key_values = vl_gpt.incremental_prefilling(
|
||||
input_ids=prepare_inputs.input_ids,
|
||||
|
||||
Reference in New Issue
Block a user