[infer] vllm video/audio inference (#7566)
This commit is contained in:
@@ -262,9 +262,7 @@ _register_composite_model(
|
||||
projector_key="visual.merger",
|
||||
vision_model_keys=["visual.patch_embed", "visual.blocks", "audio_tower"],
|
||||
language_model_keys=["model", "lm_head"],
|
||||
lora_conflict_keys=[
|
||||
"patch_embed",
|
||||
],
|
||||
lora_conflict_keys=["patch_embed"],
|
||||
)
|
||||
|
||||
|
||||
|
||||
Reference in New Issue
Block a user