from transformers import AutoProcessor, Qwen2AudioForConditionalGeneration
processor = AutoProcessor.from_pretrained("Qwen/Qwen2-Audio-7B-Instruct")
model = Qwen2AudioForConditionalGeneration.from_pretrained("danielwusg/svco_qwins7b_len192_ep2_ckpt468_20250304", torch_dtype=torch.float16)