Spaces:
Running
on
Zero
Running
on
Zero
Disable speech generation to stable the demo
Browse files
app.py
CHANGED
@@ -57,7 +57,7 @@ from ola.utils import disable_torch_init
|
|
57 |
from ola.datasets.preprocess import tokenizer_image_token, tokenizer_speech_image_token, tokenizer_speech_question_image_token
|
58 |
from ola.mm_utils import get_model_name_from_path, KeywordsStoppingCriteria, process_anyres_video, process_anyres_highres_image_genli
|
59 |
from ola.constants import IGNORE_INDEX, DEFAULT_IMAGE_TOKEN, IMAGE_TOKEN_INDEX, DEFAULT_SPEECH_TOKEN
|
60 |
-
from ola.CosyVoice_main.cosyvoice.cli.cosyvoice import CosyVoice
|
61 |
|
62 |
from huggingface_hub import hf_hub_download
|
63 |
|
@@ -81,7 +81,7 @@ model = model.bfloat16()
|
|
81 |
|
82 |
# tts_model = CosyVoice('iic/CosyVoice-300M-SFT', load_jit=False, fp16=True)
|
83 |
# tts_model = CosyVoice('FunAudioLLM/CosyVoice-300M-SFT', load_jit=True, fp16=True)
|
84 |
-
OUTPUT_SPEECH
|
85 |
|
86 |
USE_SPEECH=False
|
87 |
|
|
|
57 |
from ola.datasets.preprocess import tokenizer_image_token, tokenizer_speech_image_token, tokenizer_speech_question_image_token
|
58 |
from ola.mm_utils import get_model_name_from_path, KeywordsStoppingCriteria, process_anyres_video, process_anyres_highres_image_genli
|
59 |
from ola.constants import IGNORE_INDEX, DEFAULT_IMAGE_TOKEN, IMAGE_TOKEN_INDEX, DEFAULT_SPEECH_TOKEN
|
60 |
+
# from ola.CosyVoice_main.cosyvoice.cli.cosyvoice import CosyVoice
|
61 |
|
62 |
from huggingface_hub import hf_hub_download
|
63 |
|
|
|
81 |
|
82 |
# tts_model = CosyVoice('iic/CosyVoice-300M-SFT', load_jit=False, fp16=True)
|
83 |
# tts_model = CosyVoice('FunAudioLLM/CosyVoice-300M-SFT', load_jit=True, fp16=True)
|
84 |
+
OUTPUT_SPEECH=False
|
85 |
|
86 |
USE_SPEECH=False
|
87 |
|