Spaces:
Running
on
Zero
Running
on
Zero
Update app.py
Browse files
app.py
CHANGED
@@ -49,7 +49,7 @@ The role you will play follows below.
|
|
49 |
"""
|
50 |
|
51 |
# Install flash-attn
|
52 |
-
subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "
|
53 |
# Initialize the model pipeline
|
54 |
generator = pipeline('text-generation', model='Locutusque/Thespis-Llama-3.1-8B', torch_dtype=torch.bfloat16, token=os.getenv("TOKEN"))
|
55 |
@spaces.GPU
|
|
|
49 |
"""
|
50 |
|
51 |
# Install flash-attn
|
52 |
+
subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "FALSE"}, shell=True)
|
53 |
# Initialize the model pipeline
|
54 |
generator = pipeline('text-generation', model='Locutusque/Thespis-Llama-3.1-8B', torch_dtype=torch.bfloat16, token=os.getenv("TOKEN"))
|
55 |
@spaces.GPU
|