archit11 commited on
Commit
8cacf45
1 Parent(s): dfc51c7

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -2,7 +2,8 @@ import spaces
2
  import gradio as gr
3
  from cartesia_pytorch import ReneLMHeadModel
4
  from transformers import AutoTokenizer
5
-
 
6
  # Load model and tokenizer
7
  model = ReneLMHeadModel.from_pretrained("cartesia-ai/Rene-v0.1-1.3b-pytorch").half().cuda()
8
  tokenizer = AutoTokenizer.from_pretrained("allenai/OLMo-1B-hf")
 
2
  import gradio as gr
3
  from cartesia_pytorch import ReneLMHeadModel
4
  from transformers import AutoTokenizer
5
+ import subprocess
6
+ subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "TRUE"}, shell=True)
7
  # Load model and tokenizer
8
  model = ReneLMHeadModel.from_pretrained("cartesia-ai/Rene-v0.1-1.3b-pytorch").half().cuda()
9
  tokenizer = AutoTokenizer.from_pretrained("allenai/OLMo-1B-hf")