saucam commited on
Commit
1134e5f
1 Parent(s): d3f5dae

More changes

Browse files
Files changed (2) hide show
  1. app.py +1 -1
  2. requirements.txt +1 -0
app.py CHANGED
@@ -8,7 +8,7 @@ import spaces
8
  import gradio as gr
9
  from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig, TextIteratorStreamer
10
 
11
- subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "TRUE"}, shell=True)
12
 
13
  MODEL_ID = os.environ.get("MODEL_ID")
14
  CHAT_TEMPLATE = os.environ.get("CHAT_TEMPLATE")
 
8
  import gradio as gr
9
  from transformers import AutoModelForCausalLM, AutoTokenizer, BitsAndBytesConfig, TextIteratorStreamer
10
 
11
+ #subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "TRUE"}, shell=True)
12
 
13
  MODEL_ID = os.environ.get("MODEL_ID")
14
  CHAT_TEMPLATE = os.environ.get("CHAT_TEMPLATE")
requirements.txt CHANGED
@@ -1,4 +1,5 @@
1
  transformers==4.39.2
2
  accelerate
3
  bitsandbytes
 
4
  optimum
 
1
  transformers==4.39.2
2
  accelerate
3
  bitsandbytes
4
+ flash-attn
5
  optimum