sagar007 commited on
Commit
20d8ecd
·
verified ·
1 Parent(s): 08b6fa7

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +3 -0
app.py CHANGED
@@ -2,6 +2,9 @@ import gradio as gr
2
  import torch
3
  from transformers import AutoTokenizer, LlamaForCausalLM
4
  import spaces
 
 
 
5
 
6
  # Initialize model and tokenizer
7
  model_id = 'akjindal53244/Llama-3.1-Storm-8B'
 
2
  import torch
3
  from transformers import AutoTokenizer, LlamaForCausalLM
4
  import spaces
5
+ import subprocess
6
+ subprocess.run('pip install flash-attn --no-build-isolation', env={'FLASH_ATTENTION_SKIP_CUDA_BUILD': "TRUE"}, shell=True)
7
+
8
 
9
  # Initialize model and tokenizer
10
  model_id = 'akjindal53244/Llama-3.1-Storm-8B'