GilbertAkham commited on
Commit
337042d
·
verified ·
1 Parent(s): e811003

Upload app.py

Browse files
Files changed (1) hide show
  1. app.py +4 -1
app.py CHANGED
@@ -1,3 +1,4 @@
 
1
  import gradio as gr
2
  from transformers import AutoTokenizer, AutoModelForCausalLM
3
  from peft import PeftModel
@@ -8,7 +9,8 @@ LORA = "GilbertAkham/openlm-llama-lora-codetrans" # your LoRA on HF
8
  tokenizer = AutoTokenizer.from_pretrained(BASE)
9
  model = AutoModelForCausalLM.from_pretrained(
10
  BASE,
11
- load_in_8bit=True, # fits on T4/low VRAM
 
12
  device_map="auto"
13
  )
14
  model = PeftModel.from_pretrained(model, LORA)
@@ -34,3 +36,4 @@ demo = gr.Interface(
34
  )
35
 
36
  demo.launch(share=True) # share=True gives you a free public link
 
 
1
+
2
  import gradio as gr
3
  from transformers import AutoTokenizer, AutoModelForCausalLM
4
  from peft import PeftModel
 
9
  tokenizer = AutoTokenizer.from_pretrained(BASE)
10
  model = AutoModelForCausalLM.from_pretrained(
11
  BASE,
12
+ load_in_8bit=True,
13
+ use_fast=False, # fits on T4/low VRAM
14
  device_map="auto"
15
  )
16
  model = PeftModel.from_pretrained(model, LORA)
 
36
  )
37
 
38
  demo.launch(share=True) # share=True gives you a free public link
39
+