Spaces:

TeamTonic
/

TonicsYI-6B-200k

Paused

Tonic commited on Nov 22, 2023

Commit

4d0d5e0

1 Parent(s): 91969b4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,12 +10,14 @@ model_id = "TheBloke/Yi-34B-200K-Llamafied-GPTQ"
 gptq_config = GPTQConfig(
     bits=4,
     exllama_config={"version": 2}
 )
 tokenizer = YiTokenizer.from_pretrained("./")
 model = AutoModelForCausalLM.from_pretrained(
     model_id,
     device_map="auto",
     quantization_config=gptq_config
 )
 def run(message, chat_history, max_new_tokens=4056, temperature=3.5, top_p=0.9, top_k=800):
     prompt = get_prompt(message, chat_history)

 gptq_config = GPTQConfig(
     bits=4,
     exllama_config={"version": 2}
+    disable_exllama=True
 )
 tokenizer = YiTokenizer.from_pretrained("./")
 model = AutoModelForCausalLM.from_pretrained(
     model_id,
     device_map="auto",
     quantization_config=gptq_config
 )
 def run(message, chat_history, max_new_tokens=4056, temperature=3.5, top_p=0.9, top_k=800):
     prompt = get_prompt(message, chat_history)