Spaces:

featherless-ai
/

try-this-model

Running

wxgeorge commited on 5 days ago

Commit

f02037a

•

1 Parent(s): 75d7eaa

:wrench: drop reflection. add Nemotron. make default model.

Files changed (3) hide show

README.md CHANGED Viewed

@@ -1977,7 +1977,7 @@ models:
  - ziniuli/Mistral-7B-ReMax-v0.1
  - zmzmxz/NeuralPipe-7B-slerp
  - Qwen/Qwen2.5-72B
- - mattshumer/Reflection-Llama-3.1-70B
 ---
 # Overview

  - ziniuli/Mistral-7B-ReMax-v0.1
  - zmzmxz/NeuralPipe-7B-slerp
  - Qwen/Qwen2.5-72B
+ - nvidia/Llama-3.1-Nemotron-70B-Instruct-HF
 ---
 # Overview

app.py CHANGED Viewed

@@ -40,12 +40,14 @@ model_class_filter = {
 # we run a few other models here as well
 REFLECTION="mattshumer/Reflection-Llama-3.1-70B"
 QWEN25_72B="Qwen/Qwen2.5-72B"
 bigger_whitelisted_models = [
- REFLECTION,
- QWEN25_72B
 ]
 # REFLECTION is in backup hosting
 model_class_from_model_id[REFLECTION] = 'llama31-70b-16k'
 def build_model_choices():
  all_choices = []
  for model_class in model_cache:
@@ -72,6 +74,7 @@ def model_in_list(model):
 key=os.environ.get('RANDOM_SEED', 'kcOtfNHA+e')
 o = random.Random(f"{key}-{datetime.date.today().strftime('%Y-%m-%d')}")
 initial_model = o.choice(model_choices)[1]
 # this doesn't work in HF spaces because we're iframed :(
 # def initial_model(referer=None):
 # return REFLECTION
@@ -105,7 +108,7 @@ def respond(message, history, model):
  history_openai_format.append({"role": "assistant", "content":assistant})
  history_openai_format.append({"role": "user", "content": message})
- if model == "mattshumer/Reflection-Llama-3.1-70B":
  history_openai_format = [
  {"role": "system", "content": REFLECTION_SYSTEM_PROMPT},
  *history_openai_format

 # we run a few other models here as well
 REFLECTION="mattshumer/Reflection-Llama-3.1-70B"
 QWEN25_72B="Qwen/Qwen2.5-72B"
+NEMOTRON="nvidia/Llama-3.1-Nemotron-70B-Instruct-HF"
 bigger_whitelisted_models = [
+ QWEN25_72B,
+ NEMOTRON
 ]
 # REFLECTION is in backup hosting
 model_class_from_model_id[REFLECTION] = 'llama31-70b-16k'
+model_class_from_model_id[NEMOTRON] = 'llama31-70b-16k'
 def build_model_choices():
  all_choices = []
  for model_class in model_cache:
 key=os.environ.get('RANDOM_SEED', 'kcOtfNHA+e')
 o = random.Random(f"{key}-{datetime.date.today().strftime('%Y-%m-%d')}")
 initial_model = o.choice(model_choices)[1]
+initial_model = NEMOTRON
 # this doesn't work in HF spaces because we're iframed :(
 # def initial_model(referer=None):
 # return REFLECTION
  history_openai_format.append({"role": "assistant", "content":assistant})
  history_openai_format.append({"role": "user", "content": message})
+ if model == REFLECTION:
  history_openai_format = [
  {"role": "system", "content": REFLECTION_SYSTEM_PROMPT},
  *history_openai_format

readme-generator/generate.sh CHANGED Viewed

@@ -20,7 +20,7 @@ $(cat ../model-cache.json \
  console.log(yamlStr);"
 )
  - Qwen/Qwen2.5-72B
- - mattshumer/Reflection-Llama-3.1-70B
 ---
 $(cat body.md)

  console.log(yamlStr);"
 )
  - Qwen/Qwen2.5-72B
+ - nvidia/Llama-3.1-Nemotron-70B-Instruct-HF
 ---
 $(cat body.md)