Mathias Lux commited on
Commit
14e9219
·
1 Parent(s): 0b72e22

Switched to granite for long contexts.

Browse files
Files changed (1) hide show
  1. app.py +2 -1
app.py CHANGED
@@ -4,7 +4,8 @@ from huggingface_hub import InferenceClient
4
  """
5
  For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
6
  """
7
- client = InferenceClient("meta-llama/Llama-3.2-3B-Instruct")
 
8
  # client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
9
 
10
  _sys_msg = """
 
4
  """
5
  For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
6
  """
7
+ client = InferenceClient("ibm-granite/granite-3.1-2b-instruct") # specifically for long contexts.
8
+ # client = InferenceClient("meta-llama/Llama-3.2-3B-Instruct") # too small context window
9
  # client = InferenceClient("HuggingFaceH4/zephyr-7b-beta")
10
 
11
  _sys_msg = """