Files
test-small-llms/suite_settings/models.py
Lennart J. Kurzweg (Nx2) e3df5d3e78 models fix
2024-08-30 18:58:33 +02:00

35 lines
4.1 KiB
Python

from libs.classes import Model
models = {
245: Model( display_name="llama3.1 8b", identifier="llama3.1:8b", supports_tools=True, parameter_count_in_b=8 ),
238: Model( display_name="llama3.1 70b", identifier="llama3.1:70b", supports_tools=True, parameter_count_in_b=70 ),
# 539: Model( display_name="llama3.1 405b", identifier="llama3.1:405b", supports_tools=True, parameter_count_in_b=405 ),
120: Model( display_name="llama3 groq TU 8b", identifier="llama3-groq-tool-use:8b", supports_tools=True, parameter_count_in_b=8 ),
890: Model( display_name="llama3 groq TU 70b", identifier="llama3-groq-tool-use:70b", supports_tools=True, parameter_count_in_b=70 ),
639: Model( display_name="Mistral Large 123b", identifier="mistral-large:123b", supports_tools=True, parameter_count_in_b=123 ),
982: Model( display_name="Mistral 0.3 7b", identifier="mistral:7b", supports_tools=True, parameter_count_in_b=7 ),
670: Model( display_name="Mistral Nemo 12b", identifier="mistral-nemo:12b", supports_tools=True, parameter_count_in_b=12 ),
348: Model( display_name="Mixtral MoE 8x7b", identifier="mixtral:8x7b", supports_tools=False, parameter_count_in_b=13, ),
789: Model( display_name="Mixtral MoE 8x22b", identifier="mixtral:8x22b", supports_tools=True, parameter_count_in_b=39 ),
453: Model( display_name="Zephyr 7b", identifier="zephyr:7b", supports_tools=False, parameter_count_in_b=7 ),
445: Model( display_name="Gemma2 2b", identifier="gemma2:2b", supports_tools=False, parameter_count_in_b=2 ),
475: Model( display_name="Gemma2 9b", identifier="gemma2:9b", supports_tools=False, parameter_count_in_b=9 ),
626: Model( display_name="Gemma2 27b", identifier="gemma2:27b", supports_tools=False, parameter_count_in_b=27 ),
229: Model( display_name="Phi3 3.8b", identifier="phi3:3.8b", supports_tools=False, parameter_count_in_b=3.8 ),
329: Model( display_name="Phi3 14b", identifier="phi3:14b", supports_tools=False, parameter_count_in_b=14 ),
251: Model( display_name="Phi3.5 3.8b", identifier="phi3.5:3.8b", supports_tools=False, parameter_count_in_b=3.8 ),
903: Model( display_name="Tinyllama 1.1b", identifier="tinyllama:1.1b", supports_tools=False, parameter_count_in_b=1.1 ),
409: Model( display_name="Command R 35b", identifier="command-r:35b", supports_tools=False, parameter_count_in_b=35 ),
404: Model( display_name="Command R+ 104b", identifier="command-r-plus:104b", supports_tools=True, parameter_count_in_b=104 ),
701: Model( display_name="Yi 6b", identifier="yi:6b", supports_tools=False, parameter_count_in_b=6 ),
704: Model( display_name="Yi 9b", identifier="yi:9b", supports_tools=False, parameter_count_in_b=6 ),
724: Model( display_name="Yi 34b", identifier="yi:34b", supports_tools=False, parameter_count_in_b=34 ),
853: Model( display_name="Qwen2 0.5b", identifier="qwen2:0.5b", supports_tools=False, parameter_count_in_b=0.5 ),
23: Model( display_name="Qwen2 1.5b", identifier="qwen2:1.5b", supports_tools=False, parameter_count_in_b=1.5 ),
295: Model( display_name="Qwen2 7b", identifier="qwen2:7b", supports_tools=False, parameter_count_in_b=7 ),
655: Model( display_name="Qwen2 72b", identifier="qwen2:72b", supports_tools=False, parameter_count_in_b=72 ),
780: Model( display_name="Hermes3 8b", identifier="hermes3:8b", supports_tools=True, parameter_count_in_b=8 ),
68: Model( display_name="Aya 8b", identifier="aya:8b", supports_tools=False, parameter_count_in_b=8 ),
397: Model( display_name="Aya 35b", identifier="aya:35b", supports_tools=False, parameter_count_in_b=35 ),
}