descriptions = { 'gemma2': _("Google Gemma 2 is now available in 2 sizes, 9B and 27B."), 'llama3': _("Meta Llama 3: The most capable openly available LLM to date"), 'qwen2': _("Qwen2 is a new series of large language models from Alibaba group"), 'deepseek-coder-v2': _("An open-source Mixture-of-Experts code language model that achieves performance comparable to GPT4-Turbo in code-specific tasks."), 'phi3': _("Phi-3 is a family of lightweight 3B (Mini) and 14B (Medium) state-of-the-art open models by Microsoft."), 'aya': _("Aya 23, released by Cohere, is a new family of state-of-the-art, multilingual models that support 23 languages."), 'mistral': _("The 7B model released by Mistral AI, updated to version 0.3."), 'mixtral': _("A set of Mixture of Experts (MoE) model with open weights by Mistral AI in 8x7b and 8x22b parameter sizes."), 'codegemma': _("CodeGemma is a collection of powerful, lightweight models that can perform a variety of coding tasks like fill-in-the-middle code completion, code generation, natural language understanding, mathematical reasoning, and instruction following."), 'command-r': _("Command R is a Large Language Model optimized for conversational interaction and long context tasks."), 'command-r-plus': _("Command R+ is a powerful, scalable large language model purpose-built to excel at real-world enterprise use cases."), 'llava': _("🌋 LLaVA is a novel end-to-end trained large multimodal model that combines a vision encoder and Vicuna for general-purpose visual and language understanding. Updated to version 1.6."), 'gemma': _("Gemma is a family of lightweight, state-of-the-art open models built by Google DeepMind. Updated to version 1.1"), 'qwen': _("Qwen 1.5 is a series of large language models by Alibaba Cloud spanning from 0.5B to 110B parameters"), 'llama2': _("Llama 2 is a collection of foundation language models ranging from 7B to 70B parameters."), 'codellama': _("A large language model that can use text prompts to generate and discuss code."), 'dolphin-mixtral': _("Uncensored, 8x7b and 8x22b fine-tuned models based on the Mixtral mixture of experts models that excels at coding tasks. Created by Eric Hartford."), 'llama2-uncensored': _("Uncensored Llama 2 model by George Sung and Jarrad Hope."), 'deepseek-coder': _("DeepSeek Coder is a capable coding model trained on two trillion code and natural language tokens."), 'nomic-embed-text': _("A high-performing open embedding model with a large token context window."), 'phi': _("Phi-2: a 2.7B language model by Microsoft Research that demonstrates outstanding reasoning and language understanding capabilities."), 'dolphin-mistral': _("The uncensored Dolphin model based on Mistral that excels at coding tasks. Updated to version 2.8."), 'mistral-openorca': _("Mistral OpenOrca is a 7 billion parameter model, fine-tuned on top of the Mistral 7B model using the OpenOrca dataset."), 'orca-mini': _("A general-purpose model ranging from 3 billion parameters to 70 billion, suitable for entry-level hardware."), 'mxbai-embed-large': _("State-of-the-art large embedding model from mixedbread.ai"), 'dolphin-llama3': _("Dolphin 2.9 is a new model with 8B and 70B sizes by Eric Hartford based on Llama 3 that has a variety of instruction, conversational, and coding skills."), 'starcoder2': _("StarCoder2 is the next generation of transparently trained open code LLMs that comes in three sizes: 3B, 7B and 15B parameters."), 'llama2-chinese': _("Llama 2 based model fine tuned to improve Chinese dialogue ability."), 'zephyr': _("Zephyr is a series of fine-tuned versions of the Mistral and Mixtral models that are trained to act as helpful assistants."), 'yi': _("Yi 1.5 is a high-performing, bilingual language model."), 'nous-hermes2': _("The powerful family of models by Nous Research that excels at scientific discussion and coding tasks."), 'vicuna': _("General use chat model based on Llama and Llama 2 with 2K to 16K context sizes."), 'wizard-vicuna-uncensored': _("Wizard Vicuna Uncensored is a 7B, 13B, and 30B parameter model based on Llama 2 uncensored by Eric Hartford."), 'tinyllama': _("The TinyLlama project is an open endeavor to train a compact 1.1B Llama model on 3 trillion tokens."), 'wizardlm2': _("State of the art large language model from Microsoft AI with improved performance on complex chat, multilingual, reasoning and agent use cases."), 'starcoder': _("StarCoder is a code generation model trained on 80+ programming languages."), 'codestral': _("Codestral is Mistral AI’s first-ever code model designed for code generation tasks."), 'openchat': _("A family of open-source models trained on a wide variety of data, surpassing ChatGPT on various benchmarks. Updated to version 3.5-0106."), 'tinydolphin': _("An experimental 1.1B parameter model trained on the new Dolphin 2.8 dataset by Eric Hartford and based on TinyLlama."), 'openhermes': _("OpenHermes 2.5 is a 7B model fine-tuned by Teknium on Mistral with fully open datasets."), 'wizardcoder': _("State-of-the-art code generation model"), 'stable-code': _("Stable Code 3B is a coding model with instruct and code completion variants on par with models such as Code Llama 7B that are 2.5x larger."), 'neural-chat': _("A fine-tuned model based on Mistral with good coverage of domain and language."), 'wizard-math': _("Model focused on math and logic problems"), 'codeqwen': _("CodeQwen1.5 is a large language model pretrained on a large amount of code data."), 'phind-codellama': _("Code generation model based on Code Llama."), 'stablelm2': _("Stable LM 2 is a state-of-the-art 1.6B and 12B parameter language model trained on multilingual data in English, Spanish, German, Italian, French, Portuguese, and Dutch."), 'dolphincoder': _("A 7B and 15B uncensored variant of the Dolphin model family that excels at coding, based on StarCoder2."), 'all-minilm': _("Embedding models on very large sentence level datasets."), 'nous-hermes': _("General use models based on Llama and Llama 2 from Nous Research."), 'starling-lm': _("Starling is a large language model trained by reinforcement learning from AI feedback focused on improving chatbot helpfulness."), 'sqlcoder': _("SQLCoder is a code completion model fined-tuned on StarCoder for SQL generation tasks"), 'orca2': _("Orca 2 is built by Microsoft research, and are a fine-tuned version of Meta's Llama 2 models. The model is designed to excel particularly in reasoning."), 'llama3-gradient': _("This model extends LLama-3 8B's context length from 8k to over 1m tokens."), 'deepseek-llm': _("An advanced language model crafted with 2 trillion bilingual tokens."), 'yarn-llama2': _("An extension of Llama 2 that supports a context of up to 128k tokens."), 'llama3-chatqa': _("A model from NVIDIA based on Llama 3 that excels at conversational question answering (QA) and retrieval-augmented generation (RAG)."), 'solar': _("A compact, yet powerful 10.7B large language model designed for single-turn conversation."), 'xwinlm': _("Conversational model based on Llama 2 that performs competitively on various benchmarks."), 'granite-code': _("A family of open foundation models by IBM for Code Intelligence"), 'dolphin-phi': _("2.7B uncensored Dolphin model by Eric Hartford, based on the Phi language model by Microsoft Research."), 'wizardlm': _("General use model based on Llama 2."), 'samantha-mistral': _("A companion assistant trained in philosophy, psychology, and personal relationships. Based on Mistral."), 'stable-beluga': _("Llama 2 based model fine tuned on an Orca-style dataset. Originally called Free Willy."), 'bakllava': _("BakLLaVA is a multimodal model consisting of the Mistral 7B base model augmented with the LLaVA architecture."), 'llava-llama3': _("A LLaVA model fine-tuned from Llama 3 Instruct with better scores in several benchmarks."), 'wizardlm-uncensored': _("Uncensored version of Wizard LM model"), 'medllama2': _("Fine-tuned Llama 2 model to answer medical questions based on an open source medical dataset."), 'nous-hermes2-mixtral': _("The Nous Hermes 2 model from Nous Research, now trained over Mixtral."), 'yarn-mistral': _("An extension of Mistral to support context windows of 64K or 128K."), 'snowflake-arctic-embed': _("A suite of text embedding models by Snowflake, optimized for performance."), 'llama-pro': _("An expansion of Llama 2 that specializes in integrating both general language understanding and domain-specific knowledge, particularly in programming and mathematics."), 'codeup': _("Great code generation model based on Llama2."), 'meditron': _("Open-source medical large language model adapted from Llama 2 to the medical domain."), 'moondream': _("moondream2 is a small vision language model designed to run efficiently on edge devices."), 'everythinglm': _("Uncensored Llama2 based model with support for a 16K context window."), 'nexusraven': _("Nexus Raven is a 13B instruction tuned model for function calling tasks."), 'magicoder': _("🎩 Magicoder is a family of 7B parameter models trained on 75K synthetic instruction data using OSS-Instruct, a novel approach to enlightening LLMs with open-source code snippets."), 'deepseek-v2': _("A strong, economical, and efficient Mixture-of-Experts language model."), 'stablelm-zephyr': _("A lightweight chat model allowing accurate, and responsive output without requiring high-end hardware."), 'codebooga': _("A high-performing code instruct model created by merging two existing code models."), 'llava-phi3': _("A new small LLaVA model fine-tuned from Phi 3 Mini."), 'mistrallite': _("MistralLite is a fine-tuned model based on Mistral with enhanced capabilities of processing long contexts."), 'wizard-vicuna': _("Wizard Vicuna is a 13B parameter model based on Llama 2 trained by MelodysDreamj."), 'duckdb-nsql': _("7B parameter text-to-SQL model made by MotherDuck and Numbers Station."), 'goliath': _("A language model created by combining two fine-tuned Llama 2 70B models into one."), 'megadolphin': _("MegaDolphin-2.2-120b is a transformation of Dolphin-2.2-70b created by interleaving the model with itself."), 'open-orca-platypus2': _("Merge of the Open Orca OpenChat model and the Garage-bAInd Platypus 2 model. Designed for chat and code generation."), 'notux': _("A top-performing mixture of experts model, fine-tuned with high-quality data."), 'notus': _("A 7B chat model fine-tuned with high-quality data and based on Zephyr."), 'dbrx': _("DBRX is an open, general-purpose LLM created by Databricks."), 'falcon2': _("Falcon2 is an 11B parameters causal decoder-only model built by TII and trained over 5T tokens."), 'alfred': _("A robust conversational model designed to be used for both chat and instruct use cases."), }