--- datasets: - argilla/ultrafeedback-binarized-preferences language: - en base_model: argilla/notus-7b-v1 library_name: transformers pipeline_tag: text-generation tags: - dpo - rlaif - preference - ultrafeedback - TensorBlock - GGUF license: mit model-index: - name: notus-7b-v1 results: - task: type: text-generation name: Text Generation dataset: name: AI2 Reasoning Challenge (25-Shot) type: ai2_arc config: ARC-Challenge split: test args: num_few_shot: 25 metrics: - type: acc_norm value: 0.6459044368600683 name: normalized accuracy source: url: https://huggingface.co/datasets/open-llm-leaderboard/results/blob/main/argilla/notus-7b-v1/results_2023-11-29T22-16-51.521321.json name: Open LLM Leaderboard Results - task: type: text-generation name: Text Generation dataset: name: HellaSwag (10-Shot) type: hellaswag split: validation args: num_few_shot: 10 metrics: - type: acc_norm value: 0.8478390758812986 name: normalized accuracy source: url: https://huggingface.co/datasets/open-llm-leaderboard/results/blob/main/argilla/notus-7b-v1/results_2023-11-29T22-16-51.521321.json name: Open LLM Leaderboard Results - task: type: text-generation name: Text Generation dataset: name: TruthfulQA (0-shot) type: truthful_qa config: multiple_choice split: validation args: num_few_shot: 0 metrics: - type: mc2 value: 0.5436768358952805 source: url: https://huggingface.co/datasets/open-llm-leaderboard/results/blob/main/argilla/notus-7b-v1/results_2023-11-29T22-16-51.521321.json name: Open LLM Leaderboard Results - task: type: text-generation name: Text Generation dataset: name: MMLU (5-Shot) type: cais/mmlu config: all split: test args: num_few_shot: 5 metrics: - type: acc value: 0.6303308230938872 name: accuracy source: url: https://huggingface.co/datasets/open-llm-leaderboard/results/blob/main/argilla/notus-7b-v1/results_2023-11-29T22-16-51.521321.json name: Open LLM Leaderboard Results - task: type: text-generation name: Text Generation dataset: name: GSM8k (5-shot) type: gsm8k config: main split: test args: num_few_shot: 5 metrics: - type: acc value: 0.1516300227445034 name: accuracy source: url: https://huggingface.co/datasets/open-llm-leaderboard/results/blob/main/argilla/notus-7b-v1/results_2023-11-29T22-16-51.521321.json name: Open LLM Leaderboard Results - task: type: text-generation name: Text Generation dataset: name: Winogrande (5-shot) type: winogrande config: winogrande_xl split: validation args: num_few_shot: 5 metrics: - type: acc value: 0.7940015785319653 name: accuracy source: url: https://huggingface.co/datasets/open-llm-leaderboard/results/blob/main/argilla/notus-7b-v1/results_2023-11-29T22-16-51.521321.json name: Open LLM Leaderboard Results - task: type: text-generation name: Text Generation dataset: name: AlpacaEval type: tatsu-lab/alpaca_eval metrics: - type: tatsu-lab/alpaca_eval value: 0.9142 name: win rate source: url: https://tatsu-lab.github.io/alpaca_eval/ - task: type: text-generation name: Text Generation dataset: name: MT-Bench type: unknown metrics: - type: unknown value: 7.3 name: score source: url: https://huggingface.co/spaces/lmsys/mt-bench ---
Feedback and support: TensorBlock's Twitter/X, Telegram Group and Discord server
Awesome MCP Servers | TensorBlock Studio |
---|---|
![]() |
![]() |
A comprehensive collection of Model Context Protocol (MCP) servers. | A lightweight, open, and extensible multi-LLM interaction studio. |
👀 See what we built 👀 | 👀 See what we built 👀 |