---
datasets:
- maidalun1020/CrosslingualMultiDomainsDataset
- nvidia/Llama-Nemotron-Post-Training-Dataset
- reasonir/reasonir-data
- KShivendu/dbpedia-entities-openai-1M
- openai/openai_humaneval
- Rapidata/OpenAI-4o_t2i_human_preference
- open-thoughts/OpenThoughts-114k
- openai/MMMLU
- openbmb/Ultra-FineWeb
- nvidia/describe-anything-dataset
- open-llm-leaderboard/NousResearch__DeepHermes-3-Mistral-24B-Preview-details
- reedmayhew/claude-3.7-sonnet-reasoning
- >-
  open-llm-leaderboard-old/details_mvpmaster__Einstein-4D-Marcoro14-7b-full-slerp
- MBZUAI-IFM/qwen32b-r1distill-final
- open-llm-leaderboard-old/details_gagan3012__MetaModel_moe_multilingualv1
- wikimedia/structured-wikipedia
- google-research-datasets/go_emotions
- google-research-datasets/mbpp
- meta-llama/Llama-3.2-1B-Instruct-evals
- Jofthomas/hermes-function-calling-thinking-V1
- TIGER-Lab/WebInstruct-verified
- a-m-team/AM-DeepSeek-Distilled-40M
- future-technologies/Universal-Transformers-Dataset
- DMindAI/DMind_Benchmark
- SWE-bench/SWE-smith
- SWE-bench/SWE-smith-trajectories
- R-Bench/R-Bench
- R-Bench/R-Bench-V
- CohereLabs/Global-MMLU
language:
- en
metrics:
- chrf
- bertscore
- accuracy
base_model:
- deepseek-ai/DeepSeek-Prover-V2-671B
- Salesforce/blip2-flan-t5-xl
- piotr-ai/polanka_4b_v0.1_qwen3_250505_gguf
- tomaszki/mistral-8
- CohereLabs/aya-23-35B
- nvidia/Llama-3_1-Nemotron-Ultra-253B-v1
- unsloth/Llama-4-Maverick-17B-128E-Instruct-GGUF
- Qwen/Qwen3-235B-A22B
- unsloth/Phi-4-reasoning-plus-GGUF
- tngtech/DeepSeek-R1T-Chimera
- a-m-team/AM-Thinking-v1
- bartowski/Meta-Llama-3-120B-Instruct-GGUF
- microsoft/MAI-DS-R1
- Skywork/Skywork-R1V2-38B
- Skywork/Skywork-R1V-38B
- mradermacher/R1V-Free-2.5VL-7B-GGUF
- MaziyarPanahi/calme-3.2-instruct-78b
- google-bert/bert-large-uncased-whole-word-masking-finetuned-squad
- amd/Mixtral-8x22B-Instruct-v0.1-FP8-KV
- ginipick/Gemma-3-R1984-4B
- perplexity-ai/r1-1776
- bartowski/perplexity-ai_r1-1776-distill-llama-70b-GGUF
- silx-ai/Quasar-3.0-400B-1M
- manycore-research/SpatialLM-Llama-1B
- databricks/dbrx-instruct
- THUDM/GLM-Z1-Rumination-32B-0414
- deepseek-ai/DeepSeek-V3-0324
- cognition-ai/Kevin-32B
- unsloth/c4ai-command-a-03-2025-GGUF
- unsloth/Hermes-3-Llama-3.1-405B-bnb-4bit
- alpindale/WizardLM-2-8x22B
- allenai/OLMo-2-0325-32B-Instruct
- mancer-Carmen/1
- Kaspar/siglip-heritage-weaver-best
library_name: adapter-transformers
tags:
- text-generation-inference
- moe
- merge
- code
license: apache-2.0
new_version: Qwen/Qwen3-30B-A3B
pipeline_tag: any-to-any
---