--- license: apache-2.0 datasets: - open-r1/Mixture-of-Thoughts - openbmb/Ultra-FineWeb - yandex/yambda - nvidia/OpenCodeReasoning - nvidia/OpenMathReasoning - fka/awesome-chatgpt-prompts - DMindAI/DMind_Benchmark - MiniMaxAI/SynLogic - FreedomIntelligence/medical-o1-reasoning-SFT language: - en metrics: - accuracy - bertscore - bleu - bleurt - brier_score - cer - character - charcut_mt - chrf - code_eval base_model: - deepseek-ai/DeepSeek-R1-0528 - ByteDance-Seed/BAGEL-7B-MoT - Gapeleon/bytedance_BAGEL-7B-MoT-INT8 - google/gemma-3n-E4B-it-litert-preview - nvidia/parakeet-tdt-0.6b-v2 - mistralai/Devstral-Small-2505 - deepseek-ai/DeepSeek-R1-0528-Qwen3-8B - nari-labs/Dia-1.6B - ResembleAI/chatterbox - Lightricks/LTX-Video - ACE-Step/ACE-Step-v1-3.5B new_version: deepseek-ai/DeepSeek-R1-0528 library_name: diffusers tags: - art - code - not-for-all-audiences - merge - text-generation-inference ---