{"type": "article", "title": "VibeThinker: 3B param model that beats Opus 4.5 on reasoning with novel SFT+GRPO", "publisher": "Web Pulse", "url": "https://wpnews.pro/news/vibethinker-3b-param-model-that-beats-opus-4-5-on-reasoning-with-novel-sft-grpo", "original_source": "https://arxiv.org/abs/2606.16140", "published": "2026-06-23T02:01:25+00:00", "accessed": "2026-06-25", "id": "vibethinker-3b-param-model-that-beats-opus-4-5-on-reasoning-with-novel-sft-grpo"}