{"type": "article", "title": "Beyond Trajectory Imitation: Strategy-Guided Policy Optimization for LLM Reasoning", "publisher": "Web Pulse", "url": "https://wpnews.pro/news/beyond-trajectory-imitation-strategy-guided-policy-optimization-for-llm", "original_source": "https://arxiv.org/abs/2606.24064", "published": "2026-06-24T04:00:00+00:00", "accessed": "2026-06-25", "id": "beyond-trajectory-imitation-strategy-guided-policy-optimization-for-llm"}