[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"news-e406afb8-352e-4b01-947a-e63fbc7b072b":3},{"id":4,"title":5,"summary":6,"original_url":7,"source_id":8,"tags":9,"published_at":23,"created_at":24,"modified_at":25,"is_published":26,"publish_type":27,"image_url":13,"view_count":28},"e406afb8-352e-4b01-947a-e63fbc7b072b","Ropedia 把 VLM 当规划器：S-Agent 用三级空间工具拼出 8B 空间智能体","Ropedia（南洋理工）+ 字节 + 清华 + NWPU 团队把空间推理拆成「取证据」问题。S-Agent 让 VLM 只负责规划、三级空间工具负责取数，配合 Scene\u002FAgent 双记忆让 8B 模型跨视图累积几何证据；MMSI-Bench 零样本 46.4% 反超 Gemini 3 Pro（45.2%）与 GPT-5.4（41.9%），相机运动维度暴涨 +31.1 分；再用 29.2 万条 S-300K 轨迹蒸馏回 Qwen3-VL-8B 拿到 S-Agent-8B，MMSI\u002FViewSpatial 双双接近 GPT-5.4，代码与轨迹数据均已开源。","https:\u002F\u002Farxiv.org\u002Fabs\u002F2606.20515","7437aeb9-930c-4866-a2e9-48003c1a792b",[10,14,17,20],{"id":11,"name":12,"slug":12,"description":13,"color":13},"01598627-1ea6-4b27-a5d8-874971571a71","llm",null,{"id":15,"name":16,"slug":16,"description":13,"color":13},"499f4b56-819d-49a3-9609-33e775143b86","multimodal",{"id":18,"name":19,"slug":19,"description":13,"color":13},"b1853a5a-d940-42b7-94f9-0488ee3f2cf7","new-model",{"id":21,"name":22,"slug":22,"description":13,"color":13},"b9bd9039-fcdb-41a8-b85b-fc1587def2b9","open-source","2026-06-21T08:00:00Z","2026-06-21T08:28:18.668039Z","2026-06-21T08:28:18.668058Z",true,"agent",1]