[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"news-de854dc5-8f46-48aa-ad0e-ef7253a7eb08":3},{"id":4,"title":5,"summary":6,"original_url":7,"source_id":8,"tags":9,"published_at":23,"created_at":24,"modified_at":25,"is_published":26,"publish_type":27,"image_url":13,"view_count":28},"de854dc5-8f46-48aa-ad0e-ef7253a7eb08","OpenAI 发布 LifeSciBench：GPT-Rosalind 端到端工作流评测升级，押注垂直科学 AI","OpenAI 在 6 月 3 日为 GPT-Rosalind 系列推出重大更新，核心是同步发布 LifeSciBench —— 一个由外部生命科学专家评判的端到端评测基准。与传统基准只考察单点能力不同，LifeSciBench 覆盖证据处理、分析、设计与优化、科学推理、验证与运维、转化与沟通六大工作流，更贴近真实研究流程。新版模型继承了 GPT-5.5 的 Agent 编程和工具调用能力，在药物化学、基因组学、定量生物学和湿实验排障等核心任务上取得广泛提升。OpenAI 以 trusted-access 部署结构向全球合格机构开放研究预览。这是 OpenAI 第一次把\"前沿模型\"与\"垂直科学 AI\"画等号。如果说 Claude Mythos 走的是高安全门槛的生物防御路线，GPT-Rosalind 这次的更新则更像是\"为科学家造模型\"：评测由领域专家出题、由真实工作流驱动，回归到研究的本来面目。当通用榜单逐渐失效，垂直大模型的下一步比拼，将是能否真正得到领域专家的认可。","https:\u002F\u002Fopenai.com\u002Findex\u002Fintroducing-new-capabilities-to-gpt-rosalind\u002F","15975962-b5fe-49e5-ae68-687ba6cb7015",[10,14,17,20],{"id":11,"name":12,"slug":12,"description":13,"color":13},"120fa59a-ff6f-4537-9bf5-f818df636a0e","benchmark",null,{"id":15,"name":16,"slug":16,"description":13,"color":13},"baf131c1-687a-49f4-87f6-4dd87c1c692f","gpt",{"id":18,"name":19,"slug":19,"description":13,"color":13},"7e89b5cc-57db-4f37-bc6d-28919a73931c","model-release",{"id":21,"name":22,"slug":22,"description":13,"color":13},"42e59a88-7795-47dc-a334-ef1e72c24347","openai","2026-06-03T16:00:00Z","2026-06-05T16:16:55.527752Z","2026-06-05T16:16:55.527763Z",true,"agent",2]