[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"tag-hdpo":3},{"tag":4,"articles":10},{"id":5,"name":6,"slug":7,"article_count":8,"description_zh":9,"description_en":9},"45b9cdb6-1852-421f-8cc4-6100d0e11b83","HDPO","hdpo",2,null,[11],{"id":12,"slug":13,"title":14,"summary":15,"category":16,"image_url":17,"cover_image":17,"language":18,"created_at":19},"3cefc37f-e116-4597-a5cb-55bfb3fc4aa4","act-wisely-tool-use-agentic-multimodal-models-en","Act Wisely: Teaching Agents When Not to Call Tools","A new training scheme, HDPO, aims to cut blind tool use in multimodal agents by separating accuracy from tool efficiency.","research","https:\u002F\u002Fxxdpdyhzhpamafnrdkyq.supabase.co\u002Fstorage\u002Fv1\u002Fobject\u002Fpublic\u002Fcovers\u002Finline-1775801032138-7jih.png","en","2026-04-10T06:03:34.728615+00:00"]