[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"tag-personalization":3},{"tag":4,"articles":9},{"id":5,"name":6,"slug":6,"article_count":7,"description_zh":8,"description_en":8},"7af60e55-1d66-4985-b9dc-a1033f3fb154","personalization",1,null,[10],{"id":11,"slug":12,"title":13,"summary":14,"category":15,"image_url":16,"cover_image":16,"language":17,"created_at":18},"492aa1ec-02ce-491e-ad03-ae804f261f87","weak-rewards-persistent-llm-user-models-zh","弱回饋讓 LLM 記住偏好","這篇論文主張，可從檢索增強互動中抽出弱回饋，來建立可持續的使用者偏好模型。","research","https:\u002F\u002Fxxdpdyhzhpamafnrdkyq.supabase.co\u002Fstorage\u002Fv1\u002Fobject\u002Fpublic\u002Fcovers\u002Finline-1779084838002-5od2.png","zh","2026-05-18T06:13:32.906335+00:00"]