[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"tag-gpu-成本":3},{"tag":4,"articles":10},{"id":5,"name":6,"slug":7,"article_count":8,"description_zh":9,"description_en":9},"8632f48c-900c-46c6-9a8f-30466b3afd81","GPU 成本","gpu-成本",1,null,[11],{"id":12,"slug":13,"title":14,"summary":15,"category":16,"image_url":17,"cover_image":17,"language":18,"created_at":19},"82766fdc-4368-445d-bb4a-03377726df02","turboquant-cuts-memory-use-without-accuracy-loss-zh","TurboQuant 省 6 倍記憶體，還不掉準確率","Google Research 發表 TurboQuant，主打記憶體用量降到 1\u002F6、推論快 8 倍，且在報告測試中沒有準確率損失。這篇看它怎麼改 AI 伺服器成本。","research","https:\u002F\u002Fxxdpdyhzhpamafnrdkyq.supabase.co\u002Fstorage\u002Fv1\u002Fobject\u002Fpublic\u002Fcovers\u002Finline-1775161134112-ftrj.png","zh","2026-04-02T20:18:39.266389+00:00"]