[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"tag-model-serving":3},{"tag":4,"articles":10},{"id":5,"name":6,"slug":7,"article_count":8,"description_zh":9,"description_en":9},"07239fc7-2352-4389-833a-9ee6a34426d9","Model Serving","model-serving",0,null,[11,20,27,35],{"id":12,"slug":13,"title":14,"summary":15,"category":16,"image_url":17,"cover_image":17,"language":18,"created_at":19},"47ce5058-3c10-4d7c-ad89-053b8f8d953e","databricks-custom-models-aws-overview-zh","Databricks AWS 自訂模型重點","Databricks 說明如何在 AWS 上打包、部署與擴展自訂模型，重點是 MLflow、CPU\u002FGPU 選擇、冷啟動、重載規則與容量規劃。","tools","https:\u002F\u002Fxxdpdyhzhpamafnrdkyq.supabase.co\u002Fstorage\u002Fv1\u002Fobject\u002Fpublic\u002Fcovers\u002Finline-1780378383303-0zt9.png","zh","2026-06-02T05:32:34.88582+00:00",{"id":21,"slug":22,"title":23,"summary":24,"category":16,"image_url":25,"cover_image":25,"language":18,"created_at":26},"4adef3ab-9f07-4970-91cf-77b8b581b348","why-databricks-model-serving-is-right-default-zh","為什麼 Databricks Model Serving 是生產推論的正確預設","Databricks Model Serving 應該成為生產推論的預設選項，因為它把部署、治理與擴展整合在同一個平台，降低多模型團隊的營運成本。","https:\u002F\u002Fxxdpdyhzhpamafnrdkyq.supabase.co\u002Fstorage\u002Fv1\u002Fobject\u002Fpublic\u002Fcovers\u002Finline-1778692245329-a2wt.png","2026-05-13T17:10:30.659153+00:00",{"id":28,"slug":29,"title":30,"summary":31,"category":32,"image_url":33,"cover_image":33,"language":18,"created_at":34},"5b27896f-ad48-4a9a-8b6e-823568d8c669","wei-shen-me-lu-you-cai-shi-mo-xing-fu-wu-de-zhen-zheng-ping-zh","為什麼路由才是模型服務的真正瓶頸","模型服務的主要限制不是推理本身，而是路由決策；誰、何時、送到哪個模型與副本，才決定延遲、成本與穩定性。","industry","https:\u002F\u002Fxxdpdyhzhpamafnrdkyq.supabase.co\u002Fstorage\u002Fv1\u002Fobject\u002Fpublic\u002Fcovers\u002Finline-1778278838578-nms7.png","2026-05-08T22:20:22.020009+00:00",{"id":36,"slug":37,"title":38,"summary":39,"category":32,"image_url":40,"cover_image":40,"language":18,"created_at":41},"54b3fd97-c8e6-4b92-b87b-40913f024775","why-routing-belongs-at-the-center-of-model-serving-zh","為什麼 routing 應該放在 model serving 的中心","Routing 應該是 model serving 的單一入口，因為它能加快模型迭代，也能把服務層變成產品能力的一部分。","https:\u002F\u002Fxxdpdyhzhpamafnrdkyq.supabase.co\u002Fstorage\u002Fv1\u002Fobject\u002Fpublic\u002Fcovers\u002Finline-1777882252815-32q6.png","2026-05-04T08:10:33.607394+00:00"]