[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"tag-self-hosted-llm":3},{"tag":4,"articles":10},{"id":5,"name":6,"slug":7,"article_count":8,"description_zh":9,"description_en":9},"6887b472-fd9b-4ff4-9cd7-e26d292e7170","self-hosted LLM","self-hosted-llm",0,null,[11],{"id":12,"slug":13,"title":14,"summary":15,"category":16,"image_url":17,"cover_image":17,"language":18,"created_at":19},"97d1ef0a-fdc0-4421-abb1-e1e8a9c5ba8e","llama-3-1-70b-specs-benchmarks-deployment-en","Llama 3.1 70B: Specs, Benchmarks, Deployment","Meta’s Llama 3.1 70B offers 128K context, 88.6% MMLU, and self-hosted deployment for teams that want control and lower inference costs.","model-release","https:\u002F\u002Fxxdpdyhzhpamafnrdkyq.supabase.co\u002Fstorage\u002Fv1\u002Fobject\u002Fpublic\u002Fcovers\u002Finline-1780395489574-1mhf.png","en","2026-06-02T10:17:33.495371+00:00"]