15:[["$","meta","0",{"name":"viewport","content":"width=device-width, initial-scale=1"}],["$","meta","1",{"name":"theme-color","media":"(prefers-color-scheme: light)","content":"#ffffff"}],["$","meta","2",{"name":"theme-color","media":"(prefers-color-scheme: dark)","content":"#09090b"}],["$","meta","3",{"charSet":"utf-8"}],["$","title","4",{"children":"Slow performance Unsloth Gemma 12B Q8 — ANGESTROM — ANGESTROM"}],["$","meta","5",{"name":"description","content":"

I recently replaced GPT-OSS 20B Q4 with Gemma 4 12B Q8 but i went from roughly 70 t/s to 10 t/s.

Am I doing something w"}],["$","link","6",{"rel":"author","href":"https://angestrom.com"}],["$","meta","7",{"name":"author","content":"ANGESTROM"}],["$","link","8",{"rel":"manifest","href":"/manifest.webmanifest","crossOrigin":"use-credentials"}],["$","meta","9",{"name":"keywords","content":"artificial intelligence,AI knowledge graph,machine learning,large language models,AI research papers,AI models,AI news,AI tutorials,generative AI"}],["$","meta","10",{"name":"creator","content":"ANGESTROM"}],["$","meta","11",{"name":"publisher","content":"ANGESTROM"}],["$","meta","12",{"name":"robots","content":"index, follow"}],["$","meta","13",{"name":"googlebot","content":"index, follow, max-video-preview:-1, max-image-preview:large, max-snippet:-1"}],["$","link","14",{"rel":"canonical","href":"https://angestrom.com/news/news-slow-performance-unsloth-gemma-12b-q8"}],["$","link","15",{"rel":"alternate","hrefLang":"en","href":"https://angestrom.com/NodeType.newss/news-slow-performance-unsloth-gemma-12b-q8"}],["$","meta","16",{"name":"format-detection","content":"telephone=no, address=no, email=no"}],["$","meta","17",{"property":"og:title","content":"Slow performance Unsloth Gemma 12B Q8 — ANGESTROM"}],["$","meta","18",{"property":"og:description","content":"

I recently replaced GPT-OSS 20B Q4 with Gemma 4 12B Q8 but i went from roughly 70 t/s to 10 t/s.

Am I doing something w"}],["$","meta","19",{"property":"og:url","content":"https://angestrom.com/news/news-slow-performance-unsloth-gemma-12b-q8"}],["$","meta","20",{"property":"og:site_name","content":"ANGESTROM"}],["$","meta","21",{"property":"og:locale","content":"en_US"}],["$","meta","22",{"property":"og:image","content":"https://angestrom.com/icon-512.png"}],["$","meta","23",{"property":"og:image:width","content":"1200"}],["$","meta","24",{"property":"og:image:height","content":"630"}],["$","meta","25",{"property":"og:image:alt","content":"Slow performance Unsloth Gemma 12B Q8 — ANGESTROM"}],["$","meta","26",{"property":"og:type","content":"article"}],["$","meta","27",{"name":"twitter:card","content":"summary_large_image"}],["$","meta","28",{"name":"twitter:title","content":"Slow performance Unsloth Gemma 12B Q8 — ANGESTROM"}],["$","meta","29",{"name":"twitter:description","content":"

I recently replaced GPT-OSS 20B Q4 with Gemma 4 12B Q8 but i went from roughly 70 t/s to 10 t/s.

Am I doing something w"}],["$","meta","30",{"name":"twitter:image","content":"https://angestrom.com/icon-512.png"}],["$","link","31",{"rel":"icon","href":"/icon.png?f6ba7b6d65559612","type":"image/png","sizes":"512x512"}],["$","link","32",{"rel":"apple-touch-icon","href":"/apple-icon.png?2e9defbef5afb45a","type":"image/png","sizes":"180x180"}]]