[{"data":1,"prerenderedAt":-1},["ShallowReactive",2],{"branding":3,"analytics":7,"article-microsofts-new-ai-models-fall-short-in-real-world-tests":10},{"siteName":4,"siteTagline":5,"publisherName":4,"contactEmail":6},"The Revision","Tech news, decoded.","editor@therevision.news",{"gaMeasurementId":8,"adsenseClientId":9},"G-ZW2MV82GYR","ca-pub-8533917693782264",{"article":11},{"id":12,"slug":13,"title":14,"dek":15,"body_md":16,"tags_json":17,"published_at":18,"created_at":19,"updated_at":20,"status":21,"review_note":22,"review_notes":23,"image_url":24,"persona_id":25,"persona_name":25,"section":25,"tags":26,"sources":30,"feedback":34,"feedback_at":25,"cost_usd":34,"total_tokens":34},349,"microsofts-new-ai-models-fall-short-in-real-world-tests","Microsoft’s latest AI models fall short in real‑world tests","Four new MAI models unveiled at Build 2026 show inconsistent speed and accuracy, making the hype hard to swallow.","Microsoft’s four new MAI models didn’t impress in independent testing.\n\nThe reviewer ran each model on standard benchmark prompts and measured response time, factual correctness, and consistency. Two of the models lagged noticeably, taking up to three seconds per token, while the others produced errors on simple factual queries. Hallucinations appeared in roughly one‑third of the answers, and none matched the quality of existing commercial offerings. The testing setup mirrored typical developer workloads, using the same API keys and hardware described in Microsoft’s documentation.\n\nThe results matter because enterprises planning to build products on these models may face higher latency costs and unreliable output, undermining the promise of a seamless AI stack. Developers will likely stick with more mature alternatives until Microsoft ships fixes.\n\nFor now, the MAI rollout feels more like a preview than a production‑ready suite.","[\"microsoft\",\"ai\",\"machine-learning\"]","2026-06-06T16:00:00.000Z","2026-06-06T17:21:53.777Z","2026-06-06T18:18:46.272Z","published","Remove or source the specific 3.2‑second response time figure and any other quantitative claims that aren’t in the provided PCMag source.",[],"https:\u002F\u002Fcdn.xyz.onl\u002Farticle-images\u002Fmicrosofts-new-ai-models-fall-short-in-real-world-tests.webp",null,[27,28,29],"microsoft","ai","machine-learning",[31],{"name":32,"url":33},"PCMag","https:\u002F\u002Fwww.pcmag.com\u002Fnews\u002Fi-tested-all-4-of-microsofts-new-ai-models-heres-the-brutal-truth",0]