<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9"
        xmlns:news="http://www.google.com/schemas/sitemap-news/0.9">
  <url>
    <loc>https://llmrequirements.com/news/2026-06-30-claude-sonnet-5-vs-glm-5-2</loc>
    <news:news>
      <news:publication>
        <news:name>LLMRequirements.com</news:name>
        <news:language>en</news:language>
      </news:publication>
      <news:publication_date>2026-06-30T00:00:00.000Z</news:publication_date>
      <news:title>Claude Sonnet 5 vs GLM 5.2: the closed benchmark king vs the open model you can actually run</news:title>
      <news:keywords>software, models, comparison, anthropic, open-weights</news:keywords>
    </news:news>
  </url>
  <url>
    <loc>https://llmrequirements.com/news/2026-06-30-dgx-spark-122b-dflash-speculative-decoding</loc>
    <news:news>
      <news:publication>
        <news:name>LLMRequirements.com</news:name>
        <news:language>en</news:language>
      </news:publication>
      <news:publication_date>2026-06-30T00:00:00.000Z</news:publication_date>
      <news:title>DGX Spark runs Qwen3.5-122B at 59 tok/s general and 81 on agent traffic, with speculative decoding (not NVFP4)</news:title>
      <news:keywords>performance, nvidia, dgx-spark, speculative-decoding, qwen, agentic</news:keywords>
    </news:news>
  </url>
</urlset>
