<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
<url>
<loc>https://gingerlabs.ai/</loc>
<lastmod>2026-06-12T20:58:58.082Z</lastmod>
<changefreq>weekly</changefreq>
<priority>1</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog</loc>
<lastmod>2026-06-12T20:58:58.082Z</lastmod>
<changefreq>daily</changefreq>
<priority>0.8</priority>
</url>
<url>
<loc>https://gingerlabs.ai/resources</loc>
<lastmod>2026-06-12T20:58:58.082Z</lastmod>
<changefreq>weekly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://gingerlabs.ai/privacy</loc>
<lastmod>2026-06-12T20:58:58.082Z</lastmod>
<changefreq>yearly</changefreq>
<priority>0.2</priority>
</url>
<url>
<loc>https://gingerlabs.ai/terms</loc>
<lastmod>2026-06-12T20:58:58.082Z</lastmod>
<changefreq>yearly</changefreq>
<priority>0.2</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/70b-on-single-rtx-4090</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/anthropic-prompt-caching</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/awq-vs-gptq-benchmarks</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/bit-width-accuracy-memory-tradeoffs</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/category-aware-semantic-caching</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/context-engineering-llm-accuracy</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/cut-llm-api-costs</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/gguf-vs-awq-vs-gptq</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/hidden-llm-costs-production</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/hipaa-gdpr-llm-on-premises</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/kubernetes-llm-inference-llmd</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/kv-cache-reuse-vllm</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/litellm-router-setup-guide</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/llm-inference-costs-enterprise</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/llm-quantization-int4-int8-fp16</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/llm-semantic-routing</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/lora-vs-full-finetuning</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/multi-tier-llm-cache</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/off-peak-cache-prewarming-support-bots</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/openai-vs-anthropic-prompt-caching</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/pagedattention-vllm-throughput</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/prefill-activation-routing</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/prefix-caching-vs-semantic-caching</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/prompt-caching-break-even-analysis</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/quantization-edge-devices-under-4gb</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/quantize-llama3-4bit-guide</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/routellm-vs-vllm-semantic-router</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/self-hosting-vs-openai-api-tco</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/signal-driven-mixture-of-models</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/smoothquant-activation-aware-quantization</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/vllm-vs-ollama-vs-tgi</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/when-to-use-reasoning-models</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/category/caching</loc>
<lastmod>2026-06-12T20:58:58.082Z</lastmod>
<changefreq>weekly</changefreq>
<priority>0.5</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/category/quantization</loc>
<lastmod>2026-06-12T20:58:58.082Z</lastmod>
<changefreq>weekly</changefreq>
<priority>0.5</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/category/routing</loc>
<lastmod>2026-06-12T20:58:58.082Z</lastmod>
<changefreq>weekly</changefreq>
<priority>0.5</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/category/inference</loc>
<lastmod>2026-06-12T20:58:58.082Z</lastmod>
<changefreq>weekly</changefreq>
<priority>0.5</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/category/cost-optimization</loc>
<lastmod>2026-06-12T20:58:58.082Z</lastmod>
<changefreq>weekly</changefreq>
<priority>0.5</priority>
</url>
<url>
<loc>https://gingerlabs.ai/blog/category/self-hosting</loc>
<lastmod>2026-06-12T20:58:58.082Z</lastmod>
<changefreq>weekly</changefreq>
<priority>0.5</priority>
</url>
<url>
<loc>https://gingerlabs.ai/resources/cloud-gpu-pricing</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/resources/llm-cost-per-token</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/resources/model-cascade-vs-single-model</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/resources/open-source-llm-comparison</loc>
<lastmod>2026-06-08T00:00:00.000Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.6</priority>
</url>
<url>
<loc>https://gingerlabs.ai/solutions/construction-tech</loc>
<lastmod>2026-06-12T20:58:58.082Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://gingerlabs.ai/solutions/legal-tech</loc>
<lastmod>2026-06-12T20:58:58.082Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://gingerlabs.ai/solutions/crm-sales</loc>
<lastmod>2026-06-12T20:58:58.082Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://gingerlabs.ai/solutions/fintech-saas</loc>
<lastmod>2026-06-12T20:58:58.082Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://gingerlabs.ai/solutions/hr-tech</loc>
<lastmod>2026-06-12T20:58:58.082Z</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
</urlset>
