<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:image="http://www.google.com/schemas/sitemap-image/1.1">
<url>
<loc>https://www.hermitedge.com/</loc>
<image:image>
<image:loc>https://www.hermitedge.com/images/Google%20Thumbnail%20Logo.001.jpeg</image:loc>
</image:image>
<image:image>
<image:loc>https://www.hermitedge.com/images/home-page.jpeg</image:loc>
</image:image>
<lastmod>2026-04-13</lastmod>
<changefreq>weekly</changefreq>
<priority>1</priority>
</url>
<url>
<loc>https://www.hermitedge.com/about</loc>
<image:image>
<image:loc>https://www.hermitedge.com/images/about-page.jpeg</image:loc>
</image:image>
<image:image>
<image:loc>https://www.hermitedge.com/images/Google%20Thumbnail%20Logo.001.jpeg</image:loc>
</image:image>
<lastmod>2026-04-13</lastmod>
<changefreq>monthly</changefreq>
<priority>0.9</priority>
</url>
<url>
<loc>https://www.hermitedge.com/services</loc>
<lastmod>2026-04-13</lastmod>
<changefreq>weekly</changefreq>
<priority>0.9</priority>
</url>
<url>
<loc>https://www.hermitedge.com/portfolio</loc>
<lastmod>2026-04-13</lastmod>
<changefreq>weekly</changefreq>
<priority>0.8</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog</loc>
<lastmod>2026-04-13</lastmod>
<changefreq>weekly</changefreq>
<priority>0.9</priority>
</url>
<url>
<loc>https://www.hermitedge.com/privacy</loc>
<lastmod>2025-03-13</lastmod>
<changefreq>yearly</changefreq>
<priority>0.3</priority>
</url>
<url>
<loc>https://www.hermitedge.com/terms</loc>
<lastmod>2026-04-13</lastmod>
<changefreq>yearly</changefreq>
<priority>0.3</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/supervisor-agents-enforcing-deterministic-state-across-multi-agent-workflows</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/supervisor-agents-enforcing-deterministic-state-across-multi-agent-workflows/hero.jpg</image:loc>
</image:image>
<lastmod>2026-04-08</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/the-10m-token-trap-why-infinite-context-windows-do-not-replace-data-engineering</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/the-10m-token-trap-why-infinite-context-windows-do-not-replace-data-engineering/hero.jpg</image:loc>
</image:image>
<lastmod>2026-02-26</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/highground-building-a-backend-pipeline-for-market-intelligence</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/highground-building-a-backend-pipeline-for-market-intelligence/hero.jpg</image:loc>
</image:image>
<lastmod>2026-01-22</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/edtech-infrastructure-moving-ai-lesson-generation-out-of-the-chat-box</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/edtech-infrastructure-moving-ai-lesson-generation-out-of-the-chat-box/hero.jpg</image:loc>
</image:image>
<lastmod>2025-12-09</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/grounded-legal-ai-building-a-research-backend-around-live-case-law</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/grounded-legal-ai-building-a-research-backend-around-live-case-law/hero.jpg</image:loc>
</image:image>
<lastmod>2025-11-12</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/risk-compliance-ai-turning-contract-review-into-structured-audit-data</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/risk-compliance-ai-turning-contract-review-into-structured-audit-data/hero.jpg</image:loc>
</image:image>
<lastmod>2025-10-28</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/energy-intelligence-turning-live-telemetry-into-server-side-aggregates</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/energy-intelligence-turning-live-telemetry-into-server-side-aggregates/hero.jpg</image:loc>
</image:image>
<lastmod>2025-09-25</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/medical-research-synthesis-keeping-pubmed-retrieval-separate-from-llm-reasoning</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/medical-research-synthesis-keeping-pubmed-retrieval-separate-from-llm-reasoning/hero.jpg</image:loc>
</image:image>
<lastmod>2025-09-09</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/enterprise-sales-ai-separating-deal-strategy-from-proposal-drafting</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/enterprise-sales-ai-separating-deal-strategy-from-proposal-drafting/hero.jpg</image:loc>
</image:image>
<lastmod>2025-08-21</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/msme-brand-infrastructure-structuring-positioning-before-copywriting</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/msme-brand-infrastructure-structuring-positioning-before-copywriting/hero.jpg</image:loc>
</image:image>
<lastmod>2025-07-24</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/agentic-inventory-separating-stock-records-from-ai-decisions</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/agentic-inventory-separating-stock-records-from-ai-decisions/hero.jpg</image:loc>
</image:image>
<lastmod>2025-05-22</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/financial-intelligence-keeping-ai-away-from-the-ledger</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/financial-intelligence-keeping-ai-away-from-the-ledger/hero.jpg</image:loc>
</image:image>
<lastmod>2025-03-20</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/real-time-multimodal-pipelines-audio-video-streams</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/real-time-multimodal-pipelines-audio-video-streams/hero.jpg</image:loc>
</image:image>
<lastmod>2024-08-12</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/small-language-models-at-the-edge</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/small-language-models-at-the-edge/hero.jpg</image:loc>
</image:image>
<lastmod>2024-05-20</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/orchestrating-multi-agent-workflows-without-letting-them-run-the-system</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/orchestrating-multi-agent-workflows-without-letting-them-run-the-system/hero.jpg</image:loc>
</image:image>
<lastmod>2024-02-15</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/designing-a-multimodal-routing-layer-before-vision-access</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/designing-a-multimodal-routing-layer-before-vision-access/hero.jpg</image:loc>
</image:image>
<lastmod>2023-12-15</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/the-embedding-trap-why-default-models-need-domain-evals</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/the-embedding-trap-why-default-models-need-domain-evals/hero.jpg</image:loc>
</image:image>
<lastmod>2023-10-12</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/queueing-and-quantized-llama-2-on-local-hardware</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/queueing-and-quantized-llama-2-on-local-hardware/hero.jpg</image:loc>
</image:image>
<lastmod>2023-07-28</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/vector-storage-costs-in-document-retrieval-systems</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/vector-storage-costs-in-document-retrieval-systems/hero.jpg</image:loc>
</image:image>
<lastmod>2023-05-12</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/building-retrieval-augmented-generation-pipelines-from-scratch</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/building-retrieval-augmented-generation-pipelines-from-scratch/hero.jpg</image:loc>
</image:image>
<lastmod>2023-03-20</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/the-chatgpt-shift-conversational-state-as-a-backend-problem</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/the-chatgpt-shift-conversational-state-as-a-backend-problem/hero.jpg</image:loc>
</image:image>
<lastmod>2022-11-30</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/queue-isolated-stable-diffusion-on-local-gpu-hardware</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/queue-isolated-stable-diffusion-on-local-gpu-hardware/hero.jpg</image:loc>
</image:image>
<lastmod>2022-08-25</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/server-side-session-memory-for-llm-support-interfaces</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/server-side-session-memory-for-llm-support-interfaces/hero.jpg</image:loc>
</image:image>
<lastmod>2022-06-14</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/async-job-architecture-for-image-generation-apis</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/async-job-architecture-for-image-generation-apis/hero.jpg</image:loc>
</image:image>
<lastmod>2022-04-18</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/streaming-architecture-for-sensitive-text-generation-workloads</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/streaming-architecture-for-sensitive-text-generation-workloads/hero.jpg</image:loc>
</image:image>
<lastmod>2021-12-02</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/defending-backend-systems-against-probabilistic-model-outputs</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/defending-backend-systems-against-probabilistic-model-outputs/hero.jpg</image:loc>
</image:image>
<lastmod>2021-11-18</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/ci-cd-for-apis-handling-sensitive-data</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/ci-cd-for-apis-handling-sensitive-data/hero.jpg</image:loc>
</image:image>
<lastmod>2021-09-08</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/using-a-model-to-audit-label-quality-at-scale</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/using-a-model-to-audit-label-quality-at-scale/hero.jpg</image:loc>
</image:image>
<lastmod>2021-02-24</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/centralizing-feature-logic-for-real-time-inference</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/centralizing-feature-logic-for-real-time-inference/hero.jpg</image:loc>
</image:image>
<lastmod>2020-12-10</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/dynamic-batching-for-heavy-pytorch-workloads</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/dynamic-batching-for-heavy-pytorch-workloads/hero.jpg</image:loc>
</image:image>
<lastmod>2020-09-28</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/the-generative-trap-defending-against-probabilistic-outputs</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/the-generative-trap-defending-against-probabilistic-outputs/hero.jpg</image:loc>
</image:image>
<lastmod>2020-06-28</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/defensive-ingestion-for-covid-19-data-streams</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/defensive-ingestion-for-covid-19-data-streams/hero.jpg</image:loc>
</image:image>
<lastmod>2020-05-14</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/cold-starts-and-kubernetes-managing-latency-in-burst-traffic</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/cold-starts-and-kubernetes-managing-latency-in-burst-traffic/hero.jpg</image:loc>
</image:image>
<lastmod>2020-03-11</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/handling-feature-drift-in-production-fraud-pipelines</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/handling-feature-drift-in-production-fraud-pipelines/hero.jpg</image:loc>
</image:image>
<lastmod>2019-11-05</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/surviving-spot-interruptions-decoupling-pytorch-inference-on-aws</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/surviving-spot-interruptions-decoupling-pytorch-inference-on-aws/hero.jpg</image:loc>
</image:image>
<lastmod>2019-08-30</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/moving-past-flask-fastapi-async-requests-and-backend-workload-boundaries</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/moving-past-flask-fastapi-async-requests-and-backend-workload-boundaries/hero.jpg</image:loc>
</image:image>
<lastmod>2019-04-22</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/securing-the-data-behind-the-dashboard-flask-sql-and-backend-boundaries</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/securing-the-data-behind-the-dashboard-flask-sql-and-backend-boundaries/hero.jpg</image:loc>
</image:image>
<lastmod>2019-02-18</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
<url>
<loc>https://www.hermitedge.com/blog/a-backend-mindset-beyond-jupyter-serving-xgboost-with-flask-and-gunicorn</loc>
<image:image>
<image:loc>https://www.hermitedge.com/blog/a-backend-mindset-beyond-jupyter-serving-xgboost-with-flask-and-gunicorn/hero.jpg</image:loc>
</image:image>
<lastmod>2018-12-14</lastmod>
<changefreq>monthly</changefreq>
<priority>0.7</priority>
</url>
</urlset>
