{
  "activity_state": "surging",
  "boundary": "aggregate_public_panel_not_retrieval_api",
  "canonical_url": "https://hangingcontext.com/tags/topic/inference-optimization/",
  "counts": {
    "appearances_24h": 108,
    "appearances_30d": 569,
    "appearances_7d": 497,
    "source_count": 50,
    "stream_count": 22
  },
  "entity_type": "tag",
  "generated_at": "2026-06-01T12:12:42+00:00",
  "html_url": "https://hangingcontext.com/tags/topic/inference-optimization/",
  "json_url": "https://hangingcontext.com/data/tags/topic/inference-optimization.json",
  "last_observed_at": "2026-06-01T11:58:10.097989+00:00",
  "name": "Inference Optimization",
  "page_type": "tag_context_panel",
  "path_type": "topic",
  "related_tags": [
    {
      "count": 510,
      "html_url": "https://hangingcontext.com/tags/topic/artificial-intelligence/",
      "name": "Artificial Intelligence",
      "tag_id": 17723038993834764,
      "type": "topic"
    },
    {
      "count": 348,
      "html_url": "https://hangingcontext.com/tags/org/arxiv/",
      "name": "arXiv",
      "tag_id": 17723038994323052,
      "type": "organization"
    },
    {
      "count": 251,
      "html_url": "https://hangingcontext.com/tags/topic/ai-infrastructure/",
      "name": "AI Infrastructure",
      "tag_id": 17791452103823983,
      "type": "topic"
    },
    {
      "count": 176,
      "html_url": "https://hangingcontext.com/tags/topic/llm-evals/",
      "name": "LLM Evals",
      "tag_id": 17791452099123760,
      "type": "topic"
    },
    {
      "count": 92,
      "html_url": "https://hangingcontext.com/tags/topic/ai-agents/",
      "name": "AI Agents",
      "tag_id": 17791452097663640,
      "type": "topic"
    },
    {
      "count": 87,
      "html_url": "https://hangingcontext.com/tags/topic/gpu-clusters/",
      "name": "GPU Clusters",
      "tag_id": 17791452103543441,
      "type": "topic"
    },
    {
      "count": 67,
      "html_url": "https://hangingcontext.com/tags/org/baseten/",
      "name": "Baseten",
      "tag_id": 17723038994304984,
      "type": "organization"
    },
    {
      "count": 63,
      "html_url": "https://hangingcontext.com/tags/topic/multimodal-ai/",
      "name": "Multimodal AI",
      "tag_id": 17730948119041167,
      "type": "topic"
    },
    {
      "count": 56,
      "html_url": "https://hangingcontext.com/tags/topic/reasoning-models/",
      "name": "Reasoning Models",
      "tag_id": 17791452099463022,
      "type": "topic"
    },
    {
      "count": 48,
      "html_url": "https://hangingcontext.com/tags/topic/quantization/",
      "name": "Quantization",
      "tag_id": 17791452102923593,
      "type": "topic"
    },
    {
      "count": 39,
      "html_url": "https://hangingcontext.com/tags/topic/cloud-computing/",
      "name": "Cloud Computing",
      "tag_id": 17723038993835295,
      "type": "topic"
    },
    {
      "count": 35,
      "html_url": "https://hangingcontext.com/tags/org/nvidia/",
      "name": "Nvidia",
      "tag_id": 17723038993599085,
      "type": "organization"
    }
  ],
  "schema_version": 1,
  "slug": "inference-optimization",
  "source_window": "30d",
  "tag_id": 17791452102628180,
  "tag_type": "topic",
  "top_sources": [
    {
      "count": 74,
      "html_url": "https://hangingcontext.com/sources/arxiv-model-efficiency-engineering/",
      "name": "arxiv-model-efficiency-engineering",
      "source_id": 17779468839059819
    },
    {
      "count": 68,
      "html_url": "https://hangingcontext.com/sources/arxiv-ai-agents-tool-use/",
      "name": "arxiv-ai-agents-tool-use",
      "source_id": 17779468839019653
    },
    {
      "count": 67,
      "html_url": "https://hangingcontext.com/sources/baseten-blog/",
      "name": "baseten-blog",
      "source_id": 17798118836822159
    },
    {
      "count": 59,
      "html_url": "https://hangingcontext.com/sources/arxiv-multimodal-document-ai/",
      "name": "arxiv-multimodal-document-ai",
      "source_id": 17779468839050785
    },
    {
      "count": 55,
      "html_url": "https://hangingcontext.com/sources/arxiv-ai-infra-inference-ops/",
      "name": "arxiv-ai-infra-inference-ops",
      "source_id": 17779468839057179
    },
    {
      "count": 54,
      "html_url": "https://hangingcontext.com/sources/arxiv-frontier-methods-select/",
      "name": "arxiv-frontier-methods-select",
      "source_id": 17779468839061905
    },
    {
      "count": 34,
      "html_url": "https://hangingcontext.com/sources/runpod-blog-rss/",
      "name": "runpod-blog-rss",
      "source_id": 17794302146060200
    },
    {
      "count": 24,
      "html_url": "https://hangingcontext.com/sources/arxiv-rag-search-knowledge/",
      "name": "arxiv-rag-search-knowledge",
      "source_id": 17779468839053902
    },
    {
      "count": 20,
      "html_url": "https://hangingcontext.com/sources/together-ai-blog-rss/",
      "name": "together-ai-blog-rss",
      "source_id": 17794290573506052
    },
    {
      "count": 11,
      "html_url": "https://hangingcontext.com/sources/modal-labs-blog/",
      "name": "modal-labs-blog",
      "source_id": 17794308058542893
    }
  ],
  "top_streams": [
    {
      "count": 347,
      "html_url": "https://hangingcontext.com/streams/arxiv/",
      "name": "ARXIV",
      "slug": "arxiv",
      "stream_id": 17779468859058016
    },
    {
      "count": 13,
      "html_url": "https://hangingcontext.com/streams/hugging-face/",
      "name": "Hugging Face",
      "slug": "hugging-face",
      "stream_id": 17801201634780574
    },
    {
      "count": 10,
      "html_url": "https://hangingcontext.com/streams/amd/",
      "name": "Advanced Micro Devices",
      "slug": "amd",
      "stream_id": 17723038993558435
    },
    {
      "count": 8,
      "html_url": "https://hangingcontext.com/streams/amazon/",
      "name": "Amazon",
      "slug": "amazon",
      "stream_id": 17723038993544177
    },
    {
      "count": 5,
      "html_url": "https://hangingcontext.com/streams/minimax/",
      "name": "MiniMax",
      "slug": "minimax",
      "stream_id": 17801201634780573
    },
    {
      "count": 5,
      "html_url": "https://hangingcontext.com/streams/nvidia/",
      "name": "Nvidia",
      "slug": "nvidia",
      "stream_id": 17723038993561924
    },
    {
      "count": 5,
      "html_url": "https://hangingcontext.com/streams/zhipu-ai/",
      "name": "Zhipu AI",
      "slug": "zhipu-ai",
      "stream_id": 17801201634780571
    },
    {
      "count": 3,
      "html_url": "https://hangingcontext.com/streams/databricks/",
      "name": "Databricks",
      "slug": "databricks",
      "stream_id": 17723038993559506
    },
    {
      "count": 2,
      "html_url": "https://hangingcontext.com/streams/sitepoint/",
      "name": "SitePoint",
      "slug": "sitepoint",
      "stream_id": 17767097561152902
    },
    {
      "count": 1,
      "html_url": "https://hangingcontext.com/streams/ai21-labs/",
      "name": "AI21 Labs",
      "slug": "ai21-labs",
      "stream_id": 17801201634780575
    }
  ]
}
