<?xml version="1.0" encoding="UTF-8"?>
<!--generator='jetpack-15.8'-->
<!--Jetpack_Sitemap_Buffer_News_XMLWriter-->
<?xml-stylesheet type="text/xsl" href="//bibitlabs.com/news-sitemap.xsl"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:news="http://www.google.com/schemas/sitemap-news/0.9" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd">
 <url>
  <loc>https://bibitlabs.com/%ec%bb%a8%ed%85%8d%ec%8a%a4%ed%8a%b8-%ea%b8%b8%ec%9d%b4%eb%a5%bc-%eb%8a%98%eb%a6%ac%eb%a9%b4-%eb%a9%94%eb%aa%a8%eb%a6%ac%ea%b0%80-%ed%8f%ad%eb%b0%9c%ed%95%98%eb%8a%94-%ec%9d%b4%ec%9c%a0-kv-c/</loc>
  <lastmod>2026-05-31T13:18:45Z</lastmod>
  <news:news>
   <news:publication>
    <news:name>bibitlabs</news:name>
    <news:language>ko</news:language>
   </news:publication>
   <news:title>컨텍스트 길이를 늘리면 메모리가 폭발하는 이유 — KV Cache의 구조와 비용</news:title>
   <news:publication_date>2026-06-01T13:10:42Z</news:publication_date>
   <news:genres>Blog</news:genres>
  </news:news>
 </url>
 <url>
  <loc>https://bibitlabs.com/%eb%a7%a5%eb%b6%81%ec%97%90%ec%84%9c-70b%eb%a5%bc-%ec%96%b5%ec%a7%80%eb%a1%9c-%eb%8f%8c%eb%a6%ac%eb%8a%94-%ea%b2%83%ea%b3%bc-27b%eb%a5%bc-%ec%be%8c%ec%a0%81%ed%95%98%ea%b2%8c-%eb%8f%8c%eb%a6%ac/</loc>
  <lastmod>2026-05-31T13:17:48Z</lastmod>
  <news:news>
   <news:publication>
    <news:name>bibitlabs</news:name>
    <news:language>ko</news:language>
   </news:publication>
   <news:title>맥북에서 70B를 억지로 돌리는 것과 27B를 쾌적하게 돌리는 것 — 어느 쪽이 실제로 더 나은가</news:title>
   <news:publication_date>2026-05-31T13:17:45Z</news:publication_date>
   <news:genres>Blog</news:genres>
  </news:news>
 </url>
 <url>
  <loc>https://bibitlabs.com/%ea%b0%99%ec%9d%80-%ed%8c%8c%eb%9d%bc%eb%af%b8%ed%84%b0-%ec%88%98%ec%9d%b8%eb%8d%b0-moe-%eb%aa%a8%eb%8d%b8%ec%9d%b4-%eb%8d%94-%eb%b9%a0%eb%a5%b8-%ec%9d%b4%ec%9c%a0/</loc>
  <lastmod>2026-05-31T13:17:14Z</lastmod>
  <news:news>
   <news:publication>
    <news:name>bibitlabs</news:name>
    <news:language>ko</news:language>
   </news:publication>
   <news:title>같은 파라미터 수인데 MoE 모델이 더 빠른 이유</news:title>
   <news:publication_date>2026-05-31T13:17:12Z</news:publication_date>
   <news:genres>Blog</news:genres>
  </news:news>
 </url>
 <url>
  <loc>https://bibitlabs.com/q4_k_m-vs-q8_0-%eb%a1%9c%ec%bb%ac-llm-%ec%96%91%ec%9e%90%ed%99%94-%ec%96%b4%eb%94%94%ec%84%9c-%ed%83%80%ed%98%91%ed%95%a0-%ea%b2%83%ec%9d%b8%ea%b0%80/</loc>
  <lastmod>2026-05-31T13:16:43Z</lastmod>
  <news:news>
   <news:publication>
    <news:name>bibitlabs</news:name>
    <news:language>ko</news:language>
   </news:publication>
   <news:title>Q4_K_M vs Q8_0: 로컬 LLM 양자화, 어디서 타협할 것인가</news:title>
   <news:publication_date>2026-05-31T13:16:41Z</news:publication_date>
   <news:genres>Blog</news:genres>
  </news:news>
 </url>
 <url>
  <loc>https://bibitlabs.com/arch-arm64-%ed%95%9c-%ec%a4%84%ec%9d%b4-%ec%b6%94%eb%a1%a0-%ec%86%8d%eb%8f%84%eb%a5%bc-%eb%b0%94%ea%be%b8%eb%8a%94-%ec%9d%b4%ec%9c%a0-rosetta-%ed%95%a8%ec%a0%95/</loc>
  <lastmod>2026-05-31T13:16:10Z</lastmod>
  <news:news>
   <news:publication>
    <news:name>bibitlabs</news:name>
    <news:language>ko</news:language>
   </news:publication>
   <news:title>`arch -arm64` 한 줄이 추론 속도를 바꾸는 이유 — Rosetta 함정</news:title>
   <news:publication_date>2026-05-31T13:16:07Z</news:publication_date>
   <news:genres>Blog</news:genres>
  </news:news>
 </url>
 <url>
  <loc>https://bibitlabs.com/ollama%ec%99%80-llama-cpp-%ea%b0%99%ec%9d%80-%ec%97%94%ec%a7%84%ec%9d%b8%eb%8d%b0-%ec%99%9c-%ec%86%8d%eb%8f%84%ea%b0%80-%eb%8b%a4%eb%a5%bc%ea%b9%8c/</loc>
  <lastmod>2026-05-31T13:15:37Z</lastmod>
  <news:news>
   <news:publication>
    <news:name>bibitlabs</news:name>
    <news:language>ko</news:language>
   </news:publication>
   <news:title>Ollama와 llama.cpp, 같은 엔진인데 왜 속도가 다를까</news:title>
   <news:publication_date>2026-05-31T13:15:19Z</news:publication_date>
   <news:genres>Blog</news:genres>
  </news:news>
 </url>
 <url>
  <loc>https://bibitlabs.com/mlx%ea%b0%80-llama-cpp%eb%b3%b4%eb%8b%a4-%eb%b9%a0%eb%a5%bc-%eb%95%8c-%ea%b7%b8%eb%a6%ac%ea%b3%a0-%eb%8a%90%eb%a6%b4-%eb%95%8c-%ec%a1%b0%ea%b1%b4%eb%b3%84%eb%a1%9c-%eb%94%b0%ec%a0%b8/</loc>
  <lastmod>2026-05-31T13:14:53Z</lastmod>
  <news:news>
   <news:publication>
    <news:name>bibitlabs</news:name>
    <news:language>ko</news:language>
   </news:publication>
   <news:title>MLX가 llama.cpp보다 빠를 때, 그리고 느릴 때 — 조건별로 따져보기</news:title>
   <news:publication_date>2026-05-31T13:14:50Z</news:publication_date>
   <news:genres>Blog</news:genres>
  </news:news>
 </url>
 <url>
  <loc>https://bibitlabs.com/%eb%a7%a5%eb%b6%81%ec%97%90%ec%84%9c-llm-%eb%8f%8c%eb%a6%b4-%eb%95%8c-ollama-llama-cpp-mlx-%ec%a4%91-%eb%ad%98-%ec%8d%a8%ec%95%bc-%ed%95%98%eb%82%98/</loc>
  <lastmod>2026-05-31T13:14:21Z</lastmod>
  <news:news>
   <news:publication>
    <news:name>bibitlabs</news:name>
    <news:language>ko</news:language>
   </news:publication>
   <news:title>맥북에서 LLM 돌릴 때 Ollama, llama.cpp, MLX 중 뭘 써야 하나</news:title>
   <news:publication_date>2026-05-31T13:14:18Z</news:publication_date>
   <news:genres>Blog</news:genres>
  </news:news>
 </url>
 <url>
  <loc>https://bibitlabs.com/apple-silicon%ec%9d%98-%ed%86%b5%ed%95%a9-%eb%a9%94%eb%aa%a8%eb%a6%ac%ea%b0%80-llm-%ec%b6%94%eb%a1%a0%ec%97%90-%ec%9c%a0%eb%a6%ac%ed%95%9c-%ec%a7%84%ec%a7%9c-%ec%9d%b4%ec%9c%a0/</loc>
  <lastmod>2026-05-31T13:13:50Z</lastmod>
  <news:news>
   <news:publication>
    <news:name>bibitlabs</news:name>
    <news:language>ko</news:language>
   </news:publication>
   <news:title>Apple Silicon의 통합 메모리가 LLM 추론에 유리한 진짜 이유</news:title>
   <news:publication_date>2026-05-31T13:13:47Z</news:publication_date>
   <news:genres>Blog</news:genres>
  </news:news>
 </url>
 <url>
  <loc>https://bibitlabs.com/m4-pro%ec%99%80-m4-max-%eb%a1%9c%ec%bb%ac-llm-%ec%b6%94%eb%a1%a0-%ec%86%8d%eb%8f%84-%ec%b0%a8%ec%9d%b4%eb%8a%94-%ec%96%b4%eb%94%94%ec%84%9c-%ec%98%a4%eb%8a%94%ea%b0%80/</loc>
  <lastmod>2026-05-31T13:13:22Z</lastmod>
  <news:news>
   <news:publication>
    <news:name>bibitlabs</news:name>
    <news:language>ko</news:language>
   </news:publication>
   <news:title>M4 Pro와 M4 Max, 로컬 LLM 추론 속도 차이는 어디서 오는가</news:title>
   <news:publication_date>2026-05-31T13:13:19Z</news:publication_date>
   <news:genres>Blog</news:genres>
  </news:news>
 </url>
 <url>
  <loc>https://bibitlabs.com/%eb%a7%a5%eb%b6%81%ec%9c%bc%eb%a1%9c-llm%ec%9d%84-%eb%8f%8c%eb%a6%b4-%eb%95%8c-gpu-%ec%bd%94%ec%96%b4%eb%b3%b4%eb%8b%a4-%eb%a9%94%eb%aa%a8%eb%a6%ac-%eb%8c%80%ec%97%ad%ed%8f%ad%ec%9d%b4-%eb%a8%bc/</loc>
  <lastmod>2026-05-31T13:12:50Z</lastmod>
  <news:news>
   <news:publication>
    <news:name>bibitlabs</news:name>
    <news:language>ko</news:language>
   </news:publication>
   <news:title>맥북으로 LLM을 돌릴 때 GPU 코어보다 메모리 대역폭이 먼저인 이유</news:title>
   <news:publication_date>2026-05-31T13:12:48Z</news:publication_date>
   <news:genres>Blog</news:genres>
  </news:news>
 </url>
 <url>
  <loc>https://bibitlabs.com/%eb%a7%a5%eb%b6%81%ec%97%90-vram%ec%9d%b4-%ec%97%86%eb%8a%94%eb%8d%b0-llm%ec%9d%b4-%eb%8f%8c%ec%95%84%ea%b0%80%eb%8a%94-%ec%9d%b4%ec%9c%a0-apple-silicon%ec%9d%98-%eb%a9%94%eb%aa%a8%eb%a6%ac/</loc>
  <lastmod>2026-05-31T13:12:15Z</lastmod>
  <news:news>
   <news:publication>
    <news:name>bibitlabs</news:name>
    <news:language>ko</news:language>
   </news:publication>
   <news:title>맥북에 VRAM이 없는데 LLM이 돌아가는 이유 — Apple Silicon의 메모리 구조</news:title>
   <news:publication_date>2026-05-31T13:12:12Z</news:publication_date>
   <news:genres>Blog</news:genres>
  </news:news>
 </url>
 <url>
  <loc>https://bibitlabs.com/anthropic-claude-opus-4-8-%ea%b3%b5%ea%b0%9c/</loc>
  <lastmod>2026-05-31T03:11:35Z</lastmod>
  <news:news>
   <news:publication>
    <news:name>bibitlabs</news:name>
    <news:language>ko</news:language>
   </news:publication>
   <news:title>Anthropic, Claude Opus 4.8 공개</news:title>
   <news:publication_date>2026-05-31T03:10:11Z</news:publication_date>
   <news:genres>Blog</news:genres>
  </news:news>
 </url>
</urlset>
