<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd" xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
<url>
<loc>https://bearbearyu1223.github.io/posts/food-qna-on-server-llm/</loc>
<lastmod>2023-07-31T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/food-qna-on-device-llm/</loc>
<lastmod>2023-08-14T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/conversation-sim/</loc>
<lastmod>2023-09-07T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/assistant-api-playground/</loc>
<lastmod>2023-11-21T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/PEFT-summarization/</loc>
<lastmod>2024-01-01T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/cs336-note-get-started/</loc>
<lastmod>2025-07-20T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/cs336-note-simple-bpe/</loc>
<lastmod>2025-07-22T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/cs336-note-train-bpe-tinystories/</loc>
<lastmod>2025-07-26T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/cs336-gpt2-regex-for-pretokenization-explaind/</loc>
<lastmod>2025-08-10T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/cs336-build-a-transformer-language-model/</loc>
<lastmod>2025-09-13T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/cs336-transformer-architecture-overview/</loc>
<lastmod>2025-09-17T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/cs336-understand-computation-cost-of-transformer-model/</loc>
<lastmod>2025-09-28T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/cs336-training-a-transformer-lm-part-1/</loc>
<lastmod>2025-10-05T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/cs336-implement-softmax-log_softmax-cross_entropy/</loc>
<lastmod>2025-10-19T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/cs336-building-a-complete-training-loop/</loc>
<lastmod>2025-11-02T00:00:00-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/cs336-the-complete-experiment-for-tinystories-transformer/</loc>
<lastmod>2025-11-16T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/cs336-local-to-cloud-training/</loc>
<lastmod>2026-01-11T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/cs336-sft-qwen3-for-math-reasoning/</loc>
<lastmod>2026-01-19T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/cs336-reinforcement-learning-for-language-model/</loc>
<lastmod>2026-01-25T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/grpo-math-reasoning-lambda-cloud/</loc>
<lastmod>2026-02-08T00:00:00-08:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/posts/mcp-claude-skills-social-media-agent/</loc>
<lastmod>2026-03-28T01:00:00-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/categories/</loc>
<lastmod>2026-03-28T20:06:45-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/</loc>
<lastmod>2026-03-28T20:06:45-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/archives/</loc>
<lastmod>2026-03-28T20:06:45-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/about/</loc>
<lastmod>2026-03-28T20:06:45-07:00</lastmod>
</url>
<url>
<loc>https://bearbearyu1223.github.io/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/rag/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/chatbot/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/openai/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/embeddings/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/vector-database/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/langchain/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/streamlit/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/llama2/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/on-device/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/faiss/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/quantization/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/apple-silicon/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/llm-agents/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/conversation-simulation/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/multi-agent/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/assistant-api/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/text-to-speech/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/image-generation/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/peft/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/qlora/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/lora/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/fine-tuning/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/falcon-7b/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/summarization/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/llm-evaluation/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/cs336/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/setup/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/development-environment/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/python/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/uv/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/bpe/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/tokenization/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/unicode/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/utf-8/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/byte-pair-encoding/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/tinystories/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/compression/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/pretokenization/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/regex/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/gpt-2/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/multilingual/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/transformer/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/attention/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/pytorch/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/language-model/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/swiglu/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/rope/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/encoder-decoder/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/gpt/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/bert/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/t5/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/llama/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/architecture/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/flops/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/computation/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/scaling-laws/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/optimization/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/cross-entropy/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/perplexity/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/adamw/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/optimizer/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/memory/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/training/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/softmax/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/numerical-stability/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/training-loop/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/learning-rate/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/checkpointing/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/data-loading/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/end-to-end/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/text-generation/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/sft/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/cloud-training/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/colab/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/lambda-labs/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/cuda/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/qwen/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/math-reasoning/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/reinforcement-learning/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/policy-gradient/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/rlhf/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/grpo/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/ppo/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/lambda-cloud/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/h100/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/mcp/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/claude/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/xiaohongshu/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/content-creator/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/agent/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/claude-skills/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/tags/claude-code/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/categories/genai-projects/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/categories/rag/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/categories/on-device-llm/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/categories/multi-agent/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/categories/assistants/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/categories/fine-tuning/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/categories/cs336/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/categories/getting-started/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/categories/tokenization/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/categories/transformers/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/categories/training/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/categories/infrastructure/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/categories/reinforcement-learning/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/categories/mcp/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/categories/agent/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/page2/</loc>
</url>
<url>
<loc>https://bearbearyu1223.github.io/page3/</loc>
</url>
</urlset>
