<?xml version="1.0" encoding="UTF-8"?> <urlset xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd" xmlns="http://www.sitemaps.org/schemas/sitemap/0.9"> <url> <loc>https://unknown-nlp.github.io/books/the_godfather/</loc> <lastmod>2025-10-22T01:22:42+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/news/announcement_1/</loc> <lastmod>2015-10-22T19:59:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/news/announcement_2/</loc> <lastmod>2015-11-07T20:11:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/news/announcement_3/</loc> <lastmod>2016-01-15T11:59:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/a-survey-for-in-context-learning/</loc> <lastmod>2023-01-12T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/kala-knowledge-augmented-language-model-adaptation/</loc> <lastmod>2023-01-19T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/task-aware-retrieval-with-instructions/</loc> <lastmod>2023-01-26T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/measuring-and-improving-semantic-diversity-of-dialogue-generation/</loc> <lastmod>2023-02-02T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/adapterhub-a-framework-for-adapting-transformers-parameter-efficient/</loc> <lastmod>2023-02-09T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/calibrating-factual-knowledge-in-pretrained-language-models/</loc> <lastmod>2023-03-16T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/gpt-understands-too/</loc> <lastmod>2023-03-30T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/adapterdrop-on-the-efficiency-of-adapters-in-transformers/</loc> <lastmod>2023-04-13T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/p-tuning-v2-prompt-tuning-can-be-comparable/</loc> <lastmod>2023-04-13T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/falsesum-generating-document-level-nli-examples-for-recognizing/</loc> <lastmod>2023-04-20T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/automatic-chain-of-thought-prompting-in-large-language/</loc> <lastmod>2023-04-27T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/measuring-association-between-labels-and-free-text-rationales/</loc> <lastmod>2023-05-11T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/rethinking-the-role-of-demonstrations-what-makes-in/</loc> <lastmod>2023-05-25T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/do-prompt-based-models-really-understand-the-meaning/</loc> <lastmod>2023-06-15T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/the-false-promise-of-imitating-proprietary-llms/</loc> <lastmod>2023-06-22T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/qlora-eficient-finetuning-of-quantized-llms/</loc> <lastmod>2023-06-29T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/code-llama-open-foundation-models-for-code/</loc> <lastmod>2023-08-29T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/a-systematic-study-of-knowledge-distillation-for-natural/</loc> <lastmod>2023-09-12T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/silo-language-models-isolating-legal-risk-in-a/</loc> <lastmod>2023-09-12T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/large-language-models-as-optimizers/</loc> <lastmod>2023-09-19T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/the-cringe-loss-learning-what-language-not-to/</loc> <lastmod>2023-09-19T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/dola-decoding-by-contrasting-layers-improves-factuality-in/</loc> <lastmod>2023-10-03T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/longlora-efficient-fine-tuning-of-long-context-large/</loc> <lastmod>2023-10-10T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/resolving-interference-when-merging-models/</loc> <lastmod>2023-10-17T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/a-survey-on-large-language-model-based-autonomous/</loc> <lastmod>2023-10-31T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/efficient-streaming-language-models-with-attention-sinks/</loc> <lastmod>2023-10-31T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/in-context-learning-learns-label-relationships-but-is/</loc> <lastmod>2023-10-31T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/label-words-are-anchors-an-information-flow-perspective/</loc> <lastmod>2023-12-12T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/break-the-sequential-dependency-of-llm-inference-using/</loc> <lastmod>2023-12-19T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/learning-to-tokenize-for-generative-retrieval/</loc> <lastmod>2023-12-19T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/are-emergent-abilities-of-large-language-models-a/</loc> <lastmod>2023-12-26T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/detecting-pretraining-data-from-large-language-models/</loc> <lastmod>2024-01-02T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/vllm-easy-fast-and-cheap-llm-serving-with/</loc> <lastmod>2024-01-03T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/making-large-language-models-a-better-foundation-for/</loc> <lastmod>2024-01-09T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/benchmarking-cognitive-biases-in-large-language-models-as/</loc> <lastmod>2024-01-16T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/mistral-7b-mixtral-mixtral-of-experts/</loc> <lastmod>2024-01-16T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/in-context-pretraining-language-modeling-beyond-document-boundaries/</loc> <lastmod>2024-01-23T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/overthinking-the-truth-understanding-how-language-models-process/</loc> <lastmod>2024-01-23T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/lion-adversarial-distillation-of-proprietary-large-language-models/</loc> <lastmod>2024-01-30T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/self-rewarding-language-models/</loc> <lastmod>2024-02-06T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/can-sensitive-information-be-deleted-from-llms-objectives/</loc> <lastmod>2024-02-13T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/llm-augmented-llms-expanding-capabilities-through-composition/</loc> <lastmod>2024-02-13T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/knowledge-card-filling-llms-knowledge-gaps-with-plug/</loc> <lastmod>2024-02-20T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/wikichat-stopping-the-hallucination-of-large-language-model/</loc> <lastmod>2024-02-20T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/self-rag-learning-to-retrieve-generate-and-critique/</loc> <lastmod>2024-02-27T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/beyond-memorization-violating-privacy-via-inferencing-with-llms/</loc> <lastmod>2024-03-05T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/bitnet-scaling-1-bit-transformers-for-large-language/</loc> <lastmod>2024-03-11T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/a-simple-and-effective-pruning-approach-for-large/</loc> <lastmod>2024-03-12T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/unveiling-the-generalization-power-of-fine-tuned-large/</loc> <lastmod>2024-03-19T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/search-in-the-chain-interactively-enhancing-large-language/</loc> <lastmod>2024-03-26T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/preference-free-alignment-learning-with-regularized-relevance-reward/</loc> <lastmod>2024-04-02T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/scaling-laws-for-data-filtering-data-curation-cannot/</loc> <lastmod>2024-04-13T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/understanding-emergent-abilities-of-language-models-from-the/</loc> <lastmod>2024-04-16T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/exploring-concept-depth-how-large-language-models-acquire/</loc> <lastmod>2024-04-23T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/orpo-monolithic-preference-optimization-without-reference-model/</loc> <lastmod>2024-04-23T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/many-shot-in-context-learning/</loc> <lastmod>2024-04-30T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/training-diffusion-modelse-with-reinforcement-learning/</loc> <lastmod>2024-04-30T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/how-to-inference-big-llm-using/</loc> <lastmod>2024-05-07T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/how-to-train-llm-from-data/</loc> <lastmod>2024-05-07T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/llama-pro-progressive-llama-with-block-expansion/</loc> <lastmod>2024-05-21T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/understanding-the-performance-gap-between-online-and-offline/</loc> <lastmod>2024-05-27T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/simpo-simple-preference-optimization-with-a-reference-free/</loc> <lastmod>2024-05-28T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/stacking-your-transformers-a-closer-look-at-model/</loc> <lastmod>2024-06-04T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/contextual-position-encoding-learning-to-count-whats-important/</loc> <lastmod>2024-06-11T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/does-fine-tuning-llms-on-new-knowledge-encourage/</loc> <lastmod>2024-06-11T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/scaling-monosemanticity-extracting-interpretable-features-from-claude-3/</loc> <lastmod>2024-06-11T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/llama3-tokenizer/</loc> <lastmod>2024-07-02T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/rl-jack-reinforcement-learning-powered-black-box-jailbreaking/</loc> <lastmod>2024-07-02T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/llava-visual-instruction-tuning/</loc> <lastmod>2024-07-22T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/pyspark-how-to-preprocess-large-scale/</loc> <lastmod>2024-07-23T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/step-dpo-step-wise-preference-optimization-for-long/</loc> <lastmod>2024-07-23T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/training-large-language-models-for-reasoning-through-reverse/</loc> <lastmod>2024-07-23T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/in-context-retrieval-augmented-language-models/</loc> <lastmod>2024-07-30T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/knowledge-conflict-survey/</loc> <lastmod>2024-08-13T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/physics-of-language-models-part-21-grade-school/</loc> <lastmod>2024-08-13T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/knowledge-augmented-reasoning-distillation-for-small-language-models/</loc> <lastmod>2024-08-20T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/llm2vec-large-language-models-are-secretly-powerful-text/</loc> <lastmod>2024-09-02T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/many-shot-jailbreaking/</loc> <lastmod>2024-09-02T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/jailbreak-in-pieces-compositional-adversarial-attacks-on-multi/</loc> <lastmod>2024-09-09T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/smaller-weaker-yet-better-training-llm-reasoners-via/</loc> <lastmod>2024-09-09T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/super-evaluating-agents-on-setting-up-and-executing/</loc> <lastmod>2024-09-23T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/training-language-models-to-self-correct-via-reinforcement/</loc> <lastmod>2024-09-23T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/qcrd-quality-guided-contrastive-rationale-distillation-for-large/</loc> <lastmod>2024-10-03T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/faitheval-can-your-language-model-stay-faithful-to/</loc> <lastmod>2024-10-10T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/knowledge-entropy-decay-during-language-model-pretraining-hinders/</loc> <lastmod>2024-10-17T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/rule-based-rewards-for-language-model-safety/</loc> <lastmod>2024-10-17T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/d1-scaling-reasoning-in-diffusion-large-language-models/</loc> <lastmod>2025-01-02T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/deepseek-r1/</loc> <lastmod>2025-01-02T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/diffusion-language-model-mathematical-foundations-inference-optimization/</loc> <lastmod>2025-01-02T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/inferring-from-logits-exploring-best-practices-for-decoding/</loc> <lastmod>2025-01-02T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/tracevla-visual-trace-prompting-enhances-spatial-temporal-awareness/</loc> <lastmod>2025-01-02T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/openvla-an-open-source-vision-language-action-model/</loc> <lastmod>2025-01-14T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/agent-laboratory-using-llm-agents-as-research-assistants/</loc> <lastmod>2025-01-21T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/ssm-hippo-lssl-s4-mamba-mamba2/</loc> <lastmod>2025-02-04T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/titans-learning-to-memorize-at-test-time/</loc> <lastmod>2025-02-04T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/deepseek-v3/</loc> <lastmod>2025-02-18T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/contextual-document-embeddings/</loc> <lastmod>2025-03-04T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/logic-rl-unleashing-llm-reasoning-with-rule-based/</loc> <lastmod>2025-03-04T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/swe-rl-advancing-llm-reasoning-via-reinforcement-learning/</loc> <lastmod>2025-03-04T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/cognitive-behaviors-that-enable-self-improving-reasoners-or/</loc> <lastmod>2025-03-11T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/when-is-task-vector-provably-effective-for-model/</loc> <lastmod>2025-03-11T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/reft-reasoning-with-reinforced-fine-tuning/</loc> <lastmod>2025-03-25T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/on-the-biology-of-a-large-language-model/</loc> <lastmod>2025-04-08T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/reasoning-models-dont-always-say-what-they-think/</loc> <lastmod>2025-04-08T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/model-context-protocol-mcp-provided-by-antrophic/</loc> <lastmod>2025-04-15T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/universal-and-transferable-adversarial-attacks-on-aligned-language/</loc> <lastmod>2025-04-15T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/fine-tuning-vision-language-action-models-optimizing-speed/</loc> <lastmod>2025-04-22T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/reinforcement-learning-finetunes-small-subnetworks-in-large-language/</loc> <lastmod>2025-06-03T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/textgrad-automatic-differentiation-via-text/</loc> <lastmod>2025-06-03T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/dra-grpo-exploring-diversity-aware-reward-adjustment-for/</loc> <lastmod>2025-06-10T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/towards-a-generalizable-bimanual-foundation-policy-via-flow/</loc> <lastmod>2025-06-10T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/diffusion-of-thought-chain-of-thought-reasoning-in/</loc> <lastmod>2025-06-17T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/see-what-you-are-told-visual-attention-sink/</loc> <lastmod>2025-06-24T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/between-underthinking-and-overthinking-an-empirical-study-of/</loc> <lastmod>2025-07-01T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/reasoning-models-can-be-effective-without-thinking/</loc> <lastmod>2025-07-01T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/reasoning-model-is-stubborn-diagnosing-instruction-overriding-in/</loc> <lastmod>2025-07-15T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/scaling-reasoning-losing-control-evaluating-instruction-following-in/</loc> <lastmod>2025-07-15T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/search-r1-training-llms-to-reason-and-leverage/</loc> <lastmod>2025-07-15T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/block-diffusion-interpolating-between-autoregressive-and-diffusion-language/</loc> <lastmod>2025-08-05T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/impact-of-fine-tuning-methods-on-memorization-in/</loc> <lastmod>2025-08-05T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/on-the-expressiveness-of-softmax-attention-a-recurrent/</loc> <lastmod>2025-08-12T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/the-accuracy-paradox-in-rlhf-when-better-reward/</loc> <lastmod>2025-08-12T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/what-makes-a-reward-model-a-good-teacher/</loc> <lastmod>2025-08-12T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/on-the-generalization-of-sft-a-reinforcement-learning/</loc> <lastmod>2025-08-19T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/spurious-rewards-rethinking-training-signals-in-rlvr/</loc> <lastmod>2025-08-19T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/simpo-simple-preference-optimization-with-a-reference-free/</loc> <lastmod>2025-10-17T00:00:00+00:00</lastmod> </url> <url> <loc>https://unknown-nlp.github.io/</loc> </url> <url> <loc>https://unknown-nlp.github.io/books/</loc> </url> <url> <loc>https://unknown-nlp.github.io/_pages/dropdown/</loc> </url> <url> <loc>https://unknown-nlp.github.io/news/</loc> </url> <url> <loc>https://unknown-nlp.github.io/people/</loc> </url> <url> <loc>https://unknown-nlp.github.io/publications/</loc> </url> <url> <loc>https://unknown-nlp.github.io/repositories/</loc> </url> <url> <loc>https://unknown-nlp.github.io/teaching/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/2023/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/2024/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/2025/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/fine-tuning/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/gpt/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/icl/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/language-model/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/llm/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/paper-review/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/reasoning/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/survey/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/transformer/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/bert/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/embedding/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/generative/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/knowledge/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/ner/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/pre-training/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/qa/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/vision/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/instruction-tuning/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/neural/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/nlp/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/retrieval/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/rlhf/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/dialogue/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/evaluation-metric/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/adapter/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/lm/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/attention/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/calibrating/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/prompt-tuning/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/classification/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/parameter-efficiency/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/data-augmentation/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/detection/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/text-summarization/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/sllm/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/efficient-training/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/alignment/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/knowledge-distillation/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/domain-adaptation/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/factual-consistency/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/task-vectors/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/autonomous-agents/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/in-context-learning/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/decoding/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/library/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/reinforcement-learning/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/editing/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/natural-language-generation/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/inference/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/quantization/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/pruning/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/generalization/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/reinforcement-learning/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/diffusion/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/rl/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/pre-training/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/torch/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/continual-learning/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/interpretability/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/multimodal/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/tokenizer/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/safety/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/vlm/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/machine-learning/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/spark/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/explainability/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/embeddings/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/limited-budget/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/code-generation/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/agi/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/diffusionlm/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/sft/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/robotics/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/moe/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/text-generation/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/efficient-transformer/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/reward-model/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/tag/rlvr/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/category/paper-reviews/</loc> </url> <url> <loc>https://unknown-nlp.github.io/books/2025/</loc> </url> <url> <loc>https://unknown-nlp.github.io/books/tag/top-100/</loc> </url> <url> <loc>https://unknown-nlp.github.io/books/category/classics/</loc> </url> <url> <loc>https://unknown-nlp.github.io/books/category/crime/</loc> </url> <url> <loc>https://unknown-nlp.github.io/books/category/historical-fiction/</loc> </url> <url> <loc>https://unknown-nlp.github.io/books/category/mystery/</loc> </url> <url> <loc>https://unknown-nlp.github.io/books/category/novels/</loc> </url> <url> <loc>https://unknown-nlp.github.io/books/category/thriller/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/2/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/3/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/4/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/5/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/6/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/7/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/8/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/9/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/10/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/11/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/12/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/13/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/14/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/15/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/16/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/17/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/18/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/19/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/20/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/21/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/22/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/23/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/24/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/25/</loc> </url> <url> <loc>https://unknown-nlp.github.io/blog/page/26/</loc> </url> </urlset>