<?xml version="1.0" encoding="UTF-8"?><urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:news="http://www.google.com/schemas/sitemap-news/0.9" xmlns:xhtml="http://www.w3.org/1999/xhtml" xmlns:image="http://www.google.com/schemas/sitemap-image/1.1" xmlns:video="http://www.google.com/schemas/sitemap-video/1.1"><url><loc>https://papers.chlience.com/</loc></url><url><loc>https://papers.chlience.com/archive/</loc></url><url><loc>https://papers.chlience.com/papers/</loc></url><url><loc>https://papers.chlience.com/papers/2025-09-10-defeating-nondeterminism-llm-inference/</loc></url><url><loc>https://papers.chlience.com/papers/2409.19256-hybridflow-rlhf-framework/</loc></url><url><loc>https://papers.chlience.com/papers/2501.12948-deepseek-r1-rl-reasoning/</loc></url><url><loc>https://papers.chlience.com/papers/2503.14476-dapo-long-cot-rl-system/</loc></url><url><loc>https://papers.chlience.com/papers/2510.19315-transformers-inherently-succinct/</loc></url><url><loc>https://papers.chlience.com/papers/2605.14220-training-inference-mismatch-llm-rl/</loc></url><url><loc>https://papers.chlience.com/papers/2605.30290-self-trained-verification/</loc></url><url><loc>https://papers.chlience.com/papers/2605.31514-age-of-empires-anthropomorphism/</loc></url><url><loc>https://papers.chlience.com/papers/2606.00135-agentic-tool-calling-rl-training/</loc></url><url><loc>https://papers.chlience.com/papers/2606.04075-llms-hack-rewards-and-society/</loc></url><url><loc>https://papers.chlience.com/papers/2606.04101-ultraep-rack-scale-moe-load-balancing/</loc></url><url><loc>https://papers.chlience.com/papers/2606.04662-muon-outperforms-adam-curvature/</loc></url><url><loc>https://papers.chlience.com/papers/2606.06453-vortex-sparse-attention-serving/</loc></url><url><loc>https://papers.chlience.com/template/</loc></url><url><loc>https://papers.chlience.com/workflow/</loc></url></urlset>