<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2302.04761-Toolformer-LanguageModelsCanTeachThemselvestoUseTools/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2501.06252-TRANSFORMER-SQUARED-SELF-ADAPTIVELLMS/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2501.12948-DeepSeek-R1-IncentivizingReasoningCapabilityinLLMsviaReinfor/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2506.20249-LanguageModelingbyLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2511.03773-ScalingAgentLearningviaExperienceSynthesis/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2511.15593-WhatDoesItTaketoBeaGoodAIResearchAgent%3FStudyingtheRoleofIdea/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2512.02551-CUDA-L2-Surpassing-cuBLAS-Performance-for-Matrix-Multiplication-through-Reinforc/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2512.08296-Towards-a-Science-of-Scaling-Agent-Systems/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2512.10398-Confucius-Code-Agent-Scalable-Agent-Scaffolding-for-Real-World-Codebases/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2512.12967-QwenLong-L1.5-Post-Training-Recipe-for-Long-Context-Reasoning-and-Memory-Managem/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2512.13564-Memory-in-the-Age-of-AI-Agents-A-SurveyForms-Functions-and-Dynamics/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2512.15176-Draft-with-Diffusion-Verify-with-Autoregressive-Models/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2512.20848-Nemotron-3-Nano-Open-Efficient-Mixture-of-Experts-Hybrid-Mamba-Transformer-Model/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2512.20856-NVIDIA-Nemotron-3-Efficient-and-Open-Intelligence/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2512.23236-KernelEvolve-Scaling-Agentic-Kernel-Coding-for-Heterogeneous-AI-Accelerators-at-/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2512.23676-Web-World-Models/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2603.11327-Meta-Reinforcement-Learning-with-Self-Reflection-for-Agentic-Search/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/agents/2604.08516-MolmoWeb-Open-Visual-Web-Agent-and-Open-Data-for-the-Open-Web/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/2409.02795-TowardsaUnifiedViewofPreferenceLearningforLargeLanguageModel/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/2501.07301-TheLessonsofDevelopingProcessRewardModelsinMathematicalReaso/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/2501.12599-KIMIK1.5-SCALINGREINFORCEMENTLEARNINGWITHLLMS/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/CamelsinaChangingClimate-EnhancingLMAdaptationwithT%C3%9CLU2/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/DeepReinforcementLearningfromHumanPreferences/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/DirectPreferenceOptimization-YourLanguageModelisSecretlyaRew/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/HERMES3TECHNICALREPORT/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/INSTRUCTIONTUNINGWITHGPT-4/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/LIMA-LessIsMoreforAlignment/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/LargeReasoningModelsLearnBetterAlignmentfromFlawedThinking/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/Learningtosummarizefromhumanfeedback/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/Let%E2%80%99sVerifyStepbyStep/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/Llama2-OpenFoundationandFine-TunedChatModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/MULTIPLAYERNASHPREFERENCEOPTIMIZATION/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/OnscalableoversightwithweakLLMsjudgingstrongLLMs/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/RLHFWorkflow-FromRewardModelingtoOnlineRLHF%E2%80%93AComprehensivePr/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/ReinforcementLearningfromHumanFeedback-AshortintroductiontoR/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/ScalingInstruction-FinetunedLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/Simplesyntheticdatareducessycophancyinlargelanguagemodels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/Traininglanguagemodelstofollowinstructionswithhumanfeedback/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/TruthRL-IncentivizingTruthfulLLMsviaReinforcementLearning/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/T%C3%BClu3-PushingFrontiersinOpenLanguageModelPost-Training/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/alignment/UFT-UnifyingFine-TuningofSFTandRLHF-DPO-UNAthroughaGeneraliz/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/2506.05200-Transformers-Meet-In-Context-Learning-A-Universal-Approximation-Theory/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/2603.02188-MULTI-HEAD-LOW-RANK-ATTENTION/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/ANIMAGEISWORTH16X16WORDS-TRANSFORMERSFORIMAGERECOGNITIONATSC/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/ASurveyonDiffusionLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/AttentionIsAllYouNeed/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/AutoregressiveUniversalVideoSegmentationModel/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/Character-levelConvolutionalNetworksforTextClassification/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/DIFFERENTIALTRANSFORMER/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/DIFFUSIONTRANSFORMERSWITHREPRESENTATIONAUTOENCODERS/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/DeepResidualLearningforImageRecognition/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/DeepSeekMoE-TowardsUltimateExpertSpecializationinMixture-of-/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/EXAONE4.0-UnifiedLargeLanguageModelsIntegratingNon-reasoning/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/EfficientNet-RethinkingModelScalingforConvolutionalNeuralNet/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/EveryAttentionMatters-AnEfficientHybridArchitectureforLong-C/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/FASTANDSIMPLEX-2-SIMPLICIALATTENTIONINTRI-TON/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/FLEXOLMO-OpenLanguageModelsforFlexibleDataUse/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/Falcon-H1-AFamilyofHybrid-HeadLanguageModelsRedefiningEffici/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/FastR-CNN/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/FullyConvolutionalNetworksforSemanticSegmentation/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/GPipe-EasyScalingwithMicro-BatchPipelineParallelism/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/Gemma3TechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/GeneratingLongSequenceswithSparseTransformers/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/HOWPOWERFULAREGRAPHNEURALNETWORKS%3F/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/Jamba-1.5-HybridTransformer-MambaModelsatScale/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/Jamba-AHybridTransformer-MambaLanguageModel/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/KIMILINEAR-ANEXPRESSIVE%2CEFFICIENTATTENTIONARCHITECTURE/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/LM2-LargeMemoryModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/LONGNET-ScalingTransformersto1%2C000%2C000%2C000Tokens/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/Llama-Nemotron-EfficientReasoningModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/Log-LinearAttention/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/Mamba-Linear-TimeSequenceModelingwithSelectiveStateSpaces/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/Megatron-LM-TrainingMulti-BillionParameterLanguageModelsUsin/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/MixtralofExperts/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/Mixture-of-Transformers-ASparseandScalableArchitectureforMul/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/MobileLLM-OptimizingSub-billionParameterLanguageModelsforOn-/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/MolmoAct-ActionReasoningModelsthatcanReasoninSpace/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/Multi-TokenAttention/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/NVIDIANemotronNano2-AnAccurateandEfficientHybridMamba-Transf/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/NativeSparseAttention-Hardware-AlignedandNativelyTrainableSp/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/OLMoE-OpenMixture-of-ExpertsLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/OUTRAGEOUSLYLARGENEURALNETWORKS-THESPARSELY-GATEDMIXTURE-OF-/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/PaddleOCR-VL-BoostingMultilingualDocumentParsingviaa0.9BUltr/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/PyTorch-AnImperativeStyle%2CHigh-PerformanceDeepLearningLibrar/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/QWEN2TECHNICALREPORT/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/Qwen3TechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/RPG-AREPOSITORYPLANNINGGRAPHFORUNIFIEDANDSCALABLECODEBASEGEN/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/RecurrentGemma-MovingPastTransformersforEfficientOpenLanguag/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/ReplacingsoftmaxwithReLUinVisionTransformers/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/SCALINGLAWSMEETMODELARCHITECTURE-TOWARDINFERENCE-EFFICIENTLL/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/ScalableDiffusionModelswithTransformers/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/ScalingLatentReasoningviaLoopedLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/SequencetoSequenceLearningwithNeuralNetworks/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/TheLlama3HerdofModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/TrainingLargeLanguageModelstoReasoninaContinuousLatentSpace/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/TransformersareSSMs-GeneralizedModelsandEfficientAlgorithmsT/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/TransformerswithoutNormalization/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/VIBEVOICETechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/XGBoost-AScalableTreeBoostingSystem/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/YouOnlyLookOnce-Unified%2CReal-TimeObjectDetection/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/Zero-ShotText-to-ImageGeneration/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/architecture/doi-10.1038-nature14539-Deep-learning/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/code/2511.00839-CodeClash-BenchmarkingGoal-OrientedSoftwareEngineering/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/context-optimization/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/context-optimization/2408.01367-Transformers-are-Universal-In-context-Learners/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/context-optimization/2501.08313-MiniMax-01-ScalingFoundationModelswithLightningAttention/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/context-optimization/2510.27258-Higher-orderLinearAttention/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/context-optimization/AComprehensiveSurveyonLongContextLanguageModeling/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/context-optimization/AControlledStudyonLongContextExtensionandGeneralizationinLLM/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/context-optimization/ASurveyofContextEngineeringforLargeLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/context-optimization/Deepcontextualizedwordrepresentations/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/context-optimization/LLM2Vec-LargeLanguageModelsAreSecretlyPowerfulTextEncoders/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/context-optimization/LLaVA-CoT-LetVisionLanguageModelsReasonStep-by-Step/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/context-optimization/LongCodeZip-CompressLongContextforCodeLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/context-optimization/LongRoPE-ExtendingLLMContextWindowBeyond2MillionTokens/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/context-optimization/YaRN-EfficientContextWindowExtensionofLargeLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/data/2501.08365-TowardsBestPracticesforOpenDatasetsforLLMTraining/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/diffusion/2512.15745-LLaDA2.0-Scaling-Up-Diffusion-Language-Models-to-100B/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/diffusion/2604.06916-FP4-Explore-BF16-Train-Diffusion-Reinforcement-Learning-via-Efficient-Rollout-Sc/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/distributed-training/2501.18512-StreamingDiLoCowithoverlappingcommunication-TowardsaDistribu/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/2102.12452-Probing-Classifiers-Promises-Shortcomings-and-Advances/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/2402.07841-DoMembershipInferenceAttacksWorkonLargeLanguageModels%3F/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/2406.08446-OLMES-AStandardforLanguageModelEvaluations/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/2411.05403-BenchmarkingDistributionalAlignmentofLargeLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/2501.14249-Humanity%E2%80%99sLastExam/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/2501.15654-PeoplewhofrequentlyuseChatGPTforwritingtasksareaccurateandr/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/2512.14691-MMGR-Multi-Modal-Generative-Reasoning/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/ASurveyonEvaluationofLargeLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/AttentionHeadsofLargeLanguageModels-ASurvey/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/CanLLMsGenerateNovelResearchIdeas%3FALarge-ScaleHumanStudywith/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/CarlemanEstimatesandControllabilityofForwardStochasticParabo/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/ChatbotArena-AnOpenPlatformforEvaluatingLLMsbyHumanPreferenc/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/DeepSeek-R1Thoughtology-Let%E2%80%99sthinkaboutLLMreasoning/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/DocumentParsingUnveiled-Techniques%2CChallenges%2CandProspectsfo/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/EFFICIENTLLM-EFFICIENCYINLARGELANGUAGEMODELSEVALUATIONONARCH/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/EvaluatingLargeLanguageModelsTrainedonCode/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/GENERALIZATIONV.S.MEMORIZATION-TRACINGLANGUAGEMODELS%E2%80%99CAPABIL/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/GPQA-AGraduate-LevelGoogle-ProofQ%26ABenchmark/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/HOLISTICALLYEVALUATINGTHEENVIRONMENTALIMPACTOFCREATINGLANGUA/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/HolisticEvaluationofLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/HowIsChatGPT%E2%80%99sBehaviorChangingoverTime%3F/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/ImageNetLargeScaleVisualRecognitionChallenge/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/IsChain-of-ThoughtReasoningofLLMsaMirage%3FADataDistributionLe/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/JudgingLLM-as-a-JudgewithMT-BenchandChatbotArena/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/KernelBench-CanLLMsWriteEfficientGPUKernels%3F/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/LMSYS-CHAT-1M-ALARGE-SCALEREAL-WORLDLLMCONVERSATIONDATASET/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/M3DSYNTH-ADATASETOFMEDICAL3DIMAGESWITHAI-GENERATEDLOCALMANIP/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/MMLU-Pro-AMoreRobustandChallengingMulti-TaskLanguageUndersta/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/MMMU-Pro-AMoreRobustMulti-disciplineMultimodalUnderstandingB/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/MicrosoftCOCO-CommonObjectsinContext/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/NotAllLLMReasonersAreCreatedEqual/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/PaperBench-EvaluatingAI%E2%80%99sAbilitytoReplicateAIResearch/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/PremiseOrderMattersinReasoningwithLargeLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/REASONINGGYM-ReasoningEnvironmentsforReinforcementLearningwi/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/RULER-What%E2%80%99stheRealContextSizeofYourLong-ContextLanguageMode/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/RewardBench-EvaluatingRewardModelsforLanguageModeling/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/SUMOFTHEGL%283%29FOURIERCOEFFICIENTSOVERQUADRATICSANDMIXEDPOWERS/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/SWE-Perf-CanLanguageModelsOptimizeCodePerformanceonReal-Worl/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/TheAutomatedLLMSpeedrunningBenchmark-ReproducingNanoGPTImpro/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/TheLeaderboardIllusion/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/UndesirableMemorizationinLargeLanguageModels-ASurvey/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/VibeChecker-AligningCodeEvaluationwithHumanPreference/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/WhyDoMulti-AgentLLMSystemsFail%3F/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/WhyLanguageModelsHallucinate/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/evaluation/alphafold2-2021-Unable-to-Extract---No-Paper-Content-Provided/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/1911.00172-GENERALIZATIONTHROUGHMEMORIZATION-NEARESTNEIGHBORLANGUAGEMOD/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/2512.12087-BLASST-Dynamic-BLocked-Attention-Sparsity-via-Softmax-Thresholding/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/2512.23675-End-to-End-Test-Time-Training-for-Long-Context/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/2603.05451-FlashAttention-4-Algorithm-and-Kernel-Pipelining-Co-Design-for-Asymmetric-Hardwa/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/2603.12201-IndexCache-Accelerating-Sparse-Attention-via-Cross-Layer-Index-Reuse/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/2603.28342-Kernel-Smith-A-Unified-Recipe-for-Evolutionary-Kernel-Optimization/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/2604.04921-TriAttention-Efficient-Long-Reasoning-with-Trigonometric-KV-Compression/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/2604.08302-DMax-Aggressive-Parallel-Decoding-for-dLLMs/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/ASurveyofSmallLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/AUXILIARY-LOSS-FREELOADBALANCINGSTRATEGYFORMIXTURE-OF-EXPERT/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/AcceleratingLLMInferencewithStagedSpeculativeDecoding/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/Astra-AMulti-AgentSystemforGPUKernelPerformanceOptimization/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/BreaktheSequentialDependencyofLLMInferenceUsingLOOKAHEADDECO/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/Can1BLLMSurpass405BLLM%3FRethinkingCompute-OptimalTest-TimeSca/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/Chain-of-ThoughtReasoningwithoutPrompting/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/ChunkAttention-EfficientSelf-AttentionwithPrefix-AwareKVCach/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/CompactLanguageModelsviaPruningandKnowledgeDistillation/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/ContextParallelismforScalableMillion-TokenInference/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/DoesMoreInference-TimeComputeReallyHelpRobustness%3F/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/EAGLE-SpeculativeSamplingRequiresRethinkingFeatureUncertaint/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/EFFICIENTLYSCALINGTRANSFORMERINFERENCE/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/EFFICIENTSTREAMINGLANGUAGEMODELSWITHATTENTIONSINKS/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/EfficientlyScalingLLMReasoningwithCertaindex/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/FAST-DLLMV2-EfficientBlock-DiffusionLLM/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/FLEXATTENTION-APROGRAMMINGMODELFORGENERATINGOPTIMIZEDATTENTI/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/Fast-dLLM-Training-freeAccelerationofDiffusionLLMbyEnablingK/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/FlashAttention-2-FasterAttentionwithBetterParallelismandWork/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/FlashAttention-3-FastandAccurateAttentionwithAsynchronyandLo/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/FlashAttention-FastandMemory-EfficientExactAttentionwithIO-A/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/FlashFFTConv-EfficientConvolutionsforLongSequenceswithTensor/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/FlashInfer-EfficientandCustomizableAttentionEngineforLLMInfe/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/FlexGen-High-ThroughputGenerativeInferenceofLargeLanguageMod/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/GQA-TrainingGeneralizedMulti-QueryTransformerModelsfromMulti/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/Inference-TimeScalingforGeneralistRewardModeling/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/InferenceScalingforLong-ContextRetrievalAugmentedGeneration/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/InfiniteHiP-ExtendingLanguageModelContextUpto3MillionTokenso/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/LLMinaflash-EfficientLargeLanguageModelInferencewithLimitedM/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/LargeLanguageMonkeys-ScalingInferenceComputewithRepeatedSamp/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/LearningAdaptiveParallelReasoningwithLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/Locality-awareParallelDecodingforEfficientAutoregressiveImag/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/MEDUSA-SimpleLLMInferenceAccelerationFrameworkwithMultipleDe/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/MUTUALREASONINGMAKESSMALLERLLMSSTRONGERPROBLEM-SOLVERS/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/MiniMax-M1-ScalingTest-TimeComputeEfficientlywithLightningAt/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/ParallelScalingLawforLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/RECURRENTDRAFTERFORFASTSPECULATIVEDECODINGINLARGELANGUAGEMOD/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/SLA-BEYONDSPARSITYINDIFFUSIONTRANSFORMERSVIAFINE-TUNABLESPAR/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/SageAttention2-EfficientAttentionwithThoroughOutlierSmoothin/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/ScalingLLMTest-TimeComputeOptimallycanbeMoreEffectivethanSca/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/Sleep-timeCompute-BeyondInferenceScalingatTest-time/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/SpecInfer-AcceleratingLargeLanguageModelServingwithTree-base/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/Squid-LongContextasaNewModalityforEnergy-EfficientOn-DeviceL/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/StayontopicwithClassifier-FreeGuidance/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/THEPITFALLSOFKVCACHECOMPRESSION/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/TVM-AnAutomatedEnd-to-EndOptimizingCompilerforDeepLearning/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/TheEndofManualDecoding-TowardsTrulyEnd-to-EndLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/TheMambaintheLlama-DistillingandAcceleratingHybridModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/ThunderKittens-Simple%2CFast%2CandAdorableAIKernels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/TransMLA-MLAIsAllYouNeed/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/TuningLanguageModelsbyProxy/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/inference-optimization/s1-Simpletest-timescaling/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/2204.06745-GPT-NeoX-20B-AnOpen-SourceAutoregressiveLanguageModel/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/2310.16789-DETECTINGPRETRAININGDATAFROMLARGELANGUAGEMODELS/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/2407.04620-Learningto%28LearnatTestTime%29-RNNswithExpressiveHiddenStates/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/2408.11796-LLMPruningandDistillationinPractice-TheMinitronApproach/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/2501.09891-EvolvingDeeperLLMThinking/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/2507.06261-Gemini2.5-PushingtheFrontierwithAdvancedReasoning%2CMultimodal/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/2510.27656-RDMAPOINT-TO-POINTCOMMUNICATIONFORLLMSYSTEMS/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/2512.02038-DeepResearch-ASystematicSurvey/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/2512.02556-DeepSeek-V3.2-PushingtheFrontierofOpenLargeLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/2512.11251-Insight-Miner-A-Time-Series-Analysis-Dataset-for-Cross-Domain-Alignment-with-Nat/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/2512.13961-Olmo-3/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/2512.15586-Bolmo-Byteifying-the-Next-Generation-of-Language-Models/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/2512.16093-TurboDiffusion-Accelerating-Video-Diffusion-Models-by-100-200-Times/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/2512.23165-Evaluating-Parameter-Efficient-Methods-for-RLVR/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/2601.01739-K-EXAONE-Technical-ReportJourney-to-Frontier-Level-Performance-of-Foundation-Mod/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/2601.09012-TranslateGemma-Technical-Report/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/ASURVEYOFSELF-EVOLVINGAGENTS-ONPATHTOARTIFICIALSUPERINTELLIG/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/Alpa-AutomatingInter-andIntra-OperatorParallelismforDistribu/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/Caffe-ConvolutionalArchitectureforFastFeatureEmbedding/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/ChatGLM-AFamilyofLargeLanguageModelsfromGLM-130BtoGLM-4AllTo/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/DIVERSITYEMPOWERSINTELLIGENCE-INTEGRATINGEXPERTISEOFSOFTWARE/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/DeepMMSearch-R1-EmpoweringMultimodalLLMsinMultimodalWebSearc/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/Gold-medalistPerformanceinSolvingOlympiadGeometrywithAlphaGe/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/InsightsintoDeepSeek-V3-ScalingChallengesandReflectionsonHar/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/LargeLanguageModelAgent-ASurveyonMethodology%2CApplicationsand/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/MXNet-AFlexibleandEfficientMachineLearningLibraryforHeteroge/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/Memento-Fine-tuningLLMAgentswithoutFine-tuningLLMs/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/Mixture-of-AgentsEnhancesLargeLanguageModelCapabilities/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/Mooncake-AKVCache-centricDisaggregatedArchitectureforLLMServ/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/OLMOTRACE-TracingLanguageModelOutputsBacktoTrillionsofTraini/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/OLMo-AcceleratingtheScienceofLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/PyTorchFSDP-ExperiencesonScalingFullyShardedDataParallel/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/Ray-ADistributedFrameworkforEmergingAIApplications/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/Relax-ComposableAbstractionsforEnd-to-EndDynamicMachineLearn/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/SGLang-EfficientExecutionofStructuredLanguageModelPrograms/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/TensorFlow-Asystemforlarge-scalemachinelearning/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/TensorFlow-Large-ScaleMachineLearningonHeterogeneousDistribu/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/TowardsGeneralAgenticIntelligenceviaEnvironmentScaling/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/llm-systems/UniversalDeepResearch-BringYourOwnModelandStrategy/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/low-precision/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/low-precision/2208.07339-LLM.int8%28%29-8-bitMatrixMultiplicationforTransformersatScale/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/low-precision/2510.25602-INTv.s.FP-AComprehensiveStudyofFine-GrainedLow-bitQuantizati/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/low-precision/2511.02302-FP8-Flow-MoE-A-Casting-Free-FP8-Recipe-without-Double-Quantization-Error/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/low-precision/2512.10938-StrongerNormalization-FreeTransformers/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/low-precision/AWQ-Activation-AwareWeightQuantizationforOn-DeviceLLMCompres/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/low-precision/FP8-LM-TrainingFP8LargeLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/low-precision/PretrainingLargeLanguageModelswithNVFP4/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/low-precision/SageAttention3-MicroscalingFP4AttentionforInferenceandAnExpl/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/low-precision/TheEraof1-bitLLMs-AllLargeLanguageModelsarein1.58Bits/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/low-precision/%E2%80%9CGiveMeBF16orGiveMeDeath%E2%80%9D%3FAccuracy-PerformanceTrade-OffsinLL/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/moe/2512.14080-SonicMoE-Accelerating-MoE-with-IO-and-Tile-aware-Optimizations/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/moe/2512.23447-Coupling-Experts-and-Routers-in-Mixture-of-Experts-via-an-Auxiliary-Loss/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/moe/2601.05296-MoEBlaze-Breaking-the-Memory-Wall-for-Efficient-MoE-Training-on-Modern-GPUs/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/1710.10903-GRAPH-ATTENTION-NETWORKS/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/2507.13264-Voxtral/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/2510.23095-REVISITINGMULTIMODALPOSITIONALENCODINGINVISION-LANGUAGEMODE/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/2511.10647-DepthAnything3-RecoveringtheVisualSpacefromAnyViews/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/2511.21631-Qwen3-VLTechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/2601.04720-Qwen3-VL-Embedding-and-Qwen3-VL-Reranker-A-Unified-Framework-for-State-of-the-Ar/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/2601.10611-Molmo2Open-Weights-and-Data-for-Vision-Language-Modelswith-Video-Understanding-a/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/2603.25040-Intern-S1-Pro-Scientific-Multimodal-Foundation-Model-at-Trillion-Scale/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/ATOKEN-AUNIFIEDTOKENIZERFORVISION/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/AnEmpiricalStudyofScalingInstruction-TunedLargeMultimodalMod/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/AnIntroductiontoVision-LanguageModeling/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/Apollo-AnExplorationofVideoUnderstandinginLargeMultimodalMod/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/Buildingandbetterunderstandingvision-languagemodels-insights/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/Cube-ARobloxViewof3DIntelligence/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/Emu3-Next-TokenPredictionisAllYouNeed/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/GLM-4.5VandGLM-4.1V-Thinking-TowardsVersatileMultimodalReaso/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/Gemini-AFamilyofHighlyCapableMultimodalModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/INTERN-S1-ASCIENTIFICMULTIMODALFOUNDATIONMODEL/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/InternVL3-ExploringAdvancedTrainingandTest-TimeRecipesforOpe/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/InternVL3.5-AdvancingOpen-SourceMultimodalModelsinVersatilit/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/KIMI-VLTECHNICALREPORT/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/LLaVA-OneVision-1.5-FullyOpenFrameworkforDemocratizedMultimo/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/MMaDA-MultimodalLargeDiffusionLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/MolmoandPixMo-OpenWeightsandOpenDataforState-of-the-ArtVisio/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/NVILA-EfficientFrontierVisualLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/NVLM-OpenFrontier-ClassMultimodalLLMs/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/NextTokenPredictionTowardsMultimodalIntelligence-AComprehens/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/Phi-4-MiniTechnicalReport-CompactyetPowerfulMultimodalLangua/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/Qwen-ImageTechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/Qwen2-VL-EnhancingVision-LanguageModel%E2%80%99sPerceptionoftheWorld/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/Qwen2.5-OmniTechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/Qwen2.5-VLTechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/Qwen3-OmniTechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/SAIL-VL2TechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/ScalingAutoregressiveMulti-ModalModels-PretrainingandInstruc/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/SegmentAnything/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/SmolVLM-Redefiningsmallandefficientmultimodalmodels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/multimodal/Videomodelsarezero-shotlearnersandreasoners/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/2201.02177-GROKKING-GENERALIZATION-BEYOND-OVERFITTING-ON-SMALL-ALGORITHMIC-DATASETS/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/2209.11895-In-context-Learning-and-Induction-Heads/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/2306.13891-EstimatingtheCausalEffectofEarlyArXivingonPaperAcceptance/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/2409.14254-Instruction-Following-Without-Instruction-Tuning/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/2501.00958-2.5YearsinClass-AMultimodalTextbookforVision-LanguagePretrai/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/2501.05453-AnEmpiricalStudyofAutoregressivePre-trainingfromVideos/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/2501.15383-Qwen2.5-1MTechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/2510.22115-EveryActivationBoosted-ScalingGeneralReasonerto1TrillionOpen/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/2512.13687-Towards-Scalable-Pre-training-of-Visual-Tokenizers-for-Generation/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/2512.22955-Diversity-or-Precision-A-Deep-Dive-into-Next-Token-Prediction/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/2603.27164-daVinci-LLM-Towards-the-Science-of-Pretraining/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/2OLMo2Furious/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/BART-DenoisingSequence-to-SequencePre-trainingforNaturalLang/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/BERT-Pre-trainingofDeepBidirectionalTransformersforLanguageU/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/BLOOM-A176B-ParameterOpen-AccessMultilingualLanguageModel/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/CLIMB-CLustering-basedIterativeDataMixtureBootstrappingforLa/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/DEMOCRATIZINGOPENANDCOMPLIANTLLMSFORGLOBALLANGUAGEENVIRONMEN/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/DINOv3/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/DataComp-LM-Insearchofthenextgenerationoftrainingsetsforlang/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/DataDecide-HowtoPredictBestPretrainingDatawithSmallExperimen/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/DeepSeek-Coder-V2-BreakingtheBarrierofClosed-SourceModelsinC/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/DeepSeek-Coder-WhentheLargeLanguageModelMeetsProgramming-The/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/DeepSeekLLM-ScalingOpen-SourceLanguageModelswithLongtermism/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/DeepSeekMath-PushingtheLimitsofMathematicalReasoninginOpenLa/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/DistributedRepresentationsofWordsandPhrasesandtheirCompositi/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/Dolma-anOpenCorpusofThreeTrillionTokensforLanguageModelPretr/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/EfficientEstimationofWordRepresentationsinVectorSpace/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/EmbeddingGemma-PowerfulandLightweightTextRepresentations/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/FantasticPretrainingOptimizersandWheretoFindThem/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/GeminiEmbedding-GeneralizableEmbeddingsfromGemini/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/Gemma2-ImprovingOpenLanguageModelsataPracticalSize/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/IN-CONTEXTPRETRAINING-LANGUAGEMODELINGBEYONDDOCUMENTBOUNDARI/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/InstructionPre-Training-LanguageModelsareSupervisedMultitask/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/LargeLanguageModelsforCompilerOptimization/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/MetaCLIP2-AWorldwideScalingRecipe/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/ModelMerginginPre-trainingofLargeLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/MultilingualE5TextEmbeddings-ATechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/Nemotron-415BTechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/ONLINEARREPRESENTATIONSANDPRETRAININGDATAFREQUENCYINLANGUAGE/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/OPENDATASYNTHESISFORDEEPRESEARCH/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/OPT-OpenPre-trainedTransformerLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/OpenCoder-TheOpenCookbookforTop-TierCodeLargeLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/PaLM2TechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/Phi-3TechnicalReport-AHighlyCapableLanguageModelLocallyonYou/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/Phi-4TechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/Pre-trainingunderinfinitecompute/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/Qwen2.5-CoderTechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/Qwen2.5TechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/Qwen3Embedding-AdvancingTextEmbeddingandRerankingThroughFoun/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/RedPajama-anOpenDatasetforTrainingLargeLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/RephrasingtheWeb-ARecipeforCompute%26Data-EfficientLanguageMod/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/RoBERTa-ARobustlyOptimizedBERTPretrainingApproach/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/ScalingAgentsviaContinualPre-training/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/ScalingLawsforNeuralLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/ScalingPre-trainingtoOneHundredBillionDataforVisionLanguageM/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/ScalingSyntheticDataCreationwith1%2C000%2C000%2C000Personas/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/SigLIP2-MultilingualVision-LanguageEncoderswithImprovedSeman/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/SmolLM2-WhenSmolGoesBig%E2%80%94Data-CentricTrainingofaSmallLanguage/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/Source2Synth-SyntheticDataGenerationandCurationGroundedinRea/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/THINKINGAUGMENTEDPRE-TRAINING/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/TextbooksAreAllYouNeed/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/TextbooksAreAllYouNeedII-phi-1.5technicalreport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/TheCommonPilev0.1-An8TBDatasetofPublicDomainandOpenlyLicense/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/TheFineWebDatasets-DecantingtheWebfortheFinestTextDataatScal/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/ToCode%2CorNotToCode%3FExploringImpactofCodeinPre-training/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/TrainingCompute-OptimalLargeLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/UnleashingthePowerofDataTsunami-AComprehensiveSurveyonDataAs/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/pretraining/olmOCR-UnlockingTrillionsofTokensinPDFswithVisionLanguageMod/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/prompting/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/prompting/Chain-of-ThoughtPromptingElicitsReasoninginLargeLanguageMode/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/prompting/LanguageModelsareFew-ShotLearners/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/prompting/LargeLanguageModelsareZero-ShotReasoners/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/prompting/LargeLanguageModelsasOptimizers/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/prompting/Meta-Prompting-EnhancingLanguageModelswithTask-AgnosticScaff/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/prompting/RethinkingtheRoleofDemonstrations-WhatMakesIn-ContextLearnin/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/prompting/ThePromptReport-ASystematicSurveyofPromptEngineeringTechniqu/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/reasoning/2511.22570-DeepSeekMath-V2-TowardsSelf-VerifiableMathematicalReasoning/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/reasoning/2512.10739-Long-horizon-Reasoning-Agent-for-Olympiad-Level-Mathematical-Problem-Solving/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/reasoning/2512.16969-Probing-Scientific-General-Intelligence-of-LLMswith-Scientist-Aligned-Workflows/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/reasoning/2512.17901-WHEN-REASONING-MEETS-ITS-LAWS/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/reasoning/2512.23988-Fantastic-Reasoning-Behaviors-and-Where-to-Find-Them-Unsupervised-Discovery-of-t/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/retrieval/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/retrieval/2603.10913-LLM2VEC-GEN-Generative-Embeddings-from-Large-Language-Models/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/retrieval/Infini-gram-ScalingUnboundedn-gramLanguageModelstoaTrillionT/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/retrieval/OntheTheoreticalLimitationsofEmbedding-BasedRetrieval/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/retrieval/ScalingRetrieval-BasedLanguageModelswithaTrillion-TokenDatas/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/2507.14843-THEINVISIBLELEASH%3FWHYRLVRMAYORMAYNOTESCAPEITSORIGIN/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/2512.01374-StabilizingReinforcementLearningwithLLMs-FormulationandPract/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/2512.16649-JustRL-Scaling-a-1.5B-LLM-with-a-Simple-RL-Recipe/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/2601.05242-GDPO-Group-reward-Decoupled-Normalization-Policy-Optimization-for-Multi-reward-R/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/2601.08521-Your-Group-Relative-Advantage-Is-Biased/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/2603.08068-In-Context-Reinforcement-Learning-for-Tool-Use-in-Large-Language-Models/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/2603.08660-How-Far-Can-Unsupervised-RLVR-Scale-LLM-Training/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/2603.14473-AI-Can-Learn-Scientific-Taste/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/2603.18815-ProRL-Agent-Rollout-as-a-Service-for-RL-Training-of-Multi-Turn-LLM-Agents/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/2603.21383-PivotRL-High-Accuracy-Agentic-Post-Training-at-Low-Compute-Cost/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/AGENTICREINFORCEDPOLICYOPTIMIZATION/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/ASurveyofReinforcementLearningforLargeReasoningModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/CUDA-L1-ImprovingCUDAOptimizationviaContrastiveReinforcement/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/CompetitiveProgrammingwithLargeReasoningModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/DAPO-AnOpen-SourceLLMReinforcementLearningSystematScale/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/DEEPSEARCH-OVERCOMETHEBOTTLENECKOFREINFORCEMENTLEARNINGWITHV/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/DoesReinforcementLearningReallyIncentivizeReasoningCapacityi/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/GLM-4.5-Agentic%2CReasoning%2CandCoding%28ARC%29FoundationModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/GroupSequencePolicyOptimization/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/Magistral/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/NEMOTRON-CROSSTHINK-ScalingSelf-LearningbeyondMathReasoning/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/Phi-4-reasoningTechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/ProximalPolicyOptimizationAlgorithms/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/QERL-BEYONDEFFICIENCY%E2%80%93QUANTIZATIONENHANCEDREINFORCEMENTLEARN/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/ReinforcementLearningforReasoninginLargeLanguageModelswithOn/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/ScalingRLtoLongVideos/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/Search-R1-TrainingLLMstoReasonandLeverageSearchEngineswithRe/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/SecretsofRLHFinLargeLanguageModelsPartI-PPO/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/SharingisCaring-EfficientLMPost-TrainingwithCollectiveRLExpe/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/TheArtofScalingReinforcementLearningComputeforLLMs/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/TheLandscapeofAgenticReinforcementLearningforLLMs-ASurvey/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/TrainingLanguageModelstoSelf-CorrectviaReinforcementLearning/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/TrustRegionPolicyOptimization/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/Webscale-RL-AutomatedDataPipelineforScalingRLDatatoPretraini/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/rl-training/ZEROSEARCH-IncentivizetheSearchCapabilityofLLMswithoutSearch/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/safety/2507.05578-TheLandscapeofMemorizationinLLMs-Mechanisms%2CMeasurement%2CandM/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/serving/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/serving/DistServe-DisaggregatingPrefillandDecodingforGoodput-optimiz/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/serving/EfficientMemoryManagementforLargeLanguageModelServingwithPag/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/serving/MARCONI-PREFIXCACHINGFORTHEERAOFHYBRIDLLMS/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/serving/MegaScale-Infer-ServingMixture-of-ExpertsatScalewithDisaggre/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/serving/NanoFlow-TowardsOptimalLargeLanguageModelServingThroughput/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/serving/PUNICA-MULTI-TENANTLORASERVING/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/serving/PrefillOnly-AnInferenceEngineforPrefill-onlyWorkloadsinLarge/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/serving/S-LoRA-ServingThousandsofConcurrentLoRAAdapters/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/serving/TamingThroughput-LatencyTradeoffinLLMInferencewithSarathi-Se/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/2501.17161-SFTMemorizes%2CRLGeneralizes-AComparativeStudyofFoundationMode/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/2511.10643-Black-BoxOn-PolicyDistillationofLargeLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/2601.00417-Deep-Delta-Learning/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/2603.13985-Supervised-Fine-Tuning-versus-Reinforcement-Learning-A-Study-of-Post-Training-Me/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/2604.00626-A-Survey-of-On-Policy-Distillation-for-Large-Language-Models/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/ADAM-AMETHODFORSTOCHASTICOPTIMIZATION/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/AgentLearningviaEarlyExperience/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/Better%26FasterLargeLanguageModelsviaMulti-tokenPrediction/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/BeyondDataandModelParallelismforDeepNeuralNetworks/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/BeyondHumanData-ScalingSelf-TrainingforProblem-SolvingwithLa/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/BeyondReasoningGains-MitigatingGeneralCapabilitiesForgetting/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/CriticalBatchSizeRevisited-ASimpleEmpiricalApproachtoLarge-B/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/DCP-AddressingInputDynamismInLong-ContextTrainingviaDynamicC/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/EXAONE3.5-SeriesofLargeLanguageModelsforReal-worldUseCases/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/Eagle2.5-BoostingLong-ContextPost-TrainingforFrontierVision-/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/EfficientLarge-ScaleLanguageModelTrainingonGPUClustersUsingM/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/EfficientLong-contextLanguageModelTrainingbyCoreAttentionDis/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/Hermes4TechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/LIMI-LessisMoreforAgency/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/LIMO-LessisMoreforReasoning/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/LigerKernel-EfficientTritonKernelsforLLMTraining/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/LoRA-Low-RankAdaptationofLargeLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/MM1.5-Methods%2CAnalysis%26InsightsfromMultimodalLLMFine-tuning/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/MergetoLearn-EfficientlyAddingSkillstoLanguageModelswithMode/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/MuonOutperformsAdaminTail-EndAssociativeMemoryLearning/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/ON-POLICYDISTILLATIONOFLANGUAGEMODELS-LEARNINGFROMSELF-GENER/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/ONTHEGENERALIZATIONOFSFT-AREINFORCEMENTLEARNINGPERSPECTIVEWI/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/Parameter-EfficientTransferLearningforNLP/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/PipeDream-FastandEfficientPipelineParallelDNNTraining/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/Pre-trainingDistillationforLargeLanguageModels-ADesignSpaceE/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/PyTorchFSDP-ExperiencesonScalingFullyShardedDataParallel/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/RAFT-AdaptingLanguageModeltoDomainSpecificRAG/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/ROBUSTFT-RobustSupervisedFine-tuningforLargeLanguageModelsun/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/ReFT-RepresentationFinetuningforLanguageModels/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/ReinforcementPre-Training/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/SelfForcing-BridgingtheTrain-TestGapinAutoregressiveVideoDif/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/TongyiDeepResearchTechnicalReport/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/ZeRO-MemoryOptimizationsTowardTrainingTrillionParameterModel/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/doi-10.48550-arxiv.1406.2661-Generative-Adversarial-Nets/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/doi-10.5555-1953048.1953056-Random-Search-for-Hyper-Parameter-Optimization/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/training-methods/doi-10.5555-3045118.3045280-Dropout-A-Simple-Way-to-Prevent-Neural-Networks-from-Overfitting/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/uncategorized/1409.4842-Goingdeeperwithconvolutions/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
    <url>
         <loc>https://summary-of-some-paper-in-cuda.readthedocs.io/vision/2302.00294-The-geometry-of-hidden-representations-of-large-transformer-models/</loc>
         <lastmod>2026-06-01</lastmod>
    </url>
</urlset>