<?xml version="1.0" encoding="utf-8" standalone="yes"?><urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:xhtml="http://www.w3.org/1999/xhtml"><url><loc>https://jnk234.github.io/posts/sycophancy-recovery-simpo/</loc><lastmod>2026-04-01T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/</loc><lastmod>2026-04-01T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/</loc><lastmod>2026-04-01T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/sycophancy-recovery-dpo/</loc><lastmod>2026-03-29T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/deepseek-mhc-hyper-connections/</loc><lastmod>2026-01-23T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/understanding-rmsnorm-my-notes-on-faster-layer-normalization/</loc><lastmod>2026-01-03T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/</loc><lastmod>2025-12-20T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/quibo-mcp-server-for-agentic-blogging/</loc><lastmod>2025-12-20T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/mcp-multiverse/</loc><lastmod>2025-12-18T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/vouchai-agent-to-agent-insurance-protocol/</loc><lastmod>2025-11-15T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/self-evolving-agent/</loc><lastmod>2025-11-04T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/the-deadly-triad-in-reinforcement-learning-why-agents-fail-and-how-dqn-fixed-it/</loc><lastmod>2025-09-22T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/reinforcement-learning-algorithms/</loc><lastmod>2025-09-21T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/a-deep-dive-into-q-learning-the-off-policy-td-control-algorithm/</loc><lastmod>2025-09-19T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/a-deep-dive-into-on-policy-td-control-the-sarsa-algorithm/</loc><lastmod>2025-09-18T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/temporal-difference-bootstrapping-in-reinforcement-learning/</loc><lastmod>2025-09-17T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/monte-carlo-learning-in-rl/</loc><lastmod>2025-09-15T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/model-free-rl-prediction-control-and-the-mrp-mdp-duality/</loc><lastmod>2025-09-14T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/my-three-months-at-relativity-building-ai-for-legal-tech/</loc><lastmod>2025-09-07T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/nlp-interpretability-mechanistic-analysis-of-llms/</loc><lastmod>2025-09-01T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/reinforcement-learning-essentials-mdps-optimal-control/</loc><lastmod>2025-08-09T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/beyond-supervised-learning-unlocking-ais-potential-with-reinforcement-learning/</loc><lastmod>2025-07-14T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/lear-llm-driven-evolution-of-agent-based-rules/</loc><lastmod>2025-07-01T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/netlogo-llm-extension/</loc><lastmod>2025-06-19T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/air-insights-legal-document-intelligence/</loc><lastmod>2025-06-01T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/qd-lear-quality-diversity-in-llm-evolved-agents/</loc><lastmod>2025-05-01T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/medhastra-ai-medical-education-platform/</loc><lastmod>2025-03-22T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/faceswap-diffusion-model/</loc><lastmod>2025-03-20T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/advocate-ai-powered-ad-generator/</loc><lastmod>2025-03-12T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/second-opinaion-medical-diagnosis-system/</loc><lastmod>2025-03-12T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/agentic-blogging-assistant/</loc><lastmod>2025-02-18T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/implementing-gpt-style-attention-a-step-by-step-guide-with-pytorch/</loc><lastmod>2025-01-21T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/the-ultimate-guide-to-preparing-text-data-for-language-modeling-with-pytorch/</loc><lastmod>2025-01-06T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/cdatapytorch-in-practice-essential-building-blocks-for-modern-deep-learning/</loc><lastmod>2025-01-02T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/pytorch-in-practice-essential-building-blocks-for-modern-deep-learning/</loc><lastmod>2025-01-02T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/pytorch-in-practice-essential-building-blocks-for-modern-deep-learning/</loc><lastmod>2024-12-30T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/value-based-policy-training-in-reinforcement-learning/</loc><lastmod>2024-09-30T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/understanding-reinforcement-learning-policy-based-and-value-based-approaches/</loc><lastmod>2024-09-02T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/fast-and-efficient-finetuning-of-llms-qlora/</loc><lastmod>2024-08-19T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/from-decisions-to-rewards-understanding-the-rl-decision-making-process/</loc><lastmod>2024-08-14T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/reinforcement-learning-essentials-a-quick-guide/</loc><lastmod>2024-08-12T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/learn-act-adapt-unveiling-reinforcement-learning/</loc><lastmod>2024-08-05T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/from-perplexity-to-rouge-essential-metrics-for-evaluating-llms-easy-to-understand/</loc><lastmod>2024-04-08T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/can-less-be-more-exploring-peft-for-llms/</loc><lastmod>2024-03-27T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/decoding-the-art-understanding-text-generation-with-transformers-ii/</loc><lastmod>2024-03-26T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/decoding-the-art-understanding-text-generation-with-transformers-i/</loc><lastmod>2024-03-25T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/unlock-the-power-of-generative-ai-mastering-personalized-model-development/</loc><lastmod>2024-01-22T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/neuraforge-newsletter/</loc><lastmod>2023-08-01T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/projects/technical-publications-automation/</loc><lastmod>2022-07-01T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/cdataheres-how-you-should-train-an-intelligent-classifier-model../</loc><lastmod>2021-12-02T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/heres-how-you-should-train-an-intelligent-classifier-model../</loc><lastmod>2021-12-02T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/cdatawhy-multi-label-classification-should-be-used-instead-of-conventional-classifiers./</loc><lastmod>2021-11-29T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/why-multi-label-classification-should-be-used-instead-of-conventional-classifiers./</loc><lastmod>2021-11-29T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/cdataapproaching-data-centric-ai-using-fast.ai/</loc><lastmod>2021-11-06T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/approaching-data-centric-ai-using-fast.ai/</loc><lastmod>2021-11-06T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/cdatagetting-started-with-100-days-of-deep-learning/</loc><lastmod>2021-10-20T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/posts/getting-started-with-100-days-of-deep-learning/</loc><lastmod>2021-10-20T00:00:00+00:00</lastmod></url><url><loc>https://jnk234.github.io/cv/</loc></url><url><loc>https://jnk234.github.io/publications/</loc></url></urlset>