<?xml version="1.0" encoding="UTF-8"?>
<!-- generator="wordpress.com" -->
<urlset xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns="http://www.sitemaps.org/schemas/sitemap/0.9" xmlns:image="http://www.google.com/schemas/sitemap-image/1.1" xsi:schemaLocation="http://www.sitemaps.org/schemas/sitemap/0.9 http://www.sitemaps.org/schemas/sitemap/0.9/sitemap.xsd"><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/uncertainty-under-distribution-shift/</loc><lastmod>2026-03-14T06:50:35+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/uncertainty-drift/</loc><lastmod>2026-03-14T06:48:25+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/evaluation-governance/</loc><lastmod>2026-03-14T06:46:18+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/emergent-abilities/</loc><lastmod>2026-03-14T06:44:06+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/scaling-vs-robustness/</loc><lastmod>2026-03-14T06:42:18+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/scaling-vs-generalization/</loc><lastmod>2026-03-14T06:40:36+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/scaling-laws/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/scaling-laws-in-machine-learning-neural-networks-lexicon.png</image:loc><image:title>Scaling laws in machine learning - Neural Networks Lexicon</image:title><image:caption>Scaling laws in machine learning - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-14T06:37:39+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/robustness-vs-generalization/</loc><lastmod>2026-03-13T18:16:59+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/stress-testing-vs-benchmarking/</loc><lastmod>2026-03-13T18:16:25+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/interpretability-vs-performance/</loc><lastmod>2026-03-13T18:15:43+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/masked-language-modeling/</loc><lastmod>2026-03-13T17:16:17+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/efficiency-governance/</loc><lastmod>2026-03-13T16:58:10+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/budget-constrained-inference/</loc><lastmod>2026-03-13T16:57:09+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/graceful-degradation/</loc><lastmod>2026-03-13T16:55:22+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/sla-aware-inference-policies/</loc><lastmod>2026-03-13T16:54:11+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/evaluation-metrics/</loc><lastmod>2026-03-13T16:45:22+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/confusion-matrix/</loc><lastmod>2026-03-13T16:44:28+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/precision/</loc><lastmod>2026-03-13T16:42:50+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/recall/</loc><lastmod>2026-03-13T16:40:57+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/self-supervised-learning/</loc><lastmod>2026-03-13T15:24:36+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/capability-alignment-gap/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/capabilitye28093alignment-gap-neural-networks-lexicon-1.png</image:loc><image:title>Capability–Alignment Gap - Neural Networks Lexicon</image:title><image:caption>Capability–Alignment Gap - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-13T15:01:26+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/alignment-drift/</loc><lastmod>2026-03-13T10:51:14+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generative-models/</loc><lastmod>2026-03-13T10:42:51+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/throughput-vs-latency/</loc><lastmod>2026-03-13T09:12:53+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/self-paced-learning/</loc><lastmod>2026-03-13T09:11:59+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/optimization-stability/</loc><lastmod>2026-03-13T09:10:57+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/variational-autoencoders/</loc><lastmod>2026-03-13T09:01:32+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/autoencoders/</loc><lastmod>2026-03-13T08:38:58+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/learning-rate-scaling/</loc><lastmod>2026-03-13T08:23:48+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/weight-initialization/</loc><lastmod>2026-03-13T08:21:03+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/representation-collapse/</loc><lastmod>2026-03-13T07:47:55+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/curriculum-learning/</loc><lastmod>2026-03-13T07:35:13+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/curriculum-schedules/</loc><lastmod>2026-03-13T07:29:16+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/representation-learning/</loc><lastmod>2026-03-12T19:53:16+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/latent-representations/</loc><lastmod>2026-03-12T19:22:17+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/mixup-and-cutmix/</loc><lastmod>2026-03-12T15:17:15+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/exploration-vs-exploitation/</loc><lastmod>2026-03-12T14:16:50+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/open-set-vs-closed-set-recognition/</loc><lastmod>2026-03-12T14:14:32+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/missing-data/</loc><lastmod>2026-03-12T14:10:51+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/label-noise/</loc><lastmod>2026-03-12T14:08:59+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/label-latency/</loc><lastmod>2026-03-12T14:03:56+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/prompt-conditioning/</loc><lastmod>2026-03-12T14:01:50+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/label-distribution/</loc><lastmod>2026-03-12T13:25:51+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/independent-and-identically-distributed-iid/</loc><lastmod>2026-03-12T13:02:32+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/imputation/</loc><lastmod>2026-03-12T12:57:19+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/importance-sampling/</loc><lastmod>2026-03-12T12:54:36+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/holdout-sets/</loc><lastmod>2026-03-12T12:44:37+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/learning-rate-warmup/</loc><lastmod>2026-03-12T12:37:05+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/warmup-schedules/</loc><lastmod>2026-03-12T12:36:00+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/multi-metric-optimization/</loc><lastmod>2026-03-12T10:14:23+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/goodharts-law/</loc><lastmod>2026-03-12T10:10:43+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/instruction-tuning/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/instruction-tuning-neural-networks-lexicon.png</image:loc><image:title>Instruction Tuning - Neural Networks Lexicon</image:title><image:caption>Instruction Tuning - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-12T10:06:49+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/goodharts-law-ml-context/</loc><lastmod>2026-03-12T09:22:38+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/static-vs-rolling-retraining/</loc><lastmod>2026-03-12T09:19:46+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/model-update-policies/</loc><lastmod>2026-03-12T09:11:31+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/causal-evaluation/</loc><lastmod>2026-03-12T09:02:51+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/online-vs-offline-evaluation/</loc><lastmod>2026-03-12T08:59:29+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/offline-metrics-vs-business-metrics/</loc><lastmod>2026-03-12T08:56:05+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/benchmark-performance-vs-real-world-performance/</loc><lastmod>2026-03-12T08:55:39+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/outcome-horizon/</loc><lastmod>2026-03-12T08:52:18+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/delayed-feedback-loops/</loc><lastmod>2026-03-12T08:47:18+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/long-term-outcome-auditing/</loc><lastmod>2026-03-12T08:25:25+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/metric-gaming/</loc><lastmod>2026-03-12T08:02:50+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/proxy-metrics/</loc><lastmod>2026-03-12T07:57:49+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/reward-hacking/</loc><lastmod>2026-03-12T07:49:39+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/gradient-clipping/</loc><lastmod>2026-03-11T19:06:06+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/hard-example-mining/</loc><lastmod>2026-03-11T19:05:48+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/gradient-variance/</loc><lastmod>2026-03-11T19:04:00+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/circular-padding/</loc><lastmod>2026-03-11T17:31:56+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/dilated-convolutions/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/dilated-convolutions-neural-networks-lexicon.png</image:loc><image:title>Dilated Convolutions - Neural Networks Lexicon</image:title><image:caption>Dilated Convolutions - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-11T17:31:13+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/convolution-operation/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/convolution-operation-neural-networks-lexicon.png</image:loc><image:title>Convolution Operation - Neural Networks Lexicon</image:title><image:caption>Convolution Operation - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-11T17:28:03+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/attention-mechanism/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/attention-mechanism-neural-networks-lexicon.png</image:loc><image:title>Attention Mechanism - Neural Networks Lexicon</image:title><image:caption>Attention Mechanism - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-11T17:19:25+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/multi-head-attention/</loc><lastmod>2026-03-11T15:43:16+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/scaled-dot-product-attention/</loc><lastmod>2026-03-11T15:41:35+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/feature-lineage/</loc><lastmod>2026-03-11T12:13:39+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/feature-versioning/</loc><lastmod>2026-03-11T12:10:28+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/feature-stores/</loc><lastmod>2026-03-11T12:09:45+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/feature-availability/</loc><lastmod>2026-03-11T12:07:19+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/expanding-window-sampling/</loc><lastmod>2026-03-11T12:04:24+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/event-time-sampling/</loc><lastmod>2026-03-11T12:02:09+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/dataset-shift/</loc><lastmod>2026-03-11T10:59:48+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/dataset-bias/</loc><lastmod>2026-03-11T10:58:03+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/layer-normalization-deep-dive/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/layer-normalization-deep-dive-neural-networks-lexicon.png</image:loc><image:title>Layer Normalization (deep dive) - Neural Networks Lexicon</image:title><image:caption>Layer Normalization (deep dive) - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-11T09:40:56+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/inductive-bias/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/inductive-bias-neural-networks-lexicon.png</image:loc><image:title>Inductive Bias - Neural Networks Lexicon</image:title><image:caption>Inductive Bias - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-11T09:36:41+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/in-context-learning/</loc><lastmod>2026-03-11T09:35:22+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/hidden-layers/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/hidden-layers-neural-networks-lexicon.png</image:loc><image:title>Hidden layers - Neural Networks Lexicon</image:title><image:caption>Hidden layers - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-11T09:04:17+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/hessian-spectrum/</loc><lastmod>2026-03-11T09:03:34+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/end-to-end-learning/</loc><lastmod>2026-03-11T08:54:21+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/halting-functions/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/halting-functions-neural-networks-lexicon.png</image:loc><image:title>Halting Functions - Neural Networks Lexicon</image:title><image:caption>Halting Functions - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-11T08:32:10+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/gating-mechanisms/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/gating-mechanisms-neural-networks-lexicon.png</image:loc><image:title>Gating Mechanisms - Neural Networks Lexicon</image:title><image:caption>Gating Mechanisms - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-11T08:21:04+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/gated-recurrent-unit-gru/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/gated-recurrent-unit-gru-neural-networks-lexicon.png</image:loc><image:title>Gated Recurrent Unit (GRU) - Neural Networks Lexicon</image:title><image:caption>Gated Recurrent Unit (GRU) - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-11T08:18:11+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/exploding-gradients/</loc><lastmod>2026-03-11T08:17:12+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/feedforward-networks-in-transformers/</loc><lastmod>2026-03-11T08:14:07+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/feedforward-networks/</loc><lastmod>2026-03-11T08:11:37+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/feature-reuse/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/feature-reuse-neural-networks-lexicon.png</image:loc><image:title>Feature Reuse - Neural Networks Lexicon</image:title><image:caption>Feature Reuse - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-11T07:33:23+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/feature-maps/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/feature-maps-neural-networks-lexicon.png</image:loc><image:title>Feature Maps - Neural Networks Lexicon</image:title><image:caption>Feature Maps - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-11T07:30:55+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/feature-learning/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/feature-learning-neural-networks-lexicon.png</image:loc><image:title>Feature Learning - Neural Networks Lexicon</image:title><image:caption>Feature Learning - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-11T07:26:42+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/expert-collapse/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/expert-collapse-neural-networks-lexicon.png</image:loc><image:title>Expert Collapse - Neural Networks Lexicon</image:title><image:caption>Expert Collapse - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-11T07:00:20+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/expert-routing/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/expert-routing-neural-networks-lexicon.png</image:loc><image:title>Expert Routing - Neural Networks Lexicon</image:title><image:caption>Expert Routing - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-11T06:55:44+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/activation-functions/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/activation-functions-neural-network-lexicon.png</image:loc><image:title>Activation Functions - Neural Network Lexicon</image:title><image:caption>Activation Functions - Neural Network Lexicon</image:caption></image:image><lastmod>2026-03-10T14:24:03+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/causal-masking/</loc><lastmod>2026-03-10T12:39:04+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/decoder-only-transformers/</loc><lastmod>2026-03-10T12:38:07+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/adaptive-computation-depth/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/adaptive-computation-depth-neural-networks-lexicon.png</image:loc><image:title>Adaptive Computation Depth - Neural Networks Lexicon</image:title><image:caption>Adaptive Computation Depth - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-10T11:56:15+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/</loc><lastmod>2026-03-10T11:44:38+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/generalization/</loc><lastmod>2026-03-10T11:44:21+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/calibration-drift/</loc><lastmod>2026-03-10T11:30:50+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/</loc><lastmod>2026-03-10T11:24:02+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/transformer-scaling-laws/</loc><lastmod>2026-03-10T10:09:09+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/residual-connections-conceptual/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/understanding-residual-connections-in-neural-networks-neural-networks-lexicon.png</image:loc><image:title>Understanding residual connections in neural networks - Neural Networks Lexicon</image:title><image:caption>Understanding residual connections in neural networks - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-10T09:18:36+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/accuracy-latency-trade-offs/</loc><lastmod>2026-03-09T16:17:53+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/soft-vs-hard-halting/</loc><lastmod>2026-03-09T16:16:34+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/attention-vs-convolution/</loc><lastmod>2026-03-09T16:15:22+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/pretraining-vs-fine-tuning/</loc><lastmod>2026-03-09T16:14:14+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/parameter-efficient-fine-tuning-peft/</loc><lastmod>2026-03-09T14:38:57+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/cross-attention/</loc><lastmod>2026-03-09T13:52:08+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/exposure-bias-deep-dive/</loc><lastmod>2026-03-09T12:52:10+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/encoder-only-vs-decoder-only-transformers/</loc><lastmod>2026-03-09T12:44:33+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/decoder-only-vs-encoder-decoder-trade-offs/</loc><lastmod>2026-03-09T10:39:53+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/chain-of-thought-prompting/</loc><lastmod>2026-03-09T08:29:05+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/autoregressive-models/</loc><lastmod>2026-03-08T17:58:33+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/scheduled-sampling-deep-dive/</loc><lastmod>2026-03-08T17:36:25+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/sequence-to-sequence-models-seq2seq/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/sequence-to-sequence-models-seq2seq-neural-networks-lexicon.png</image:loc><image:title>Sequence-to-Sequence Models (Seq2Seq) - Neural Networks Lexicon</image:title><image:caption>Sequence-to-Sequence Models (Seq2Seq) - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-08T17:33:38+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/early-exit-networks/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/early-exit-networks-neural-networks-lexicon.png</image:loc><image:title>Early Exit Networks - Neural Networks Lexicon</image:title><image:caption>Early Exit Networks - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-08T15:00:38+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/model-architecture/</loc><lastmod>2026-03-08T13:55:27+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/attention-mechanism-foundational/</loc><lastmod>2026-03-08T13:41:14+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/self-attention/</loc><lastmod>2026-03-08T13:20:44+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/residual-networks-resnet/</loc><lastmod>2026-03-07T20:11:35+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/skip-connections-general/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/skip-connections-general-neural-networks-lexicon.png</image:loc><image:title>Skip Connections (General) - Neural Networks Lexicon</image:title><image:caption>Skip Connections (General) - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-07T20:09:13+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/highway-networks/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/highway-networks-neural-networks-lexicon.png</image:loc><image:title>Highway Networks - Neural Networks Lexicon</image:title><image:caption>Highway Networks - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-07T20:08:41+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/normalization-layers/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/normalization-layers-neural-networks-lexicon.png</image:loc><image:title>Normalization Layers - Neural Networks Lexicon</image:title><image:caption>Normalization Layers - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-07T20:04:40+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/rms-normalization/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/rms-normalization-neural-networks-lexicon.png</image:loc><image:title>RMS Normalization - Neural Networks Lexicon</image:title><image:caption>RMS Normalization - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-07T20:03:40+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/teacher-forcing/</loc><lastmod>2026-03-07T14:48:48+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/compute-aware-evaluation/</loc><lastmod>2026-03-07T14:47:06+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/compute-data-trade-offs/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/computee28093data-trade-offs-neural-networks-lexicon.png</image:loc><image:title>Compute–Data Trade-offs - Neural Networks Lexicon</image:title><image:caption>Compute–Data Trade-offs - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-07T14:44:58+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/compute-aware-loss-functions/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/compute-aware-loss-functions-neural-networks-lexicon.png</image:loc><image:title>Compute-Aware Loss Functions - Neural Networks Lexicon</image:title><image:caption>Compute-Aware Loss Functions - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-07T14:44:29+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/mixture-of-experts/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/mixture-of-experts-neural-networks-lexicon.png</image:loc><image:title>Mixture of Experts - Neural Networks Lexicon</image:title><image:caption>Mixture of Experts - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-07T14:41:58+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/routing-entropy/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/routing-entropy-neural-networks-lexicon.png</image:loc><image:title>Routing Entropy - Neural Networks Lexicon</image:title><image:caption>Routing Entropy - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-07T14:40:39+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/load-balancing-in-moe/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/load-balancing-in-moe-neural-networks-lexicon.png</image:loc><image:title>Load Balancing in MoE - Neural Networks Lexicon</image:title><image:caption>Load Balancing in MoE - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-07T14:38:53+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/</loc><lastmod>2026-03-07T13:34:13+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/threshold-selection/</loc><lastmod>2026-03-07T13:21:22+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/receptive-fields/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/03/understanding-receptive-fields-in-neural-networks-neural-networks-lexicon.png</image:loc><image:title>Understanding receptive fields in neural networks - Neural Networks Lexicon</image:title><image:caption>Understanding receptive fields in neural networks - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-07T10:09:26+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/long-short-term-memory-lstm/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/long-short-term-memory-lstm-neural-networks-lexicon.png</image:loc><image:title>Long Short-Term Memory (LSTM) - Neural Networks Lexicon</image:title><image:caption>Long Short-Term Memory (LSTM) - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-07T10:05:48+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/recurrent-neural-network-rnn/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/03/recurrent-neural-network-infographic-neural-networks-lexicon.png</image:loc><image:title>Recurrent neural network infographic - Neural Networks Lexicon</image:title><image:caption>Recurrent neural network infographic - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-07T10:04:38+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/convolutional-neural-network-cnn/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/convolutional-neural-network-cnn-neural-networks-lexicon.png</image:loc><image:title>Convolutional Neural Network (CNN) - Neural Networks Lexicon</image:title><image:caption>Convolutional Neural Network (CNN) - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-07T10:01:48+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/causal-feature-engineering/</loc><lastmod>2026-03-07T08:20:44+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/training-serving-skew/</loc><lastmod>2026-03-07T08:17:17+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/training-drift-vs-evaluation-drift/</loc><lastmod>2026-03-06T17:48:43+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/data-drift-vs-concept-drift/</loc><lastmod>2026-03-06T17:47:07+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/covariate-shift-vs-label-shift/</loc><lastmod>2026-03-06T17:46:08+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/processing-time-leakage/</loc><lastmod>2026-03-06T15:59:06+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/temporal-feature-leakage/</loc><lastmod>2026-03-06T15:57:46+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/walk-forward-validation/</loc><lastmod>2026-03-06T15:55:21+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/bidirectional-rnns/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/bidirectional-rnns-neural-networks-lexicon.png</image:loc><image:title>Bidirectional RNNs - Neural Networks Lexicon</image:title><image:caption>Bidirectional RNNs - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-06T10:31:49+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/backpropagation-through-time-bptt/</loc><lastmod>2026-03-06T10:31:12+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/institutional-oversight-models/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/institutional-oversight-models-neural-networks-lexicon.png</image:loc><image:title>Institutional Oversight Models - Neural Networks Lexicon</image:title><image:caption>Institutional Oversight Models - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-06T10:28:41+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/robustness-benchmarks-vs-accuracy-benchmarks/</loc><lastmod>2026-03-06T10:26:36+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/in-distribution-vs-out-of-distribution/</loc><lastmod>2026-03-06T10:25:19+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/leaderboard-overfitting/</loc><lastmod>2026-03-06T10:23:50+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/resampling-techniques/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/03/resampling-techniques-for-class-imbalance-neural-network-lexicon.png</image:loc><image:title>Resampling techniques for class imbalance - Neural Network Lexicon</image:title><image:caption>Resampling techniques for class imbalance - Neural Network Lexicon</image:caption></image:image><lastmod>2026-03-06T09:03:28+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/encoder-decoder-models/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/03/encoder-decoder-models-infographic-neural-networks-lexicon.png</image:loc><image:title>Encoder-decoder models infographic - Neural Networks Lexicon</image:title><image:caption>Encoder-decoder models infographic - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-06T06:50:33+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/accuracy-vs-loss/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/03/accuracy-vs-loss-explained-visually-neural-networks-lexicon.png</image:loc><image:title>Accuracy vs Loss explained visually - Neural Networks Lexicon</image:title><image:caption>Accuracy vs Loss explained visually - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-06T06:47:54+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/underfitting/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/03/understanding-underfitting-in-machine-learning-neural-network-lexicon.png</image:loc><image:title>Understanding underfitting in machine learning - Neural Network Lexicon</image:title><image:caption>Understanding underfitting in machine learning - Neural Network Lexicon</image:caption></image:image><lastmod>2026-03-06T06:44:38+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/robustness-adversarial-threats/adversarial-attacks-overview/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/03/adversarial-attacks-in-machine-learning-overview-neural-network-lexicon.png</image:loc><image:title>Adversarial attacks in machine learning overview - Neural Network Lexicon</image:title><image:caption>Adversarial attacks in machine learning overview - Neural Network Lexicon</image:caption></image:image><lastmod>2026-03-06T06:42:23+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/robustness-adversarial-threats/adversarial-training/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/03/adversarial-training-for-robust-ai-models-neural-network-lexicon.png</image:loc><image:title>Adversarial training for robust AI models - Neural Network Lexicon</image:title><image:caption>Adversarial training for robust AI models - Neural Network Lexicon</image:caption></image:image><lastmod>2026-03-06T06:40:38+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/direct-preference-optimization-dpo/</loc><lastmod>2026-03-05T18:54:48+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/deceptive-alignment/</loc><lastmod>2026-03-05T18:50:17+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/corrigibility/</loc><lastmod>2026-03-05T18:48:13+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/constitutional-ai/</loc><lastmod>2026-03-05T18:47:21+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/instrumental-convergence/</loc><lastmod>2026-03-05T18:29:04+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/capability-governance/</loc><lastmod>2026-03-05T18:13:29+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/capability-control/</loc><lastmod>2026-03-05T18:12:49+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/alignment-tax/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/alignment-tax-neural-networks-lexicon.png</image:loc><image:title>Alignment Tax - Neural Networks Lexicon</image:title><image:caption>Alignment Tax - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-05T18:11:52+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/alignment-fragility/</loc><lastmod>2026-03-05T18:10:46+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/alignment-failures-case-studies-framework/</loc><lastmod>2026-03-05T18:10:18+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/oversight-scalability-limits/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/oversight-scalability-limits-neural-networks-lexicon.png</image:loc><image:title>Oversight Scalability Limits - Neural Networks Lexicon</image:title><image:caption>Oversight Scalability Limits - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-05T18:09:11+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/alignment-failure-cascades/</loc><lastmod>2026-03-05T18:08:31+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/safety-critical-deployment/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/safety-critical-deployment-neural-networks-lexicon.png</image:loc><image:title>Safety-Critical Deployment - Neural Networks Lexicon</image:title><image:caption>Safety-Critical Deployment - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-05T16:16:28+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/value-extrapolation/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/value-extrapolation-neural-networks-lexicon.png</image:loc><image:title>Value Extrapolation - Neural Networks Lexicon</image:title><image:caption>Value Extrapolation - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-05T16:15:46+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/superalignment/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/superalignment-neural-networks-lexicon.png</image:loc><image:title>Superalignment - Neural Networks Lexicon</image:title><image:caption>Superalignment - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-05T16:15:13+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/robustness-adversarial-threats/black-box-attacks/</loc><lastmod>2026-03-05T10:16:28+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/alignment-debt/</loc><lastmod>2026-03-05T08:49:00+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/alignment-capability-scaling/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/alignment-capability-scaling-neural-networks-lexicon.png</image:loc><image:title>Alignment Capability Scaling - Neural Networks Lexicon</image:title><image:caption>Alignment Capability Scaling - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-05T08:47:25+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/vanishing-gradients/</loc><lastmod>2026-03-05T07:50:00+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/transformer-architecture/</loc><lastmod>2026-03-05T07:46:00+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/positional-encoding/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/03/understanding-positional-encoding-in-transformers-neural-networks-lexicon.png</image:loc><image:title>Understanding positional encoding in transformers - Neural Networks Lexicon</image:title><image:caption>Understanding positional encoding in transformers - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-05T07:34:33+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/state-space-models/</loc><lastmod>2026-03-04T19:37:18+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/state-space-models-vs-rnns/</loc><lastmod>2026-03-04T17:59:09+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/deep-signal-propagation-theory/</loc><lastmod>2026-03-04T17:34:52+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/rlhf-vs-dpo/</loc><lastmod>2026-03-04T10:31:56+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/reward-model-overfitting/</loc><lastmod>2026-03-04T09:30:55+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/reward-model-collapse/</loc><lastmod>2026-03-04T09:19:28+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/reward-uncertainty-estimation/</loc><lastmod>2026-03-04T08:54:58+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/continuous-time-vs-discrete-time-optimization/</loc><lastmod>2026-03-03T17:55:53+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/stochastic-gradient-flow/</loc><lastmod>2026-03-03T17:48:08+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/entropy-sgd/</loc><lastmod>2026-03-03T17:44:30+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/loss-landscape-curvature/</loc><lastmod>2026-03-03T17:41:10+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/fisher-information-matrix-fim/</loc><lastmod>2026-03-03T17:36:46+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/natural-gradient-descent-deep-dive/</loc><lastmod>2026-03-03T17:32:16+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/trust-region-methods/</loc><lastmod>2026-03-03T17:28:40+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/proximal-policy-optimization-deep-dive/</loc><lastmod>2026-03-03T16:25:51+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/kl-penalty-in-rlhf/</loc><lastmod>2026-03-03T16:20:54+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/gradient-flow-vs-gradient-descent/</loc><lastmod>2026-03-03T12:07:10+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/ntk-regime-vs-finite-width-regime/</loc><lastmod>2026-03-03T11:44:57+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/compute-optimal-vs-data-optimal-scaling/</loc><lastmod>2026-03-03T11:04:26+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/calibration-vs-raw-accuracy/</loc><lastmod>2026-03-03T10:43:51+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/cosine-decay-vs-step-decay/</loc><lastmod>2026-03-03T10:34:36+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/safety-vs-capability/</loc><lastmod>2026-03-02T18:10:13+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/overparameterization-vs-underparameterization/</loc><lastmod>2026-03-02T18:04:37+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/rag-vs-larger-context-windows/</loc><lastmod>2026-03-02T16:53:32+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/large-batch-vs-small-batch-training/</loc><lastmod>2026-03-02T16:47:13+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/offline-vs-online-rlhf/</loc><lastmod>2026-03-02T16:07:49+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/feature-learning-vs-lazy-training/</loc><lastmod>2026-03-02T09:45:53+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/double-descent/</loc><lastmod>2026-03-02T09:09:40+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/sharp-vs-flat-minima/</loc><lastmod>2026-03-01T19:22:17+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/concept-drift/</loc><lastmod>2026-03-01T19:17:10+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/class-imbalance/</loc><lastmod>2026-03-01T19:16:31+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/blocked-sampling/</loc><lastmod>2026-03-01T19:16:02+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/active-sampling/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/active-sampling-strategies-in-machine-learning-neural-networks-lexicon.png</image:loc><image:title>Active sampling strategies in machine learning - Neural Networks Lexicon</image:title><image:caption>Active sampling strategies in machine learning - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-01T19:15:17+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/dropout-vs-weight-decay/</loc><lastmod>2026-03-01T16:13:23+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/l1-vs-l2-regularization/</loc><lastmod>2026-03-01T15:00:50+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/03/ai-alignment-and-governance-infographic-neural-networks-lexicon.png</image:loc><image:title>AI alignment and governance infographic - Neural Networks Lexicon</image:title><image:caption>AI alignment and governance infographic - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-01T14:56:59+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/momentum-vs-nesterov-momentum/</loc><lastmod>2026-03-01T14:36:28+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/adam-vs-adamw/</loc><lastmod>2026-03-01T14:22:15+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/embeddings/</loc><lastmod>2026-03-01T14:16:31+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/sgd-vs-adam-comparison/</loc><lastmod>2026-03-01T13:31:48+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/worst-case-vs-average-case-risk/</loc><lastmod>2026-03-01T13:15:19+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/adversarial-robustness-vs-natural-robustness/</loc><lastmod>2026-03-01T12:06:17+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/emergence-vs-smooth-scaling/</loc><lastmod>2026-03-01T11:12:32+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/bayesian-optimization/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/03/bayesian-optimization-neural-networks-lexicon.png</image:loc><image:title>Bayesian Optimization - Neural Networks Lexicon</image:title><image:caption>Bayesian Optimization - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-01T07:48:19+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/batch-size/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/03/understanding-batch-size-neural-networks-lexicon.png</image:loc><image:title>Understanding Batch Size - Neural Networks Lexicon</image:title><image:caption>Understanding Batch Size - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-01T07:45:30+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/backpropagation/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/03/backpropagation-neural-networks-lexicon.png</image:loc><image:title>Backpropagation - Neural Networks Lexicon</image:title><image:caption>Backpropagation - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-03-01T07:41:53+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/active-learning/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/active-learning-infographic-for-model-improvement-neural-networks-lexicon.png</image:loc><image:title>Active learning infographic for model improvement - Neural Networks Lexicon</image:title><image:caption>Active learning infographic for model improvement - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-28T17:13:21+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/stride-and-padding/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/stride-and-padding-neural-networks-lexicon.png</image:loc><image:title>Stride and Padding - Neural Networks Lexicon</image:title><image:caption>Stride and Padding - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-28T17:04:10+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/multi-objective-rewards/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/multi-objective-rewards-for-rl-agents-neural-networks-lexicon.png</image:loc><image:title>Multi-objective rewards for RL agents - Neural Networks Lexicon</image:title><image:caption>Multi-objective rewards for RL agents - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-28T16:24:29+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/robust-reward-design/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/robust-reward-design-neural-networks-lexicon.png</image:loc><image:title>Robust Reward Design - Neural Networks Lexicon</image:title><image:caption>Robust Reward Design - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-28T14:43:42+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/reward-modeling/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/reward-modeling-neural-networks-lexicon.png</image:loc><image:title>Reward Modeling - Neural Networks Lexicon</image:title><image:caption>Reward Modeling - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-28T14:41:51+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/value-learning/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/value-learning-neural-networks-lexicon.png</image:loc><image:title>Value Learning - Neural Networks Lexicon</image:title><image:caption>Value Learning - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-28T14:37:26+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/__trashed/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/model-capacity-neural-networks-lexicon.png</image:loc><image:title>Model capacity - Neural Networks Lexicon</image:title><image:caption>Model capacity - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-28T13:22:26+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/output-layers/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/types-of-output-layers-in-neural-networks-neural-networks-lexicon.png</image:loc><image:title>Types of output layers in neural networks - Neural Networks Lexicon</image:title><image:caption>Types of output layers in neural networks - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-28T13:19:45+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/residual-connections/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/residual-connections-neural-networks-lexicon.png</image:loc><image:title>Residual Connections - Neural Networks Lexicon</image:title><image:caption>Residual Connections - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-28T08:12:27+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/gradient-flow/</loc><lastmod>2026-02-28T07:04:43+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/goal-misgeneralization/</loc><lastmod>2026-02-27T20:26:47+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/ai-incident-reporting-frameworks/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/ai-incident-reporting-frameworks-neural-networks-lexicon-1.png</image:loc><image:title>AI Incident Reporting Frameworks - Neural Networks Lexicon</image:title><image:caption>AI Incident Reporting Frameworks - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-26T17:59:23+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/red-teaming-in-ai/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/red-teaming-in-ai-neural-networks-lexicon.png</image:loc><image:title>Red Teaming in AI - Neural Networks Lexicon</image:title><image:caption>Red Teaming in AI - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-26T17:58:16+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/norm-free-transformers/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/norm-free-transformers-neural-networks-lexicon.png</image:loc><image:title>Norm-Free Transformers - Neural Networks Lexicon</image:title><image:caption>Norm-Free Transformers - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-26T17:44:32+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/scalenorm/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/scalenorm-neural-networks-lexicon.png</image:loc><image:title>ScaleNorm - Neural Networks Lexicon</image:title><image:caption>ScaleNorm - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-25T16:51:02+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/neurons/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/neurons-neural-networks-lexicon.png</image:loc><image:title>Neurons - Neural Networks Lexicon</image:title><image:caption>Neurons - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-25T16:41:58+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/dense-connections-densenet/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/dense-connections-densenet-neural-networks-lexicon.png</image:loc><image:title>Dense Connections (DenseNet) - Neural Networks Lexicon</image:title><image:caption>Dense Connections (DenseNet) - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-24T16:37:38+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/conditional-computation/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/conditional-computation-neural-networks-lexicon.png</image:loc><image:title>Conditional Computation - Neural Networks Lexicon</image:title><image:caption>Conditional Computation - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-23T18:43:59+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/batch-normalization-deep-dive/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/batch-normalization-deep-dive-neural-networks-lexicon.png</image:loc><image:title>Batch Normalization (deep dive) - Neural Networks Lexicon</image:title><image:caption>Batch Normalization (deep dive) - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-23T16:55:15+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/architecture-scaling-laws/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/architecture-scaling-laws-neural-networks-lexicon.png</image:loc><image:title>Architecture Scaling Laws - Neural Networks Lexicon</image:title><image:caption>Architecture Scaling Laws - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-23T16:46:41+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/strategic-awareness-in-ai/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/strategic-awareness-in-ai-neural-networks-lexicon.png</image:loc><image:title>Strategic Awareness in AI - Neural Networks Lexicon</image:title><image:caption>Strategic Awareness in AI - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-23T15:36:04+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/scalable-oversight/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/scalable-oversight-neural-networks-lexicon.png</image:loc><image:title>Scalable Oversight - Neural Networks Lexicon</image:title><image:caption>Scalable Oversight - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-23T15:33:43+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/objective-robustness/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/objective-robustness-neural-networks-lexicon.png</image:loc><image:title>Objective Robustness - Neural Networks Lexicon</image:title><image:caption>Objective Robustness - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-23T15:26:51+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/reinforcement-learning-from-human-feedback-rlhf/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/reinforcement-learning-from-human-feedback-rlhf-neural-networks-lexicon.png</image:loc><image:title>Reinforcement Learning from Human Feedback (RLHF) - Neural Networks Lexicon</image:title><image:caption>Reinforcement Learning from Human Feedback (RLHF) - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-23T15:24:35+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/model-risk-management-mrm-in-ai/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/model-risk-management-mrm-in-ai-neural-networks-lexicon.png</image:loc><image:title>Model Risk Management (MRM) in AI - Neural Networks Lexicon</image:title><image:caption>Model Risk Management (MRM) in AI - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-23T15:22:12+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/recursive-self-improvement-risks/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/recursive-self-improvement-risks-neural-networks-lexicon.png</image:loc><image:title>Recursive Self-Improvement Risks - Neural Networks Lexicon</image:title><image:caption>Recursive Self-Improvement Risks - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-23T14:36:19+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/policy-based-routing/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/policy-based-routing-neural-networks-lexicon.png</image:loc><image:title>Policy-Based Routing - Neural Networks Lexicon</image:title><image:caption>Policy-Based Routing - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-23T14:33:59+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/institutional-alignment-drift/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/institutional-alignment-drift-neural-networks-lexicon.png</image:loc><image:title>Institutional Alignment Drift - Neural Networks Lexicon</image:title><image:caption>Institutional Alignment Drift - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-23T14:31:41+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/human-ai-co-governance/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/human-ai-co-governance-neural-networks-lexicon.png</image:loc><image:title>Human-AI Co-Governance - Neural Networks Lexicon</image:title><image:caption>Human-AI Co-Governance - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-23T14:29:14+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/governance-lag/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/governance-lag-neural-networks-lexicon.png</image:loc><image:title>Governance Lag - Neural Networks Lexicon</image:title><image:caption>Governance Lag - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-22T19:14:45+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/model-autonomy-levels/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/model-autonomy-levels-neural-networks-lexicon.png</image:loc><image:title>Model Autonomy Levels - Neural Networks Lexicon</image:title><image:caption>Model Autonomy Levels - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-22T19:12:41+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/mechanistic-interpretability/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/mechanistic-interpretability-neural-network-lexicon.png</image:loc><image:title>Mechanistic Interpretability - Neural Network Lexicon</image:title><image:caption>Mechanistic Interpretability - Neural Network Lexicon</image:caption></image:image><lastmod>2026-02-22T19:06:41+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/long-term-monitoring-systems/</loc><lastmod>2026-02-22T19:00:10+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/interpretability-tools/</loc><image:image><image:loc>https://neuralnetworklexicon.com/wp-content/uploads/2026/02/interpretability-tools-neural-networks-lexicon.png</image:loc><image:title>Interpretability Tools - Neural Networks Lexicon</image:title><image:caption>Interpretability Tools - Neural Networks Lexicon</image:caption></image:image><lastmod>2026-02-22T18:46:30+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/evaluation-governance/</loc><lastmod>2026-02-22T17:05:32+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/alignment-in-llms/</loc><lastmod>2026-02-22T16:24:57+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/alignment-and-governance/ai-safety-evaluation/</loc><lastmod>2026-02-22T14:23:04+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/calibration-vs-accuracy/</loc><lastmod>2026-02-22T14:12:35+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/outcome-aware-evaluation/</loc><lastmod>2026-02-22T14:10:04+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/feedback-loops/</loc><lastmod>2026-02-22T13:29:32+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/metric-drift/</loc><lastmod>2026-02-22T11:13:29+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/strategic-compliance-vs-alignment-2/</loc><lastmod>2026-02-22T09:29:00+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/stress-testing-models/</loc><lastmod>2026-02-22T07:02:31+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/decision-cost-functions/</loc><lastmod>2026-02-21T18:08:55+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/reward-design/</loc><lastmod>2026-02-20T19:26:59+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/depth-vs-width-in-neural-networks/</loc><lastmod>2026-02-19T13:48:46+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/state-space-models-vs-transformers/</loc><lastmod>2026-02-19T13:21:23+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/rnn-vs-transformer/</loc><lastmod>2026-02-19T12:13:09+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/gru-vs-lstm/</loc><lastmod>2026-02-19T11:14:37+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/dilated-convolutions-vs-stride/</loc><lastmod>2026-02-19T10:52:38+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/reflect-vs-zero-padding/</loc><lastmod>2026-02-19T10:32:38+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/same-vs-valid-padding/</loc><lastmod>2026-02-19T10:05:36+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/structured-vs-unstructured-pruning/</loc><lastmod>2026-02-19T09:48:00+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/outer-vs-inner-alignment-advanced-framing/</loc><lastmod>2026-02-19T09:27:03+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/pre-norm-vs-post-norm-residual-blocks/</loc><lastmod>2026-02-19T08:55:39+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/skip-connections-vs-residual-connections/</loc><lastmod>2026-02-19T08:39:41+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/strided-convolution-vs-pooling/</loc><lastmod>2026-02-19T08:36:40+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/layernorm-vs-rmsnorm/</loc><lastmod>2026-02-19T07:41:19+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/random-search/</loc><lastmod>2026-02-18T10:27:42+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/mini-batch-gradient-descent/</loc><lastmod>2026-02-18T09:27:20+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/optimizers/</loc><lastmod>2026-02-18T08:50:42+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/learning-rate/</loc><lastmod>2026-02-18T08:23:32+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/large-batch-training/</loc><lastmod>2026-02-18T08:20:24+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/sparse-vs-dense-models/</loc><lastmod>2026-02-17T14:25:27+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/pre-norm-vs-post-norm-architectures/</loc><lastmod>2026-02-17T14:24:12+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/strategic-compliance-vs-alignment/</loc><lastmod>2026-02-17T14:23:27+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/comparisons-and-tradeoffs/</loc><lastmod>2026-02-17T14:18:01+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/vision-transfer-learning/</loc><lastmod>2026-02-15T09:50:03+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/validation-curves/</loc><lastmod>2026-02-15T09:44:23+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/training-monitoring/</loc><lastmod>2026-02-15T09:42:44+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/training-instability/</loc><lastmod>2026-02-15T09:41:14+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/training-dynamics/</loc><lastmod>2026-02-15T08:53:52+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/optimization/</loc><lastmod>2026-02-15T08:41:13+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/loss-functions/</loc><lastmod>2026-02-15T08:32:36+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/learning-rate-schedules/</loc><lastmod>2026-02-15T08:31:11+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/learning-curves/</loc><lastmod>2026-02-15T08:27:08+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/hyperparameters/</loc><lastmod>2026-02-15T08:24:15+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/hyperparameter-optimization/</loc><lastmod>2026-02-15T08:21:51+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/grid-search/</loc><lastmod>2026-02-15T08:18:47+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/gradient-noise/</loc><lastmod>2026-02-15T08:14:34+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/gradient-descent/</loc><lastmod>2026-02-15T08:11:47+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/early-stopping/</loc><lastmod>2026-02-15T07:33:22+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/convergence/</loc><lastmod>2026-02-15T07:25:10+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-and-optimization/</loc><lastmod>2026-02-14T17:48:52+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/sparse-neural-networks/</loc><lastmod>2026-02-14T17:38:21+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/robustness-adversarial-threats/white-box-attacks/</loc><lastmod>2026-02-14T17:36:53+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/robustness-adversarial-threats/untargeted-attacks/</loc><lastmod>2026-02-14T17:34:29+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/robustness-adversarial-threats/transferability-of-adversarial-examples/</loc><lastmod>2026-02-14T16:23:58+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/robustness-adversarial-threats/targeted-attacks/</loc><lastmod>2026-02-14T16:17:41+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/robustness-adversarial-threats/robustness-vs-generalization/</loc><lastmod>2026-02-14T15:58:06+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/robustness-adversarial-threats/robustness-metrics/</loc><lastmod>2026-02-14T15:56:57+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/robustness-adversarial-threats/evasion-attacks/</loc><lastmod>2026-02-14T15:55:31+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/robustness-adversarial-threats/</loc><lastmod>2026-02-14T15:51:27+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/quantization/</loc><lastmod>2026-02-14T15:48:36+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/pruning/</loc><lastmod>2026-02-14T15:39:17+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/model-interpretability/</loc><lastmod>2026-02-14T15:36:58+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/utility-curves/</loc><lastmod>2026-02-14T15:27:53+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/uncertainty-estimation/</loc><lastmod>2026-02-14T15:20:55+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/train-test-split/</loc><lastmod>2026-02-14T13:59:29+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/time-series-validation/</loc><lastmod>2026-02-14T13:58:08+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/temperature-scaling/</loc><lastmod>2026-02-14T13:54:26+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/roc-curve/</loc><lastmod>2026-02-14T13:36:17+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/reproducibility-in-ml/</loc><lastmod>2026-02-14T13:21:20+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/reliability-diagrams/</loc><lastmod>2026-02-14T13:20:11+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/regularization/</loc><lastmod>2026-02-14T12:42:49+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/recall-at-k-rk/</loc><lastmod>2026-02-14T12:41:39+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/precision-recall-curve/</loc><lastmod>2026-02-14T12:33:04+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/precision-at-k-pk/</loc><lastmod>2026-02-14T12:31:58+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/overfitting/</loc><lastmod>2026-02-14T12:24:34+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/operating-point-selection/</loc><lastmod>2026-02-14T12:19:40+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/open-set-recognition/</loc><lastmod>2026-02-14T12:16:10+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/nested-cross-validation/</loc><lastmod>2026-02-14T12:10:58+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/model-robustness/</loc><lastmod>2026-02-14T12:07:52+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/model-confidence/</loc><lastmod>2026-02-14T12:06:52+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/metric-selection-under-imbalance/</loc><lastmod>2026-02-14T12:05:51+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/hidden-test-sets/</loc><lastmod>2026-02-14T11:23:33+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/f1-score/</loc><lastmod>2026-02-14T11:15:12+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/expected-cost-curves/</loc><lastmod>2026-02-14T11:12:23+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/expected-calibration-error-ece/</loc><lastmod>2026-02-14T11:11:24+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/evaluation-protocols/</loc><lastmod>2026-02-14T11:10:24+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/epistemic-uncertainty/</loc><lastmod>2026-02-14T11:07:03+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/delayed-rewards/</loc><lastmod>2026-02-14T10:24:26+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/decision-thresholding/</loc><lastmod>2026-02-14T10:22:43+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/data-leakage-validation-specific/</loc><lastmod>2026-02-14T10:17:35+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/cross-validation/</loc><lastmod>2026-02-14T10:16:40+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/cross-validation-strategies/</loc><lastmod>2026-02-14T10:16:26+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/cost-sensitive-learning/</loc><lastmod>2026-02-14T10:09:32+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/class-imbalance/</loc><lastmod>2026-02-14T10:05:10+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/capacity-headroom-planning/</loc><lastmod>2026-02-14T10:03:23+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/bias-variance-tradeoff/</loc><lastmod>2026-02-14T09:21:00+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/benchmarking-robustness/</loc><lastmod>2026-02-14T09:19:56+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/benchmarking-practices/</loc><lastmod>2026-02-14T09:09:43+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/benchmark-leakage/</loc><lastmod>2026-02-14T09:08:51+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/benchmark-datasets/</loc><lastmod>2026-02-14T09:08:01+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/baseline-performance/</loc><lastmod>2026-02-14T09:07:14+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/bandit-algorithms-overview/</loc><lastmod>2026-02-14T09:06:24+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/auc/</loc><lastmod>2026-02-14T09:05:40+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/aleatoric-uncertainty/</loc><lastmod>2026-02-14T09:04:51+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/adversarial-examples/</loc><lastmod>2026-02-14T09:03:58+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/generalization-and-evaluation/accuracy/</loc><lastmod>2026-02-14T09:00:16+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/feature-scaling/</loc><lastmod>2026-02-14T08:58:31+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/validation-data/</loc><lastmod>2026-02-14T08:54:10+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/training-data/</loc><lastmod>2026-02-14T08:53:21+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/train-test-contamination/</loc><lastmod>2026-02-14T08:52:33+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/time-aware-sampling/</loc><lastmod>2026-02-14T08:51:40+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/test-data/</loc><lastmod>2026-02-14T08:50:48+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/target-leakage/</loc><lastmod>2026-02-14T08:48:57+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/stratified-sampling/</loc><lastmod>2026-02-14T08:47:47+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/selection-bias/</loc><lastmod>2026-02-14T08:15:19+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/sampling-strategies/</loc><lastmod>2026-02-14T08:14:12+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/sampling-bias/</loc><lastmod>2026-02-14T08:13:21+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/rolling-window-sampling/</loc><lastmod>2026-02-14T08:12:27+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/rolling-retraining/</loc><lastmod>2026-02-14T08:11:33+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/rare-event-detection/</loc><lastmod>2026-02-14T08:09:53+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/out-of-distribution-test-data/</loc><lastmod>2026-02-14T08:08:23+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/out-of-distribution-data-ood/</loc><lastmod>2026-02-14T08:07:38+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/measurement-bias/</loc><lastmod>2026-02-14T08:06:05+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/forward-chaining-splits/</loc><lastmod>2026-02-13T17:45:41+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/distribution-shift/</loc><lastmod>2026-02-13T17:39:29+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/data-quality/</loc><lastmod>2026-02-13T17:36:57+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/data-preprocessing/</loc><lastmod>2026-02-13T17:36:13+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/data-leakage/</loc><lastmod>2026-02-13T17:35:18+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/data-and-distribution/data-distribution/</loc><lastmod>2026-02-13T17:34:18+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/calibration/</loc><lastmod>2026-02-13T17:24:57+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/batch-normalization/</loc><lastmod>2026-02-13T17:23:53+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/architecture-and-representation/sparse-training-dynamics/</loc><lastmod>2026-02-13T17:22:11+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/from-metrics-to-decisions/</loc><lastmod>2026-02-03T16:27:14+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/training-loop/</loc><lastmod>2026-02-02T16:22:41+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/transfer-learning/</loc><lastmod>2026-02-02T15:59:42+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/weights-and-bias/</loc><lastmod>2026-02-02T12:19:48+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/how-this-lexicon-is-organized/</loc><lastmod>2026-02-01T12:28:00+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/contact-us/</loc><lastmod>2026-02-01T10:32:11+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/disclaimer/</loc><lastmod>2026-02-01T10:26:19+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/cookie-policy/</loc><lastmod>2026-02-01T10:23:05+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/terms-conditions/</loc><lastmod>2026-02-01T10:19:56+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com/privacy-policy/</loc><lastmod>2026-02-01T10:06:35+00:00</lastmod><changefreq>weekly</changefreq><priority>0.6</priority></url><url><loc>https://neuralnetworklexicon.com</loc><changefreq>daily</changefreq><priority>1.0</priority><lastmod>2026-03-14T06:50:35+00:00</lastmod></url></urlset>
