<?xml version="1.0" encoding="UTF-8"?>
<urlset xmlns="http://www.sitemaps.org/schemas/sitemap/0.9">
  <url><loc>https://parasdahal.com/deep-clustering</loc></url>
  <url><loc>https://parasdahal.com/adversarial-attack</loc></url>
  <url><loc>https://parasdahal.com/softmax-crossentropy</loc></url>
  <url><loc>https://parasdahal.com/notes/MAP-Elites</loc></url>
  <url><loc>https://parasdahal.com/notes/Tiny+Reasoning+Model+(TRM)</loc></url>
  <url><loc>https://parasdahal.com/notes/Hierarchical+Reasoning+Model+(HRM)</loc></url>
  <url><loc>https://parasdahal.com/notes/dpo-direct-preference-optimization</loc></url>
  <url><loc>https://parasdahal.com/notes/stochastic+gradients</loc></url>
  <url><loc>https://parasdahal.com/notes/gaussian+distribution</loc></url>
  <url><loc>https://parasdahal.com/notes/activation+functions</loc></url>
  <url><loc>https://parasdahal.com/notes/alr_optimizers</loc></url>
  <url><loc>https://parasdahal.com/notes/advantage-functions</loc></url>
  <url><loc>https://parasdahal.com/notes/autoencoders</loc></url>
  <url><loc>https://parasdahal.com/notes/Autoregressive+Generation+and+KV+Caching+in+Transformers</loc></url>
  <url><loc>https://parasdahal.com/notes/autoregressive+models</loc></url>
  <url><loc>https://parasdahal.com/notes/bert</loc></url>
  <url><loc>https://parasdahal.com/notes/bleu</loc></url>
  <url><loc>https://parasdahal.com/notes/bm25</loc></url>
  <url><loc>https://parasdahal.com/notes/backpropagation+through+time</loc></url>
  <url><loc>https://parasdahal.com/notes/backpropagation</loc></url>
  <url><loc>https://parasdahal.com/notes/basis+functions</loc></url>
  <url><loc>https://parasdahal.com/notes/bayesian+estimation</loc></url>
  <url><loc>https://parasdahal.com/notes/bayesian+linear+regression</loc></url>
  <url><loc>https://parasdahal.com/notes/bayesian+model+selection+with+model+evidence</loc></url>
  <url><loc>https://parasdahal.com/notes/beam+decoding</loc></url>
  <url><loc>https://parasdahal.com/notes/bellman+equation+and+value+functions</loc></url>
  <url><loc>https://parasdahal.com/notes/bias+vs+variance+in+machine+learning</loc></url>
  <url><loc>https://parasdahal.com/notes/boltzmann+machines</loc></url>
  <url><loc>https://parasdahal.com/notes/bradley-terry-model</loc></url>
  <url><loc>https://parasdahal.com/notes/byte+pair+encoding</loc></url>
  <url><loc>https://parasdahal.com/notes/cnns+for+nlp</loc></url>
  <url><loc>https://parasdahal.com/notes/calibration</loc></url>
  <url><loc>https://parasdahal.com/notes/capsule+networks+(capsnet)</loc></url>
  <url><loc>https://parasdahal.com/notes/challenges+of+gan</loc></url>
  <url><loc>https://parasdahal.com/notes/challenges+of+optimizing+deep+models</loc></url>
  <url><loc>https://parasdahal.com/notes/class+imbalance</loc></url>
  <url><loc>https://parasdahal.com/notes/collaborative+filtering</loc></url>
  <url><loc>https://parasdahal.com/notes/compositional+semantics+and+sentence+representations</loc></url>
  <url><loc>https://parasdahal.com/notes/compressed+sensing</loc></url>
  <url><loc>https://parasdahal.com/notes/conditional+gan</loc></url>
  <url><loc>https://parasdahal.com/notes/Confident+Learning+-+Principled+Data+Cleaning</loc></url>
  <url><loc>https://parasdahal.com/notes/conformal+prediction</loc></url>
  <url><loc>https://parasdahal.com/notes/contrastive+divergence</loc></url>
  <url><loc>https://parasdahal.com/notes/control+variates</loc></url>
  <url><loc>https://parasdahal.com/notes/convolution</loc></url>
  <url><loc>https://parasdahal.com/notes/convolutional+neural+networks+(cnn)</loc></url>
  <url><loc>https://parasdahal.com/notes/coreference+resolution</loc></url>
  <url><loc>https://parasdahal.com/notes/counterfactual+evaluation+and+ltr</loc></url>
  <url><loc>https://parasdahal.com/notes/covariate-shift</loc></url>
  <url><loc>https://parasdahal.com/notes/cross+validation</loc></url>
  <url><loc>https://parasdahal.com/notes/cross+entropy</loc></url>
  <url><loc>https://parasdahal.com/notes/decision+theory</loc></url>
  <url><loc>https://parasdahal.com/notes/Deep+Q-Learning</loc></url>
  <url><loc>https://parasdahal.com/notes/Deep+Supervision+with+Recursion</loc></url>
  <url><loc>https://parasdahal.com/notes/depth+and+trainability</loc></url>
  <url><loc>https://parasdahal.com/notes/discrete+fourier+transform</loc></url>
  <url><loc>https://parasdahal.com/notes/discriminant+functions</loc></url>
  <url><loc>https://parasdahal.com/notes/disentangled+representations</loc></url>
  <url><loc>https://parasdahal.com/notes/distant+supervision</loc></url>
  <url><loc>https://parasdahal.com/notes/distribution-shift</loc></url>
  <url><loc>https://parasdahal.com/notes/dropout</loc></url>
  <url><loc>https://parasdahal.com/notes/dyna-q+-+planning+and+learning</loc></url>
  <url><loc>https://parasdahal.com/notes/dynamic+programming+(rl)</loc></url>
  <url><loc>https://parasdahal.com/notes/Eligibility+Trace</loc></url>
  <url><loc>https://parasdahal.com/notes/Emergent+Misalignment+in+LLMs</loc></url>
  <url><loc>https://parasdahal.com/notes/energy+based+models</loc></url>
  <url><loc>https://parasdahal.com/notes/ensemble+methods</loc></url>
  <url><loc>https://parasdahal.com/notes/equivalent+kernel</loc></url>
  <url><loc>https://parasdahal.com/notes/expectation+maximization</loc></url>
  <url><loc>https://parasdahal.com/notes/expected+reciprocal+rank</loc></url>
  <url><loc>https://parasdahal.com/notes/fisher-information</loc></url>
  <url><loc>https://parasdahal.com/notes/Focal+Loss</loc></url>
  <url><loc>https://parasdahal.com/notes/gru</loc></url>
  <url><loc>https://parasdahal.com/notes/gaussian+mixture+model</loc></url>
  <url><loc>https://parasdahal.com/notes/gaussian+processes</loc></url>
  <url><loc>https://parasdahal.com/notes/generalized+advantage+estimate</loc></url>
  <url><loc>https://parasdahal.com/notes/generative+adversarial+networks</loc></url>
  <url><loc>https://parasdahal.com/notes/graph+convolutional++networks+(gcn)</loc></url>
  <url><loc>https://parasdahal.com/notes/group+equivariant+convolutional+neural+networks</loc></url>
  <url><loc>https://parasdahal.com/notes/Grouped+Query+Attention+(GQA)</loc></url>
  <url><loc>https://parasdahal.com/notes/harris+corner+detection</loc></url>
  <url><loc>https://parasdahal.com/notes/dot-product-normalization</loc></url>
  <url><loc>https://parasdahal.com/notes/hopfield+networks</loc></url>
  <url><loc>https://parasdahal.com/notes/hough+transform</loc></url>
  <url><loc>https://parasdahal.com/notes/importance+sampling</loc></url>
  <url><loc>https://parasdahal.com/notes/incremental+implementation+of+estimating+action+values</loc></url>
  <url><loc>https://parasdahal.com/notes/infogan</loc></url>
  <url><loc>https://parasdahal.com/notes/inverse+reinforcement+learning</loc></url>
  <url><loc>https://parasdahal.com/notes/jensen's+inequality</loc></url>
  <url><loc>https://parasdahal.com/notes/jensen–shannon+divergence</loc></url>
  <url><loc>https://parasdahal.com/notes/k-means</loc></url>
  <url><loc>https://parasdahal.com/notes/kl+divergence</loc></url>
  <url><loc>https://parasdahal.com/notes/kernel+methods</loc></url>
  <url><loc>https://parasdahal.com/notes/lstm</loc></url>
  <url><loc>https://parasdahal.com/notes/lagrange+multipliers</loc></url>
  <url><loc>https://parasdahal.com/notes/lambdarank</loc></url>
  <url><loc>https://parasdahal.com/notes/latenent+variable+models</loc></url>
  <url><loc>https://parasdahal.com/notes/layer+normalization</loc></url>
  <url><loc>https://parasdahal.com/notes/learning+to+defer</loc></url>
  <url><loc>https://parasdahal.com/notes/learning+to+rank</loc></url>
  <url><loc>https://parasdahal.com/notes/least+squares+for+classification</loc></url>
  <url><loc>https://parasdahal.com/notes/listnet+and+listmle</loc></url>
  <url><loc>https://parasdahal.com/notes/logistic+regression</loc></url>
  <url><loc>https://parasdahal.com/notes/loss+functions</loc></url>
  <url><loc>https://parasdahal.com/notes/maml+-+model-agnostic+meta-learning</loc></url>
  <url><loc>https://parasdahal.com/notes/markov+decision+processes</loc></url>
  <url><loc>https://parasdahal.com/notes/markov+reward+processes</loc></url>
  <url><loc>https://parasdahal.com/notes/maximum+a+posteriori+(map)</loc></url>
  <url><loc>https://parasdahal.com/notes/Maximum+Entropy+Principle</loc></url>
  <url><loc>https://parasdahal.com/notes/maximum+likelihood+estimation</loc></url>
  <url><loc>https://parasdahal.com/notes/mmd</loc></url>
  <url><loc>https://parasdahal.com/notes/meta+learning</loc></url>
  <url><loc>https://parasdahal.com/notes/Mixture+of+Experts+in+Transformers+(MoE)</loc></url>
  <url><loc>https://parasdahal.com/notes/mixture+of+experts</loc></url>
  <url><loc>https://parasdahal.com/notes/model+based+reinforcement+learning</loc></url>
  <url><loc>https://parasdahal.com/notes/model+complexity+and+occams+razor</loc></url>
  <url><loc>https://parasdahal.com/notes/model+free+reinforcement+learning</loc></url>
  <url><loc>https://parasdahal.com/notes/monte-carlo+estimation</loc></url>
  <url><loc>https://parasdahal.com/notes/monte-carlo+rl+methods</loc></url>
  <url><loc>https://parasdahal.com/notes/monte-carlo+tree+search</loc></url>
  <url><loc>https://parasdahal.com/notes/multi-armed+bandits</loc></url>
  <url><loc>https://parasdahal.com/notes/Multi-Head+Latent+Attention+(MLA)</loc></url>
  <url><loc>https://parasdahal.com/notes/Multi-Network+Training+with+Moving+Average+Target</loc></url>
  <url><loc>https://parasdahal.com/notes/natural+policy+gradient</loc></url>
  <url><loc>https://parasdahal.com/notes/normalization</loc></url>
  <url><loc>https://parasdahal.com/notes/normalizing+flows</loc></url>
  <url><loc>https://parasdahal.com/notes/off-policy+learning+with+approximation</loc></url>
  <url><loc>https://parasdahal.com/notes/on-policy+learning+with+approximation</loc></url>
  <url><loc>https://parasdahal.com/notes/online+evaluation+and+ltr</loc></url>
  <url><loc>https://parasdahal.com/notes/pgt+actor-critic</loc></url>
  <url><loc>https://parasdahal.com/notes/partial-observability</loc></url>
  <url><loc>https://parasdahal.com/notes/pathwise+gradient+estimator</loc></url>
  <url><loc>https://parasdahal.com/notes/perceptron</loc></url>
  <url><loc>https://parasdahal.com/notes/pixelrnn</loc></url>
  <url><loc>https://parasdahal.com/notes/policy+gradient</loc></url>
  <url><loc>https://parasdahal.com/notes/polyloss</loc></url>
  <url><loc>https://parasdahal.com/notes/positional+encoding</loc></url>
  <url><loc>https://parasdahal.com/notes/principle+component+analysis+(pca)</loc></url>
  <url><loc>https://parasdahal.com/notes/prioritized+sweeping</loc></url>
  <url><loc>https://parasdahal.com/notes/probabilistic+generative+models</loc></url>
  <url><loc>https://parasdahal.com/notes/reinforce+-+monte+carlo+policy+gradient</loc></url>
  <url><loc>https://parasdahal.com/notes/reinforce+-+score+function+estimator</loc></url>
  <url><loc>https://parasdahal.com/notes/rlhf+-+reinforcement+learning+with+human+feedback</loc></url>
  <url><loc>https://parasdahal.com/notes/rmsnorm</loc></url>
  <url><loc>https://parasdahal.com/notes/ranknet</loc></url>
  <url><loc>https://parasdahal.com/notes/relu</loc></url>
  <url><loc>https://parasdahal.com/notes/recurrent+neural+networks+(rnn)</loc></url>
  <url><loc>https://parasdahal.com/notes/regularized+least+squares</loc></url>
  <url><loc>https://parasdahal.com/notes/reinforcement+learning+problem+setup</loc></url>
  <url><loc>https://parasdahal.com/notes/Rotary+Position+Embeddings+(RoPE)</loc></url>
  <url><loc>https://parasdahal.com/notes/semi-markov+decision+processes</loc></url>
  <url><loc>https://parasdahal.com/notes/sentencepiece+-+unigram+lm+encoding</loc></url>
  <url><loc>https://parasdahal.com/notes/similarity+measures</loc></url>
  <url><loc>https://parasdahal.com/notes/singular+value+decomposition</loc></url>
  <url><loc>https://parasdahal.com/notes/state+update+functions+in+partially+observable+mdp</loc></url>
  <url><loc>https://parasdahal.com/notes/stochastic+gradient+descent</loc></url>
  <url><loc>https://parasdahal.com/notes/support+vector+machines+(svm)</loc></url>
  <url><loc>https://parasdahal.com/notes/temporal+difference+learning</loc></url>
  <url><loc>https://parasdahal.com/notes/tokenization</loc></url>
  <url><loc>https://parasdahal.com/notes/transformers</loc></url>
  <url><loc>https://parasdahal.com/notes/uncertainty+in+machine+learning</loc></url>
  <url><loc>https://parasdahal.com/notes/variational+autoencoders</loc></url>
  <url><loc>https://parasdahal.com/notes/variational+inference</loc></url>
  <url><loc>https://parasdahal.com/notes/weight+initialization</loc></url>
  <url><loc>https://parasdahal.com/notes/why+generative+models</loc></url>
  <url><loc>https://parasdahal.com/notes/why+implicit+density+models</loc></url>
  <url><loc>https://parasdahal.com/notes/ppo+-+proximal+policy+optimization</loc></url>
  <url><loc>https://parasdahal.com/notes/trpo+-+trust-region+policy+optimization</loc></url>
  <url><loc>https://parasdahal.com/notes/deep-q-network</loc></url>
  <url><loc>https://parasdahal.com/notes/grpo-group-relative-policy-optimization</loc></url>
  <url><loc>https://parasdahal.com/notes/attention+mechanism</loc></url>
  <url><loc>https://parasdahal.com/notes/Scaling+Attention</loc></url>
  <url><loc>https://parasdahal.com/notes/Dreamer</loc></url>
  <url><loc>https://parasdahal.com/notes/Intrinsically-Motivated+Humans+and+Agents+in+Open-World+Exploration</loc></url>
  <url><loc>https://parasdahal.com/notes/AlphaEvolve</loc></url>
  <url><loc>https://parasdahal.com/notes/Towards+an+AI+co-scientist</loc></url>
  <url><loc>https://parasdahal.com/notes/OMNI+-+Open-endedness+via+Models+of+human+Notions+of+Interestingness</loc></url>
  <url><loc>https://parasdahal.com/notes/Darwin+Godel+Machine+(DGM)</loc></url>
  <url><loc>https://parasdahal.com/notes/Foundation+Model+Self-Play+(FMSP)</loc></url>
  <url><loc>https://parasdahal.com/notes/Automated+Design+of+Agentic+Systems+(ADAS)</loc></url>
  <url><loc>https://parasdahal.com/notes/Go-Explore</loc></url>
  <url><loc>https://parasdahal.com/notes/Better+Think+Thrice+-+Learning+to+Reason+Causally+with+Double+Counterfactual+Consistency</loc></url>
  <url><loc>https://parasdahal.com/notes/Mathematical+Exploration+and+Discovery+at+Scale+(with+AlphaEvolve)</loc></url>
  <url><loc>https://parasdahal.com/notes/Minimal+Criterion+Coevolution</loc></url>
  <url><loc>https://parasdahal.com/</loc></url>
  <url><loc>https://parasdahal.com/blog</loc></url>
  <url><loc>https://parasdahal.com/notes</loc></url>
</urlset>