<?xml version="1.0" encoding="utf-8" standalone="yes"?><rss version="2.0" xmlns:atom="http://www.w3.org/2005/Atom" xmlns:content="http://purl.org/rss/1.0/modules/content/"><channel><title>Tags on Mateusz Pieniak</title><link>https://mateuszpieniak.com/tags/</link><description/><generator>Hugo -- 0.163.3</generator><language>en-us</language><lastBuildDate>Thu, 02 Jul 2026 00:00:00 +0000</lastBuildDate><atom:link href="https://mateuszpieniak.com/tags/index.xml" rel="self" type="application/rss+xml"/><item><title>Deep Q-Network</title><link>https://mateuszpieniak.com/tags/deep-q-network/</link><pubDate>Thu, 02 Jul 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/deep-q-network/</guid><description/></item><item><title>Deep Reinforcement Learning</title><link>https://mateuszpieniak.com/tags/deep-reinforcement-learning/</link><pubDate>Thu, 02 Jul 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/deep-reinforcement-learning/</guid><description/></item><item><title>Double DQN</title><link>https://mateuszpieniak.com/tags/double-dqn/</link><pubDate>Thu, 02 Jul 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/double-dqn/</guid><description/></item><item><title>DQN</title><link>https://mateuszpieniak.com/tags/dqn/</link><pubDate>Thu, 02 Jul 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/dqn/</guid><description/></item><item><title>Dueling DQN</title><link>https://mateuszpieniak.com/tags/dueling-dqn/</link><pubDate>Thu, 02 Jul 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/dueling-dqn/</guid><description/></item><item><title>Experience Replay</title><link>https://mateuszpieniak.com/tags/experience-replay/</link><pubDate>Thu, 02 Jul 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/experience-replay/</guid><description/></item><item><title>Overestimation Bias</title><link>https://mateuszpieniak.com/tags/overestimation-bias/</link><pubDate>Thu, 02 Jul 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/overestimation-bias/</guid><description/></item><item><title>Prioritized Experience Replay</title><link>https://mateuszpieniak.com/tags/prioritized-experience-replay/</link><pubDate>Thu, 02 Jul 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/prioritized-experience-replay/</guid><description/></item><item><title>Reinforcement Learning</title><link>https://mateuszpieniak.com/tags/reinforcement-learning/</link><pubDate>Thu, 02 Jul 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/reinforcement-learning/</guid><description/></item><item><title>Reward Clipping</title><link>https://mateuszpieniak.com/tags/reward-clipping/</link><pubDate>Thu, 02 Jul 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/reward-clipping/</guid><description/></item><item><title>Target Network</title><link>https://mateuszpieniak.com/tags/target-network/</link><pubDate>Thu, 02 Jul 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/target-network/</guid><description/></item><item><title>Approximate Q-Learning</title><link>https://mateuszpieniak.com/tags/approximate-q-learning/</link><pubDate>Tue, 23 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/approximate-q-learning/</guid><description/></item><item><title>Deadly Triad</title><link>https://mateuszpieniak.com/tags/deadly-triad/</link><pubDate>Tue, 23 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/deadly-triad/</guid><description/></item><item><title>Expected SARSA</title><link>https://mateuszpieniak.com/tags/expected-sarsa/</link><pubDate>Tue, 23 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/expected-sarsa/</guid><description/></item><item><title>Function Approximation</title><link>https://mateuszpieniak.com/tags/function-approximation/</link><pubDate>Tue, 23 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/function-approximation/</guid><description/></item><item><title>Model-Free Reinforcement Learning</title><link>https://mateuszpieniak.com/tags/model-free-reinforcement-learning/</link><pubDate>Tue, 23 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/model-free-reinforcement-learning/</guid><description/></item><item><title>Q-Learning</title><link>https://mateuszpieniak.com/tags/q-learning/</link><pubDate>Tue, 23 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/q-learning/</guid><description/></item><item><title>SARSA</title><link>https://mateuszpieniak.com/tags/sarsa/</link><pubDate>Tue, 23 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/sarsa/</guid><description/></item><item><title>Semi-Gradient Methods</title><link>https://mateuszpieniak.com/tags/semi-gradient-methods/</link><pubDate>Tue, 23 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/semi-gradient-methods/</guid><description/></item><item><title>Exploration</title><link>https://mateuszpieniak.com/tags/exploration/</link><pubDate>Sun, 21 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/exploration/</guid><description/></item><item><title>Monte Carlo</title><link>https://mateuszpieniak.com/tags/monte-carlo/</link><pubDate>Sun, 21 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/monte-carlo/</guid><description/></item><item><title>Temporal Difference</title><link>https://mateuszpieniak.com/tags/temporal-difference/</link><pubDate>Sun, 21 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/temporal-difference/</guid><description/></item><item><title>Banach Fixed-Point Theorem</title><link>https://mateuszpieniak.com/tags/banach-fixed-point-theorem/</link><pubDate>Wed, 17 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/banach-fixed-point-theorem/</guid><description/></item><item><title>Bellman Expectation Equation</title><link>https://mateuszpieniak.com/tags/bellman-expectation-equation/</link><pubDate>Wed, 17 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/bellman-expectation-equation/</guid><description/></item><item><title>Bellman Optimality Equation</title><link>https://mateuszpieniak.com/tags/bellman-optimality-equation/</link><pubDate>Wed, 17 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/bellman-optimality-equation/</guid><description/></item><item><title>Contraction Mapping</title><link>https://mateuszpieniak.com/tags/contraction-mapping/</link><pubDate>Wed, 17 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/contraction-mapping/</guid><description/></item><item><title>Generalized Policy Iteration</title><link>https://mateuszpieniak.com/tags/generalized-policy-iteration/</link><pubDate>Wed, 17 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/generalized-policy-iteration/</guid><description/></item><item><title>Model-Based Reinforcement Learning</title><link>https://mateuszpieniak.com/tags/model-based-reinforcement-learning/</link><pubDate>Wed, 17 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/model-based-reinforcement-learning/</guid><description/></item><item><title>Policy Iteration</title><link>https://mateuszpieniak.com/tags/policy-iteration/</link><pubDate>Wed, 17 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/policy-iteration/</guid><description/></item><item><title>Value Iteration</title><link>https://mateuszpieniak.com/tags/value-iteration/</link><pubDate>Wed, 17 Jun 2026 00:00:00 +0000</pubDate><guid>https://mateuszpieniak.com/tags/value-iteration/</guid><description/></item></channel></rss>