[ ( [ "/coin-flip"
    , "/doc/ai/1987-mcdermott.pdf"
    , "/doc/ai/nn/2013-clark.pdf"
    , "/doc/ai/tabular/2012-rintanen.pdf"
    ]
  , "heuristics"
  )
, ( [ "/coin-flip"
    , "/doc/ai/1987-mcdermott.pdf"
    , "/doc/ai/nn/2013-clark.pdf"
    , "/doc/ai/tabular/2012-rintanen.pdf"
    , "/doc/psychology/neuroscience/2023-coulter.pdf"
    , "/doc/psychology/neuroscience/2023-lai.pdf"
    , "/doc/reinforcement-learning/imitation-learning/2018-gudmundsson.pdf"
    , "/doc/reinforcement-learning/imperfect-information/diplomacy/2022-bakhtin.pdf"
    , "/doc/reinforcement-learning/model/2000-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2001-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2010-silver.pdf"
    , "/doc/reinforcement-learning/model/2012-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2013-auger.pdf"
    , "/doc/reinforcement-learning/model/2015-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2018-eslami.pdf#deepmind"
    , "/doc/reinforcement-learning/model/2018-everitt.pdf"
    ]
  , "planning"
  )
, ( [ "/coin-flip"
    , "/doc/ai/1987-mcdermott.pdf"
    , "/doc/ai/nn/2013-clark.pdf"
    , "/doc/ai/tabular/2012-rintanen.pdf"
    , "/doc/psychology/neuroscience/2023-coulter.pdf"
    , "/doc/psychology/neuroscience/2023-lai.pdf"
    , "/doc/reinforcement-learning/imitation-learning/2018-gudmundsson.pdf"
    , "/doc/reinforcement-learning/imperfect-information/diplomacy/2022-bakhtin.pdf"
    , "/doc/reinforcement-learning/model/2000-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2001-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2010-silver.pdf"
    , "/doc/reinforcement-learning/model/2012-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2013-auger.pdf"
    , "/doc/reinforcement-learning/model/2015-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2018-eslami.pdf#deepmind"
    , "/doc/reinforcement-learning/model/2018-everitt.pdf"
    , "/doc/reinforcement-learning/model/2023-gao.pdf"
    , "/doc/reinforcement-learning/model/2024-wang-2.pdf"
    , "/doc/reinforcement-learning/robot/2006-bongard.pdf"
    , "/doc/statistics/decision/2003-zadrozny.pdf"
    , "https://ai.stanford.edu/~pabbeel/pubs/AbbeelCoatesQuigleyNg_aaorltahf_nips2006.pdf"
    , "https://arxiv.org/abs/0909.0801"
    , "https://arxiv.org/abs/1301.6690"
    , "https://arxiv.org/abs/1401.5390"
    , "https://arxiv.org/abs/1411.5326#deepmind"
    , "https://arxiv.org/abs/1506.00779"
    , "https://arxiv.org/abs/1511.09249#schmidhuber"
    , "https://arxiv.org/abs/1602.02867#deepmind"
    , "https://arxiv.org/abs/1606.04442"
    , "https://arxiv.org/abs/1612.02179"
    , "https://arxiv.org/abs/1612.08810#deepmind"
    , "https://arxiv.org/abs/1702.07274"
    , "https://arxiv.org/abs/1703.04070"
    , "https://arxiv.org/abs/1704.02254"
    , "https://arxiv.org/abs/1704.07183"
    , "https://arxiv.org/abs/1704.08792"
    , "https://arxiv.org/abs/1705.02670"
    , "https://arxiv.org/abs/1705.07615"
    , "https://arxiv.org/abs/1705.08080"
    , "https://arxiv.org/abs/1706.09597"
    , "https://arxiv.org/abs/1707.03497#deepmind"
    , "https://arxiv.org/abs/1707.06170"
    , "https://arxiv.org/abs/1707.07012#google"
    , "https://arxiv.org/abs/1708.02596"
    , "https://arxiv.org/abs/1708.03871"
    , "https://arxiv.org/abs/1709.06390"
    , "https://arxiv.org/abs/1709.06917"
    , "https://arxiv.org/abs/1712.05556"
    , "https://arxiv.org/abs/1802.03676"
    , "https://arxiv.org/abs/1802.09127#google"
    , "https://arxiv.org/abs/1803.10122#google"
    , "https://arxiv.org/abs/1804.09028#ibm"
    , "https://arxiv.org/abs/1805.00909"
    , "https://arxiv.org/abs/1805.08166"
    , "https://arxiv.org/abs/1805.12114"
    , "https://arxiv.org/abs/1805.12244"
    , "https://arxiv.org/abs/1807.06763"
    , "https://arxiv.org/abs/1807.06906"
    , "https://arxiv.org/abs/1811.01458#deepmind"
    , "https://arxiv.org/abs/1811.04551#google"
    , "https://arxiv.org/abs/1903.08942"
    , "https://arxiv.org/abs/1905.10501"
    , "https://arxiv.org/abs/1906.05030"
    , "https://arxiv.org/abs/1906.08253"
    , "https://arxiv.org/abs/1910.03016"
    , "https://arxiv.org/abs/1910.06862"
    , "https://arxiv.org/abs/1912.01603#googledeepmind"
    , "https://arxiv.org/abs/1912.02807#deepmind"
    , "https://arxiv.org/abs/2001.00102"
    , "https://arxiv.org/abs/2002.07019"
    , "https://arxiv.org/abs/2003.03600"
    , "https://arxiv.org/abs/2003.08876"
    , "https://arxiv.org/abs/2004.14990"
    , "https://arxiv.org/abs/2005.05960"
    , "https://arxiv.org/abs/2005.12126#nvidia"
    , "https://arxiv.org/abs/2005.13239v6"
    , "https://arxiv.org/abs/2006.04757"
    , "https://arxiv.org/abs/2006.13888"
    , "https://arxiv.org/abs/2007.09560"
    , "https://arxiv.org/abs/2010.11895"
    , "https://arxiv.org/abs/2010.15835"
    , "https://arxiv.org/abs/2011.11751"
    , "https://arxiv.org/abs/2011.15091"
    , "https://arxiv.org/abs/2012.09812"
    , "https://arxiv.org/abs/2102.04518"
    , "https://arxiv.org/abs/2102.08363"
    , "https://arxiv.org/abs/2102.13249"
    , "https://arxiv.org/abs/2103.04909"
    , "https://arxiv.org/abs/2104.03946"
    , "https://arxiv.org/abs/2104.05336#deepmind"
    , "https://arxiv.org/abs/2106.00188"
    , "https://arxiv.org/abs/2106.04651"
    , "https://arxiv.org/abs/2106.04866"
    , "https://arxiv.org/abs/2106.13195#google"
    , "https://arxiv.org/abs/2109.08342"
    , "https://arxiv.org/abs/2109.10312"
    , "https://arxiv.org/abs/2110.01517"
    , "https://arxiv.org/abs/2111.02552"
    , "https://arxiv.org/abs/2111.07775"
    , "https://arxiv.org/abs/2111.09800"
    , "https://arxiv.org/abs/2112.05244"
    , "https://arxiv.org/abs/2201.07207#google"
    , "https://arxiv.org/abs/2201.12975"
    , "https://arxiv.org/abs/2202.01682"
    , "https://arxiv.org/abs/2202.01771"
    , "https://arxiv.org/abs/2202.02790"
    , "https://arxiv.org/abs/2203.00352"
    , "https://arxiv.org/abs/2203.08015"
    , "https://arxiv.org/abs/2203.13880"
    , "https://arxiv.org/abs/2204.01691#google"
    , "https://arxiv.org/abs/2204.05080#deepmind"
    , "https://arxiv.org/abs/2205.10712"
    , "https://arxiv.org/abs/2205.11495"
    , "https://arxiv.org/abs/2206.04114#google"
    , "https://arxiv.org/abs/2206.08332#deepmind"
    , "https://arxiv.org/abs/2206.11309#microsoft"
    , "https://arxiv.org/abs/2206.11795#openai"
    , "https://arxiv.org/abs/2206.14176"
    , "https://arxiv.org/abs/2207.04429"
    , "https://arxiv.org/abs/2207.05608#google"
    , "https://arxiv.org/abs/2207.13224#google"
    , "https://arxiv.org/abs/2207.13513"
    , "https://arxiv.org/abs/2208.02918#microsoft"
    , "https://arxiv.org/abs/2208.14928"
    , "https://arxiv.org/abs/2209.00588"
    , "https://arxiv.org/abs/2209.08466"
    , "https://arxiv.org/abs/2210.04435"
    , "https://arxiv.org/abs/2210.05805#facebook"
    , "https://arxiv.org/abs/2211.02703"
    , "https://arxiv.org/abs/2212.01508#deepmind"
    , "https://arxiv.org/abs/2212.04581"
    , "https://arxiv.org/abs/2301.04104#deepmind"
    , "https://arxiv.org/abs/2302.12422#nvidia"
    , "https://arxiv.org/abs/2305.07764#google"
    , "https://arxiv.org/abs/2306.04930#microsoft"
    , "https://arxiv.org/abs/2306.12554"
    , "https://arxiv.org/abs/2306.14079"
    , "https://arxiv.org/abs/2307.08678"
    , "https://arxiv.org/abs/2308.01399"
    , "https://arxiv.org/abs/2310.04406"
    , "https://arxiv.org/abs/2310.06089"
    , "https://arxiv.org/abs/2310.15386"
    , "https://arxiv.org/abs/2311.01017"
    , "https://arxiv.org/abs/2311.05584"
    , "https://arxiv.org/abs/2312.04657"
    , "https://arxiv.org/abs/2312.06937"
    , "https://arxiv.org/abs/2312.09056"
    , "https://arxiv.org/abs/2312.17227"
    , "https://arxiv.org/abs/2404.12358"
    , "https://arxiv.org/abs/2405.14333#deepseek"
    , "https://arxiv.org/abs/2405.15306"
    , "https://arxiv.org/abs/2405.20519"
    , "https://arxiv.org/abs/2406.03689"
    , "https://arxiv.org/abs/2406.05946"
    , "https://arxiv.org/abs/2406.06485"
    , "https://arxiv.org/abs/2406.06592#deepmind"
    , "https://arxiv.org/abs/2406.07394"
    , "https://arxiv.org/abs/2406.08404#schmidhuber"
    , "https://arxiv.org/abs/2406.10162#anthropic"
    , "https://arxiv.org/abs/2410.07166"
    , "https://arxiv.org/abs/2410.20268"
    , "https://dallasinnovates.com/exclusive-qa-john-carmacks-different-path-to-artificial-general-intelligence/"
    , "https://deepmindsafetyresearch.medium.com/designing-agent-incentives-to-avoid-reward-tampering-4380c1bb6cd"
    , "https://nv-tlabs.github.io/gameGAN/#nvidia"
    , "https://openreview.net/forum?id=YwDvofEWlEx"
    , "https://openreview.net/forum?id=psXVkKO9No#deepmind"
    , "https://research.google/blog/introducing-dreamer-scalable-reinforcement-learning-using-world-models/"
    , "https://www.biorxiv.org/content/10.1101/2021.03.15.435518.full"
    , "https://www.biorxiv.org/content/10.1101/2022.09.25.509419.full"
    , "https://www.biorxiv.org/content/10.1101/2023.04.04.535512.full"
    , "https://www.biorxiv.org/content/10.1101/2024.08.13.607810.full"
    , "https://www.nature.com/articles/s41467-022-35422-y"
    , "https://www.reuters.com/technology/artificial-intelligence/openai-co-founder-sutskevers-new-safety-focused-ai-startup-ssi-raises-1-billion-2024-09-04/"
    , "https://www.theatlantic.com/technology/archive/2023/11/openai-sam-altman-q-algorithm-breakthrough-project/676163/"
    ]
  , "imitation-learning"
  )
, ( [ "/coin-flip"
    , "/doc/ai/1987-mcdermott.pdf"
    , "/doc/ai/nn/2013-clark.pdf"
    , "/doc/ai/tabular/2012-rintanen.pdf"
    , "/doc/psychology/neuroscience/2023-coulter.pdf"
    , "/doc/psychology/neuroscience/2023-lai.pdf"
    , "/doc/reinforcement-learning/imitation-learning/2018-gudmundsson.pdf"
    , "/doc/reinforcement-learning/imperfect-information/diplomacy/2022-bakhtin.pdf"
    , "/doc/reinforcement-learning/model/2000-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2001-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2010-silver.pdf"
    , "/doc/reinforcement-learning/model/2012-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2013-auger.pdf"
    , "/doc/reinforcement-learning/model/2015-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2018-eslami.pdf#deepmind"
    , "/doc/reinforcement-learning/model/2018-everitt.pdf"
    , "/doc/reinforcement-learning/model/2023-gao.pdf"
    , "/doc/reinforcement-learning/model/2024-wang-2.pdf"
    , "/doc/reinforcement-learning/robot/2006-bongard.pdf"
    , "/doc/statistics/decision/2003-zadrozny.pdf"
    , "https://ai.stanford.edu/~pabbeel/pubs/AbbeelCoatesQuigleyNg_aaorltahf_nips2006.pdf"
    , "https://arxiv.org/abs/0909.0801"
    , "https://arxiv.org/abs/1301.6690"
    , "https://arxiv.org/abs/1401.5390"
    , "https://arxiv.org/abs/1411.5326#deepmind"
    , "https://arxiv.org/abs/1506.00779"
    , "https://arxiv.org/abs/1511.09249#schmidhuber"
    , "https://arxiv.org/abs/1602.02867#deepmind"
    , "https://arxiv.org/abs/1606.04442"
    , "https://arxiv.org/abs/1612.02179"
    , "https://arxiv.org/abs/1612.08810#deepmind"
    , "https://arxiv.org/abs/1702.07274"
    , "https://arxiv.org/abs/1703.04070"
    , "https://arxiv.org/abs/1704.02254"
    , "https://arxiv.org/abs/1704.07183"
    , "https://arxiv.org/abs/1704.08792"
    , "https://arxiv.org/abs/1705.02670"
    , "https://arxiv.org/abs/1705.07615"
    , "https://arxiv.org/abs/1705.08080"
    , "https://arxiv.org/abs/1706.09597"
    , "https://arxiv.org/abs/1707.03497#deepmind"
    , "https://arxiv.org/abs/1707.06170"
    , "https://arxiv.org/abs/1707.07012#google"
    , "https://arxiv.org/abs/1708.02596"
    , "https://arxiv.org/abs/1708.03871"
    , "https://arxiv.org/abs/1709.06390"
    , "https://arxiv.org/abs/1709.06917"
    , "https://arxiv.org/abs/1712.05556"
    , "https://arxiv.org/abs/1803.10122#google"
    , "https://arxiv.org/abs/1804.09028#ibm"
    , "https://arxiv.org/abs/1805.00909"
    , "https://arxiv.org/abs/1805.08166"
    , "https://arxiv.org/abs/1805.12114"
    , "https://arxiv.org/abs/1805.12244"
    , "https://arxiv.org/abs/1807.06763"
    , "https://arxiv.org/abs/1807.06906"
    , "https://arxiv.org/abs/1811.01458#deepmind"
    , "https://arxiv.org/abs/1811.04551#google"
    , "https://arxiv.org/abs/1812.03973#google"
    , "https://arxiv.org/abs/1905.10501"
    , "https://arxiv.org/abs/1906.05030"
    , "https://arxiv.org/abs/1906.08253"
    , "https://arxiv.org/abs/1910.03016"
    , "https://arxiv.org/abs/1910.06862"
    , "https://arxiv.org/abs/1912.01603#googledeepmind"
    , "https://arxiv.org/abs/1912.02807#deepmind"
    , "https://arxiv.org/abs/2001.00102"
    , "https://arxiv.org/abs/2002.07019"
    , "https://arxiv.org/abs/2003.03600"
    , "https://arxiv.org/abs/2003.08876"
    , "https://arxiv.org/abs/2004.14990"
    , "https://arxiv.org/abs/2005.05960"
    , "https://arxiv.org/abs/2005.12126#nvidia"
    , "https://arxiv.org/abs/2005.13239v6"
    , "https://arxiv.org/abs/2006.04757"
    , "https://arxiv.org/abs/2006.13888"
    , "https://arxiv.org/abs/2007.09560"
    , "https://arxiv.org/abs/2008.02215"
    , "https://arxiv.org/abs/2010.11895"
    , "https://arxiv.org/abs/2010.15835"
    , "https://arxiv.org/abs/2011.11751"
    , "https://arxiv.org/abs/2011.15091"
    , "https://arxiv.org/abs/2012.09812"
    , "https://arxiv.org/abs/2102.04518"
    , "https://arxiv.org/abs/2102.08363"
    , "https://arxiv.org/abs/2102.13249"
    , "https://arxiv.org/abs/2103.04909"
    , "https://arxiv.org/abs/2104.03946"
    , "https://arxiv.org/abs/2104.05336#deepmind"
    , "https://arxiv.org/abs/2104.14516"
    , "https://arxiv.org/abs/2106.00188"
    , "https://arxiv.org/abs/2106.04651"
    , "https://arxiv.org/abs/2106.04866"
    , "https://arxiv.org/abs/2106.13195#google"
    , "https://arxiv.org/abs/2109.08342"
    , "https://arxiv.org/abs/2109.09371"
    , "https://arxiv.org/abs/2109.10312"
    , "https://arxiv.org/abs/2110.01517"
    , "https://arxiv.org/abs/2111.02552"
    , "https://arxiv.org/abs/2111.07775"
    , "https://arxiv.org/abs/2111.09800"
    , "https://arxiv.org/abs/2112.05244"
    , "https://arxiv.org/abs/2112.11598"
    , "https://arxiv.org/abs/2201.07207#google"
    , "https://arxiv.org/abs/2201.12975"
    , "https://arxiv.org/abs/2202.01682"
    , "https://arxiv.org/abs/2202.01771"
    , "https://arxiv.org/abs/2202.02790"
    , "https://arxiv.org/abs/2203.00352"
    , "https://arxiv.org/abs/2203.08015"
    , "https://arxiv.org/abs/2203.13880"
    , "https://arxiv.org/abs/2204.01691#google"
    , "https://arxiv.org/abs/2204.05080#deepmind"
    , "https://arxiv.org/abs/2205.11495"
    , "https://arxiv.org/abs/2206.04114#google"
    , "https://arxiv.org/abs/2206.08332#deepmind"
    , "https://arxiv.org/abs/2206.11309#microsoft"
    , "https://arxiv.org/abs/2206.11795#openai"
    , "https://arxiv.org/abs/2206.14176"
    , "https://arxiv.org/abs/2207.04429"
    , "https://arxiv.org/abs/2207.05608#google"
    , "https://arxiv.org/abs/2207.13224#google"
    , "https://arxiv.org/abs/2207.13513"
    , "https://arxiv.org/abs/2208.02918#microsoft"
    , "https://arxiv.org/abs/2209.00588"
    , "https://arxiv.org/abs/2209.08466"
    , "https://arxiv.org/abs/2210.04435"
    , "https://arxiv.org/abs/2210.05805#facebook"
    , "https://arxiv.org/abs/2211.02703"
    , "https://arxiv.org/abs/2212.01508#deepmind"
    , "https://arxiv.org/abs/2212.04581"
    , "https://arxiv.org/abs/2301.04104#deepmind"
    , "https://arxiv.org/abs/2302.07350#deepmind"
    , "https://arxiv.org/abs/2302.12422#nvidia"
    , "https://arxiv.org/abs/2306.04930#microsoft"
    , "https://arxiv.org/abs/2310.04406"
    , "https://arxiv.org/abs/2310.06089"
    , "https://arxiv.org/abs/2311.01017"
    , "https://arxiv.org/abs/2311.05584"
    , "https://arxiv.org/abs/2312.04657"
    , "https://arxiv.org/abs/2312.09056"
    , "https://arxiv.org/abs/2312.17227"
    , "https://arxiv.org/abs/2404.12358"
    , "https://dallasinnovates.com/exclusive-qa-john-carmacks-different-path-to-artificial-general-intelligence/"
    , "https://deepmindsafetyresearch.medium.com/designing-agent-incentives-to-avoid-reward-tampering-4380c1bb6cd"
    , "https://nv-tlabs.github.io/gameGAN/#nvidia"
    , "https://openreview.net/forum?id=YwDvofEWlEx"
    , "https://openreview.net/forum?id=psXVkKO9No#deepmind"
    , "https://research.google/blog/introducing-dreamer-scalable-reinforcement-learning-using-world-models/"
    , "https://www.biorxiv.org/content/10.1101/2021.03.15.435518.full"
    , "https://www.biorxiv.org/content/10.1101/2022.09.25.509419.full"
    , "https://www.biorxiv.org/content/10.1101/2023.04.04.535512.full"
    , "https://www.nature.com/articles/s41467-022-35422-y"
    , "https://www.ncbi.nlm.nih.gov/pmc/articles/PMC3559008/"
    , "https://www.theatlantic.com/technology/archive/2023/11/openai-sam-altman-q-algorithm-breakthrough-project/676163/"
    ]
  , "latent-dynamics"
  )
, ( [ "/coin-flip"
    , "/doc/ai/1987-mcdermott.pdf"
    , "/doc/ai/nn/2013-clark.pdf"
    , "/doc/ai/tabular/2012-rintanen.pdf"
    , "/doc/psychology/neuroscience/2023-coulter.pdf"
    , "/doc/psychology/neuroscience/2023-lai.pdf"
    , "/doc/reinforcement-learning/imitation-learning/2018-gudmundsson.pdf"
    , "/doc/reinforcement-learning/imperfect-information/diplomacy/2022-bakhtin.pdf"
    , "/doc/reinforcement-learning/model/2000-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2001-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2010-silver.pdf"
    , "/doc/reinforcement-learning/model/2012-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2013-auger.pdf"
    , "/doc/reinforcement-learning/model/2015-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2018-eslami.pdf#deepmind"
    , "/doc/reinforcement-learning/model/2018-everitt.pdf"
    , "/doc/reinforcement-learning/model/2023-gao.pdf"
    , "/doc/reinforcement-learning/model/2024-wang-2.pdf"
    , "/doc/reinforcement-learning/robot/2006-bongard.pdf"
    , "/doc/statistics/decision/2003-zadrozny.pdf"
    , "https://ai.stanford.edu/~pabbeel/pubs/AbbeelCoatesQuigleyNg_aaorltahf_nips2006.pdf"
    , "https://arxiv.org/abs/0909.0801"
    , "https://arxiv.org/abs/1301.6690"
    , "https://arxiv.org/abs/1401.5390"
    , "https://arxiv.org/abs/1411.5326#deepmind"
    , "https://arxiv.org/abs/1506.00779"
    , "https://arxiv.org/abs/1511.09249#schmidhuber"
    , "https://arxiv.org/abs/1602.02867#deepmind"
    , "https://arxiv.org/abs/1606.04442"
    , "https://arxiv.org/abs/1612.02179"
    , "https://arxiv.org/abs/1612.08810#deepmind"
    , "https://arxiv.org/abs/1702.07274"
    , "https://arxiv.org/abs/1703.04070"
    , "https://arxiv.org/abs/1704.02254"
    , "https://arxiv.org/abs/1704.07183"
    , "https://arxiv.org/abs/1704.08792"
    , "https://arxiv.org/abs/1705.02670"
    , "https://arxiv.org/abs/1705.07615"
    , "https://arxiv.org/abs/1705.08080"
    , "https://arxiv.org/abs/1706.09597"
    , "https://arxiv.org/abs/1707.03497#deepmind"
    , "https://arxiv.org/abs/1707.06170"
    , "https://arxiv.org/abs/1707.07012#google"
    , "https://arxiv.org/abs/1708.02596"
    , "https://arxiv.org/abs/1709.06390"
    , "https://arxiv.org/abs/1709.06917"
    , "https://arxiv.org/abs/1712.05556"
    , "https://arxiv.org/abs/1802.03676"
    , "https://arxiv.org/abs/1802.09127#google"
    , "https://arxiv.org/abs/1803.10122#google"
    , "https://arxiv.org/abs/1804.09028#ibm"
    , "https://arxiv.org/abs/1805.00909"
    , "https://arxiv.org/abs/1805.08166"
    , "https://arxiv.org/abs/1805.12114"
    , "https://arxiv.org/abs/1805.12244"
    , "https://arxiv.org/abs/1807.06763"
    , "https://arxiv.org/abs/1807.06906"
    , "https://arxiv.org/abs/1811.01458#deepmind"
    , "https://arxiv.org/abs/1811.04551#google"
    , "https://arxiv.org/abs/1812.03973#google"
    , "https://arxiv.org/abs/1903.08942"
    , "https://arxiv.org/abs/1905.10501"
    , "https://arxiv.org/abs/1906.05030"
    , "https://arxiv.org/abs/1906.08253"
    , "https://arxiv.org/abs/1910.03016"
    , "https://arxiv.org/abs/1910.06862"
    , "https://arxiv.org/abs/1912.01603#googledeepmind"
    , "https://arxiv.org/abs/1912.02807#deepmind"
    , "https://arxiv.org/abs/2001.00102"
    , "https://arxiv.org/abs/2002.07019"
    , "https://arxiv.org/abs/2003.03600"
    , "https://arxiv.org/abs/2003.08876"
    , "https://arxiv.org/abs/2004.14990"
    , "https://arxiv.org/abs/2005.05960"
    , "https://arxiv.org/abs/2005.12126#nvidia"
    , "https://arxiv.org/abs/2005.13239v6"
    , "https://arxiv.org/abs/2006.04757"
    , "https://arxiv.org/abs/2006.13888"
    , "https://arxiv.org/abs/2007.09560"
    , "https://arxiv.org/abs/2008.02215"
    , "https://arxiv.org/abs/2010.11895"
    , "https://arxiv.org/abs/2010.15835"
    , "https://arxiv.org/abs/2011.11751"
    , "https://arxiv.org/abs/2011.15091"
    , "https://arxiv.org/abs/2012.09812"
    , "https://arxiv.org/abs/2102.04518"
    , "https://arxiv.org/abs/2102.08363"
    , "https://arxiv.org/abs/2102.13249"
    , "https://arxiv.org/abs/2103.04909"
    , "https://arxiv.org/abs/2104.03946"
    , "https://arxiv.org/abs/2104.05336#deepmind"
    , "https://arxiv.org/abs/2106.04651"
    , "https://arxiv.org/abs/2106.04866"
    , "https://arxiv.org/abs/2106.13195#google"
    , "https://arxiv.org/abs/2109.08342"
    , "https://arxiv.org/abs/2109.09371"
    , "https://arxiv.org/abs/2109.10312"
    , "https://arxiv.org/abs/2110.01517"
    , "https://arxiv.org/abs/2111.02552"
    , "https://arxiv.org/abs/2111.07775"
    , "https://arxiv.org/abs/2111.09800"
    , "https://arxiv.org/abs/2112.05244"
    , "https://arxiv.org/abs/2201.07207#google"
    , "https://arxiv.org/abs/2201.12975"
    , "https://arxiv.org/abs/2202.01682"
    , "https://arxiv.org/abs/2202.01771"
    , "https://arxiv.org/abs/2202.02790"
    , "https://arxiv.org/abs/2203.00352"
    , "https://arxiv.org/abs/2203.08015"
    , "https://arxiv.org/abs/2203.13880"
    , "https://arxiv.org/abs/2204.01691#google"
    , "https://arxiv.org/abs/2204.02863"
    , "https://arxiv.org/abs/2204.05080#deepmind"
    , "https://arxiv.org/abs/2205.11495"
    , "https://arxiv.org/abs/2206.04114#google"
    , "https://arxiv.org/abs/2206.08332#deepmind"
    , "https://arxiv.org/abs/2206.11795#openai"
    , "https://arxiv.org/abs/2206.14176"
    , "https://arxiv.org/abs/2207.04429"
    , "https://arxiv.org/abs/2207.05608#google"
    , "https://arxiv.org/abs/2207.13224#google"
    , "https://arxiv.org/abs/2207.13513"
    , "https://arxiv.org/abs/2208.02918#microsoft"
    , "https://arxiv.org/abs/2208.14928"
    , "https://arxiv.org/abs/2209.00588"
    , "https://arxiv.org/abs/2209.08466"
    , "https://arxiv.org/abs/2210.04435"
    , "https://arxiv.org/abs/2210.05805#facebook"
    , "https://arxiv.org/abs/2211.02703"
    , "https://arxiv.org/abs/2212.01508#deepmind"
    , "https://arxiv.org/abs/2212.04581"
    , "https://arxiv.org/abs/2301.04104#deepmind"
    , "https://arxiv.org/abs/2302.12422#nvidia"
    , "https://arxiv.org/abs/2305.07764#google"
    , "https://arxiv.org/abs/2306.12554"
    , "https://arxiv.org/abs/2306.14079"
    , "https://arxiv.org/abs/2307.08678"
    , "https://arxiv.org/abs/2308.01399"
    , "https://arxiv.org/abs/2310.04406"
    , "https://arxiv.org/abs/2310.06089"
    , "https://arxiv.org/abs/2310.15386"
    , "https://arxiv.org/abs/2311.01017"
    , "https://arxiv.org/abs/2311.05584"
    , "https://arxiv.org/abs/2312.04657"
    , "https://arxiv.org/abs/2312.06937"
    , "https://arxiv.org/abs/2312.09056"
    , "https://arxiv.org/abs/2312.17227"
    , "https://arxiv.org/abs/2404.12358"
    , "https://arxiv.org/abs/2405.14333#deepseek"
    , "https://arxiv.org/abs/2405.20519"
    , "https://arxiv.org/abs/2406.03689"
    , "https://arxiv.org/abs/2406.06485"
    , "https://arxiv.org/abs/2406.06592#deepmind"
    , "https://arxiv.org/abs/2406.07394"
    , "https://arxiv.org/abs/2406.08404#schmidhuber"
    , "https://arxiv.org/abs/2406.10162#anthropic"
    , "https://arxiv.org/abs/2410.07166"
    , "https://arxiv.org/abs/2410.20268"
    , "https://deepmindsafetyresearch.medium.com/designing-agent-incentives-to-avoid-reward-tampering-4380c1bb6cd"
    , "https://openreview.net/forum?id=YwDvofEWlEx"
    , "https://openreview.net/forum?id=psXVkKO9No#deepmind"
    , "https://research.google/blog/introducing-dreamer-scalable-reinforcement-learning-using-world-models/"
    , "https://www.biorxiv.org/content/10.1101/2021.03.15.435518.full"
    , "https://www.biorxiv.org/content/10.1101/2022.09.25.509419.full"
    , "https://www.biorxiv.org/content/10.1101/2023.04.04.535512.full"
    , "https://www.biorxiv.org/content/10.1101/2024.08.13.607810.full"
    , "https://www.nature.com/articles/s41467-022-35422-y"
    ]
  , "imitation-learning"
  )
, ( [ "/coin-flip"
    , "/doc/ai/1987-mcdermott.pdf"
    , "/doc/ai/nn/2013-clark.pdf"
    , "/doc/ai/tabular/2012-rintanen.pdf"
    , "/doc/psychology/neuroscience/2023-coulter.pdf"
    , "/doc/psychology/neuroscience/2023-lai.pdf"
    , "/doc/reinforcement-learning/imitation-learning/2018-gudmundsson.pdf"
    , "/doc/reinforcement-learning/imperfect-information/diplomacy/2022-bakhtin.pdf"
    , "/doc/reinforcement-learning/model/2000-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2001-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2010-silver.pdf"
    , "/doc/reinforcement-learning/model/2012-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2013-auger.pdf"
    , "/doc/reinforcement-learning/model/2015-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2018-eslami.pdf#deepmind"
    , "/doc/reinforcement-learning/model/2018-everitt.pdf"
    , "/doc/reinforcement-learning/model/2023-gao.pdf"
    , "/doc/reinforcement-learning/model/2024-wang-2.pdf"
    , "/doc/reinforcement-learning/robot/2006-bongard.pdf"
    , "/doc/statistics/decision/2003-zadrozny.pdf"
    , "https://ai.stanford.edu/~pabbeel/pubs/AbbeelCoatesQuigleyNg_aaorltahf_nips2006.pdf"
    , "https://arxiv.org/abs/0909.0801"
    , "https://arxiv.org/abs/1301.6690"
    , "https://arxiv.org/abs/1401.5390"
    , "https://arxiv.org/abs/1506.00779"
    , "https://arxiv.org/abs/1511.09249#schmidhuber"
    , "https://arxiv.org/abs/1602.02867#deepmind"
    , "https://arxiv.org/abs/1606.04442"
    , "https://arxiv.org/abs/1612.02179"
    , "https://arxiv.org/abs/1612.08810#deepmind"
    , "https://arxiv.org/abs/1702.07274"
    , "https://arxiv.org/abs/1703.04070"
    , "https://arxiv.org/abs/1704.02254"
    , "https://arxiv.org/abs/1704.07183"
    , "https://arxiv.org/abs/1704.08792"
    , "https://arxiv.org/abs/1705.02670"
    , "https://arxiv.org/abs/1705.07615"
    , "https://arxiv.org/abs/1705.08080"
    , "https://arxiv.org/abs/1706.09597"
    , "https://arxiv.org/abs/1707.03497#deepmind"
    , "https://arxiv.org/abs/1707.06170"
    , "https://arxiv.org/abs/1707.07012#google"
    , "https://arxiv.org/abs/1708.02596"
    , "https://arxiv.org/abs/1709.06390"
    , "https://arxiv.org/abs/1709.06917"
    , "https://arxiv.org/abs/1712.05556"
    , "https://arxiv.org/abs/1802.03676"
    , "https://arxiv.org/abs/1802.09127#google"
    , "https://arxiv.org/abs/1803.10122#google"
    , "https://arxiv.org/abs/1804.09028#ibm"
    , "https://arxiv.org/abs/1805.00909"
    , "https://arxiv.org/abs/1805.08166"
    , "https://arxiv.org/abs/1805.12114"
    , "https://arxiv.org/abs/1805.12244"
    , "https://arxiv.org/abs/1807.06763"
    , "https://arxiv.org/abs/1807.06906"
    , "https://arxiv.org/abs/1811.01458#deepmind"
    , "https://arxiv.org/abs/1811.04551#google"
    , "https://arxiv.org/abs/1903.08942"
    , "https://arxiv.org/abs/1905.10501"
    , "https://arxiv.org/abs/1906.05030"
    , "https://arxiv.org/abs/1906.08253"
    , "https://arxiv.org/abs/1910.03016"
    , "https://arxiv.org/abs/1910.06862"
    , "https://arxiv.org/abs/1912.01603#googledeepmind"
    , "https://arxiv.org/abs/1912.02807#deepmind"
    , "https://arxiv.org/abs/2001.00102"
    , "https://arxiv.org/abs/2002.07019"
    , "https://arxiv.org/abs/2003.03600"
    , "https://arxiv.org/abs/2003.08876"
    , "https://arxiv.org/abs/2005.05960"
    , "https://arxiv.org/abs/2005.12126#nvidia"
    , "https://arxiv.org/abs/2005.13239v6"
    , "https://arxiv.org/abs/2006.04757"
    , "https://arxiv.org/abs/2006.13888"
    , "https://arxiv.org/abs/2007.09560"
    , "https://arxiv.org/abs/2010.11895"
    , "https://arxiv.org/abs/2010.15835"
    , "https://arxiv.org/abs/2011.11751"
    , "https://arxiv.org/abs/2011.15091"
    , "https://arxiv.org/abs/2012.09812"
    , "https://arxiv.org/abs/2102.04518"
    , "https://arxiv.org/abs/2102.08363"
    , "https://arxiv.org/abs/2102.13249"
    , "https://arxiv.org/abs/2103.04909"
    , "https://arxiv.org/abs/2104.03946"
    , "https://arxiv.org/abs/2104.05336#deepmind"
    , "https://arxiv.org/abs/2104.14516"
    , "https://arxiv.org/abs/2106.00188"
    , "https://arxiv.org/abs/2106.04651"
    , "https://arxiv.org/abs/2106.04866"
    , "https://arxiv.org/abs/2106.13195#google"
    , "https://arxiv.org/abs/2109.08342"
    , "https://arxiv.org/abs/2109.09371"
    , "https://arxiv.org/abs/2109.10312"
    , "https://arxiv.org/abs/2110.01517"
    , "https://arxiv.org/abs/2111.07775"
    , "https://arxiv.org/abs/2111.09800"
    , "https://arxiv.org/abs/2112.05244"
    , "https://arxiv.org/abs/2201.07207#google"
    , "https://arxiv.org/abs/2201.12975"
    , "https://arxiv.org/abs/2202.01682"
    , "https://arxiv.org/abs/2202.01771"
    , "https://arxiv.org/abs/2202.02790"
    , "https://arxiv.org/abs/2203.00352"
    , "https://arxiv.org/abs/2203.08015"
    , "https://arxiv.org/abs/2203.13880"
    , "https://arxiv.org/abs/2204.01691#google"
    , "https://arxiv.org/abs/2204.02863"
    , "https://arxiv.org/abs/2204.05080#deepmind"
    , "https://arxiv.org/abs/2205.11495"
    , "https://arxiv.org/abs/2206.04114#google"
    , "https://arxiv.org/abs/2206.08332#deepmind"
    , "https://arxiv.org/abs/2206.11795#openai"
    , "https://arxiv.org/abs/2206.14176"
    , "https://arxiv.org/abs/2207.04429"
    , "https://arxiv.org/abs/2207.05608#google"
    , "https://arxiv.org/abs/2207.13224#google"
    , "https://arxiv.org/abs/2207.13513"
    , "https://arxiv.org/abs/2208.02918#microsoft"
    , "https://arxiv.org/abs/2208.14928"
    , "https://arxiv.org/abs/2209.00588"
    , "https://arxiv.org/abs/2209.08466"
    , "https://arxiv.org/abs/2210.04435"
    , "https://arxiv.org/abs/2210.05805#facebook"
    , "https://arxiv.org/abs/2211.02703"
    , "https://arxiv.org/abs/2212.01508#deepmind"
    , "https://arxiv.org/abs/2212.04581"
    , "https://arxiv.org/abs/2301.04104#deepmind"
    , "https://arxiv.org/abs/2302.12422#nvidia"
    , "https://arxiv.org/abs/2305.07764#google"
    , "https://arxiv.org/abs/2306.12554"
    , "https://arxiv.org/abs/2306.14079"
    , "https://arxiv.org/abs/2307.08678"
    , "https://arxiv.org/abs/2308.01399"
    , "https://arxiv.org/abs/2310.04406"
    , "https://arxiv.org/abs/2310.06089"
    , "https://arxiv.org/abs/2310.15386"
    , "https://arxiv.org/abs/2311.01017"
    , "https://arxiv.org/abs/2311.05584"
    , "https://arxiv.org/abs/2312.04657"
    , "https://arxiv.org/abs/2312.09056"
    , "https://arxiv.org/abs/2312.17227"
    , "https://arxiv.org/abs/2404.12358"
    , "https://arxiv.org/abs/2405.14333#deepseek"
    , "https://arxiv.org/abs/2405.20519"
    , "https://arxiv.org/abs/2406.03689"
    , "https://arxiv.org/abs/2406.06485"
    , "https://arxiv.org/abs/2406.06592#deepmind"
    , "https://arxiv.org/abs/2406.07394"
    , "https://arxiv.org/abs/2406.08404#schmidhuber"
    , "https://arxiv.org/abs/2406.10162#anthropic"
    , "https://arxiv.org/abs/2410.07166"
    , "https://deepmindsafetyresearch.medium.com/designing-agent-incentives-to-avoid-reward-tampering-4380c1bb6cd"
    , "https://nv-tlabs.github.io/gameGAN/#nvidia"
    , "https://openreview.net/forum?id=YwDvofEWlEx"
    , "https://openreview.net/forum?id=psXVkKO9No#deepmind"
    , "https://research.google/blog/introducing-dreamer-scalable-reinforcement-learning-using-world-models/"
    , "https://www.biorxiv.org/content/10.1101/2021.03.15.435518.full"
    , "https://www.biorxiv.org/content/10.1101/2022.09.25.509419.full"
    , "https://www.biorxiv.org/content/10.1101/2023.04.04.535512.full"
    , "https://www.biorxiv.org/content/10.1101/2024.08.13.607810.full"
    , "https://www.nature.com/articles/s41467-022-35422-y"
    ]
  , "world-models"
  )
, ( [ "/coin-flip"
    , "/doc/ai/1987-mcdermott.pdf"
    , "/doc/ai/nn/2013-clark.pdf"
    , "/doc/ai/tabular/2012-rintanen.pdf"
    , "/doc/psychology/neuroscience/2023-coulter.pdf"
    , "/doc/psychology/neuroscience/2023-lai.pdf"
    , "/doc/reinforcement-learning/imitation-learning/2018-gudmundsson.pdf"
    , "/doc/reinforcement-learning/imperfect-information/diplomacy/2022-bakhtin.pdf"
    , "/doc/reinforcement-learning/model/2000-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2001-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2010-silver.pdf"
    , "/doc/reinforcement-learning/model/2012-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2013-auger.pdf"
    , "/doc/reinforcement-learning/model/2015-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2018-eslami.pdf#deepmind"
    , "/doc/reinforcement-learning/model/2018-everitt.pdf"
    , "/doc/reinforcement-learning/model/2023-gao.pdf"
    , "/doc/reinforcement-learning/model/2024-wang-2.pdf"
    , "/doc/reinforcement-learning/robot/2006-bongard.pdf"
    , "https://ai.stanford.edu/~pabbeel/pubs/AbbeelCoatesQuigleyNg_aaorltahf_nips2006.pdf"
    , "https://arxiv.org/abs/0909.0801"
    , "https://arxiv.org/abs/1301.6690"
    , "https://arxiv.org/abs/1401.5390"
    , "https://arxiv.org/abs/1411.5326#deepmind"
    , "https://arxiv.org/abs/1506.00779"
    , "https://arxiv.org/abs/1511.09249#schmidhuber"
    , "https://arxiv.org/abs/1602.02867#deepmind"
    , "https://arxiv.org/abs/1606.04442"
    , "https://arxiv.org/abs/1612.02179"
    , "https://arxiv.org/abs/1612.08810#deepmind"
    , "https://arxiv.org/abs/1702.07274"
    , "https://arxiv.org/abs/1703.04070"
    , "https://arxiv.org/abs/1704.02254"
    , "https://arxiv.org/abs/1704.07183"
    , "https://arxiv.org/abs/1704.08792"
    , "https://arxiv.org/abs/1705.02670"
    , "https://arxiv.org/abs/1705.07615"
    , "https://arxiv.org/abs/1705.08080"
    , "https://arxiv.org/abs/1706.09597"
    , "https://arxiv.org/abs/1707.03497#deepmind"
    , "https://arxiv.org/abs/1707.06170"
    , "https://arxiv.org/abs/1707.07012#google"
    , "https://arxiv.org/abs/1708.02596"
    , "https://arxiv.org/abs/1708.03871"
    , "https://arxiv.org/abs/1709.06390"
    , "https://arxiv.org/abs/1709.06917"
    , "https://arxiv.org/abs/1712.05556"
    , "https://arxiv.org/abs/1802.03676"
    , "https://arxiv.org/abs/1802.09127#google"
    , "https://arxiv.org/abs/1803.10122#google"
    , "https://arxiv.org/abs/1804.09028#ibm"
    , "https://arxiv.org/abs/1805.00909"
    , "https://arxiv.org/abs/1805.08166"
    , "https://arxiv.org/abs/1805.12114"
    , "https://arxiv.org/abs/1805.12244"
    , "https://arxiv.org/abs/1807.06763"
    , "https://arxiv.org/abs/1807.06906"
    , "https://arxiv.org/abs/1811.01458#deepmind"
    , "https://arxiv.org/abs/1811.04551#google"
    , "https://arxiv.org/abs/1812.03973#google"
    , "https://arxiv.org/abs/1903.08942"
    , "https://arxiv.org/abs/1905.10501"
    , "https://arxiv.org/abs/1906.05030"
    , "https://arxiv.org/abs/1906.08253"
    , "https://arxiv.org/abs/1910.03016"
    , "https://arxiv.org/abs/1910.06862"
    , "https://arxiv.org/abs/1912.01603#googledeepmind"
    , "https://arxiv.org/abs/1912.02807#deepmind"
    , "https://arxiv.org/abs/2001.00102"
    , "https://arxiv.org/abs/2002.07019"
    , "https://arxiv.org/abs/2003.03600"
    , "https://arxiv.org/abs/2003.08876"
    , "https://arxiv.org/abs/2004.14990"
    , "https://arxiv.org/abs/2005.05960"
    , "https://arxiv.org/abs/2005.12126#nvidia"
    , "https://arxiv.org/abs/2005.13239v6"
    , "https://arxiv.org/abs/2006.04757"
    , "https://arxiv.org/abs/2006.13888"
    , "https://arxiv.org/abs/2007.09560"
    , "https://arxiv.org/abs/2010.11895"
    , "https://arxiv.org/abs/2010.15835"
    , "https://arxiv.org/abs/2011.11751"
    , "https://arxiv.org/abs/2011.15091"
    , "https://arxiv.org/abs/2012.09812"
    , "https://arxiv.org/abs/2102.04518"
    , "https://arxiv.org/abs/2102.08363"
    , "https://arxiv.org/abs/2102.13249"
    , "https://arxiv.org/abs/2103.04909"
    , "https://arxiv.org/abs/2104.03946"
    , "https://arxiv.org/abs/2104.05336#deepmind"
    , "https://arxiv.org/abs/2106.00188"
    , "https://arxiv.org/abs/2106.04866"
    , "https://arxiv.org/abs/2106.13195#google"
    , "https://arxiv.org/abs/2109.09371"
    , "https://arxiv.org/abs/2109.10312"
    , "https://arxiv.org/abs/2110.01517"
    , "https://arxiv.org/abs/2111.02552"
    , "https://arxiv.org/abs/2111.07775"
    , "https://arxiv.org/abs/2111.09800"
    , "https://arxiv.org/abs/2112.05244"
    , "https://arxiv.org/abs/2201.07207#google"
    , "https://arxiv.org/abs/2201.12975"
    , "https://arxiv.org/abs/2202.01682"
    , "https://arxiv.org/abs/2202.01771"
    , "https://arxiv.org/abs/2202.02790"
    , "https://arxiv.org/abs/2203.00352"
    , "https://arxiv.org/abs/2203.08015"
    , "https://arxiv.org/abs/2203.13880"
    , "https://arxiv.org/abs/2204.01691#google"
    , "https://arxiv.org/abs/2204.05080#deepmind"
    , "https://arxiv.org/abs/2205.11495"
    , "https://arxiv.org/abs/2206.04114#google"
    , "https://arxiv.org/abs/2206.08332#deepmind"
    , "https://arxiv.org/abs/2206.11795#openai"
    , "https://arxiv.org/abs/2206.14176"
    , "https://arxiv.org/abs/2207.04429"
    , "https://arxiv.org/abs/2207.05608#google"
    , "https://arxiv.org/abs/2207.13224#google"
    , "https://arxiv.org/abs/2207.13513"
    , "https://arxiv.org/abs/2208.14928"
    , "https://arxiv.org/abs/2209.00588"
    , "https://arxiv.org/abs/2209.08466"
    , "https://arxiv.org/abs/2210.04435"
    , "https://arxiv.org/abs/2210.05805#facebook"
    , "https://arxiv.org/abs/2211.02703"
    , "https://arxiv.org/abs/2212.01508#deepmind"
    , "https://arxiv.org/abs/2212.04581"
    , "https://arxiv.org/abs/2301.04104#deepmind"
    , "https://arxiv.org/abs/2302.07350#deepmind"
    , "https://arxiv.org/abs/2302.12422#nvidia"
    , "https://arxiv.org/abs/2305.07764#google"
    , "https://arxiv.org/abs/2306.04930#microsoft"
    , "https://arxiv.org/abs/2306.12554"
    , "https://arxiv.org/abs/2306.14079"
    , "https://arxiv.org/abs/2308.01399"
    , "https://arxiv.org/abs/2310.04406"
    , "https://arxiv.org/abs/2310.06089"
    , "https://arxiv.org/abs/2310.15386"
    , "https://arxiv.org/abs/2311.01017"
    , "https://arxiv.org/abs/2311.05584"
    , "https://arxiv.org/abs/2312.04657"
    , "https://arxiv.org/abs/2312.06937"
    , "https://arxiv.org/abs/2312.09056"
    , "https://arxiv.org/abs/2312.17227"
    , "https://arxiv.org/abs/2404.12358"
    , "https://arxiv.org/abs/2405.15306"
    , "https://arxiv.org/abs/2405.20519"
    , "https://arxiv.org/abs/2406.06485"
    , "https://arxiv.org/abs/2406.06592#deepmind"
    , "https://arxiv.org/abs/2406.07394"
    , "https://arxiv.org/abs/2406.08404#schmidhuber"
    , "https://arxiv.org/abs/2406.10162#anthropic"
    , "https://dallasinnovates.com/exclusive-qa-john-carmacks-different-path-to-artificial-general-intelligence/"
    , "https://deepmindsafetyresearch.medium.com/designing-agent-incentives-to-avoid-reward-tampering-4380c1bb6cd"
    , "https://nv-tlabs.github.io/gameGAN/#nvidia"
    , "https://openreview.net/forum?id=YwDvofEWlEx"
    , "https://openreview.net/forum?id=psXVkKO9No#deepmind"
    , "https://research.google/blog/introducing-dreamer-scalable-reinforcement-learning-using-world-models/"
    , "https://www.biorxiv.org/content/10.1101/2021.03.15.435518.full"
    , "https://www.biorxiv.org/content/10.1101/2022.09.25.509419.full"
    , "https://www.biorxiv.org/content/10.1101/2023.04.04.535512.full"
    , "https://www.biorxiv.org/content/10.1101/2024.08.13.607810.full"
    , "https://www.nature.com/articles/s41467-022-35422-y"
    , "https://www.reuters.com/technology/artificial-intelligence/openai-co-founder-sutskevers-new-safety-focused-ai-startup-ssi-raises-1-billion-2024-09-04/"
    , "https://www.theatlantic.com/technology/archive/2023/11/openai-sam-altman-q-algorithm-breakthrough-project/676163/"
    ]
  , "world-models"
  )
, ( [ "/coin-flip"
    , "/doc/ai/1987-mcdermott.pdf"
    , "/doc/ai/nn/2013-clark.pdf"
    , "/doc/ai/tabular/2012-rintanen.pdf"
    , "/doc/psychology/neuroscience/2023-coulter.pdf"
    , "/doc/psychology/neuroscience/2023-lai.pdf"
    , "/doc/reinforcement-learning/imitation-learning/2018-gudmundsson.pdf"
    , "/doc/reinforcement-learning/imperfect-information/diplomacy/2022-bakhtin.pdf"
    , "/doc/reinforcement-learning/model/2000-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2001-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2010-silver.pdf"
    , "/doc/reinforcement-learning/model/2012-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2013-auger.pdf"
    , "/doc/reinforcement-learning/model/2015-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2018-eslami.pdf#deepmind"
    , "/doc/reinforcement-learning/model/2018-everitt.pdf"
    , "/doc/reinforcement-learning/model/2023-gao.pdf"
    , "/doc/reinforcement-learning/model/2024-wang-2.pdf"
    , "/doc/statistics/decision/2003-zadrozny.pdf"
    , "https://ai.stanford.edu/~pabbeel/pubs/AbbeelCoatesQuigleyNg_aaorltahf_nips2006.pdf"
    , "https://arxiv.org/abs/0909.0801"
    , "https://arxiv.org/abs/1301.6690"
    , "https://arxiv.org/abs/1401.5390"
    , "https://arxiv.org/abs/1411.5326#deepmind"
    , "https://arxiv.org/abs/1506.00779"
    , "https://arxiv.org/abs/1511.09249#schmidhuber"
    , "https://arxiv.org/abs/1602.02867#deepmind"
    , "https://arxiv.org/abs/1606.04442"
    , "https://arxiv.org/abs/1612.02179"
    , "https://arxiv.org/abs/1612.08810#deepmind"
    , "https://arxiv.org/abs/1702.07274"
    , "https://arxiv.org/abs/1703.04070"
    , "https://arxiv.org/abs/1704.07183"
    , "https://arxiv.org/abs/1704.08792"
    , "https://arxiv.org/abs/1705.02670"
    , "https://arxiv.org/abs/1705.07615"
    , "https://arxiv.org/abs/1705.08080"
    , "https://arxiv.org/abs/1706.09597"
    , "https://arxiv.org/abs/1707.03497#deepmind"
    , "https://arxiv.org/abs/1707.06170"
    , "https://arxiv.org/abs/1707.07012#google"
    , "https://arxiv.org/abs/1708.02596"
    , "https://arxiv.org/abs/1708.03871"
    , "https://arxiv.org/abs/1709.06390"
    , "https://arxiv.org/abs/1709.06917"
    , "https://arxiv.org/abs/1712.05556"
    , "https://arxiv.org/abs/1802.03676"
    , "https://arxiv.org/abs/1802.09127#google"
    , "https://arxiv.org/abs/1803.10122#google"
    , "https://arxiv.org/abs/1804.09028#ibm"
    , "https://arxiv.org/abs/1805.00909"
    , "https://arxiv.org/abs/1805.08166"
    , "https://arxiv.org/abs/1805.12114"
    , "https://arxiv.org/abs/1805.12244"
    , "https://arxiv.org/abs/1807.06763"
    , "https://arxiv.org/abs/1807.06906"
    , "https://arxiv.org/abs/1811.01458#deepmind"
    , "https://arxiv.org/abs/1811.04551#google"
    , "https://arxiv.org/abs/1905.10501"
    , "https://arxiv.org/abs/1906.05030"
    , "https://arxiv.org/abs/1906.08253"
    , "https://arxiv.org/abs/1910.03016"
    , "https://arxiv.org/abs/1910.06862"
    , "https://arxiv.org/abs/1912.01603#googledeepmind"
    , "https://arxiv.org/abs/1912.02807#deepmind"
    , "https://arxiv.org/abs/2001.00102"
    , "https://arxiv.org/abs/2002.07019"
    , "https://arxiv.org/abs/2003.03600"
    , "https://arxiv.org/abs/2003.08876"
    , "https://arxiv.org/abs/2004.14990"
    , "https://arxiv.org/abs/2005.05960"
    , "https://arxiv.org/abs/2005.12126#nvidia"
    , "https://arxiv.org/abs/2005.13239v6"
    , "https://arxiv.org/abs/2006.04757"
    , "https://arxiv.org/abs/2006.13888"
    , "https://arxiv.org/abs/2008.02215"
    , "https://arxiv.org/abs/2010.11895"
    , "https://arxiv.org/abs/2010.15835"
    , "https://arxiv.org/abs/2011.11751"
    , "https://arxiv.org/abs/2011.15091"
    , "https://arxiv.org/abs/2012.09812"
    , "https://arxiv.org/abs/2102.04518"
    , "https://arxiv.org/abs/2102.08363"
    , "https://arxiv.org/abs/2102.13249"
    , "https://arxiv.org/abs/2103.04909"
    , "https://arxiv.org/abs/2104.03946"
    , "https://arxiv.org/abs/2104.05336#deepmind"
    , "https://arxiv.org/abs/2104.14516"
    , "https://arxiv.org/abs/2106.00188"
    , "https://arxiv.org/abs/2106.04866"
    , "https://arxiv.org/abs/2106.13195#google"
    , "https://arxiv.org/abs/2109.08342"
    , "https://arxiv.org/abs/2109.09371"
    , "https://arxiv.org/abs/2109.10312"
    , "https://arxiv.org/abs/2110.01517"
    , "https://arxiv.org/abs/2111.02552"
    , "https://arxiv.org/abs/2111.07775"
    , "https://arxiv.org/abs/2111.09800"
    , "https://arxiv.org/abs/2112.05244"
    , "https://arxiv.org/abs/2201.07207#google"
    , "https://arxiv.org/abs/2201.12975"
    , "https://arxiv.org/abs/2202.01682"
    , "https://arxiv.org/abs/2202.01771"
    , "https://arxiv.org/abs/2202.02790"
    , "https://arxiv.org/abs/2203.00352"
    , "https://arxiv.org/abs/2203.08015"
    , "https://arxiv.org/abs/2203.13880"
    , "https://arxiv.org/abs/2204.01691#google"
    , "https://arxiv.org/abs/2204.05080#deepmind"
    , "https://arxiv.org/abs/2205.11495"
    , "https://arxiv.org/abs/2206.04114#google"
    , "https://arxiv.org/abs/2206.08332#deepmind"
    , "https://arxiv.org/abs/2206.11309#microsoft"
    , "https://arxiv.org/abs/2206.11795#openai"
    , "https://arxiv.org/abs/2206.14176"
    , "https://arxiv.org/abs/2207.04429"
    , "https://arxiv.org/abs/2207.05608#google"
    , "https://arxiv.org/abs/2207.13224#google"
    , "https://arxiv.org/abs/2207.13513"
    , "https://arxiv.org/abs/2208.02918#microsoft"
    , "https://arxiv.org/abs/2208.14928"
    , "https://arxiv.org/abs/2209.00588"
    , "https://arxiv.org/abs/2209.08466"
    , "https://arxiv.org/abs/2210.04435"
    , "https://arxiv.org/abs/2210.05805#facebook"
    , "https://arxiv.org/abs/2211.02703"
    , "https://arxiv.org/abs/2212.01508#deepmind"
    , "https://arxiv.org/abs/2212.04581"
    , "https://arxiv.org/abs/2301.04104#deepmind"
    , "https://arxiv.org/abs/2302.07350#deepmind"
    , "https://arxiv.org/abs/2302.12422#nvidia"
    , "https://arxiv.org/abs/2305.07764#google"
    , "https://arxiv.org/abs/2306.04930#microsoft"
    , "https://arxiv.org/abs/2306.12554"
    , "https://arxiv.org/abs/2306.14079"
    , "https://arxiv.org/abs/2307.08678"
    , "https://arxiv.org/abs/2308.01399"
    , "https://arxiv.org/abs/2310.04406"
    , "https://arxiv.org/abs/2310.06089"
    , "https://arxiv.org/abs/2310.15386"
    , "https://arxiv.org/abs/2311.01017"
    , "https://arxiv.org/abs/2311.05584"
    , "https://arxiv.org/abs/2312.04657"
    , "https://arxiv.org/abs/2312.06937"
    , "https://arxiv.org/abs/2312.09056"
    , "https://arxiv.org/abs/2312.17227"
    , "https://arxiv.org/abs/2404.12358"
    , "https://arxiv.org/abs/2405.20519"
    , "https://arxiv.org/abs/2406.03689"
    , "https://arxiv.org/abs/2406.06485"
    , "https://arxiv.org/abs/2406.06592#deepmind"
    , "https://arxiv.org/abs/2406.07394"
    , "https://arxiv.org/abs/2406.08404#schmidhuber"
    , "https://arxiv.org/abs/2406.10162#anthropic"
    , "https://deepmindsafetyresearch.medium.com/designing-agent-incentives-to-avoid-reward-tampering-4380c1bb6cd"
    , "https://nv-tlabs.github.io/gameGAN/#nvidia"
    , "https://openreview.net/forum?id=YwDvofEWlEx"
    , "https://openreview.net/forum?id=psXVkKO9No#deepmind"
    , "https://research.google/blog/introducing-dreamer-scalable-reinforcement-learning-using-world-models/"
    , "https://www.biorxiv.org/content/10.1101/2021.03.15.435518.full"
    , "https://www.biorxiv.org/content/10.1101/2022.09.25.509419.full"
    , "https://www.biorxiv.org/content/10.1101/2023.04.04.535512.full"
    , "https://www.nature.com/articles/s41467-022-35422-y"
    ]
  , "exploration-strategies"
  )
, ( [ "/coin-flip"
    , "/doc/ai/1987-mcdermott.pdf"
    , "/doc/ai/nn/2013-clark.pdf"
    , "/doc/ai/tabular/2012-rintanen.pdf"
    , "/doc/psychology/neuroscience/2023-coulter.pdf"
    , "/doc/psychology/neuroscience/2023-lai.pdf"
    , "/doc/reinforcement-learning/imitation-learning/2018-gudmundsson.pdf"
    , "/doc/reinforcement-learning/imperfect-information/diplomacy/2022-bakhtin.pdf"
    , "/doc/reinforcement-learning/model/2000-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2001-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2010-silver.pdf"
    , "/doc/reinforcement-learning/model/2012-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2013-auger.pdf"
    , "/doc/reinforcement-learning/model/2015-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2018-eslami.pdf#deepmind"
    , "/doc/reinforcement-learning/model/2018-everitt.pdf"
    , "/doc/reinforcement-learning/model/2023-gao.pdf"
    , "/doc/reinforcement-learning/model/2024-wang-2.pdf"
    , "https://ai.stanford.edu/~pabbeel/pubs/AbbeelCoatesQuigleyNg_aaorltahf_nips2006.pdf"
    , "https://arxiv.org/abs/0909.0801"
    , "https://arxiv.org/abs/1301.6690"
    , "https://arxiv.org/abs/1401.5390"
    , "https://arxiv.org/abs/1411.5326#deepmind"
    , "https://arxiv.org/abs/1506.00779"
    , "https://arxiv.org/abs/1511.09249#schmidhuber"
    , "https://arxiv.org/abs/1602.02867#deepmind"
    , "https://arxiv.org/abs/1606.04442"
    , "https://arxiv.org/abs/1612.02179"
    , "https://arxiv.org/abs/1612.08810#deepmind"
    , "https://arxiv.org/abs/1702.07274"
    , "https://arxiv.org/abs/1703.04070"
    , "https://arxiv.org/abs/1704.02254"
    , "https://arxiv.org/abs/1704.07183"
    , "https://arxiv.org/abs/1704.08792"
    , "https://arxiv.org/abs/1705.02670"
    , "https://arxiv.org/abs/1705.07615"
    , "https://arxiv.org/abs/1705.08080"
    , "https://arxiv.org/abs/1706.09597"
    , "https://arxiv.org/abs/1707.03497#deepmind"
    , "https://arxiv.org/abs/1707.06170"
    , "https://arxiv.org/abs/1707.07012#google"
    , "https://arxiv.org/abs/1708.02596"
    , "https://arxiv.org/abs/1708.03871"
    , "https://arxiv.org/abs/1709.06390"
    , "https://arxiv.org/abs/1709.06917"
    , "https://arxiv.org/abs/1712.05556"
    , "https://arxiv.org/abs/1802.03676"
    , "https://arxiv.org/abs/1802.09127#google"
    , "https://arxiv.org/abs/1803.10122#google"
    , "https://arxiv.org/abs/1804.09028#ibm"
    , "https://arxiv.org/abs/1805.00909"
    , "https://arxiv.org/abs/1805.08166"
    , "https://arxiv.org/abs/1805.12114"
    , "https://arxiv.org/abs/1805.12244"
    , "https://arxiv.org/abs/1807.06763"
    , "https://arxiv.org/abs/1807.06906"
    , "https://arxiv.org/abs/1811.01458#deepmind"
    , "https://arxiv.org/abs/1811.04551#google"
    , "https://arxiv.org/abs/1812.03973#google"
    , "https://arxiv.org/abs/1903.08942"
    , "https://arxiv.org/abs/1905.10501"
    , "https://arxiv.org/abs/1906.05030"
    , "https://arxiv.org/abs/1906.08253"
    , "https://arxiv.org/abs/1910.03016"
    , "https://arxiv.org/abs/1910.06862"
    , "https://arxiv.org/abs/1912.01603#googledeepmind"
    , "https://arxiv.org/abs/1912.02807#deepmind"
    , "https://arxiv.org/abs/2001.00102"
    , "https://arxiv.org/abs/2002.07019"
    , "https://arxiv.org/abs/2003.03600"
    , "https://arxiv.org/abs/2003.08876"
    , "https://arxiv.org/abs/2004.14990"
    , "https://arxiv.org/abs/2005.05960"
    , "https://arxiv.org/abs/2005.12126#nvidia"
    , "https://arxiv.org/abs/2005.13239v6"
    , "https://arxiv.org/abs/2006.04757"
    , "https://arxiv.org/abs/2006.13888"
    , "https://arxiv.org/abs/2008.02215"
    , "https://arxiv.org/abs/2010.11895"
    , "https://arxiv.org/abs/2010.15835"
    , "https://arxiv.org/abs/2011.11751"
    , "https://arxiv.org/abs/2011.15091"
    , "https://arxiv.org/abs/2012.09812"
    , "https://arxiv.org/abs/2102.04518"
    , "https://arxiv.org/abs/2102.08363"
    , "https://arxiv.org/abs/2102.13249"
    , "https://arxiv.org/abs/2103.04909"
    , "https://arxiv.org/abs/2104.03946"
    , "https://arxiv.org/abs/2104.05336#deepmind"
    , "https://arxiv.org/abs/2106.04866"
    , "https://arxiv.org/abs/2106.13195#google"
    , "https://arxiv.org/abs/2109.08342"
    , "https://arxiv.org/abs/2109.09371"
    , "https://arxiv.org/abs/2109.10312"
    , "https://arxiv.org/abs/2110.01517"
    , "https://arxiv.org/abs/2111.02552"
    , "https://arxiv.org/abs/2111.07775"
    , "https://arxiv.org/abs/2111.09800"
    , "https://arxiv.org/abs/2112.05244"
    , "https://arxiv.org/abs/2201.07207#google"
    , "https://arxiv.org/abs/2201.12975"
    , "https://arxiv.org/abs/2202.01682"
    , "https://arxiv.org/abs/2202.01771"
    , "https://arxiv.org/abs/2202.02790"
    , "https://arxiv.org/abs/2203.00352"
    , "https://arxiv.org/abs/2203.08015"
    , "https://arxiv.org/abs/2203.13880"
    , "https://arxiv.org/abs/2204.01691#google"
    , "https://arxiv.org/abs/2204.02863"
    , "https://arxiv.org/abs/2204.05080#deepmind"
    , "https://arxiv.org/abs/2205.11495"
    , "https://arxiv.org/abs/2206.04114#google"
    , "https://arxiv.org/abs/2206.08332#deepmind"
    , "https://arxiv.org/abs/2206.11795#openai"
    , "https://arxiv.org/abs/2206.14176"
    , "https://arxiv.org/abs/2207.04429"
    , "https://arxiv.org/abs/2207.05608#google"
    , "https://arxiv.org/abs/2207.13224#google"
    , "https://arxiv.org/abs/2207.13513"
    , "https://arxiv.org/abs/2208.02918#microsoft"
    , "https://arxiv.org/abs/2208.14928"
    , "https://arxiv.org/abs/2209.00588"
    , "https://arxiv.org/abs/2209.08466"
    , "https://arxiv.org/abs/2210.04435"
    , "https://arxiv.org/abs/2210.05805#facebook"
    , "https://arxiv.org/abs/2211.02703"
    , "https://arxiv.org/abs/2212.01508#deepmind"
    , "https://arxiv.org/abs/2212.04581"
    , "https://arxiv.org/abs/2301.04104#deepmind"
    , "https://arxiv.org/abs/2302.12422#nvidia"
    , "https://arxiv.org/abs/2305.07764#google"
    , "https://arxiv.org/abs/2306.12554"
    , "https://arxiv.org/abs/2306.14079"
    , "https://arxiv.org/abs/2307.08678"
    , "https://arxiv.org/abs/2308.01399"
    , "https://arxiv.org/abs/2310.04406"
    , "https://arxiv.org/abs/2310.06089"
    , "https://arxiv.org/abs/2310.15386"
    , "https://arxiv.org/abs/2311.01017"
    , "https://arxiv.org/abs/2311.05584"
    , "https://arxiv.org/abs/2312.04657"
    , "https://arxiv.org/abs/2312.06937"
    , "https://arxiv.org/abs/2312.09056"
    , "https://arxiv.org/abs/2312.17227"
    , "https://arxiv.org/abs/2404.12358"
    , "https://arxiv.org/abs/2405.14333#deepseek"
    , "https://arxiv.org/abs/2405.20519"
    , "https://arxiv.org/abs/2406.03689"
    , "https://arxiv.org/abs/2406.05946"
    , "https://arxiv.org/abs/2406.06485"
    , "https://arxiv.org/abs/2406.06592#deepmind"
    , "https://arxiv.org/abs/2406.07394"
    , "https://arxiv.org/abs/2406.08404#schmidhuber"
    , "https://arxiv.org/abs/2406.10162#anthropic"
    , "https://arxiv.org/abs/2410.01707"
    , "https://arxiv.org/abs/2410.07166"
    , "https://deepmindsafetyresearch.medium.com/designing-agent-incentives-to-avoid-reward-tampering-4380c1bb6cd"
    , "https://nv-tlabs.github.io/gameGAN/#nvidia"
    , "https://openreview.net/forum?id=YwDvofEWlEx"
    , "https://openreview.net/forum?id=psXVkKO9No#deepmind"
    , "https://research.google/blog/introducing-dreamer-scalable-reinforcement-learning-using-world-models/"
    , "https://www.biorxiv.org/content/10.1101/2022.09.25.509419.full"
    , "https://www.biorxiv.org/content/10.1101/2023.04.04.535512.full"
    , "https://www.nature.com/articles/s41467-022-35422-y"
    ]
  , "adaptive-planning"
  )
, ( [ "/coin-flip"
    , "/doc/ai/1987-mcdermott.pdf"
    , "/doc/ai/nn/2013-clark.pdf"
    , "/doc/ai/tabular/2012-rintanen.pdf"
    , "/doc/psychology/neuroscience/2023-coulter.pdf"
    , "/doc/psychology/neuroscience/2023-lai.pdf"
    , "/doc/reinforcement-learning/imitation-learning/2018-gudmundsson.pdf"
    , "/doc/reinforcement-learning/imperfect-information/diplomacy/2022-bakhtin.pdf"
    , "/doc/reinforcement-learning/model/2000-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2001-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2010-silver.pdf"
    , "/doc/reinforcement-learning/model/2012-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2013-auger.pdf"
    , "/doc/reinforcement-learning/model/2015-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2018-eslami.pdf#deepmind"
    , "/doc/reinforcement-learning/model/2018-everitt.pdf"
    , "/doc/reinforcement-learning/model/2023-gao.pdf"
    , "/doc/reinforcement-learning/model/2024-wang-2.pdf"
    , "https://ai.stanford.edu/~pabbeel/pubs/AbbeelCoatesQuigleyNg_aaorltahf_nips2006.pdf"
    , "https://arxiv.org/abs/0909.0801"
    , "https://arxiv.org/abs/1301.6690"
    , "https://arxiv.org/abs/1401.5390"
    , "https://arxiv.org/abs/1411.5326#deepmind"
    , "https://arxiv.org/abs/1506.00779"
    , "https://arxiv.org/abs/1511.09249#schmidhuber"
    , "https://arxiv.org/abs/1602.02867#deepmind"
    , "https://arxiv.org/abs/1606.04442"
    , "https://arxiv.org/abs/1612.02179"
    , "https://arxiv.org/abs/1612.08810#deepmind"
    , "https://arxiv.org/abs/1702.07274"
    , "https://arxiv.org/abs/1703.04070"
    , "https://arxiv.org/abs/1704.07183"
    , "https://arxiv.org/abs/1704.08792"
    , "https://arxiv.org/abs/1705.02670"
    , "https://arxiv.org/abs/1705.07615"
    , "https://arxiv.org/abs/1705.08080"
    , "https://arxiv.org/abs/1706.09597"
    , "https://arxiv.org/abs/1707.03497#deepmind"
    , "https://arxiv.org/abs/1707.06170"
    , "https://arxiv.org/abs/1707.07012#google"
    , "https://arxiv.org/abs/1708.02596"
    , "https://arxiv.org/abs/1708.03871"
    , "https://arxiv.org/abs/1709.06390"
    , "https://arxiv.org/abs/1709.06917"
    , "https://arxiv.org/abs/1712.05556"
    , "https://arxiv.org/abs/1802.03676"
    , "https://arxiv.org/abs/1803.10122#google"
    , "https://arxiv.org/abs/1804.09028#ibm"
    , "https://arxiv.org/abs/1805.00909"
    , "https://arxiv.org/abs/1805.08166"
    , "https://arxiv.org/abs/1805.12114"
    , "https://arxiv.org/abs/1805.12244"
    , "https://arxiv.org/abs/1807.06763"
    , "https://arxiv.org/abs/1807.06906"
    , "https://arxiv.org/abs/1811.01458#deepmind"
    , "https://arxiv.org/abs/1811.04551#google"
    , "https://arxiv.org/abs/1812.03973#google"
    , "https://arxiv.org/abs/1905.10501"
    , "https://arxiv.org/abs/1906.05030"
    , "https://arxiv.org/abs/1906.08253"
    , "https://arxiv.org/abs/1910.03016"
    , "https://arxiv.org/abs/1910.06862"
    , "https://arxiv.org/abs/1912.01603#googledeepmind"
    , "https://arxiv.org/abs/1912.02807#deepmind"
    , "https://arxiv.org/abs/2001.00102"
    , "https://arxiv.org/abs/2002.07019"
    , "https://arxiv.org/abs/2003.03600"
    , "https://arxiv.org/abs/2003.08876"
    , "https://arxiv.org/abs/2004.14990"
    , "https://arxiv.org/abs/2005.05960"
    , "https://arxiv.org/abs/2005.12126#nvidia"
    , "https://arxiv.org/abs/2005.13239v6"
    , "https://arxiv.org/abs/2006.04757"
    , "https://arxiv.org/abs/2006.13888"
    , "https://arxiv.org/abs/2007.09560"
    , "https://arxiv.org/abs/2008.02215"
    , "https://arxiv.org/abs/2010.11895"
    , "https://arxiv.org/abs/2010.15835"
    , "https://arxiv.org/abs/2011.11751"
    , "https://arxiv.org/abs/2011.15091"
    , "https://arxiv.org/abs/2012.09812"
    , "https://arxiv.org/abs/2102.04518"
    , "https://arxiv.org/abs/2102.08363"
    , "https://arxiv.org/abs/2102.13249"
    , "https://arxiv.org/abs/2103.04909"
    , "https://arxiv.org/abs/2104.03946"
    , "https://arxiv.org/abs/2104.05336#deepmind"
    , "https://arxiv.org/abs/2106.00188"
    , "https://arxiv.org/abs/2106.04651"
    , "https://arxiv.org/abs/2106.04866"
    , "https://arxiv.org/abs/2106.13195#google"
    , "https://arxiv.org/abs/2109.08342"
    , "https://arxiv.org/abs/2109.10312"
    , "https://arxiv.org/abs/2110.01517"
    , "https://arxiv.org/abs/2111.07775"
    , "https://arxiv.org/abs/2111.09800"
    , "https://arxiv.org/abs/2112.05244"
    , "https://arxiv.org/abs/2201.07207#google"
    , "https://arxiv.org/abs/2201.12975"
    , "https://arxiv.org/abs/2202.01682"
    , "https://arxiv.org/abs/2202.01771"
    , "https://arxiv.org/abs/2202.02790"
    , "https://arxiv.org/abs/2203.00352"
    , "https://arxiv.org/abs/2203.08015"
    , "https://arxiv.org/abs/2203.13880"
    , "https://arxiv.org/abs/2204.01691#google"
    , "https://arxiv.org/abs/2204.05080#deepmind"
    , "https://arxiv.org/abs/2205.10712"
    , "https://arxiv.org/abs/2205.11495"
    , "https://arxiv.org/abs/2206.04114#google"
    , "https://arxiv.org/abs/2206.08332#deepmind"
    , "https://arxiv.org/abs/2206.11795#openai"
    , "https://arxiv.org/abs/2206.14176"
    , "https://arxiv.org/abs/2207.04429"
    , "https://arxiv.org/abs/2207.05608#google"
    , "https://arxiv.org/abs/2207.13224#google"
    , "https://arxiv.org/abs/2207.13513"
    , "https://arxiv.org/abs/2208.02918#microsoft"
    , "https://arxiv.org/abs/2208.14928"
    , "https://arxiv.org/abs/2209.00588"
    , "https://arxiv.org/abs/2209.08466"
    , "https://arxiv.org/abs/2210.04435"
    , "https://arxiv.org/abs/2210.05805#facebook"
    , "https://arxiv.org/abs/2211.02703"
    , "https://arxiv.org/abs/2212.01508#deepmind"
    , "https://arxiv.org/abs/2212.04581"
    , "https://arxiv.org/abs/2301.04104#deepmind"
    , "https://arxiv.org/abs/2302.12422#nvidia"
    , "https://arxiv.org/abs/2306.04930#microsoft"
    , "https://arxiv.org/abs/2306.12554"
    , "https://arxiv.org/abs/2306.14079"
    , "https://arxiv.org/abs/2308.01399"
    , "https://arxiv.org/abs/2310.04406"
    , "https://arxiv.org/abs/2310.06089"
    , "https://arxiv.org/abs/2310.15386"
    , "https://arxiv.org/abs/2311.01017"
    , "https://arxiv.org/abs/2311.05584"
    , "https://arxiv.org/abs/2312.04657"
    , "https://arxiv.org/abs/2312.06937"
    , "https://arxiv.org/abs/2312.09056"
    , "https://arxiv.org/abs/2312.17227"
    , "https://arxiv.org/abs/2404.12358"
    , "https://arxiv.org/abs/2405.15306"
    , "https://arxiv.org/abs/2405.20519"
    , "https://arxiv.org/abs/2406.06485"
    , "https://arxiv.org/abs/2406.06592#deepmind"
    , "https://arxiv.org/abs/2406.07394"
    , "https://arxiv.org/abs/2406.08404#schmidhuber"
    , "https://arxiv.org/abs/2406.10162#anthropic"
    , "https://deepmindsafetyresearch.medium.com/designing-agent-incentives-to-avoid-reward-tampering-4380c1bb6cd"
    , "https://nv-tlabs.github.io/gameGAN/#nvidia"
    , "https://openreview.net/forum?id=YwDvofEWlEx"
    , "https://openreview.net/forum?id=psXVkKO9No#deepmind"
    , "https://research.google/blog/introducing-dreamer-scalable-reinforcement-learning-using-world-models/"
    , "https://www.biorxiv.org/content/10.1101/2021.03.15.435518.full"
    , "https://www.biorxiv.org/content/10.1101/2022.09.25.509419.full"
    , "https://www.biorxiv.org/content/10.1101/2023.04.04.535512.full"
    , "https://www.biorxiv.org/content/10.1101/2024.08.13.607810.full"
    , "https://www.nature.com/articles/s41467-022-35422-y"
    ]
  , "model-based-control"
  )
, ( [ "/coin-flip"
    , "/doc/ai/1987-mcdermott.pdf"
    , "/doc/ai/nn/2013-clark.pdf"
    , "/doc/ai/tabular/2012-rintanen.pdf"
    , "/doc/psychology/neuroscience/2023-coulter.pdf"
    , "/doc/psychology/neuroscience/2023-lai.pdf"
    , "/doc/reinforcement-learning/imitation-learning/2018-gudmundsson.pdf"
    , "/doc/reinforcement-learning/imperfect-information/diplomacy/2022-bakhtin.pdf"
    , "/doc/reinforcement-learning/model/2000-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2001-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2010-silver.pdf"
    , "/doc/reinforcement-learning/model/2012-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2013-auger.pdf"
    , "/doc/reinforcement-learning/model/2015-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2018-eslami.pdf#deepmind"
    , "/doc/reinforcement-learning/model/2018-everitt.pdf"
    , "/doc/reinforcement-learning/model/2023-gao.pdf"
    , "/doc/reinforcement-learning/robot/2006-bongard.pdf"
    , "/doc/statistics/decision/2003-zadrozny.pdf"
    , "https://ai.stanford.edu/~pabbeel/pubs/AbbeelCoatesQuigleyNg_aaorltahf_nips2006.pdf"
    , "https://arxiv.org/abs/0909.0801"
    , "https://arxiv.org/abs/1301.6690"
    , "https://arxiv.org/abs/1401.5390"
    , "https://arxiv.org/abs/1411.5326#deepmind"
    , "https://arxiv.org/abs/1506.00779"
    , "https://arxiv.org/abs/1511.09249#schmidhuber"
    , "https://arxiv.org/abs/1602.02867#deepmind"
    , "https://arxiv.org/abs/1606.04442"
    , "https://arxiv.org/abs/1612.02179"
    , "https://arxiv.org/abs/1612.08810#deepmind"
    , "https://arxiv.org/abs/1702.07274"
    , "https://arxiv.org/abs/1703.04070"
    , "https://arxiv.org/abs/1704.02254"
    , "https://arxiv.org/abs/1704.07183"
    , "https://arxiv.org/abs/1704.08792"
    , "https://arxiv.org/abs/1705.02670"
    , "https://arxiv.org/abs/1705.07615"
    , "https://arxiv.org/abs/1705.08080"
    , "https://arxiv.org/abs/1706.09597"
    , "https://arxiv.org/abs/1707.03497#deepmind"
    , "https://arxiv.org/abs/1707.06170"
    , "https://arxiv.org/abs/1707.07012#google"
    , "https://arxiv.org/abs/1708.02596"
    , "https://arxiv.org/abs/1708.03871"
    , "https://arxiv.org/abs/1709.06390"
    , "https://arxiv.org/abs/1709.06917"
    , "https://arxiv.org/abs/1712.05556"
    , "https://arxiv.org/abs/1802.03676"
    , "https://arxiv.org/abs/1802.09127#google"
    , "https://arxiv.org/abs/1803.10122#google"
    , "https://arxiv.org/abs/1805.00909"
    , "https://arxiv.org/abs/1805.08166"
    , "https://arxiv.org/abs/1805.12114"
    , "https://arxiv.org/abs/1805.12244"
    , "https://arxiv.org/abs/1807.06763"
    , "https://arxiv.org/abs/1807.06906"
    , "https://arxiv.org/abs/1811.01458#deepmind"
    , "https://arxiv.org/abs/1811.04551#google"
    , "https://arxiv.org/abs/1903.08942"
    , "https://arxiv.org/abs/1905.10501"
    , "https://arxiv.org/abs/1906.05030"
    , "https://arxiv.org/abs/1906.08253"
    , "https://arxiv.org/abs/1910.03016"
    , "https://arxiv.org/abs/1910.06862"
    , "https://arxiv.org/abs/1912.01603#googledeepmind"
    , "https://arxiv.org/abs/1912.02807#deepmind"
    , "https://arxiv.org/abs/2001.00102"
    , "https://arxiv.org/abs/2002.07019"
    , "https://arxiv.org/abs/2003.03600"
    , "https://arxiv.org/abs/2003.08876"
    , "https://arxiv.org/abs/2005.05960"
    , "https://arxiv.org/abs/2005.12126#nvidia"
    , "https://arxiv.org/abs/2005.13239v6"
    , "https://arxiv.org/abs/2006.04757"
    , "https://arxiv.org/abs/2006.13888"
    , "https://arxiv.org/abs/2007.09560"
    , "https://arxiv.org/abs/2008.02215"
    , "https://arxiv.org/abs/2010.11895"
    , "https://arxiv.org/abs/2010.15835"
    , "https://arxiv.org/abs/2011.11751"
    , "https://arxiv.org/abs/2011.15091"
    , "https://arxiv.org/abs/2012.09812"
    , "https://arxiv.org/abs/2102.04518"
    , "https://arxiv.org/abs/2102.08363"
    , "https://arxiv.org/abs/2102.13249"
    , "https://arxiv.org/abs/2103.04909"
    , "https://arxiv.org/abs/2104.03946"
    , "https://arxiv.org/abs/2104.05336#deepmind"
    , "https://arxiv.org/abs/2106.04651"
    , "https://arxiv.org/abs/2106.04866"
    , "https://arxiv.org/abs/2109.08342"
    , "https://arxiv.org/abs/2110.01517"
    , "https://arxiv.org/abs/2111.02552"
    , "https://arxiv.org/abs/2111.07775"
    , "https://arxiv.org/abs/2111.09800"
    , "https://arxiv.org/abs/2112.05244"
    , "https://arxiv.org/abs/2201.07207#google"
    , "https://arxiv.org/abs/2201.12975"
    , "https://arxiv.org/abs/2202.01682"
    , "https://arxiv.org/abs/2202.01771"
    , "https://arxiv.org/abs/2202.02790"
    , "https://arxiv.org/abs/2203.00352"
    , "https://arxiv.org/abs/2203.08015"
    , "https://arxiv.org/abs/2203.13880"
    , "https://arxiv.org/abs/2204.01691#google"
    , "https://arxiv.org/abs/2204.05080#deepmind"
    , "https://arxiv.org/abs/2205.11495"
    , "https://arxiv.org/abs/2206.04114#google"
    , "https://arxiv.org/abs/2206.08332#deepmind"
    , "https://arxiv.org/abs/2206.11795#openai"
    , "https://arxiv.org/abs/2206.14176"
    , "https://arxiv.org/abs/2207.04429"
    , "https://arxiv.org/abs/2207.05608#google"
    , "https://arxiv.org/abs/2207.13224#google"
    , "https://arxiv.org/abs/2207.13513"
    , "https://arxiv.org/abs/2208.14928"
    , "https://arxiv.org/abs/2209.00588"
    , "https://arxiv.org/abs/2209.08466"
    , "https://arxiv.org/abs/2210.04435"
    , "https://arxiv.org/abs/2210.05805#facebook"
    , "https://arxiv.org/abs/2211.02703"
    , "https://arxiv.org/abs/2212.01508#deepmind"
    , "https://arxiv.org/abs/2212.04581"
    , "https://arxiv.org/abs/2301.04104#deepmind"
    , "https://arxiv.org/abs/2302.12422#nvidia"
    , "https://arxiv.org/abs/2305.07764#google"
    , "https://arxiv.org/abs/2306.12554"
    , "https://arxiv.org/abs/2306.14079"
    , "https://arxiv.org/abs/2307.08678"
    , "https://arxiv.org/abs/2308.01399"
    , "https://arxiv.org/abs/2310.04406"
    , "https://arxiv.org/abs/2310.06089"
    , "https://arxiv.org/abs/2310.15386"
    , "https://arxiv.org/abs/2311.01017"
    , "https://arxiv.org/abs/2311.05584"
    , "https://arxiv.org/abs/2312.04657"
    , "https://arxiv.org/abs/2312.09056"
    , "https://arxiv.org/abs/2312.17227"
    , "https://arxiv.org/abs/2404.12358"
    , "https://arxiv.org/abs/2405.14333#deepseek"
    , "https://arxiv.org/abs/2405.15306"
    , "https://arxiv.org/abs/2405.20519"
    , "https://arxiv.org/abs/2406.03689"
    , "https://arxiv.org/abs/2406.05946"
    , "https://arxiv.org/abs/2406.06485"
    , "https://arxiv.org/abs/2406.06592#deepmind"
    , "https://arxiv.org/abs/2406.07394"
    , "https://arxiv.org/abs/2406.08404#schmidhuber"
    , "https://arxiv.org/abs/2406.10162#anthropic"
    , "https://arxiv.org/abs/2410.01707"
    , "https://deepmindsafetyresearch.medium.com/designing-agent-incentives-to-avoid-reward-tampering-4380c1bb6cd"
    , "https://nv-tlabs.github.io/gameGAN/#nvidia"
    , "https://openreview.net/forum?id=YwDvofEWlEx"
    , "https://openreview.net/forum?id=psXVkKO9No#deepmind"
    , "https://research.google/blog/introducing-dreamer-scalable-reinforcement-learning-using-world-models/"
    , "https://www.biorxiv.org/content/10.1101/2021.03.15.435518.full"
    , "https://www.biorxiv.org/content/10.1101/2023.04.04.535512.full"
    , "https://www.biorxiv.org/content/10.1101/2024.08.13.607810.full"
    ]
  , "world-models"
  )
, ( [ "/coin-flip"
    , "/doc/ai/1987-mcdermott.pdf"
    , "/doc/ai/nn/2013-clark.pdf"
    , "/doc/ai/tabular/2012-rintanen.pdf"
    , "/doc/psychology/neuroscience/2023-coulter.pdf"
    , "/doc/psychology/neuroscience/2023-lai.pdf"
    , "/doc/reinforcement-learning/imitation-learning/2018-gudmundsson.pdf"
    , "/doc/reinforcement-learning/imperfect-information/diplomacy/2022-bakhtin.pdf"
    , "/doc/reinforcement-learning/model/2000-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2001-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2010-silver.pdf"
    , "/doc/reinforcement-learning/model/2012-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2013-auger.pdf"
    , "/doc/reinforcement-learning/model/2015-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2018-eslami.pdf#deepmind"
    , "/doc/reinforcement-learning/model/2018-everitt.pdf"
    , "/doc/reinforcement-learning/model/2023-gao.pdf"
    , "/doc/reinforcement-learning/robot/2006-bongard.pdf"
    , "/doc/statistics/decision/2003-zadrozny.pdf"
    , "https://ai.stanford.edu/~pabbeel/pubs/AbbeelCoatesQuigleyNg_aaorltahf_nips2006.pdf"
    , "https://arxiv.org/abs/0909.0801"
    , "https://arxiv.org/abs/1301.6690"
    , "https://arxiv.org/abs/1401.5390"
    , "https://arxiv.org/abs/1411.5326#deepmind"
    , "https://arxiv.org/abs/1511.09249#schmidhuber"
    , "https://arxiv.org/abs/1602.02867#deepmind"
    , "https://arxiv.org/abs/1606.04442"
    , "https://arxiv.org/abs/1612.02179"
    , "https://arxiv.org/abs/1612.08810#deepmind"
    , "https://arxiv.org/abs/1702.07274"
    , "https://arxiv.org/abs/1703.04070"
    , "https://arxiv.org/abs/1704.02254"
    , "https://arxiv.org/abs/1704.07183"
    , "https://arxiv.org/abs/1704.08792"
    , "https://arxiv.org/abs/1705.02670"
    , "https://arxiv.org/abs/1705.07615"
    , "https://arxiv.org/abs/1705.08080"
    , "https://arxiv.org/abs/1706.09597"
    , "https://arxiv.org/abs/1707.03497#deepmind"
    , "https://arxiv.org/abs/1707.06170"
    , "https://arxiv.org/abs/1707.07012#google"
    , "https://arxiv.org/abs/1708.02596"
    , "https://arxiv.org/abs/1708.03871"
    , "https://arxiv.org/abs/1709.06390"
    , "https://arxiv.org/abs/1709.06917"
    , "https://arxiv.org/abs/1712.05556"
    , "https://arxiv.org/abs/1803.10122#google"
    , "https://arxiv.org/abs/1804.09028#ibm"
    , "https://arxiv.org/abs/1805.00909"
    , "https://arxiv.org/abs/1805.08166"
    , "https://arxiv.org/abs/1805.12114"
    , "https://arxiv.org/abs/1805.12244"
    , "https://arxiv.org/abs/1807.06763"
    , "https://arxiv.org/abs/1807.06906"
    , "https://arxiv.org/abs/1811.01458#deepmind"
    , "https://arxiv.org/abs/1811.04551#google"
    , "https://arxiv.org/abs/1812.03973#google"
    , "https://arxiv.org/abs/1905.10501"
    , "https://arxiv.org/abs/1906.05030"
    , "https://arxiv.org/abs/1906.08253"
    , "https://arxiv.org/abs/1910.03016"
    , "https://arxiv.org/abs/1910.06862"
    , "https://arxiv.org/abs/1912.01603#googledeepmind"
    , "https://arxiv.org/abs/1912.02807#deepmind"
    , "https://arxiv.org/abs/2001.00102"
    , "https://arxiv.org/abs/2002.07019"
    , "https://arxiv.org/abs/2003.03600"
    , "https://arxiv.org/abs/2003.08876"
    , "https://arxiv.org/abs/2004.14990"
    , "https://arxiv.org/abs/2005.05960"
    , "https://arxiv.org/abs/2005.12126#nvidia"
    , "https://arxiv.org/abs/2005.13239v6"
    , "https://arxiv.org/abs/2006.04757"
    , "https://arxiv.org/abs/2006.13888"
    , "https://arxiv.org/abs/2007.09560"
    , "https://arxiv.org/abs/2008.02215"
    , "https://arxiv.org/abs/2010.11895"
    , "https://arxiv.org/abs/2010.15835"
    , "https://arxiv.org/abs/2011.11751"
    , "https://arxiv.org/abs/2011.15091"
    , "https://arxiv.org/abs/2012.09812"
    , "https://arxiv.org/abs/2102.04518"
    , "https://arxiv.org/abs/2102.08363"
    , "https://arxiv.org/abs/2102.13249"
    , "https://arxiv.org/abs/2103.04909"
    , "https://arxiv.org/abs/2104.03946"
    , "https://arxiv.org/abs/2104.05336#deepmind"
    , "https://arxiv.org/abs/2104.14516"
    , "https://arxiv.org/abs/2106.00188"
    , "https://arxiv.org/abs/2106.04651"
    , "https://arxiv.org/abs/2106.04866"
    , "https://arxiv.org/abs/2106.13195#google"
    , "https://arxiv.org/abs/2109.08342"
    , "https://arxiv.org/abs/2109.09371"
    , "https://arxiv.org/abs/2109.10312"
    , "https://arxiv.org/abs/2110.01517"
    , "https://arxiv.org/abs/2111.07775"
    , "https://arxiv.org/abs/2111.09800"
    , "https://arxiv.org/abs/2112.05244"
    , "https://arxiv.org/abs/2112.11598"
    , "https://arxiv.org/abs/2201.07207#google"
    , "https://arxiv.org/abs/2201.12975"
    , "https://arxiv.org/abs/2202.01682"
    , "https://arxiv.org/abs/2202.01771"
    , "https://arxiv.org/abs/2202.02790"
    , "https://arxiv.org/abs/2203.00352"
    , "https://arxiv.org/abs/2203.08015"
    , "https://arxiv.org/abs/2203.13880"
    , "https://arxiv.org/abs/2204.01691#google"
    , "https://arxiv.org/abs/2204.02863"
    , "https://arxiv.org/abs/2204.05080#deepmind"
    , "https://arxiv.org/abs/2205.10712"
    , "https://arxiv.org/abs/2205.11495"
    , "https://arxiv.org/abs/2206.04114#google"
    , "https://arxiv.org/abs/2206.08332#deepmind"
    , "https://arxiv.org/abs/2206.11309#microsoft"
    , "https://arxiv.org/abs/2206.11795#openai"
    , "https://arxiv.org/abs/2206.14176"
    , "https://arxiv.org/abs/2207.04429"
    , "https://arxiv.org/abs/2207.05608#google"
    , "https://arxiv.org/abs/2207.13224#google"
    , "https://arxiv.org/abs/2207.13513"
    , "https://arxiv.org/abs/2208.02918#microsoft"
    , "https://arxiv.org/abs/2209.00588"
    , "https://arxiv.org/abs/2209.08466"
    , "https://arxiv.org/abs/2210.04435"
    , "https://arxiv.org/abs/2210.05805#facebook"
    , "https://arxiv.org/abs/2211.02703"
    , "https://arxiv.org/abs/2212.01508#deepmind"
    , "https://arxiv.org/abs/2212.04581"
    , "https://arxiv.org/abs/2301.04104#deepmind"
    , "https://arxiv.org/abs/2302.07350#deepmind"
    , "https://arxiv.org/abs/2302.12422#nvidia"
    , "https://arxiv.org/abs/2306.04930#microsoft"
    , "https://arxiv.org/abs/2310.04406"
    , "https://arxiv.org/abs/2310.06089"
    , "https://arxiv.org/abs/2310.15386"
    , "https://arxiv.org/abs/2311.01017"
    , "https://arxiv.org/abs/2311.05584"
    , "https://arxiv.org/abs/2312.04657"
    , "https://arxiv.org/abs/2312.06937"
    , "https://arxiv.org/abs/2312.09056"
    , "https://arxiv.org/abs/2312.17227"
    , "https://arxiv.org/abs/2404.12358"
    , "https://deepmindsafetyresearch.medium.com/designing-agent-incentives-to-avoid-reward-tampering-4380c1bb6cd"
    , "https://nv-tlabs.github.io/gameGAN/#nvidia"
    , "https://openreview.net/forum?id=YwDvofEWlEx"
    , "https://openreview.net/forum?id=psXVkKO9No#deepmind"
    , "https://research.google/blog/introducing-dreamer-scalable-reinforcement-learning-using-world-models/"
    , "https://www.biorxiv.org/content/10.1101/2021.03.15.435518.full"
    , "https://www.biorxiv.org/content/10.1101/2022.09.25.509419.full"
    , "https://www.biorxiv.org/content/10.1101/2023.04.04.535512.full"
    , "https://www.nature.com/articles/s41467-022-35422-y"
    , "https://www.ncbi.nlm.nih.gov/pmc/articles/PMC3559008/"
    ]
  , "world-models"
  )
, ( [ "/coin-flip"
    , "/doc/ai/1987-mcdermott.pdf"
    , "/doc/ai/nn/2013-clark.pdf"
    , "/doc/ai/tabular/2012-rintanen.pdf"
    , "/doc/psychology/neuroscience/2023-coulter.pdf"
    , "/doc/psychology/neuroscience/2023-lai.pdf"
    , "/doc/reinforcement-learning/imitation-learning/2018-gudmundsson.pdf"
    , "/doc/reinforcement-learning/imperfect-information/diplomacy/2022-bakhtin.pdf"
    , "/doc/reinforcement-learning/model/2000-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2001-cazenave.pdf"
    , "/doc/reinforcement-learning/model/2010-silver.pdf"
    , "/doc/reinforcement-learning/model/2012-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2013-auger.pdf"
    , "/doc/reinforcement-learning/model/2015-lipovetzky.pdf"
    , "/doc/reinforcement-learning/model/2018-eslami.pdf#deepmind"
    , "/doc/reinforcement-learning/model/2018-everitt.pdf"
    , "/doc/reinforcement-learning/model/2023-gao.pdf"
    , "/doc/reinforcement-learning/robot/2006-bongard.pdf"
    , "https://ai.stanford.edu/~pabbeel/pubs/AbbeelCoatesQuigleyNg_aaorltahf_nips2006.pdf"
    , "https://arxiv.org/abs/0909.0801"
    , "https://arxiv.org/abs/1301.6690"
    , "https://arxiv.org/abs/1401.5390"
    , "https://arxiv.org/abs/1411.5326#deepmind"
    , "https://arxiv.org/abs/1506.00779"
    , "https://arxiv.org/abs/1511.09249#schmidhuber"
    , "https://arxiv.org/abs/1602.02867#deepmind"
    , "https://arxiv.org/abs/1606.04442"
    , "https://arxiv.org/abs/1612.02179"
    , "https://arxiv.org/abs/1612.08810#deepmind"
    , "https://arxiv.org/abs/1703.04070"
    , "https://arxiv.org/abs/1704.02254"
    , "https://arxiv.org/abs/1704.07183"
    , "https://arxiv.org/abs/1704.08792"
    , "https://arxiv.org/abs/1705.02670"
    , "https://arxiv.org/abs/1705.07615"
    , "https://arxiv.org/abs/1705.08080"
    , "https://arxiv.org/abs/1706.09597"
    , "https://arxiv.org/abs/1707.03497#deepmind"
    , "https://arxiv.org/abs/1707.06170"
    , "https://arxiv.org/abs/1708.02596"
    , "https://arxiv.org/abs/1708.03871"
    , "https://arxiv.org/abs/1709.06390"
    , "https://arxiv.org/abs/1709.06917"
    , "https://arxiv.org/abs/1712.05556"
    , "https://arxiv.org/abs/1802.03676"
    , "https://arxiv.org/abs/1802.09127#google"
    , "https://arxiv.org/abs/1803.10122#google"
    , "https://arxiv.org/abs/1804.09028#ibm"
    , "https://arxiv.org/abs/1805.00909"
    , "https://arxiv.org/abs/1805.08166"
    , "https://arxiv.org/abs/1805.12114"
    , "https://arxiv.org/abs/1805.12244"
    , "https://arxiv.org/abs/1807.06763"
    , "https://arxiv.org/abs/1807.06906"
    , "https://arxiv.org/abs/1811.01458#deepmind"
    , "https://arxiv.org/abs/1811.04551#google"
    , "https://arxiv.org/abs/1903.08942"
    , "https://arxiv.org/abs/1905.10501"
    , "https://arxiv.org/abs/1906.05030"
    , "https://arxiv.org/abs/1906.08253"
    , "https://arxiv.org/abs/1910.03016"
    , "https://arxiv.org/abs/1910.06862"
    , "https://arxiv.org/abs/1912.01603#googledeepmind"
    , "https://arxiv.org/abs/1912.02807#deepmind"
    , "https://arxiv.org/abs/2001.00102"
    , "https://arxiv.org/abs/2002.07019"
    , "https://arxiv.org/abs/2003.03600"
    , "https://arxiv.org/abs/2003.08876"
    , "https://arxiv.org/abs/2004.14990"
    , "https://arxiv.org/abs/2005.05960"
    , "https://arxiv.org/abs/2005.12126#nvidia"
    , "https://arxiv.org/abs/2005.13239v6"
    , "https://arxiv.org/abs/2006.04757"
    , "https://arxiv.org/abs/2006.13888"
    , "https://arxiv.org/abs/2007.09560"
    , "https://arxiv.org/abs/2008.02215"
    , "https://arxiv.org/abs/2010.11895"
    , "https://arxiv.org/abs/2011.11751"
    , "https://arxiv.org/abs/2011.15091"
    , "https://arxiv.org/abs/2012.09812"
    , "https://arxiv.org/abs/2102.04518"
    , "https://arxiv.org/abs/2102.08363"
    , "https://arxiv.org/abs/2102.13249"
    , "https://arxiv.org/abs/2103.04909"
    , "https://arxiv.org/abs/2104.03946"
    , "https://arxiv.org/abs/2104.05336#deepmind"
    , "https://arxiv.org/abs/2104.14516"
    , "https://arxiv.org/abs/2106.00188"
    , "https://arxiv.org/abs/2106.04866"
    , "https://arxiv.org/abs/2106.13195#google"
    , "https://arxiv.org/abs/2109.08342"
    , "https://arxiv.org/abs/2109.09371"
    , "https://arxiv.org/abs/2109.10312"
    , "https://arxiv.org/abs/2110.01517"
    , "https://arxiv.org/abs/2111.02552"
    , "https://arxiv.org/abs/2111.07775"
    , "https://arxiv.org/abs/2111.09800"
    , "https://arxiv.org/abs/2112.05244"
    , "https://arxiv.org/abs/2201.07207#google"
    , "https://arxiv.org/abs/2202.01682"
    , "https://arxiv.org/abs/2202.01771"
    , "https://arxiv.org/abs/2202.02790"
    , "https://arxiv.org/abs/2203.00352"
    , "https://arxiv.org/abs/2203.08015"
    , "https://arxiv.org/abs/2203.13880"
    , "https://arxiv.org/abs/2204.01691#google"
    , "https://arxiv.org/abs/2204.02863"
    , "https://arxiv.org/abs/2204.05080#deepmind"
    , "https://arxiv.org/abs/2205.11495"
    , "https://arxiv.org/abs/2206.04114#google"
    , "https://arxiv.org/abs/2206.08332#deepmind"
    , "https://arxiv.org/abs/2206.11795#openai"
    , "https://arxiv.org/abs/2206.14176"
    , "https://arxiv.org/abs/2207.04429"
    , "https://arxiv.org/abs/2207.05608#google"
    , "https://arxiv.org/abs/2207.13224#google"
    , "https://arxiv.org/abs/2207.13513"
    , "https://arxiv.org/abs/2208.02918#microsoft"
    , "https://arxiv.org/abs/2208.14928"
    , "https://arxiv.org/abs/2209.00588"
    , "https://arxiv.org/abs/2209.08466"
    , "https://arxiv.org/abs/2210.04435"
    , "https://arxiv.org/abs/2210.05805#facebook"
    , "https://arxiv.org/abs/2211.02703"
    , "https://arxiv.org/abs/2212.01508#deepmind"
    , "https://arxiv.org/abs/2212.04581"
    , "https://arxiv.org/abs/2301.04104#deepmind"
    , "https://arxiv.org/abs/2302.07350#deepmind"
    , "https://arxiv.org/abs/2302.12422#nvidia"
    , "https://arxiv.org/abs/2305.07764#google"
    , "https://arxiv.org/abs/2306.12554"
    , "https://arxiv.org/abs/2306.14079"
    , "https://arxiv.org/abs/2307.08678"
    , "https://arxiv.org/abs/2308.01399"
    , "https://arxiv.org/abs/2310.04406"
    , "https://arxiv.org/abs/2310.06089"
    , "https://arxiv.org/abs/2310.15386"
    , "https://arxiv.org/abs/2311.01017"
    , "https://arxiv.org/abs/2311.05584"
    , "https://arxiv.org/abs/2312.04657"
    , "https://arxiv.org/abs/2312.06937"
    , "https://arxiv.org/abs/2312.09056"
    , "https://arxiv.org/abs/2312.17227"
    , "https://arxiv.org/abs/2404.12358"
    , "https://arxiv.org/abs/2405.20519"
    , "https://arxiv.org/abs/2406.06485"
    , "https://arxiv.org/abs/2406.06592#deepmind"
    , "https://arxiv.org/abs/2406.07394"
    , "https://arxiv.org/abs/2406.08404#schmidhuber"
    , "https://arxiv.org/abs/2406.10162#anthropic"
    , "https://deepmindsafetyresearch.medium.com/designing-agent-incentives-to-avoid-reward-tampering-4380c1bb6cd"
    , "https://nv-tlabs.github.io/gameGAN/#nvidia"
    , "https://openreview.net/forum?id=YwDvofEWlEx"
    , "https://openreview.net/forum?id=psXVkKO9No#deepmind"
    , "https://research.google/blog/introducing-dreamer-scalable-reinforcement-learning-using-world-models/"
    , "https://www.biorxiv.org/content/10.1101/2021.03.15.435518.full"
    , "https://www.biorxiv.org/content/10.1101/2023.04.04.535512.full"
    , "https://www.biorxiv.org/content/10.1101/2024.08.13.607810.full"
    ]
  , "world-models"
  )
, ( [ "/coin-flip"
    , "/doc/ai/1987-mcdermott.pdf"
    , "/doc/ai/nn/2013-clark.pdf"
    , "/doc/ai/tabular/2012-rintanen.pdf"
    , "/doc/reinforcement-learning/imitation-learning/2018-gudmundsson.pdf"
    , "/doc/reinforcement-learning/imperfect-information/diplomacy/2022-bakhtin.pdf"
    , "/doc/reinforcement-learning/model/2010-silver.pdf"
    , "/doc/reinforcement-learning/model/2013-auger.pdf"
    , "/doc/reinforcement-learning/model/2018-eslami.pdf#deepmind"
    , "/doc/reinforcement-learning/model/2018-everitt.pdf"
    , "/doc/reinforcement-learning/model/2023-gao.pdf"
    , "/doc/reinforcement-learning/model/2024-wang-2.pdf"
    , "/doc/reinforcement-learning/robot/2006-bongard.pdf"
    , "/doc/statistics/decision/2003-zadrozny.pdf"
    , "https://ai.stanford.edu/~pabbeel/pubs/AbbeelCoatesQuigleyNg_aaorltahf_nips2006.pdf"
    , "https://arxiv.org/abs/0909.0801"
    , "https://arxiv.org/abs/1301.6690"
    , "https://arxiv.org/abs/1401.5390"
    , "https://arxiv.org/abs/1411.5326#deepmind"
    , "https://arxiv.org/abs/1511.09249#schmidhuber"
    , "https://arxiv.org/abs/1602.02867#deepmind"
    , "https://arxiv.org/abs/1606.04442"
    , "https://arxiv.org/abs/1612.02179"
    , "https://arxiv.org/abs/1612.08810#deepmind"
    , "https://arxiv.org/abs/1702.07274"
    , "https://arxiv.org/abs/1703.04070"
    , "https://arxiv.org/abs/1704.02254"
    , "https://arxiv.org/abs/1704.07183"
    , "https://arxiv.org/abs/1704.08792"
    , "https://arxiv.org/abs/1705.02670"
    , "https://arxiv.org/abs/1705.07615"
    , "https://arxiv.org/abs/1705.08080"
    , "https://arxiv.org/abs/1706.09597"
    , "https://arxiv.org/abs/1707.03497#deepmind"
    , "https://arxiv.org/abs/1707.06170"
    , "https://arxiv.org/abs/1707.07012#google"
    , "https://arxiv.org/abs/1708.02596"
    , "https://arxiv.org/abs/1709.06390"
    , "https://arxiv.org/abs/1709.06917"
    , "https://arxiv.org/abs/1712.05556"
    , "https://arxiv.org/abs/1803.10122#google"
    , "https://arxiv.org/abs/1804.09028#ibm"
    , "https://arxiv.org/abs/1805.00909"
    , "https://arxiv.org/abs/1805.08166"
    , "https://arxiv.org/abs/1805.12114"
    , "https://arxiv.org/abs/1805.12244"
    , "https://arxiv.org/abs/1807.06906"
    , "https://arxiv.org/abs/1811.01458#deepmind"
    , "https://arxiv.org/abs/1811.04551#google"
    , "https://arxiv.org/abs/1812.03973#google"
    , "https://arxiv.org/abs/1905.10501"
    , "https://arxiv.org/abs/1906.05030"
    , "https://arxiv.org/abs/1906.08253"
    , "https://arxiv.org/abs/1910.03016"
    , "https://arxiv.org/abs/1910.06862"
    , "https://arxiv.org/abs/1912.01603#googledeepmind"
    , "https://arxiv.org/abs/1912.02807#deepmind"
    , "https://arxiv.org/abs/2001.00102"
    , "https://arxiv.org/abs/2002.07019"
    , "https://arxiv.org/abs/2003.08876"
    , "https://arxiv.org/abs/2004.14990"
    , "https://arxiv.org/abs/2005.05960"
    , "https://arxiv.org/abs/2005.12126#nvidia"
    , "https://arxiv.org/abs/2005.13239v6"
    , "https://arxiv.org/abs/2006.04757"
    , "https://arxiv.org/abs/2006.13888"
    , "https://arxiv.org/abs/2008.02215"
    , "https://arxiv.org/abs/2010.11895"
    , "https://arxiv.org/abs/2010.15835"
    , "https://arxiv.org/abs/2011.11751"
    , "https://arxiv.org/abs/2012.09812"
    , "https://arxiv.org/abs/2102.04518"
    , "https://arxiv.org/abs/2102.08363"
    , "https://arxiv.org/abs/2102.13249"
    , "https://arxiv.org/abs/2103.04909"
    , "https://arxiv.org/abs/2104.03946"
    , "https://arxiv.org/abs/2104.05336#deepmind"
    , "https://arxiv.org/abs/2104.14516"
    , "https://arxiv.org/abs/2106.00188"
    , "https://arxiv.org/abs/2106.04651"
    , "https://arxiv.org/abs/2106.13195#google"
    , "https://arxiv.org/abs/2109.08342"
    , "https://arxiv.org/abs/2109.09371"
    , "https://arxiv.org/abs/2109.10312"
    , "https://arxiv.org/abs/2110.01517"
    , "https://arxiv.org/abs/2111.02552"
    , "https://arxiv.org/abs/2111.07775"
    , "https://arxiv.org/abs/2111.09800"
    , "https://arxiv.org/abs/2112.05244"
    , "https://arxiv.org/abs/2112.11598"
    , "https://arxiv.org/abs/2201.07207#google"
    , "https://arxiv.org/abs/2201.12975"
    , "https://arxiv.org/abs/2202.01682"
    , "https://arxiv.org/abs/2202.01771"
    , "https://arxiv.org/abs/2202.02790"
    , "https://arxiv.org/abs/2203.00352"
    , "https://arxiv.org/abs/2203.08015"
    , "https://arxiv.org/abs/2203.13880"
    , "https://arxiv.org/abs/2204.01691#google"
    , "https://arxiv.org/abs/2204.05080#deepmind"
    , "https://arxiv.org/abs/2205.10712"
    , "https://arxiv.org/abs/2205.11495"
    , "https://arxiv.org/abs/2206.04114#google"
    , "https://arxiv.org/abs/2206.08332#deepmind"
    , "https://arxiv.org/abs/2206.11309#microsoft"
    , "https://arxiv.org/abs/2206.11795#openai"
    , "https://arxiv.org/abs/2206.14176"
    , "https://arxiv.org/abs/2207.04429"
    , "https://arxiv.org/abs/2207.05608#google"
    , "https://arxiv.org/abs/2207.13224#google"
    , "https://arxiv.org/abs/2207.13513"
    , "https://arxiv.org/abs/2208.02918#microsoft"
    , "https://arxiv.org/abs/2209.00588"
    , "https://arxiv.org/abs/2209.08466"
    , "https://arxiv.org/abs/2210.04435"
    , "https://arxiv.org/abs/2210.05805#facebook"
    , "https://arxiv.org/abs/2211.02703"
    , "https://arxiv.org/abs/2212.01508#deepmind"
    , "https://arxiv.org/abs/2212.04581"
    , "https://arxiv.org/abs/2301.04104#deepmind"
    , "https://arxiv.org/abs/2302.07350#deepmind"
    , "https://arxiv.org/abs/2302.12422#nvidia"
    , "https://arxiv.org/abs/2306.04930#microsoft"
    , "https://arxiv.org/abs/2310.04406"
    , "https://arxiv.org/abs/2310.06089"
    , "https://arxiv.org/abs/2310.15386"
    , "https://arxiv.org/abs/2311.01017"
    , "https://arxiv.org/abs/2311.05584"
    , "https://arxiv.org/abs/2312.04657"
    , "https://arxiv.org/abs/2312.06937"
    , "https://arxiv.org/abs/2312.09056"
    , "https://arxiv.org/abs/2312.17227"
    , "https://arxiv.org/abs/2404.12358"
    , "https://dallasinnovates.com/exclusive-qa-john-carmacks-different-path-to-artificial-general-intelligence/"
    , "https://deepmindsafetyresearch.medium.com/designing-agent-incentives-to-avoid-reward-tampering-4380c1bb6cd"
    , "https://nv-tlabs.github.io/gameGAN/#nvidia"
    , "https://openreview.net/forum?id=YwDvofEWlEx"
    , "https://openreview.net/forum?id=psXVkKO9No#deepmind"
    , "https://research.google/blog/introducing-dreamer-scalable-reinforcement-learning-using-world-models/"
    , "https://www.biorxiv.org/content/10.1101/2021.03.15.435518.full"
    , "https://www.biorxiv.org/content/10.1101/2022.09.25.509419.full"
    , "https://www.nature.com/articles/s41467-022-35422-y"
    , "https://www.theatlantic.com/technology/archive/2023/11/openai-sam-altman-q-algorithm-breakthrough-project/676163/"
    ]
  , "strategy-adaptation"
  )
, ( [ "/coin-flip"
    , "/doc/ai/1987-mcdermott.pdf"
    , "/doc/ai/nn/2013-clark.pdf"
    , "/doc/ai/tabular/2012-rintanen.pdf"
    , "/doc/reinforcement-learning/imitation-learning/2018-gudmundsson.pdf"
    , "/doc/reinforcement-learning/imperfect-information/diplomacy/2022-bakhtin.pdf"
    , "/doc/reinforcement-learning/model/2010-silver.pdf"
    , "/doc/reinforcement-learning/model/2013-auger.pdf"
    , "/doc/reinforcement-learning/model/2018-eslami.pdf#deepmind"
    , "/doc/reinforcement-learning/model/2018-everitt.pdf"
    , "/doc/reinforcement-learning/model/2023-gao.pdf"
    , "/doc/statistics/decision/2003-zadrozny.pdf"
    , "https://ai.stanford.edu/~pabbeel/pubs/AbbeelCoatesQuigleyNg_aaorltahf_nips2006.pdf"
    , "https://arxiv.org/abs/0909.0801"
    , "https://arxiv.org/abs/1301.6690"

…[File truncated due to length; see original file]…