Physics of Language Models: Part 2.2,
How to Learn From Mistakes on Grade-School Math Problems

Slide show (best viewed on a computer)

@article{YXLA2024-gsm2,
  author = {Ye, Tian and Xu, Zicheng and Li, Yuanzhi and {Allen-Zhu}, Zeyuan},
  title = {{Physics of Language Models: Part 2.1, Grade-School Math and the Hidden Reasoning Process}},
  journal = {ArXiv e-prints},
  year = 2024,
  month = aug,
  volume = {abs/2408.16293},
  note = {Full version available at \url{http://arxiv.org/abs/2408.16293}}
}