Skip to content

Latest commit

 

History

History
146 lines (94 loc) · 3.76 KB

math.md

File metadata and controls

146 lines (94 loc) · 3.76 KB

LLMs for Math

Here're some resources about Math LLMs

Method

Llemma: An Open Language Model For Mathematics

tag: Llemma | Proof-Pile-2

paper link: here

github link: here

dataset link: here

citation:

@misc{azerbayev2023llemma,
      title={Llemma: An Open Language Model For Mathematics}, 
      author={Zhangir Azerbayev and Hailey Schoelkopf and Keiran Paster and Marco Dos Santos and Stephen McAleer and Albert Q. Jiang and Jia Deng and Stella Biderman and Sean Welleck},
      year={2023},
      eprint={2310.10631},
      archivePrefix={arXiv},
      primaryClass={cs.CL}
}

MetaMath: Bootstrap Your Own Mathematical Questions for Large Language Models

tag: MetaMath | MetaMathQA

paper link: here

github link: here

dataset link: here

citation:

@misc{yu2023metamath,
      title={MetaMath: Bootstrap Your Own Mathematical Questions for Large Language Models}, 
      author={Longhui Yu and Weisen Jiang and Han Shi and Jincheng Yu and Zhengying Liu and Yu Zhang and James T. Kwok and Zhenguo Li and Adrian Weller and Weiyang Liu},
      year={2023},
      eprint={2309.12284},
      archivePrefix={arXiv},
      primaryClass={cs.CL}
}

LeanDojo: Theorem Proving with Retrieval-Augmented Language Models

tag: LeanDojo

paper link: here

github link: here

citation:

@inproceedings{yang2023leandojo,
  title={{LeanDojo}: Theorem Proving with Retrieval-Augmented Language Models},
  author={Yang, Kaiyu and Swope, Aidan and Gu, Alex and Chalamala, Rahul and Song, Peiyang and Yu, Shixing and Godil, Saad and Prenger, Ryan and Anandkumar, Anima},
  booktitle={Neural Information Processing Systems (NeurIPS)},
  year={2023}
}

Let's Verify Step by Step

tag: PRM800K

paper link: here

github link: here

citation:

@article{lightman2023lets,
      title={Let's Verify Step by Step}, 
      author={Lightman, Hunter and Kosaraju, Vineet and Burda, Yura and Edwards, Harri and Baker, Bowen and Lee, Teddy and Leike, Jan and Schulman, John and Sutskever, Ilya and Cobbe, Karl},
      journal={arXiv preprint arXiv:2305.20050},
      year={2023}
}

Corpus

Generative AI for Math: Part I -- MathPile: A Billion-Token-Scale Pretraining Corpus for Math

tag: MathPile

paper link: here

github link: here

dataset link: here

citation:

@misc{wang2023generative,
      title={Generative AI for Math: Part I -- MathPile: A Billion-Token-Scale Pretraining Corpus for Math}, 
      author={Zengzhi Wang and Rui Xia and Pengfei Liu},
      year={2023},
      eprint={2312.17120},
      archivePrefix={arXiv},
      primaryClass={cs.CL}
}

OpenWebMath: An Open Dataset of High-Quality Mathematical Web Text

tag: OpenWebMath

paper link: here

github link: here

dataset link: here

citation:

@misc{paster2023openwebmath,
      title={OpenWebMath: An Open Dataset of High-Quality Mathematical Web Text}, 
      author={Keiran Paster and Marco Dos Santos and Zhangir Azerbayev and Jimmy Ba},
      year={2023},
      eprint={2310.06786},
      archivePrefix={arXiv},
      primaryClass={cs.AI}
}