This project is inspired from the blog scaling-test-time-compute and their github-code
This is purely a beginner code specfically for poor gpu people maybe that's what I intend to do atleast
@misc{beeching2024scalingtesttimecompute,
title={Scaling test-time compute with open models},
author={Edward Beeching and Lewis Tunstall and Sasha Rush},
url={https://huggingface.co/spaces/HuggingFaceH4/blogpost-scaling-test-time-compute},
}
@misc{snell2024scalingllmtesttimecompute,
title={Scaling LLM Test-Time Compute Optimally can be More Effective than Scaling Model Parameters},
author={Charlie Snell and Jaehoon Lee and Kelvin Xu and Aviral Kumar},
year={2024},
eprint={2408.03314},
archivePrefix={arXiv},
primaryClass={cs.LG},
url={https://arxiv.org/abs/2408.03314},
}