fastapi==0.74.* requests==2.27.* sentencepiece==0.1.* torch transformers uvicorn[standard]==0.17.* peft optimum auto-gptq