docx2txt==0.8 langchain==0.2.1 langchain_community==0.2.1 langchain_huggingface==0.0.3 sentencepiece==0.2.0 PyPDF2