docx2txt==0.8 langchain==0.2.1 langchain-community==0.2.1 langchain-huggingface==0.0.3 sentencepiece==0.2.0 PyMuPDF protobuf langdetect==1.0.9