gensim hdbscan nltk numpy openai >= 1.0.0 pandas plotly regex scikit-learn seaborn sentence-transformers tiktoken tokenizers tqdm umap-learn umap-learn[plot]