kafka-python python-dotenv tweepy==3.9.0 pyspark==3.0.2 spacy sklearn cassandra-driver nltk