mmh3 pandas simhash scikit-learn torch transformers[torch]