3 files changed, 1058 insertions, 0 deletions
diff --git a/.gitignore b/.gitignore
index e69de29..cdd4086 100644
--- a/.gitignore
+++ b/.gitignore
@@ -0,0 +1 @@
+/textdistance-4.5.0.tar.gz
diff --git a/python-textdistance.spec b/python-textdistance.spec
new file mode 100644
index 0000000..2648353
--- /dev/null
+++ b/python-textdistance.spec
@@ -0,0 +1,1056 @@
+%global _empty_manifest_terminate_build 0
+Name:		python-textdistance
+Version:	4.5.0
+Release:	1
+Summary:	Compute distance between the two texts.
+License:	MIT
+URL:		https://github.com/orsinium/textdistance
+Source0:	https://mirrors.nju.edu.cn/pypi/web/packages/85/1e/2a567b5ad7ca6d2c0edce788e72a7ae6da088c3f8b7ffd20041e873518ee/textdistance-4.5.0.tar.gz
+BuildArch:	noarch
+
+Requires:	python3-jellyfish
+Requires:	python3-pyxDamerauLevenshtein
+Requires:	python3-rapidfuzz
+Requires:	python3-abydos
+Requires:	python3-distance
+Requires:	python3-jellyfish
+Requires:	python3-Levenshtein
+Requires:	python3-rapidfuzz
+Requires:	python3-Levenshtein
+Requires:	python3-rapidfuzz
+Requires:	python3-jellyfish
+Requires:	python3-rapidfuzz
+Requires:	python3-Levenshtein
+Requires:	python3-rapidfuzz
+Requires:	python3-abydos
+Requires:	python3-distance
+Requires:	python3-jellyfish
+Requires:	python3-numpy
+Requires:	python3-py-stringmatching
+Requires:	python3-pylev
+Requires:	python3-Levenshtein
+Requires:	python3-pyxDamerauLevenshtein
+Requires:	python3-rapidfuzz
+Requires:	python3-tabulate
+Requires:	python3-abydos
+Requires:	python3-distance
+Requires:	python3-jellyfish
+Requires:	python3-numpy
+Requires:	python3-py-stringmatching
+Requires:	python3-pylev
+Requires:	python3-Levenshtein
+Requires:	python3-pyxDamerauLevenshtein
+Requires:	python3-rapidfuzz
+Requires:	python3-tabulate
+Requires:	python3-abydos
+Requires:	python3-distance
+Requires:	python3-jellyfish
+Requires:	python3-numpy
+Requires:	python3-py-stringmatching
+Requires:	python3-pylev
+Requires:	python3-Levenshtein
+Requires:	python3-pyxDamerauLevenshtein
+Requires:	python3-rapidfuzz
+Requires:	python3-tabulate
+Requires:	python3-abydos
+Requires:	python3-jellyfish
+Requires:	python3-numpy
+Requires:	python3-Levenshtein
+Requires:	python3-pyxDamerauLevenshtein
+Requires:	python3-rapidfuzz
+Requires:	python3-abydos
+Requires:	python3-jellyfish
+Requires:	python3-numpy
+Requires:	python3-Levenshtein
+Requires:	python3-pyxDamerauLevenshtein
+Requires:	python3-rapidfuzz
+Requires:	python3-abydos
+Requires:	python3-jellyfish
+Requires:	python3-numpy
+Requires:	python3-Levenshtein
+Requires:	python3-pyxDamerauLevenshtein
+Requires:	python3-rapidfuzz
+Requires:	python3-flake8
+Requires:	python3-flake8-blind-except
+Requires:	python3-flake8-bugbear
+Requires:	python3-flake8-commas
+Requires:	python3-flake8-logging-format
+Requires:	python3-flake8-mutable
+Requires:	python3-flake8-pep3101
+Requires:	python3-flake8-quotes
+Requires:	python3-flake8-string-format
+Requires:	python3-flake8-tidy-imports
+Requires:	python3-isort
+Requires:	python3-mypy
+Requires:	python3-pep8-naming
+Requires:	python3-twine
+Requires:	python3-types-tabulate
+Requires:	python3-hypothesis
+Requires:	python3-isort
+Requires:	python3-numpy
+Requires:	python3-pytest
+
+%description
+# TextDistance
+
+![TextDistance logo](logo.png)
+
+[![Build Status](https://travis-ci.org/life4/textdistance.svg?branch=master)](https://travis-ci.org/life4/textdistance) [![PyPI version](https://img.shields.io/pypi/v/textdistance.svg)](https://pypi.python.org/pypi/textdistance) [![Status](https://img.shields.io/pypi/status/textdistance.svg)](https://pypi.python.org/pypi/textdistance) [![License](https://img.shields.io/pypi/l/textdistance.svg)](LICENSE)
+
+**TextDistance** -- python library for comparing distance between two or more sequences by many algorithms.
+
+Features:
+
+- 30+ algorithms
+- Pure python implementation
+- Simple usage
+- More than two sequences comparing
+- Some algorithms have more than one implementation in one class.
+- Optional numpy usage for maximum speed.
+
+## Algorithms
+
+### Edit based
+
+| Algorithm                                                                                 | Class                | Functions              |
+|-------------------------------------------------------------------------------------------|----------------------|------------------------|
+| [Hamming](https://en.wikipedia.org/wiki/Hamming_distance)                                 | `Hamming`            | `hamming`              |
+| [MLIPNS](http://www.sial.iias.spb.su/files/386-386-1-PB.pdf)                              | `Mlipns`             | `mlipns`               |
+| [Levenshtein](https://en.wikipedia.org/wiki/Levenshtein_distance)                         | `Levenshtein`        | `levenshtein`          |
+| [Damerau-Levenshtein](https://en.wikipedia.org/wiki/Damerau%E2%80%93Levenshtein_distance) | `DamerauLevenshtein` | `damerau_levenshtein`  |
+| [Jaro-Winkler](https://en.wikipedia.org/wiki/Jaro%E2%80%93Winkler_distance)               | `JaroWinkler`        | `jaro_winkler`, `jaro` |
+| [Strcmp95](http://cpansearch.perl.org/src/SCW/Text-JaroWinkler-0.1/strcmp95.c)            | `StrCmp95`           | `strcmp95`             |
+| [Needleman-Wunsch](https://en.wikipedia.org/wiki/Needleman%E2%80%93Wunsch_algorithm)      | `NeedlemanWunsch`    | `needleman_wunsch`     |
+| [Gotoh](http://bioinfo.ict.ac.cn/~dbu/AlgorithmCourses/Lectures/LOA/Lec6-Sequence-Alignment-Affine-Gaps-Gotoh1982.pdf) | `Gotoh`              | `gotoh`                |
+| [Smith-Waterman](https://en.wikipedia.org/wiki/Smith%E2%80%93Waterman_algorithm)          | `SmithWaterman`      | `smith_waterman`       |
+
+### Token based
+
+| Algorithm                                                                                 | Class                | Functions     |
+|-------------------------------------------------------------------------------------------|----------------------|---------------|
+| [Jaccard index](https://en.wikipedia.org/wiki/Jaccard_index)                              | `Jaccard`            | `jaccard`     |
+| [Sørensen–Dice coefficient](https://en.wikipedia.org/wiki/S%C3%B8rensen%E2%80%93Dice_coefficient) | `Sorensen`   | `sorensen`, `sorensen_dice`, `dice` |
+| [Tversky index](https://en.wikipedia.org/wiki/Tversky_index)                              | `Tversky`            | `tversky`    |
+| [Overlap coefficient](https://en.wikipedia.org/wiki/Overlap_coefficient)                  | `Overlap`            | `overlap`    |
+| [Tanimoto distance](https://en.wikipedia.org/wiki/Jaccard_index#Tanimoto_similarity_and_distance) | `Tanimoto`   | `tanimoto`   |
+| [Cosine similarity](https://en.wikipedia.org/wiki/Cosine_similarity)                      | `Cosine`             | `cosine`     |
+| [Monge-Elkan](https://www.academia.edu/200314/Generalized_Monge-Elkan_Method_for_Approximate_Text_String_Comparison) | `MongeElkan` | `monge_elkan` |
+| [Bag distance](https://github.com/Yomguithereal/talisman/blob/master/src/metrics/bag.js) | `Bag`        | `bag`        |
+
+### Sequence based
+
+| Algorithm | Class | Functions |
+|-----------|-------|-----------|
+| [longest common subsequence similarity](https://en.wikipedia.org/wiki/Longest_common_subsequence_problem)          | `LCSSeq` | `lcsseq` |
+| [longest common substring similarity](https://docs.python.org/2/library/difflib.html#difflib.SequenceMatcher)      | `LCSStr` | `lcsstr` |
+| [Ratcliff-Obershelp similarity](https://en.wikipedia.org/wiki/Gestalt_Pattern_Matching) | `RatcliffObershelp` | `ratcliff_obershelp` |
+
+### Compression based
+
+[Normalized compression distance](https://en.wikipedia.org/wiki/Normalized_compression_distance#Normalized_compression_distance) with different compression algorithms.
+
+Classic compression algorithms:
+
+| Algorithm                                                                  | Class       | Function     |
+|----------------------------------------------------------------------------|-------------|--------------|
+| [Arithmetic coding](https://en.wikipedia.org/wiki/Arithmetic_coding)       | `ArithNCD`  | `arith_ncd`  |
+| [RLE](https://en.wikipedia.org/wiki/Run-length_encoding)                   | `RLENCD`    | `rle_ncd`    |
+| [BWT RLE](https://en.wikipedia.org/wiki/Burrows%E2%80%93Wheeler_transform) | `BWTRLENCD` | `bwtrle_ncd` |
+
+Normal compression algorithms:
+
+| Algorithm                                                                  | Class        | Function      |
+|----------------------------------------------------------------------------|--------------|---------------|
+| Square Root                                                                | `SqrtNCD`    | `sqrt_ncd`    |
+| [Entropy](https://en.wikipedia.org/wiki/Entropy_(information_theory))      | `EntropyNCD` | `entropy_ncd` |
+
+Work in progress algorithms that compare two strings as array of bits:
+
+| Algorithm                                  | Class     | Function   |
+|--------------------------------------------|-----------|------------|
+| [BZ2](https://en.wikipedia.org/wiki/Bzip2) | `BZ2NCD`  | `bz2_ncd`  |
+| [LZMA](https://en.wikipedia.org/wiki/LZMA) | `LZMANCD` | `lzma_ncd` |
+| [ZLib](https://en.wikipedia.org/wiki/Zlib) | `ZLIBNCD` | `zlib_ncd` |
+
+See [blog post](https://articles.life4web.ru/other/ncd/) for more details about NCD.
+
+### Phonetic
+
+| Algorithm                                                                    | Class    | Functions |
+|------------------------------------------------------------------------------|----------|-----------|
+| [MRA](https://en.wikipedia.org/wiki/Match_rating_approach)                   | `MRA`    | `mra`     |
+| [Editex](https://anhaidgroup.github.io/py_stringmatching/v0.3.x/Editex.html) | `Editex` | `editex`  |
+
+### Simple
+
+| Algorithm           | Class      | Functions  |
+|---------------------|------------|------------|
+| Prefix similarity   | `Prefix`   | `prefix`   |
+| Postfix similarity  | `Postfix`  | `postfix`  |
+| Length distance     | `Length`   | `length`   |
+| Identity similarity | `Identity` | `identity` |
+| Matrix similarity   | `Matrix`   | `matrix`   |
+
+## Installation
+
+### Stable
+
+Only pure python implementation:
+
+```bash
+pip install textdistance
+```
+
+With extra libraries for maximum speed:
+
+```bash
+pip install "textdistance[extras]"
+```
+
+With all libraries (required for [benchmarking](#benchmarks) and [testing](#running-tests)):
+
+```bash
+pip install "textdistance[benchmark]"
+```
+
+With algorithm specific extras:
+
+```bash
+pip install "textdistance[Hamming]"
+```
+
+Algorithms with available extras: `DamerauLevenshtein`, `Hamming`, `Jaro`, `JaroWinkler`, `Levenshtein`.
+
+### Dev
+
+Via pip:
+
+```bash
+pip install -e git+https://github.com/life4/textdistance.git#egg=textdistance
+```
+
+Or clone repo and install with some extras:
+
+```bash
+git clone https://github.com/life4/textdistance.git
+pip install -e ".[benchmark]"
+```
+
+## Usage
+
+All algorithms have 2 interfaces:
+
+1. Class with algorithm-specific params for customizing.
+2. Class instance with default params for quick and simple usage.
+
+All algorithms have some common methods:
+
+1. `.distance(*sequences)` -- calculate distance between sequences.
+2. `.similarity(*sequences)` -- calculate similarity for sequences.
+3. `.maximum(*sequences)` -- maximum possible value for distance and similarity. For any sequence: `distance + similarity == maximum`.
+4. `.normalized_distance(*sequences)` -- normalized distance between sequences. The return value is a float between 0 and 1, where 0 means equal, and 1 totally different.
+5. `.normalized_similarity(*sequences)` -- normalized similarity for sequences. The return value is a float between 0 and 1, where 0 means totally different, and 1 equal.
+
+Most common init arguments:
+
+1. `qval` -- q-value for split sequences into q-grams. Possible values:
+    - 1 (default) -- compare sequences by chars.
+    - 2 or more -- transform sequences to q-grams.
+    - None -- split sequences by words.
+2. `as_set` -- for token-based algorithms:
+    - True -- `t` and `ttt` is equal.
+    - False (default) -- `t` and `ttt` is different.
+
+## Examples
+
+For example, [Hamming distance](https://en.wikipedia.org/wiki/Hamming_distance):
+
+```python
+import textdistance
+
+textdistance.hamming('test', 'text')
+# 1
+
+textdistance.hamming.distance('test', 'text')
+# 1
+
+textdistance.hamming.similarity('test', 'text')
+# 3
+
+textdistance.hamming.normalized_distance('test', 'text')
+# 0.25
+
+textdistance.hamming.normalized_similarity('test', 'text')
+# 0.75
+
+textdistance.Hamming(qval=2).distance('test', 'text')
+# 2
+
+```
+
+Any other algorithms have same interface.
+
+## Articles
+
+A few articles with examples how to use textdistance in the real world:
+
+- [Guide to Fuzzy Matching with Python](http://theautomatic.net/2019/11/13/guide-to-fuzzy-matching-with-python/)
+- [String similarity — the basic know your algorithms guide!](https://itnext.io/string-similarity-the-basic-know-your-algorithms-guide-3de3d7346227)
+- [Normalized compression distance](https://articles.life4web.ru/other/ncd/)
+
+## Extra libraries
+
+For main algorithms textdistance try to call known external libraries (fastest first) if available (installed in your system) and possible (this implementation can compare this type of sequences). [Install](#installation) textdistance with extras for this feature.
+
+You can disable this by passing `external=False` argument on init:
+
+```python3
+import textdistance
+hamming = textdistance.Hamming(external=False)
+hamming('text', 'testit')
+# 3
+```
+
+Supported libraries:
+
+1. [abydos](https://github.com/chrislit/abydos)
+1. [Distance](https://github.com/doukremt/distance)
+1. [jellyfish](https://github.com/jamesturk/jellyfish)
+1. [py_stringmatching](https://github.com/anhaidgroup/py_stringmatching)
+1. [pylev](https://github.com/toastdriven/pylev)
+1. [python-Levenshtein](https://github.com/ztane/python-Levenshtein)
+1. [pyxDamerauLevenshtein](https://github.com/gfairchild/pyxDamerauLevenshtein)
+
+Algorithms:
+
+1. DamerauLevenshtein
+1. Hamming
+1. Jaro
+1. JaroWinkler
+1. Levenshtein
+
+## Benchmarks
+
+Without extras installation:
+
+| algorithm          | library               |    time |
+|--------------------|-----------------------|---------|
+| DamerauLevenshtein | rapidfuzz             | 0.00312 |
+| DamerauLevenshtein | jellyfish             | 0.00591 |
+| DamerauLevenshtein | pyxdameraulevenshtein | 0.03335 |
+| DamerauLevenshtein | abydos                | 0.63278 |
+| DamerauLevenshtein | **textdistance**      | 0.83524 |
+| Hamming            | Levenshtein           | 0.00038 |
+| Hamming            | rapidfuzz             | 0.00044 |
+| Hamming            | jellyfish             | 0.00091 |
+| Hamming            | distance              | 0.00812 |
+| Hamming            | abydos                | 0.00902 |
+| Hamming            | **textdistance**      | 0.03531 |
+| Jaro               | rapidfuzz             | 0.00092 |
+| Jaro               | jellyfish             | 0.00191 |
+| Jaro               | **textdistance**      | 0.07365 |
+| JaroWinkler        | rapidfuzz             | 0.00094 |
+| JaroWinkler        | jellyfish             | 0.00195 |
+| JaroWinkler        | **textdistance**      | 0.07501 |
+| Levenshtein        | rapidfuzz             | 0.00099 |
+| Levenshtein        | Levenshtein           | 0.00122 |
+| Levenshtein        | jellyfish             | 0.00254 |
+| Levenshtein        | pylev                 | 0.15688 |
+| Levenshtein        | distance              | 0.28669 |
+| Levenshtein        | **textdistance**      | 0.53902 |
+| Levenshtein        | abydos                | 1.25783 |
+
+Total: 24 libs.
+
+Yeah, so slow. Use TextDistance on production only with extras.
+
+Textdistance use benchmark's results for algorithm's optimization and try to call fastest external lib first (if possible).
+
+You can run benchmark manually on your system:
+
+```bash
+pip install textdistance[benchmark]
+python3 -m textdistance.benchmark
+```
+
+TextDistance show benchmarks results table for your system and save libraries priorities into `libraries.json` file in TextDistance's folder. This file will be used by textdistance for calling fastest algorithm implementation. Default [libraries.json](textdistance/libraries.json) already included in package.
+
+## Running tests
+
+All you need is [task](https://taskfile.dev/). See [Taskfile.yml](./Taskfile.yml) for the list of available commands. For example, to run tests including third-party libraries usage, execute `task pytest-external:run`.
+
+## Contributing
+
+PRs are welcome!
+
+- Found a bug? Fix it!
+- Want to add more algorithms? Sure! Just make it with the same interface as other algorithms in the lib and add some tests.
+- Can make something faster? Great! Just avoid external dependencies and remember that everything should work not only with strings.
+- Something else that do you think is good? Do it! Just make sure that CI passes and everything from the README is still applicable (interface, features, and so on).
+- Have no time to code? Tell your friends and subscribers about `textdistance`. More users, more contributions, more amazing features.
+
+Thank you :heart:
+
+
+
+
+%package -n python3-textdistance
+Summary:	Compute distance between the two texts.
+Provides:	python-textdistance
+BuildRequires:	python3-devel
+BuildRequires:	python3-setuptools
+BuildRequires:	python3-pip
+%description -n python3-textdistance
+# TextDistance
+
+![TextDistance logo](logo.png)
+
+[![Build Status](https://travis-ci.org/life4/textdistance.svg?branch=master)](https://travis-ci.org/life4/textdistance) [![PyPI version](https://img.shields.io/pypi/v/textdistance.svg)](https://pypi.python.org/pypi/textdistance) [![Status](https://img.shields.io/pypi/status/textdistance.svg)](https://pypi.python.org/pypi/textdistance) [![License](https://img.shields.io/pypi/l/textdistance.svg)](LICENSE)
+
+**TextDistance** -- python library for comparing distance between two or more sequences by many algorithms.
+
+Features:
+
+- 30+ algorithms
+- Pure python implementation
+- Simple usage
+- More than two sequences comparing
+- Some algorithms have more than one implementation in one class.
+- Optional numpy usage for maximum speed.
+
+## Algorithms
+
+### Edit based
+
+| Algorithm                                                                                 | Class                | Functions              |
+|-------------------------------------------------------------------------------------------|----------------------|------------------------|
+| [Hamming](https://en.wikipedia.org/wiki/Hamming_distance)                                 | `Hamming`            | `hamming`              |
+| [MLIPNS](http://www.sial.iias.spb.su/files/386-386-1-PB.pdf)                              | `Mlipns`             | `mlipns`               |
+| [Levenshtein](https://en.wikipedia.org/wiki/Levenshtein_distance)                         | `Levenshtein`        | `levenshtein`          |
+| [Damerau-Levenshtein](https://en.wikipedia.org/wiki/Damerau%E2%80%93Levenshtein_distance) | `DamerauLevenshtein` | `damerau_levenshtein`  |
+| [Jaro-Winkler](https://en.wikipedia.org/wiki/Jaro%E2%80%93Winkler_distance)               | `JaroWinkler`        | `jaro_winkler`, `jaro` |
+| [Strcmp95](http://cpansearch.perl.org/src/SCW/Text-JaroWinkler-0.1/strcmp95.c)            | `StrCmp95`           | `strcmp95`             |
+| [Needleman-Wunsch](https://en.wikipedia.org/wiki/Needleman%E2%80%93Wunsch_algorithm)      | `NeedlemanWunsch`    | `needleman_wunsch`     |
+| [Gotoh](http://bioinfo.ict.ac.cn/~dbu/AlgorithmCourses/Lectures/LOA/Lec6-Sequence-Alignment-Affine-Gaps-Gotoh1982.pdf) | `Gotoh`              | `gotoh`                |
+| [Smith-Waterman](https://en.wikipedia.org/wiki/Smith%E2%80%93Waterman_algorithm)          | `SmithWaterman`      | `smith_waterman`       |
+
+### Token based
+
+| Algorithm                                                                                 | Class                | Functions     |
+|-------------------------------------------------------------------------------------------|----------------------|---------------|
+| [Jaccard index](https://en.wikipedia.org/wiki/Jaccard_index)                              | `Jaccard`            | `jaccard`     |
+| [Sørensen–Dice coefficient](https://en.wikipedia.org/wiki/S%C3%B8rensen%E2%80%93Dice_coefficient) | `Sorensen`   | `sorensen`, `sorensen_dice`, `dice` |
+| [Tversky index](https://en.wikipedia.org/wiki/Tversky_index)                              | `Tversky`            | `tversky`    |
+| [Overlap coefficient](https://en.wikipedia.org/wiki/Overlap_coefficient)                  | `Overlap`            | `overlap`    |
+| [Tanimoto distance](https://en.wikipedia.org/wiki/Jaccard_index#Tanimoto_similarity_and_distance) | `Tanimoto`   | `tanimoto`   |
+| [Cosine similarity](https://en.wikipedia.org/wiki/Cosine_similarity)                      | `Cosine`             | `cosine`     |
+| [Monge-Elkan](https://www.academia.edu/200314/Generalized_Monge-Elkan_Method_for_Approximate_Text_String_Comparison) | `MongeElkan` | `monge_elkan` |
+| [Bag distance](https://github.com/Yomguithereal/talisman/blob/master/src/metrics/bag.js) | `Bag`        | `bag`        |
+
+### Sequence based
+
+| Algorithm | Class | Functions |
+|-----------|-------|-----------|
+| [longest common subsequence similarity](https://en.wikipedia.org/wiki/Longest_common_subsequence_problem)          | `LCSSeq` | `lcsseq` |
+| [longest common substring similarity](https://docs.python.org/2/library/difflib.html#difflib.SequenceMatcher)      | `LCSStr` | `lcsstr` |
+| [Ratcliff-Obershelp similarity](https://en.wikipedia.org/wiki/Gestalt_Pattern_Matching) | `RatcliffObershelp` | `ratcliff_obershelp` |
+
+### Compression based
+
+[Normalized compression distance](https://en.wikipedia.org/wiki/Normalized_compression_distance#Normalized_compression_distance) with different compression algorithms.
+
+Classic compression algorithms:
+
+| Algorithm                                                                  | Class       | Function     |
+|----------------------------------------------------------------------------|-------------|--------------|
+| [Arithmetic coding](https://en.wikipedia.org/wiki/Arithmetic_coding)       | `ArithNCD`  | `arith_ncd`  |
+| [RLE](https://en.wikipedia.org/wiki/Run-length_encoding)                   | `RLENCD`    | `rle_ncd`    |
+| [BWT RLE](https://en.wikipedia.org/wiki/Burrows%E2%80%93Wheeler_transform) | `BWTRLENCD` | `bwtrle_ncd` |
+
+Normal compression algorithms:
+
+| Algorithm                                                                  | Class        | Function      |
+|----------------------------------------------------------------------------|--------------|---------------|
+| Square Root                                                                | `SqrtNCD`    | `sqrt_ncd`    |
+| [Entropy](https://en.wikipedia.org/wiki/Entropy_(information_theory))      | `EntropyNCD` | `entropy_ncd` |
+
+Work in progress algorithms that compare two strings as array of bits:
+
+| Algorithm                                  | Class     | Function   |
+|--------------------------------------------|-----------|------------|
+| [BZ2](https://en.wikipedia.org/wiki/Bzip2) | `BZ2NCD`  | `bz2_ncd`  |
+| [LZMA](https://en.wikipedia.org/wiki/LZMA) | `LZMANCD` | `lzma_ncd` |
+| [ZLib](https://en.wikipedia.org/wiki/Zlib) | `ZLIBNCD` | `zlib_ncd` |
+
+See [blog post](https://articles.life4web.ru/other/ncd/) for more details about NCD.
+
+### Phonetic
+
+| Algorithm                                                                    | Class    | Functions |
+|------------------------------------------------------------------------------|----------|-----------|
+| [MRA](https://en.wikipedia.org/wiki/Match_rating_approach)                   | `MRA`    | `mra`     |
+| [Editex](https://anhaidgroup.github.io/py_stringmatching/v0.3.x/Editex.html) | `Editex` | `editex`  |
+
+### Simple
+
+| Algorithm           | Class      | Functions  |
+|---------------------|------------|------------|
+| Prefix similarity   | `Prefix`   | `prefix`   |
+| Postfix similarity  | `Postfix`  | `postfix`  |
+| Length distance     | `Length`   | `length`   |
+| Identity similarity | `Identity` | `identity` |
+| Matrix similarity   | `Matrix`   | `matrix`   |
+
+## Installation
+
+### Stable
+
+Only pure python implementation:
+
+```bash
+pip install textdistance
+```
+
+With extra libraries for maximum speed:
+
+```bash
+pip install "textdistance[extras]"
+```
+
+With all libraries (required for [benchmarking](#benchmarks) and [testing](#running-tests)):
+
+```bash
+pip install "textdistance[benchmark]"
+```
+
+With algorithm specific extras:
+
+```bash
+pip install "textdistance[Hamming]"
+```
+
+Algorithms with available extras: `DamerauLevenshtein`, `Hamming`, `Jaro`, `JaroWinkler`, `Levenshtein`.
+
+### Dev
+
+Via pip:
+
+```bash
+pip install -e git+https://github.com/life4/textdistance.git#egg=textdistance
+```
+
+Or clone repo and install with some extras:
+
+```bash
+git clone https://github.com/life4/textdistance.git
+pip install -e ".[benchmark]"
+```
+
+## Usage
+
+All algorithms have 2 interfaces:
+
+1. Class with algorithm-specific params for customizing.
+2. Class instance with default params for quick and simple usage.
+
+All algorithms have some common methods:
+
+1. `.distance(*sequences)` -- calculate distance between sequences.
+2. `.similarity(*sequences)` -- calculate similarity for sequences.
+3. `.maximum(*sequences)` -- maximum possible value for distance and similarity. For any sequence: `distance + similarity == maximum`.
+4. `.normalized_distance(*sequences)` -- normalized distance between sequences. The return value is a float between 0 and 1, where 0 means equal, and 1 totally different.
+5. `.normalized_similarity(*sequences)` -- normalized similarity for sequences. The return value is a float between 0 and 1, where 0 means totally different, and 1 equal.
+
+Most common init arguments:
+
+1. `qval` -- q-value for split sequences into q-grams. Possible values:
+    - 1 (default) -- compare sequences by chars.
+    - 2 or more -- transform sequences to q-grams.
+    - None -- split sequences by words.
+2. `as_set` -- for token-based algorithms:
+    - True -- `t` and `ttt` is equal.
+    - False (default) -- `t` and `ttt` is different.
+
+## Examples
+
+For example, [Hamming distance](https://en.wikipedia.org/wiki/Hamming_distance):
+
+```python
+import textdistance
+
+textdistance.hamming('test', 'text')
+# 1
+
+textdistance.hamming.distance('test', 'text')
+# 1
+
+textdistance.hamming.similarity('test', 'text')
+# 3
+
+textdistance.hamming.normalized_distance('test', 'text')
+# 0.25
+
+textdistance.hamming.normalized_similarity('test', 'text')
+# 0.75
+
+textdistance.Hamming(qval=2).distance('test', 'text')
+# 2
+
+```
+
+Any other algorithms have same interface.
+
+## Articles
+
+A few articles with examples how to use textdistance in the real world:
+
+- [Guide to Fuzzy Matching with Python](http://theautomatic.net/2019/11/13/guide-to-fuzzy-matching-with-python/)
+- [String similarity — the basic know your algorithms guide!](https://itnext.io/string-similarity-the-basic-know-your-algorithms-guide-3de3d7346227)
+- [Normalized compression distance](https://articles.life4web.ru/other/ncd/)
+
+## Extra libraries
+
+For main algorithms textdistance try to call known external libraries (fastest first) if available (installed in your system) and possible (this implementation can compare this type of sequences). [Install](#installation) textdistance with extras for this feature.
+
+You can disable this by passing `external=False` argument on init:
+
+```python3
+import textdistance
+hamming = textdistance.Hamming(external=False)
+hamming('text', 'testit')
+# 3
+```
+
+Supported libraries:
+
+1. [abydos](https://github.com/chrislit/abydos)
+1. [Distance](https://github.com/doukremt/distance)
+1. [jellyfish](https://github.com/jamesturk/jellyfish)
+1. [py_stringmatching](https://github.com/anhaidgroup/py_stringmatching)
+1. [pylev](https://github.com/toastdriven/pylev)
+1. [python-Levenshtein](https://github.com/ztane/python-Levenshtein)
+1. [pyxDamerauLevenshtein](https://github.com/gfairchild/pyxDamerauLevenshtein)
+
+Algorithms:
+
+1. DamerauLevenshtein
+1. Hamming
+1. Jaro
+1. JaroWinkler
+1. Levenshtein
+
+## Benchmarks
+
+Without extras installation:
+
+| algorithm          | library               |    time |
+|--------------------|-----------------------|---------|
+| DamerauLevenshtein | rapidfuzz             | 0.00312 |
+| DamerauLevenshtein | jellyfish             | 0.00591 |
+| DamerauLevenshtein | pyxdameraulevenshtein | 0.03335 |
+| DamerauLevenshtein | abydos                | 0.63278 |
+| DamerauLevenshtein | **textdistance**      | 0.83524 |
+| Hamming            | Levenshtein           | 0.00038 |
+| Hamming            | rapidfuzz             | 0.00044 |
+| Hamming            | jellyfish             | 0.00091 |
+| Hamming            | distance              | 0.00812 |
+| Hamming            | abydos                | 0.00902 |
+| Hamming            | **textdistance**      | 0.03531 |
+| Jaro               | rapidfuzz             | 0.00092 |
+| Jaro               | jellyfish             | 0.00191 |
+| Jaro               | **textdistance**      | 0.07365 |
+| JaroWinkler        | rapidfuzz             | 0.00094 |
+| JaroWinkler        | jellyfish             | 0.00195 |
+| JaroWinkler        | **textdistance**      | 0.07501 |
+| Levenshtein        | rapidfuzz             | 0.00099 |
+| Levenshtein        | Levenshtein           | 0.00122 |
+| Levenshtein        | jellyfish             | 0.00254 |
+| Levenshtein        | pylev                 | 0.15688 |
+| Levenshtein        | distance              | 0.28669 |
+| Levenshtein        | **textdistance**      | 0.53902 |
+| Levenshtein        | abydos                | 1.25783 |
+
+Total: 24 libs.
+
+Yeah, so slow. Use TextDistance on production only with extras.
+
+Textdistance use benchmark's results for algorithm's optimization and try to call fastest external lib first (if possible).
+
+You can run benchmark manually on your system:
+
+```bash
+pip install textdistance[benchmark]
+python3 -m textdistance.benchmark
+```
+
+TextDistance show benchmarks results table for your system and save libraries priorities into `libraries.json` file in TextDistance's folder. This file will be used by textdistance for calling fastest algorithm implementation. Default [libraries.json](textdistance/libraries.json) already included in package.
+
+## Running tests
+
+All you need is [task](https://taskfile.dev/). See [Taskfile.yml](./Taskfile.yml) for the list of available commands. For example, to run tests including third-party libraries usage, execute `task pytest-external:run`.
+
+## Contributing
+
+PRs are welcome!
+
+- Found a bug? Fix it!
+- Want to add more algorithms? Sure! Just make it with the same interface as other algorithms in the lib and add some tests.
+- Can make something faster? Great! Just avoid external dependencies and remember that everything should work not only with strings.
+- Something else that do you think is good? Do it! Just make sure that CI passes and everything from the README is still applicable (interface, features, and so on).
+- Have no time to code? Tell your friends and subscribers about `textdistance`. More users, more contributions, more amazing features.
+
+Thank you :heart:
+
+
+
+
+%package help
+Summary:	Development documents and examples for textdistance
+Provides:	python3-textdistance-doc
+%description help
+# TextDistance
+
+![TextDistance logo](logo.png)
+
+[![Build Status](https://travis-ci.org/life4/textdistance.svg?branch=master)](https://travis-ci.org/life4/textdistance) [![PyPI version](https://img.shields.io/pypi/v/textdistance.svg)](https://pypi.python.org/pypi/textdistance) [![Status](https://img.shields.io/pypi/status/textdistance.svg)](https://pypi.python.org/pypi/textdistance) [![License](https://img.shields.io/pypi/l/textdistance.svg)](LICENSE)
+
+**TextDistance** -- python library for comparing distance between two or more sequences by many algorithms.
+
+Features:
+
+- 30+ algorithms
+- Pure python implementation
+- Simple usage
+- More than two sequences comparing
+- Some algorithms have more than one implementation in one class.
+- Optional numpy usage for maximum speed.
+
+## Algorithms
+
+### Edit based
+
+| Algorithm                                                                                 | Class                | Functions              |
+|-------------------------------------------------------------------------------------------|----------------------|------------------------|
+| [Hamming](https://en.wikipedia.org/wiki/Hamming_distance)                                 | `Hamming`            | `hamming`              |
+| [MLIPNS](http://www.sial.iias.spb.su/files/386-386-1-PB.pdf)                              | `Mlipns`             | `mlipns`               |
+| [Levenshtein](https://en.wikipedia.org/wiki/Levenshtein_distance)                         | `Levenshtein`        | `levenshtein`          |
+| [Damerau-Levenshtein](https://en.wikipedia.org/wiki/Damerau%E2%80%93Levenshtein_distance) | `DamerauLevenshtein` | `damerau_levenshtein`  |
+| [Jaro-Winkler](https://en.wikipedia.org/wiki/Jaro%E2%80%93Winkler_distance)               | `JaroWinkler`        | `jaro_winkler`, `jaro` |
+| [Strcmp95](http://cpansearch.perl.org/src/SCW/Text-JaroWinkler-0.1/strcmp95.c)            | `StrCmp95`           | `strcmp95`             |
+| [Needleman-Wunsch](https://en.wikipedia.org/wiki/Needleman%E2%80%93Wunsch_algorithm)      | `NeedlemanWunsch`    | `needleman_wunsch`     |
+| [Gotoh](http://bioinfo.ict.ac.cn/~dbu/AlgorithmCourses/Lectures/LOA/Lec6-Sequence-Alignment-Affine-Gaps-Gotoh1982.pdf) | `Gotoh`              | `gotoh`                |
+| [Smith-Waterman](https://en.wikipedia.org/wiki/Smith%E2%80%93Waterman_algorithm)          | `SmithWaterman`      | `smith_waterman`       |
+
+### Token based
+
+| Algorithm                                                                                 | Class                | Functions     |
+|-------------------------------------------------------------------------------------------|----------------------|---------------|
+| [Jaccard index](https://en.wikipedia.org/wiki/Jaccard_index)                              | `Jaccard`            | `jaccard`     |
+| [Sørensen–Dice coefficient](https://en.wikipedia.org/wiki/S%C3%B8rensen%E2%80%93Dice_coefficient) | `Sorensen`   | `sorensen`, `sorensen_dice`, `dice` |
+| [Tversky index](https://en.wikipedia.org/wiki/Tversky_index)                              | `Tversky`            | `tversky`    |
+| [Overlap coefficient](https://en.wikipedia.org/wiki/Overlap_coefficient)                  | `Overlap`            | `overlap`    |
+| [Tanimoto distance](https://en.wikipedia.org/wiki/Jaccard_index#Tanimoto_similarity_and_distance) | `Tanimoto`   | `tanimoto`   |
+| [Cosine similarity](https://en.wikipedia.org/wiki/Cosine_similarity)                      | `Cosine`             | `cosine`     |
+| [Monge-Elkan](https://www.academia.edu/200314/Generalized_Monge-Elkan_Method_for_Approximate_Text_String_Comparison) | `MongeElkan` | `monge_elkan` |
+| [Bag distance](https://github.com/Yomguithereal/talisman/blob/master/src/metrics/bag.js) | `Bag`        | `bag`        |
+
+### Sequence based
+
+| Algorithm | Class | Functions |
+|-----------|-------|-----------|
+| [longest common subsequence similarity](https://en.wikipedia.org/wiki/Longest_common_subsequence_problem)          | `LCSSeq` | `lcsseq` |
+| [longest common substring similarity](https://docs.python.org/2/library/difflib.html#difflib.SequenceMatcher)      | `LCSStr` | `lcsstr` |
+| [Ratcliff-Obershelp similarity](https://en.wikipedia.org/wiki/Gestalt_Pattern_Matching) | `RatcliffObershelp` | `ratcliff_obershelp` |
+
+### Compression based
+
+[Normalized compression distance](https://en.wikipedia.org/wiki/Normalized_compression_distance#Normalized_compression_distance) with different compression algorithms.
+
+Classic compression algorithms:
+
+| Algorithm                                                                  | Class       | Function     |
+|----------------------------------------------------------------------------|-------------|--------------|
+| [Arithmetic coding](https://en.wikipedia.org/wiki/Arithmetic_coding)       | `ArithNCD`  | `arith_ncd`  |
+| [RLE](https://en.wikipedia.org/wiki/Run-length_encoding)                   | `RLENCD`    | `rle_ncd`    |
+| [BWT RLE](https://en.wikipedia.org/wiki/Burrows%E2%80%93Wheeler_transform) | `BWTRLENCD` | `bwtrle_ncd` |
+
+Normal compression algorithms:
+
+| Algorithm                                                                  | Class        | Function      |
+|----------------------------------------------------------------------------|--------------|---------------|
+| Square Root                                                                | `SqrtNCD`    | `sqrt_ncd`    |
+| [Entropy](https://en.wikipedia.org/wiki/Entropy_(information_theory))      | `EntropyNCD` | `entropy_ncd` |
+
+Work in progress algorithms that compare two strings as array of bits:
+
+| Algorithm                                  | Class     | Function   |
+|--------------------------------------------|-----------|------------|
+| [BZ2](https://en.wikipedia.org/wiki/Bzip2) | `BZ2NCD`  | `bz2_ncd`  |
+| [LZMA](https://en.wikipedia.org/wiki/LZMA) | `LZMANCD` | `lzma_ncd` |
+| [ZLib](https://en.wikipedia.org/wiki/Zlib) | `ZLIBNCD` | `zlib_ncd` |
+
+See [blog post](https://articles.life4web.ru/other/ncd/) for more details about NCD.
+
+### Phonetic
+
+| Algorithm                                                                    | Class    | Functions |
+|------------------------------------------------------------------------------|----------|-----------|
+| [MRA](https://en.wikipedia.org/wiki/Match_rating_approach)                   | `MRA`    | `mra`     |
+| [Editex](https://anhaidgroup.github.io/py_stringmatching/v0.3.x/Editex.html) | `Editex` | `editex`  |
+
+### Simple
+
+| Algorithm           | Class      | Functions  |
+|---------------------|------------|------------|
+| Prefix similarity   | `Prefix`   | `prefix`   |
+| Postfix similarity  | `Postfix`  | `postfix`  |
+| Length distance     | `Length`   | `length`   |
+| Identity similarity | `Identity` | `identity` |
+| Matrix similarity   | `Matrix`   | `matrix`   |
+
+## Installation
+
+### Stable
+
+Only pure python implementation:
+
+```bash
+pip install textdistance
+```
+
+With extra libraries for maximum speed:
+
+```bash
+pip install "textdistance[extras]"
+```
+
+With all libraries (required for [benchmarking](#benchmarks) and [testing](#running-tests)):
+
+```bash
+pip install "textdistance[benchmark]"
+```
+
+With algorithm specific extras:
+
+```bash
+pip install "textdistance[Hamming]"
+```
+
+Algorithms with available extras: `DamerauLevenshtein`, `Hamming`, `Jaro`, `JaroWinkler`, `Levenshtein`.
+
+### Dev
+
+Via pip:
+
+```bash
+pip install -e git+https://github.com/life4/textdistance.git#egg=textdistance
+```
+
+Or clone repo and install with some extras:
+
+```bash
+git clone https://github.com/life4/textdistance.git
+pip install -e ".[benchmark]"
+```
+
+## Usage
+
+All algorithms have 2 interfaces:
+
+1. Class with algorithm-specific params for customizing.
+2. Class instance with default params for quick and simple usage.
+
+All algorithms have some common methods:
+
+1. `.distance(*sequences)` -- calculate distance between sequences.
+2. `.similarity(*sequences)` -- calculate similarity for sequences.
+3. `.maximum(*sequences)` -- maximum possible value for distance and similarity. For any sequence: `distance + similarity == maximum`.
+4. `.normalized_distance(*sequences)` -- normalized distance between sequences. The return value is a float between 0 and 1, where 0 means equal, and 1 totally different.
+5. `.normalized_similarity(*sequences)` -- normalized similarity for sequences. The return value is a float between 0 and 1, where 0 means totally different, and 1 equal.
+
+Most common init arguments:
+
+1. `qval` -- q-value for split sequences into q-grams. Possible values:
+    - 1 (default) -- compare sequences by chars.
+    - 2 or more -- transform sequences to q-grams.
+    - None -- split sequences by words.
+2. `as_set` -- for token-based algorithms:
+    - True -- `t` and `ttt` is equal.
+    - False (default) -- `t` and `ttt` is different.
+
+## Examples
+
+For example, [Hamming distance](https://en.wikipedia.org/wiki/Hamming_distance):
+
+```python
+import textdistance
+
+textdistance.hamming('test', 'text')
+# 1
+
+textdistance.hamming.distance('test', 'text')
+# 1
+
+textdistance.hamming.similarity('test', 'text')
+# 3
+
+textdistance.hamming.normalized_distance('test', 'text')
+# 0.25
+
+textdistance.hamming.normalized_similarity('test', 'text')
+# 0.75
+
+textdistance.Hamming(qval=2).distance('test', 'text')
+# 2
+
+```
+
+Any other algorithms have same interface.
+
+## Articles
+
+A few articles with examples how to use textdistance in the real world:
+
+- [Guide to Fuzzy Matching with Python](http://theautomatic.net/2019/11/13/guide-to-fuzzy-matching-with-python/)
+- [String similarity — the basic know your algorithms guide!](https://itnext.io/string-similarity-the-basic-know-your-algorithms-guide-3de3d7346227)
+- [Normalized compression distance](https://articles.life4web.ru/other/ncd/)
+
+## Extra libraries
+
+For main algorithms textdistance try to call known external libraries (fastest first) if available (installed in your system) and possible (this implementation can compare this type of sequences). [Install](#installation) textdistance with extras for this feature.
+
+You can disable this by passing `external=False` argument on init:
+
+```python3
+import textdistance
+hamming = textdistance.Hamming(external=False)
+hamming('text', 'testit')
+# 3
+```
+
+Supported libraries:
+
+1. [abydos](https://github.com/chrislit/abydos)
+1. [Distance](https://github.com/doukremt/distance)
+1. [jellyfish](https://github.com/jamesturk/jellyfish)
+1. [py_stringmatching](https://github.com/anhaidgroup/py_stringmatching)
+1. [pylev](https://github.com/toastdriven/pylev)
+1. [python-Levenshtein](https://github.com/ztane/python-Levenshtein)
+1. [pyxDamerauLevenshtein](https://github.com/gfairchild/pyxDamerauLevenshtein)
+
+Algorithms:
+
+1. DamerauLevenshtein
+1. Hamming
+1. Jaro
+1. JaroWinkler
+1. Levenshtein
+
+## Benchmarks
+
+Without extras installation:
+
+| algorithm          | library               |    time |
+|--------------------|-----------------------|---------|
+| DamerauLevenshtein | rapidfuzz             | 0.00312 |
+| DamerauLevenshtein | jellyfish             | 0.00591 |
+| DamerauLevenshtein | pyxdameraulevenshtein | 0.03335 |
+| DamerauLevenshtein | abydos                | 0.63278 |
+| DamerauLevenshtein | **textdistance**      | 0.83524 |
+| Hamming            | Levenshtein           | 0.00038 |
+| Hamming            | rapidfuzz             | 0.00044 |
+| Hamming            | jellyfish             | 0.00091 |
+| Hamming            | distance              | 0.00812 |
+| Hamming            | abydos                | 0.00902 |
+| Hamming            | **textdistance**      | 0.03531 |
+| Jaro               | rapidfuzz             | 0.00092 |
+| Jaro               | jellyfish             | 0.00191 |
+| Jaro               | **textdistance**      | 0.07365 |
+| JaroWinkler        | rapidfuzz             | 0.00094 |
+| JaroWinkler        | jellyfish             | 0.00195 |
+| JaroWinkler        | **textdistance**      | 0.07501 |
+| Levenshtein        | rapidfuzz             | 0.00099 |
+| Levenshtein        | Levenshtein           | 0.00122 |
+| Levenshtein        | jellyfish             | 0.00254 |
+| Levenshtein        | pylev                 | 0.15688 |
+| Levenshtein        | distance              | 0.28669 |
+| Levenshtein        | **textdistance**      | 0.53902 |
+| Levenshtein        | abydos                | 1.25783 |
+
+Total: 24 libs.
+
+Yeah, so slow. Use TextDistance on production only with extras.
+
+Textdistance use benchmark's results for algorithm's optimization and try to call fastest external lib first (if possible).
+
+You can run benchmark manually on your system:
+
+```bash
+pip install textdistance[benchmark]
+python3 -m textdistance.benchmark
+```
+
+TextDistance show benchmarks results table for your system and save libraries priorities into `libraries.json` file in TextDistance's folder. This file will be used by textdistance for calling fastest algorithm implementation. Default [libraries.json](textdistance/libraries.json) already included in package.
+
+## Running tests
+
+All you need is [task](https://taskfile.dev/). See [Taskfile.yml](./Taskfile.yml) for the list of available commands. For example, to run tests including third-party libraries usage, execute `task pytest-external:run`.
+
+## Contributing
+
+PRs are welcome!
+
+- Found a bug? Fix it!
+- Want to add more algorithms? Sure! Just make it with the same interface as other algorithms in the lib and add some tests.
+- Can make something faster? Great! Just avoid external dependencies and remember that everything should work not only with strings.
+- Something else that do you think is good? Do it! Just make sure that CI passes and everything from the README is still applicable (interface, features, and so on).
+- Have no time to code? Tell your friends and subscribers about `textdistance`. More users, more contributions, more amazing features.
+
+Thank you :heart:
+
+
+
+
+%prep
+%autosetup -n textdistance-4.5.0
+
+%build
+%py3_build
+
+%install
+%py3_install
+install -d -m755 %{buildroot}/%{_pkgdocdir}
+if [ -d doc ]; then cp -arf doc %{buildroot}/%{_pkgdocdir}; fi
+if [ -d docs ]; then cp -arf docs %{buildroot}/%{_pkgdocdir}; fi
+if [ -d example ]; then cp -arf example %{buildroot}/%{_pkgdocdir}; fi
+if [ -d examples ]; then cp -arf examples %{buildroot}/%{_pkgdocdir}; fi
+pushd %{buildroot}
+if [ -d usr/lib ]; then
+	find usr/lib -type f -printf "/%h/%f\n" >> filelist.lst
+fi
+if [ -d usr/lib64 ]; then
+	find usr/lib64 -type f -printf "/%h/%f\n" >> filelist.lst
+fi
+if [ -d usr/bin ]; then
+	find usr/bin -type f -printf "/%h/%f\n" >> filelist.lst
+fi
+if [ -d usr/sbin ]; then
+	find usr/sbin -type f -printf "/%h/%f\n" >> filelist.lst
+fi
+touch doclist.lst
+if [ -d usr/share/man ]; then
+	find usr/share/man -type f -printf "/%h/%f.gz\n" >> doclist.lst
+fi
+popd
+mv %{buildroot}/filelist.lst .
+mv %{buildroot}/doclist.lst .
+
+%files -n python3-textdistance -f filelist.lst
+%dir %{python3_sitelib}/*
+
+%files help -f doclist.lst
+%{_docdir}/*
+
+%changelog
+* Mon Apr 10 2023 Python_Bot <Python_Bot@openeuler.org> - 4.5.0-1
+- Package Spec generated
diff --git a/sources b/sources
new file mode 100644
index 0000000..aa6f5a8
--- /dev/null
+++ b/sources
@@ -0,0 +1 @@
+e389e6ce47721071688f3ae989139f06  textdistance-4.5.0.tar.gz