d3ec733c425e7d9d066380b95e04605843339bd0,dirty_cat/similarity_encoder.py,,get_prototype_sorted_by_frequencies,#,47
Before Change
Returns a numpy array of the values without their frequencies
uniques, counts = np.unique(prototypes, return_counts=True)
frequencies = list(zip(uniques, counts))
frequencies, _ = sorted(frequencies, key=lambda elt: elt[1], reverse=True)
return np.array([f for f in frequencies])
_VECTORIZED_EDIT_DISTANCES = {
"levenshtein-ratio": np.vectorize(string_distances.levenshtein_ratio),
After Change
Returns a numpy array of the values without their frequencies
uniques, counts = np.unique(prototypes, return_counts=True)
sorted_indexes = np.argsort(counts)[::-1]
return uniques[sorted_indexes], counts[sorted_indexes]
_VECTORIZED_EDIT_DISTANCES = {
"levenshtein-ratio": np.vectorize(string_distances.levenshtein_ratio),
In pattern: SUPERPATTERN
Frequency: 3
Non-data size: 7
Instances Project Name: dirty-cat/dirty_cat
Commit Name: d3ec733c425e7d9d066380b95e04605843339bd0
Time: 2018-11-08
Author: maxime.cuny@inria.fr
File Name: dirty_cat/similarity_encoder.py
Class Name:
Method Name: get_prototype_sorted_by_frequencies
Project Name: robertmartin8/PyPortfolioOpt
Commit Name: 5e56bcc41a7d147c710e57c4c764651c7e148581
Time: 2020-04-30
Author: thomas.schmlezer@gmail.com
File Name: pypfopt/hierarchical_portfolio.py
Class Name: HRPOpt
Method Name: _get_quasi_diag
Project Name: robertmartin8/PyPortfolioOpt
Commit Name: 70b08e1d2e703b4e3d16da9aaa04706dd4413232
Time: 2020-05-01
Author: thomas.schmlezer@gmail.com
File Name: pypfopt/hierarchical_portfolio.py
Class Name: HRPOpt
Method Name: _get_quasi_diag