@@ -74,7 +74,7 @@ function overlap_join(db_collection::AbstractSimStringDB, features, τ, candidat
7474 results = String[]
7575
7676 for (candidate, match_count) in candidate_match_counts
77- for i in (query_feature_length - τ + 1 ) : query_feature_length # TODO : Verify
77+ for i in (query_feature_length - τ + 1 ) : query_feature_length
7878 if candidate in lookup_feature_set_by_size_feature (db_collection, candidate_size, features[i])
7979 match_count += 1
8080 end
@@ -103,16 +103,16 @@ function search!(measure::AbstractSimilarityMeasure, db_collection::DictDB, quer
103103 features = extract_features (db_collection. feature_extractor, query)
104104
105105 # Metadata from the generated features (length, min & max sizes)
106- length_of_features = length (features)
107- min_feature_size = minimum_feature_size (measure, length_of_features, α)
108- max_feature_size = maximum_feature_size (measure, db_collection, length_of_features, α)
106+ # length_of_features = length(features)
107+ # min_feature_size = minimum_feature_size(measure, length_of_features, α)
108+ # max_feature_size = maximum_feature_size(measure, db_collection, length_of_features, α)
109109
110110 results = String[]
111111
112112 # Generate and return results from the potential candidate size pool
113- @inbounds for candidate_size in min_feature_size : max_feature_size
113+ @inbounds for candidate_size in minimum_feature_size (measure, length (features), α) : maximum_feature_size (measure, db_collection, length (features), α)
114114 # Minimum overlap
115- τ = minimum_overlap (measure, length_of_features , candidate_size, α)
115+ τ = minimum_overlap (measure, length (features) , candidate_size, α)
116116
117117 # Generate approximate candidates from the overlap join
118118 append! (results, overlap_join (db_collection, features, τ, candidate_size))
0 commit comments