@@ -74,7 +74,7 @@ function overlap_join(db_collection::AbstractSimStringDB, features, τ, candidat
74
74
results = String[]
75
75
76
76
for (candidate, match_count) in candidate_match_counts
77
- for i in (query_feature_length - τ + 1 ) : query_feature_length# TODO : Verify
77
+ for i in (query_feature_length - τ + 1 ) : query_feature_length
78
78
if candidate in lookup_feature_set_by_size_feature (db_collection, candidate_size, features[i])
79
79
match_count += 1
80
80
end
@@ -103,16 +103,16 @@ function search!(measure::AbstractSimilarityMeasure, db_collection::DictDB, quer
103
103
features = extract_features (db_collection. feature_extractor, query)
104
104
105
105
# Metadata from the generated features (length, min & max sizes)
106
- length_of_features = length (features)
107
- min_feature_size = minimum_feature_size (measure, length_of_features, α)
108
- max_feature_size = maximum_feature_size (measure, db_collection, length_of_features, α)
106
+ # length_of_features = length(features)
107
+ # min_feature_size = minimum_feature_size(measure, length_of_features, α)
108
+ # max_feature_size = maximum_feature_size(measure, db_collection, length_of_features, α)
109
109
110
110
results = String[]
111
111
112
112
# Generate and return results from the potential candidate size pool
113
- @inbounds for candidate_size in min_feature_size : max_feature_size
113
+ @inbounds for candidate_size in minimum_feature_size (measure, length (features), α) : maximum_feature_size (measure, db_collection, length (features), α)
114
114
# Minimum overlap
115
- τ = minimum_overlap (measure, length_of_features , candidate_size, α)
115
+ τ = minimum_overlap (measure, length (features) , candidate_size, α)
116
116
117
117
# Generate approximate candidates from the overlap join
118
118
append! (results, overlap_join (db_collection, features, τ, candidate_size))
0 commit comments