summaryrefslogtreecommitdiffstats
path: root/container-search/src/main/java/com/yahoo/search/ranking/ResultReranker.java
diff options
context:
space:
mode:
Diffstat (limited to 'container-search/src/main/java/com/yahoo/search/ranking/ResultReranker.java')
-rw-r--r--container-search/src/main/java/com/yahoo/search/ranking/ResultReranker.java98
1 files changed, 46 insertions, 52 deletions
diff --git a/container-search/src/main/java/com/yahoo/search/ranking/ResultReranker.java b/container-search/src/main/java/com/yahoo/search/ranking/ResultReranker.java
index d92068cd8d9..2d54e58daa2 100644
--- a/container-search/src/main/java/com/yahoo/search/ranking/ResultReranker.java
+++ b/container-search/src/main/java/com/yahoo/search/ranking/ResultReranker.java
@@ -14,80 +14,74 @@ class ResultReranker {
private static final Logger logger = Logger.getLogger(ResultReranker.class.getName());
- // scale and adjust the score according to the range
- // of the original and final score values to avoid that
- // a score from the backend is larger than finalScores_low
- static class Ranges {
- private double initialScores_high = -Double.MAX_VALUE;
- private double initialScores_low = Double.MAX_VALUE;
- private double finalScores_high = -Double.MAX_VALUE;
- private double finalScores_low = Double.MAX_VALUE;
+ private final HitRescorer hitRescorer;
+ private final int rerankCount;
+ private final List<WrappedHit> hitsToRescore = new ArrayList<>();
+ private final RangeAdjuster ranges = new RangeAdjuster();
- boolean rescaleNeeded() {
- return (initialScores_low > finalScores_low
- &&
- initialScores_high >= initialScores_low
- &&
- finalScores_high >= finalScores_low);
- }
- void withInitialScore(double score) {
- if (score < initialScores_low) initialScores_low = score;
- if (score > initialScores_high) initialScores_high = score;
- }
- void withFinalScore(double score) {
- if (score < finalScores_low) finalScores_low = score;
- if (score > finalScores_high) finalScores_high = score;
- }
- private double initialRange() {
- double r = initialScores_high - initialScores_low;
- if (r < 1.0) r = 1.0;
- return r;
- }
- private double finalRange() {
- double r = finalScores_high - finalScores_low;
- if (r < 1.0) r = 1.0;
- return r;
- }
- double scale() { return finalRange() / initialRange(); }
- double bias() { return finalScores_low - initialScores_low * scale(); }
+ ResultReranker(HitRescorer hitRescorer, int rerankCount) {
+ this.hitRescorer = hitRescorer;
+ this.rerankCount = rerankCount;
}
- static void rerankHits(Result result, HitRescorer hitRescorer, int rerankCount) {
- List<Hit> hitsToRescore = new ArrayList<>();
- // consider doing recursive iteration explicitly instead of using deepIterator?
+ void rerankHits(Result result) {
+ gatherHits(result);
+ runPreProcessing();
+ hitRescorer.runNormalizers();
+ runProcessing();
+ runPostProcessing();
+ result.hits().sort();
+ }
+
+ private void gatherHits(Result result) {
for (var iterator = result.hits().deepIterator(); iterator.hasNext();) {
Hit hit = iterator.next();
if (hit.isMeta() || hit instanceof HitGroup) {
continue;
}
// what about hits inside grouping results?
- // they are inside GroupingListHit, we won't recurse into it; so we won't see them.
- hitsToRescore.add(hit);
+ // they did not show up here during manual testing.
+ var wrapped = WrappedHit.from(hit);
+ if (wrapped != null) hitsToRescore.add(wrapped);
}
+ }
+
+ private void runPreProcessing() {
// we can't be 100% certain that hits were sorted according to relevance:
hitsToRescore.sort(Comparator.naturalOrder());
- var ranges = new Ranges();
- for (var iterator = hitsToRescore.iterator(); rerankCount > 0 && iterator.hasNext(); ) {
- Hit hit = iterator.next();
- double oldScore = hit.getRelevance().getScore();
- boolean didRerank = hitRescorer.rescoreHit(hit);
+ int count = 0;
+ for (WrappedHit hit : hitsToRescore) {
+ if (count == rerankCount) break;
+ hitRescorer.preprocess(hit);
+ ++count;
+ }
+ }
+
+ private void runProcessing() {
+ int count = 0;
+ for (var iterator = hitsToRescore.iterator(); count < rerankCount && iterator.hasNext(); ) {
+ WrappedHit wrapped = iterator.next();
+ double oldScore = wrapped.getScore();
+ boolean didRerank = hitRescorer.rescoreHit(wrapped);
if (didRerank) {
ranges.withInitialScore(oldScore);
- ranges.withFinalScore(hit.getRelevance().getScore());
- --rerankCount;
+ ranges.withFinalScore(wrapped.getScore());
+ ++count;
iterator.remove();
}
}
+ }
+
+ private void runPostProcessing() {
// if any hits are left in the list, they may need rescaling:
- if (ranges.rescaleNeeded()) {
+ if (ranges.rescaleNeeded() && ! hitsToRescore.isEmpty()) {
double scale = ranges.scale();
double bias = ranges.bias();
- for (Hit hit : hitsToRescore) {
- double oldScore = hit.getRelevance().getScore();
- hit.setRelevance(oldScore * scale + bias);
+ for (WrappedHit wrapped : hitsToRescore) {
+ double oldScore = wrapped.getScore();
+ wrapped.setScore(oldScore * scale + bias);
}
}
- result.hits().sort();
}
}