📄 disjunctionsumscorer.cs
字号:
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
using System;
using ScorerDocQueue = Lucene.Net.Util.ScorerDocQueue;
namespace Lucene.Net.Search
{
/// <summary>A Scorer for OR like queries, counterpart of <code>ConjunctionScorer</code>.
/// This Scorer implements {@link Scorer#SkipTo(int)} and uses skipTo() on the given Scorers.
/// </summary>
/// <todo> Implement score(HitCollector, int). </todo>
class DisjunctionSumScorer : Scorer
{
/// <summary>The number of subscorers. </summary>
private int nrScorers;
/// <summary>The subscorers. </summary>
protected internal System.Collections.IList subScorers;
/// <summary>The minimum number of scorers that should match. </summary>
private int minimumNrMatchers;
/// <summary>The scorerDocQueue contains all subscorers ordered by their current doc(),
/// with the minimum at the top.
/// <br>The scorerDocQueue is initialized the first time next() or skipTo() is called.
/// <br>An exhausted scorer is immediately removed from the scorerDocQueue.
/// <br>If less than the minimumNrMatchers scorers
/// remain in the scorerDocQueue next() and skipTo() return false.
/// <p>
/// After each to call to next() or skipTo()
/// <code>currentSumScore</code> is the total score of the current matching doc,
/// <code>nrMatchers</code> is the number of matching scorers,
/// and all scorers are after the matching doc, or are exhausted.
/// </summary>
private ScorerDocQueue scorerDocQueue = null;
private int queueSize = - 1; // used to avoid size() method calls on scorerDocQueue
/// <summary>The document number of the current match. </summary>
private int currentDoc = - 1;
/// <summary>The number of subscorers that provide the current match. </summary>
protected internal int nrMatchers = - 1;
private float currentScore = System.Single.NaN;
/// <summary>Construct a <code>DisjunctionScorer</code>.</summary>
/// <param name="subScorers">A collection of at least two subscorers.
/// </param>
/// <param name="minimumNrMatchers">The positive minimum number of subscorers that should
/// match to match this query.
/// <br>When <code>minimumNrMatchers</code> is bigger than
/// the number of <code>subScorers</code>,
/// no matches will be produced.
/// <br>When minimumNrMatchers equals the number of subScorers,
/// it more efficient to use <code>ConjunctionScorer</code>.
/// </param>
public DisjunctionSumScorer(System.Collections.IList subScorers, int minimumNrMatchers) : base(null)
{
nrScorers = subScorers.Count;
if (minimumNrMatchers <= 0)
{
throw new System.ArgumentException("Minimum nr of matchers must be positive");
}
if (nrScorers <= 1)
{
throw new System.ArgumentException("There must be at least 2 subScorers");
}
this.minimumNrMatchers = minimumNrMatchers;
this.subScorers = subScorers;
}
/// <summary>Construct a <code>DisjunctionScorer</code>, using one as the minimum number
/// of matching subscorers.
/// </summary>
public DisjunctionSumScorer(System.Collections.IList subScorers) : this(subScorers, 1)
{
}
/// <summary>Called the first time next() or skipTo() is called to
/// initialize <code>scorerDocQueue</code>.
/// </summary>
private void InitScorerDocQueue()
{
System.Collections.IEnumerator si = subScorers.GetEnumerator();
scorerDocQueue = new ScorerDocQueue(nrScorers);
queueSize = 0;
while (si.MoveNext())
{
Scorer se = (Scorer) si.Current;
if (se.Next())
{
// doc() method will be used in scorerDocQueue.
if (scorerDocQueue.Insert(se))
{
queueSize++;
}
}
}
}
/// <summary>Scores and collects all matching documents.</summary>
/// <param name="hc">The collector to which all matching documents are passed through
/// {@link HitCollector#Collect(int, float)}.
/// <br>When this method is used the {@link #Explain(int)} method should not be used.
/// </param>
public override void Score(HitCollector hc)
{
while (Next())
{
hc.Collect(currentDoc, currentScore);
}
}
/// <summary>Expert: Collects matching documents in a range. Hook for optimization.
/// Note that {@link #Next()} must be called once before this method is called
/// for the first time.
/// </summary>
/// <param name="hc">The collector to which all matching documents are passed through
/// {@link HitCollector#Collect(int, float)}.
/// </param>
/// <param name="max">Do not score documents past this.
/// </param>
/// <returns> true if more matching documents may remain.
/// </returns>
protected internal override bool Score(HitCollector hc, int max)
{
while (currentDoc < max)
{
hc.Collect(currentDoc, currentScore);
if (!Next())
{
return false;
}
}
return true;
}
public override bool Next()
{
if (scorerDocQueue == null)
{
InitScorerDocQueue();
}
return (scorerDocQueue.Size() >= minimumNrMatchers) && AdvanceAfterCurrent();
}
/// <summary>Advance all subscorers after the current document determined by the
/// top of the <code>scorerDocQueue</code>.
/// Repeat until at least the minimum number of subscorers match on the same
/// document and all subscorers are after that document or are exhausted.
/// <br>On entry the <code>scorerDocQueue</code> has at least <code>minimumNrMatchers</code>
/// available. At least the scorer with the minimum document number will be advanced.
/// </summary>
/// <returns> true iff there is a match.
/// <br>In case there is a match, </code>currentDoc</code>, </code>currentSumScore</code>,
/// and </code>nrMatchers</code> describe the match.
///
/// </returns>
/// <todo> Investigate whether it is possible to use skipTo() when </todo>
/// <summary> the minimum number of matchers is bigger than one, ie. try and use the
/// character of ConjunctionScorer for the minimum number of matchers.
/// Also delay calling score() on the sub scorers until the minimum number of
/// matchers is reached.
/// <br>For this, a Scorer array with minimumNrMatchers elements might
/// hold Scorers at currentDoc that are temporarily popped from scorerQueue.
/// </summary>
protected internal virtual bool AdvanceAfterCurrent()
{
do
{
// repeat until minimum nr of matchers
currentDoc = scorerDocQueue.TopDoc();
currentScore = scorerDocQueue.TopScore();
nrMatchers = 1;
do
{
// Until all subscorers are after currentDoc
if (!scorerDocQueue.TopNextAndAdjustElsePop())
{
if (--queueSize == 0)
{
break; // nothing more to advance, check for last match.
}
}
if (scorerDocQueue.TopDoc() != currentDoc)
{
break; // All remaining subscorers are after currentDoc.
}
currentScore += scorerDocQueue.TopScore();
nrMatchers++;
}
while (true);
if (nrMatchers >= minimumNrMatchers)
{
return true;
}
else if (queueSize < minimumNrMatchers)
{
return false;
}
}
while (true);
}
/// <summary>Returns the score of the current document matching the query.
/// Initially invalid, until {@link #Next()} is called the first time.
/// </summary>
public override float Score()
{
return currentScore;
}
public override int Doc()
{
return currentDoc;
}
/// <summary>Returns the number of subscorers matching the current document.
/// Initially invalid, until {@link #Next()} is called the first time.
/// </summary>
public virtual int NrMatchers()
{
return nrMatchers;
}
/// <summary>Skips to the first match beyond the current whose document number is
/// greater than or equal to a given target.
/// <br>When this method is used the {@link #Explain(int)} method should not be used.
/// <br>The implementation uses the skipTo() method on the subscorers.
/// </summary>
/// <param name="target">The target document number.
/// </param>
/// <returns> true iff there is such a match.
/// </returns>
public override bool SkipTo(int target)
{
if (scorerDocQueue == null)
{
InitScorerDocQueue();
}
if (queueSize < minimumNrMatchers)
{
return false;
}
if (target <= currentDoc)
{
return true;
}
do
{
if (scorerDocQueue.TopDoc() >= target)
{
return AdvanceAfterCurrent();
}
else if (!scorerDocQueue.TopSkipToAndAdjustElsePop(target))
{
if (--queueSize < minimumNrMatchers)
{
return false;
}
}
}
while (true);
}
/// <returns> An explanation for the score of a given document.
/// </returns>
public override Explanation Explain(int doc)
{
Explanation res = new Explanation();
System.Collections.IEnumerator ssi = subScorers.GetEnumerator();
float sumScore = 0.0f;
int nrMatches = 0;
while (ssi.MoveNext())
{
Explanation es = ((Scorer) ssi.Current).Explain(doc);
if (es.GetValue() > 0.0f)
{
// indicates match
sumScore += es.GetValue();
nrMatches++;
}
res.AddDetail(es);
}
if (nrMatchers >= minimumNrMatchers)
{
res.SetValue(sumScore);
res.SetDescription("sum over at least " + minimumNrMatchers + " of " + subScorers.Count + ":");
}
else
{
res.SetValue(0.0f);
res.SetDescription(nrMatches + " match(es) but at least " + minimumNrMatchers + " of " + subScorers.Count + " needed");
}
return res;
}
}
}
⌨️ 快捷键说明
复制代码
Ctrl + C
搜索代码
Ctrl + F
全屏模式
F11
切换主题
Ctrl + Shift + D
显示快捷键
?
增大字号
Ctrl + =
减小字号
Ctrl + -