public WeightedSpanTerm this[K key] { get { return(wrapped[key]); } set { WeightedSpanTerm prev = null; wrapped.TryGetValue(key, out prev); wrapped[key] = value; if (prev == null) { return; } WeightedSpanTerm prevTerm = prev; WeightedSpanTerm newTerm = value; if (!prevTerm.IsPositionSensitive) { newTerm.IsPositionSensitive = false; } } }
/// <summary> /// Fills a <see cref="T:IDictionary{string, WeightedSpanTerm}"/> with <see cref="WeightedSpanTerm"/>s using the terms from /// the supplied <see cref="Search.Spans.SpanQuery"/>. /// </summary> /// <param name="terms"><see cref="T:IDictionary{string, WeightedSpanTerm}"/> to place created <see cref="WeightedSpanTerm"/>s in</param> /// <param name="query"><see cref="Query"/> to extract Terms from</param> /// <exception cref="System.IO.IOException">If there is a low-level I/O error</exception> protected virtual void ExtractWeightedTerms(IDictionary <string, WeightedSpanTerm> terms, Query query) { var nonWeightedTerms = new JCG.HashSet <Term>(); query.ExtractTerms(nonWeightedTerms); foreach (Term queryTerm in nonWeightedTerms) { if (FieldNameComparer(queryTerm.Field)) { WeightedSpanTerm weightedSpanTerm = new WeightedSpanTerm(query.Boost, queryTerm.Text()); terms[queryTerm.Text()] = weightedSpanTerm; } } }
/// <summary> /// Constructs a new <see cref="QueryScorer"/> instance /// </summary> /// <param name="weightedTerms">an array of pre-created <see cref="WeightedSpanTerm"/>s</param> public QueryScorer(WeightedSpanTerm[] weightedTerms) { this.fieldWeightedSpanTerms = new HashMap <string, WeightedSpanTerm>(weightedTerms.Length); foreach (WeightedSpanTerm t in weightedTerms) { WeightedSpanTerm existingTerm = fieldWeightedSpanTerms[t.Term]; if ((existingTerm == null) || (existingTerm.Weight < t.Weight)) { // if a term is defined more than once, always use the highest // scoring Weight fieldWeightedSpanTerms[t.Term] = t; maxTermWeight = Math.Max(maxTermWeight, t.Weight); } } skipInitExtractor = true; }
/// <seealso cref="IFragmenter.IsNewFragment()"/> public virtual bool IsNewFragment() { position += posIncAtt.PositionIncrement; if (waitForPos == position) { waitForPos = -1; } else if (waitForPos != -1) { return(false); } WeightedSpanTerm wSpanTerm = queryScorer.GetWeightedSpanTerm(termAtt.ToString()); if (wSpanTerm != null) { IList <PositionSpan> positionSpans = wSpanTerm.PositionSpans; for (int i = 0; i < positionSpans.Count; i++) { if (positionSpans[i].Start == position) { waitForPos = positionSpans[i].End + 1; break; } } } bool isNewFrag = offsetAtt.EndOffset >= (fragmentSize * currentNumFrags) && (textSize - offsetAtt.EndOffset) >= fragmentSize.TripleShift(1); if (isNewFrag) { currentNumFrags++; } return(isNewFrag); }
public bool TryGetValue(K key, out WeightedSpanTerm value) { return(wrapped.TryGetValue(key, out value)); }
public void Add(K key, WeightedSpanTerm value) { this[key] = value; }
/// <summary> /// Fills a <see cref="T:IDictionary{string, WeightedSpanTerm}"/> with <see cref="WeightedSpanTerm"/>s using the terms from the supplied <see cref="SpanQuery"/>. /// </summary> /// <param name="terms"><see cref="T:IDictionary{string, WeightedSpanTerm}"/> to place created <see cref="WeightedSpanTerm"/>s in</param> /// <param name="spanQuery"><see cref="SpanQuery"/> to extract Terms from</param> /// <exception cref="System.IO.IOException">If there is a low-level I/O error</exception> protected virtual void ExtractWeightedSpanTerms(IDictionary <string, WeightedSpanTerm> terms, SpanQuery spanQuery) { ISet <string> fieldNames; if (fieldName == null) { fieldNames = new JCG.HashSet <string>(); CollectSpanQueryFields(spanQuery, fieldNames); } else { fieldNames = new JCG.HashSet <string> { fieldName }; } // To support the use of the default field name if (defaultField != null) { fieldNames.Add(defaultField); } IDictionary <string, SpanQuery> queries = new JCG.Dictionary <string, SpanQuery>(); var nonWeightedTerms = new JCG.HashSet <Term>(); bool mustRewriteQuery = MustRewriteQuery(spanQuery); if (mustRewriteQuery) { foreach (string field in fieldNames) { SpanQuery rewrittenQuery = (SpanQuery)spanQuery.Rewrite(GetLeafContext().Reader); queries[field] = rewrittenQuery; rewrittenQuery.ExtractTerms(nonWeightedTerms); } } else { spanQuery.ExtractTerms(nonWeightedTerms); } List <PositionSpan> spanPositions = new List <PositionSpan>(); foreach (string field in fieldNames) { SpanQuery q; q = mustRewriteQuery ? queries[field] : spanQuery; AtomicReaderContext context = GetLeafContext(); var termContexts = new JCG.Dictionary <Term, TermContext>(); ISet <Term> extractedTerms = new JCG.SortedSet <Term>(); q.ExtractTerms(extractedTerms); foreach (Term term in extractedTerms) { termContexts[term] = TermContext.Build(context, term); } IBits acceptDocs = context.AtomicReader.LiveDocs; Spans.Spans spans = q.GetSpans(context, acceptDocs, termContexts); // collect span positions while (spans.Next()) { spanPositions.Add(new PositionSpan(spans.Start, spans.End - 1)); } } if (spanPositions.Count == 0) { // no spans found return; } foreach (Term queryTerm in nonWeightedTerms) { if (FieldNameComparer(queryTerm.Field)) { WeightedSpanTerm weightedSpanTerm; if (!terms.TryGetValue(queryTerm.Text(), out weightedSpanTerm) || weightedSpanTerm == null) { weightedSpanTerm = new WeightedSpanTerm(spanQuery.Boost, queryTerm.Text()); weightedSpanTerm.AddPositionSpans(spanPositions); weightedSpanTerm.IsPositionSensitive = true; terms[queryTerm.Text()] = weightedSpanTerm; } else { if (spanPositions.Count > 0) { weightedSpanTerm.AddPositionSpans(spanPositions); } } } } }