233 lines
8.1 KiB
C#
233 lines
8.1 KiB
C#
/*
|
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
|
* contributor license agreements. See the NOTICE file distributed with
|
|
* this work for additional information regarding copyright ownership.
|
|
* The ASF licenses this file to You under the Apache License, Version 2.0
|
|
* (the "License"); you may not use this file except in compliance with
|
|
* the License. You may obtain a copy of the License at
|
|
*
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
*
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
* See the License for the specific language governing permissions and
|
|
* limitations under the License.
|
|
*/
|
|
|
|
using System;
|
|
using System.Collections.Generic;
|
|
using NUnit.Framework;
|
|
|
|
using SimpleAnalyzer = Lucene.Net.Analysis.SimpleAnalyzer;
|
|
using StandardAnalyzer = Lucene.Net.Analysis.Standard.StandardAnalyzer;
|
|
using Document = Lucene.Net.Documents.Document;
|
|
using Field = Lucene.Net.Documents.Field;
|
|
using IndexReader = Lucene.Net.Index.IndexReader;
|
|
using IndexWriter = Lucene.Net.Index.IndexWriter;
|
|
using Term = Lucene.Net.Index.Term;
|
|
using TermEnum = Lucene.Net.Index.TermEnum;
|
|
using RAMDirectory = Lucene.Net.Store.RAMDirectory;
|
|
using LuceneTestCase = Lucene.Net.Util.LuceneTestCase;
|
|
|
|
namespace Lucene.Net.Search
|
|
{
|
|
|
|
/// <summary>This class tests the MultiPhraseQuery class.</summary>
|
|
[TestFixture]
|
|
public class TestMultiPhraseQuery:LuceneTestCase
|
|
{
|
|
|
|
[Test]
|
|
public virtual void TestPhrasePrefix()
|
|
{
|
|
RAMDirectory indexStore = new RAMDirectory();
|
|
IndexWriter writer = new IndexWriter(indexStore, new SimpleAnalyzer(), true, IndexWriter.MaxFieldLength.LIMITED);
|
|
Add("blueberry pie", writer);
|
|
Add("blueberry strudel", writer);
|
|
Add("blueberry pizza", writer);
|
|
Add("blueberry chewing gum", writer);
|
|
Add("bluebird pizza", writer);
|
|
Add("bluebird foobar pizza", writer);
|
|
Add("piccadilly circus", writer);
|
|
writer.Optimize();
|
|
writer.Close();
|
|
|
|
IndexSearcher searcher = new IndexSearcher(indexStore, true);
|
|
|
|
// search for "blueberry pi*":
|
|
MultiPhraseQuery query1 = new MultiPhraseQuery();
|
|
// search for "strawberry pi*":
|
|
MultiPhraseQuery query2 = new MultiPhraseQuery();
|
|
query1.Add(new Term("body", "blueberry"));
|
|
query2.Add(new Term("body", "strawberry"));
|
|
|
|
System.Collections.ArrayList termsWithPrefix = new System.Collections.ArrayList();
|
|
IndexReader ir = IndexReader.Open(indexStore, true);
|
|
|
|
// this TermEnum gives "piccadilly", "pie" and "pizza".
|
|
System.String prefix = "pi";
|
|
TermEnum te = ir.Terms(new Term("body", prefix));
|
|
do
|
|
{
|
|
if (te.Term.Text.StartsWith(prefix))
|
|
{
|
|
termsWithPrefix.Add(te.Term);
|
|
}
|
|
}
|
|
while (te.Next());
|
|
|
|
query1.Add((Term[]) termsWithPrefix.ToArray(typeof(Term)));
|
|
Assert.AreEqual("body:\"blueberry (piccadilly pie pizza)\"", query1.ToString());
|
|
query2.Add((Term[]) termsWithPrefix.ToArray(typeof(Term)));
|
|
Assert.AreEqual("body:\"strawberry (piccadilly pie pizza)\"", query2.ToString());
|
|
|
|
ScoreDoc[] result;
|
|
result = searcher.Search(query1, null, 1000).ScoreDocs;
|
|
Assert.AreEqual(2, result.Length);
|
|
result = searcher.Search(query2, null, 1000).ScoreDocs;
|
|
Assert.AreEqual(0, result.Length);
|
|
|
|
// search for "blue* pizza":
|
|
MultiPhraseQuery query3 = new MultiPhraseQuery();
|
|
termsWithPrefix.Clear();
|
|
prefix = "blue";
|
|
te = ir.Terms(new Term("body", prefix));
|
|
do
|
|
{
|
|
if (te.Term.Text.StartsWith(prefix))
|
|
{
|
|
termsWithPrefix.Add(te.Term);
|
|
}
|
|
}
|
|
while (te.Next());
|
|
query3.Add((Term[]) termsWithPrefix.ToArray(typeof(Term)));
|
|
query3.Add(new Term("body", "pizza"));
|
|
|
|
result = searcher.Search(query3, null, 1000).ScoreDocs;
|
|
Assert.AreEqual(2, result.Length); // blueberry pizza, bluebird pizza
|
|
Assert.AreEqual("body:\"(blueberry bluebird) pizza\"", query3.ToString());
|
|
|
|
// test slop:
|
|
query3.Slop = 1;
|
|
result = searcher.Search(query3, null, 1000).ScoreDocs;
|
|
Assert.AreEqual(3, result.Length); // blueberry pizza, bluebird pizza, bluebird foobar pizza
|
|
|
|
MultiPhraseQuery query4 = new MultiPhraseQuery();
|
|
|
|
// okay, all terms must belong to the same field
|
|
Assert.Throws<ArgumentException>(() =>
|
|
{
|
|
query4.Add(new Term("field1", "foo"));
|
|
query4.Add(new Term("field2", "foobar"));
|
|
});
|
|
|
|
searcher.Close();
|
|
indexStore.Close();
|
|
}
|
|
|
|
private void Add(System.String s, IndexWriter writer)
|
|
{
|
|
Document doc = new Document();
|
|
doc.Add(new Field("body", s, Field.Store.YES, Field.Index.ANALYZED));
|
|
writer.AddDocument(doc);
|
|
}
|
|
|
|
[Test]
|
|
public virtual void TestBooleanQueryContainingSingleTermPrefixQuery()
|
|
{
|
|
// this tests against bug 33161 (now fixed)
|
|
// In order to cause the bug, the outer query must have more than one term
|
|
// and all terms required.
|
|
// The contained PhraseMultiQuery must contain exactly one term array.
|
|
|
|
RAMDirectory indexStore = new RAMDirectory();
|
|
IndexWriter writer = new IndexWriter(indexStore, new SimpleAnalyzer(), true, IndexWriter.MaxFieldLength.LIMITED);
|
|
Add("blueberry pie", writer);
|
|
Add("blueberry chewing gum", writer);
|
|
Add("blue raspberry pie", writer);
|
|
writer.Optimize();
|
|
writer.Close();
|
|
|
|
IndexSearcher searcher = new IndexSearcher(indexStore, true);
|
|
// This query will be equivalent to +body:pie +body:"blue*"
|
|
BooleanQuery q = new BooleanQuery();
|
|
q.Add(new TermQuery(new Term("body", "pie")), Occur.MUST);
|
|
|
|
MultiPhraseQuery trouble = new MultiPhraseQuery();
|
|
trouble.Add(new Term[]{new Term("body", "blueberry"), new Term("body", "blue")});
|
|
q.Add(trouble, Occur.MUST);
|
|
|
|
// exception will be thrown here without fix
|
|
ScoreDoc[] hits = searcher.Search(q, null, 1000).ScoreDocs;
|
|
|
|
Assert.AreEqual(2, hits.Length, "Wrong number of hits");
|
|
searcher.Close();
|
|
}
|
|
|
|
[Test]
|
|
public virtual void TestPhrasePrefixWithBooleanQuery()
|
|
{
|
|
RAMDirectory indexStore = new RAMDirectory();
|
|
IndexWriter writer = new IndexWriter(indexStore, new StandardAnalyzer(Util.Version.LUCENE_CURRENT, Support.Compatibility.SetFactory.CreateHashSet<string>()), true, IndexWriter.MaxFieldLength.LIMITED);
|
|
Add("This is a test", "object", writer);
|
|
Add("a note", "note", writer);
|
|
writer.Close();
|
|
|
|
IndexSearcher searcher = new IndexSearcher(indexStore, true);
|
|
|
|
// This query will be equivalent to +type:note +body:"a t*"
|
|
BooleanQuery q = new BooleanQuery();
|
|
q.Add(new TermQuery(new Term("type", "note")), Occur.MUST);
|
|
|
|
MultiPhraseQuery trouble = new MultiPhraseQuery();
|
|
trouble.Add(new Term("body", "a"));
|
|
trouble.Add(new Term[]{new Term("body", "test"), new Term("body", "this")});
|
|
q.Add(trouble, Occur.MUST);
|
|
|
|
// exception will be thrown here without fix for #35626:
|
|
ScoreDoc[] hits = searcher.Search(q, null, 1000).ScoreDocs;
|
|
Assert.AreEqual(0, hits.Length, "Wrong number of hits");
|
|
searcher.Close();
|
|
}
|
|
|
|
[Test]
|
|
public virtual void TestHashCodeAndEquals()
|
|
{
|
|
MultiPhraseQuery query1 = new MultiPhraseQuery();
|
|
MultiPhraseQuery query2 = new MultiPhraseQuery();
|
|
|
|
Assert.AreEqual(query1.GetHashCode(), query2.GetHashCode());
|
|
Assert.AreEqual(query1, query2);
|
|
|
|
Term term1 = new Term("someField", "someText");
|
|
|
|
query1.Add(term1);
|
|
query2.Add(term1);
|
|
|
|
Assert.AreEqual(query1.GetHashCode(), query2.GetHashCode());
|
|
Assert.AreEqual(query1, query2);
|
|
|
|
Term term2 = new Term("someField", "someMoreText");
|
|
|
|
query1.Add(term2);
|
|
|
|
Assert.IsFalse(query1.GetHashCode() == query2.GetHashCode());
|
|
Assert.IsFalse(query1.Equals(query2));
|
|
|
|
query2.Add(term2);
|
|
|
|
Assert.AreEqual(query1.GetHashCode(), query2.GetHashCode());
|
|
Assert.AreEqual(query1, query2);
|
|
}
|
|
|
|
|
|
private void Add(System.String s, System.String type, IndexWriter writer)
|
|
{
|
|
Document doc = new Document();
|
|
doc.Add(new Field("body", s, Field.Store.YES, Field.Index.ANALYZED));
|
|
doc.Add(new Field("type", type, Field.Store.YES, Field.Index.NOT_ANALYZED));
|
|
writer.AddDocument(doc);
|
|
}
|
|
}
|
|
} |