LUCENE-2548: don't intern field names

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1138058 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
Michael McCandless 2011-06-21 15:42:54 +00:00
parent 9d469e5111
commit c039e210b0
68 changed files with 212 additions and 542 deletions

View File

@ -149,6 +149,9 @@ Changes in backwards compatibility policy
files holding stored fields and term vectors) while flushing a files holding stored fields and term vectors) while flushing a
segment. (Mike McCandless) segment. (Mike McCandless)
* LUCENE-2548: Field names (eg in Term, FieldInfo) are no longer
interned. (Mike McCandless)
Changes in Runtime Behavior Changes in Runtime Behavior
* LUCENE-2846: omitNorms now behaves like omitTermFrequencyAndPositions, if you * LUCENE-2846: omitNorms now behaves like omitTermFrequencyAndPositions, if you

View File

@ -31,7 +31,6 @@ import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.memory.MemoryIndex; import org.apache.lucene.index.memory.MemoryIndex;
import org.apache.lucene.search.Query; import org.apache.lucene.search.Query;
import org.apache.lucene.search.spans.SpanQuery; import org.apache.lucene.search.spans.SpanQuery;
import org.apache.lucene.util.StringHelper;
/** /**
* {@link Scorer} implementation which scores text fragments by the number of * {@link Scorer} implementation which scores text fragments by the number of
@ -88,7 +87,7 @@ public class QueryScorer implements Scorer {
* @param defaultField * @param defaultField
*/ */
public QueryScorer(Query query, IndexReader reader, String field, String defaultField) { public QueryScorer(Query query, IndexReader reader, String field, String defaultField) {
this.defaultField = StringHelper.intern(defaultField); this.defaultField = defaultField;
init(query, field, reader, true); init(query, field, reader, true);
} }
@ -96,7 +95,7 @@ public class QueryScorer implements Scorer {
* @param defaultField - The default field for queries with the field name unspecified * @param defaultField - The default field for queries with the field name unspecified
*/ */
public QueryScorer(Query query, String field, String defaultField) { public QueryScorer(Query query, String field, String defaultField) {
this.defaultField = StringHelper.intern(defaultField); this.defaultField = defaultField;
init(query, field, null, true); init(query, field, null, true);
} }

View File

@ -26,7 +26,6 @@ import org.apache.lucene.search.BooleanClause;
import org.apache.lucene.search.BooleanQuery; import org.apache.lucene.search.BooleanQuery;
import org.apache.lucene.search.FilteredQuery; import org.apache.lucene.search.FilteredQuery;
import org.apache.lucene.search.Query; import org.apache.lucene.search.Query;
import org.apache.lucene.util.StringHelper;
/** /**
* Utility class used to extract the terms used in a query, plus any weights. * Utility class used to extract the terms used in a query, plus any weights.
@ -94,10 +93,6 @@ public final class QueryTermExtractor
public static final WeightedTerm[] getTerms(Query query, boolean prohibited, String fieldName) public static final WeightedTerm[] getTerms(Query query, boolean prohibited, String fieldName)
{ {
HashSet<WeightedTerm> terms=new HashSet<WeightedTerm>(); HashSet<WeightedTerm> terms=new HashSet<WeightedTerm>();
if(fieldName!=null)
{
fieldName= StringHelper.intern(fieldName);
}
getTerms(query,terms,prohibited,fieldName); getTerms(query,terms,prohibited,fieldName);
return terms.toArray(new WeightedTerm[0]); return terms.toArray(new WeightedTerm[0]);
} }
@ -114,7 +109,6 @@ public final class QueryTermExtractor
return getTerms(query,prohibited,null); return getTerms(query,prohibited,null);
} }
//fieldname MUST be interned prior to this call
private static final void getTerms(Query query, HashSet<WeightedTerm> terms,boolean prohibited, String fieldName) private static final void getTerms(Query query, HashSet<WeightedTerm> terms,boolean prohibited, String fieldName)
{ {
try try
@ -131,7 +125,7 @@ public final class QueryTermExtractor
for (Iterator<Term> iter = nonWeightedTerms.iterator(); iter.hasNext();) for (Iterator<Term> iter = nonWeightedTerms.iterator(); iter.hasNext();)
{ {
Term term = iter.next(); Term term = iter.next();
if((fieldName==null)||(term.field()==fieldName)) if((fieldName==null)||(term.field().equals(fieldName)))
{ {
terms.add(new WeightedTerm(query.getBoost(),term.text())); terms.add(new WeightedTerm(query.getBoost(),term.text()));
} }

View File

@ -41,7 +41,6 @@ import org.apache.lucene.search.spans.SpanOrQuery;
import org.apache.lucene.search.spans.SpanQuery; import org.apache.lucene.search.spans.SpanQuery;
import org.apache.lucene.search.spans.SpanTermQuery; import org.apache.lucene.search.spans.SpanTermQuery;
import org.apache.lucene.search.spans.Spans; import org.apache.lucene.search.spans.Spans;
import org.apache.lucene.util.StringHelper;
/** /**
* Class used to extract {@link WeightedSpanTerm}s from a {@link Query} based on whether * Class used to extract {@link WeightedSpanTerm}s from a {@link Query} based on whether
@ -63,7 +62,7 @@ public class WeightedSpanTermExtractor {
public WeightedSpanTermExtractor(String defaultField) { public WeightedSpanTermExtractor(String defaultField) {
if (defaultField != null) { if (defaultField != null) {
this.defaultField = StringHelper.intern(defaultField); this.defaultField = defaultField;
} }
} }
@ -314,8 +313,8 @@ public class WeightedSpanTermExtractor {
* Necessary to implement matches for queries against <code>defaultField</code> * Necessary to implement matches for queries against <code>defaultField</code>
*/ */
private boolean fieldNameComparator(String fieldNameToCheck) { private boolean fieldNameComparator(String fieldNameToCheck) {
boolean rv = fieldName == null || fieldNameToCheck == fieldName boolean rv = fieldName == null || fieldName.equals(fieldNameToCheck)
|| fieldNameToCheck == defaultField; || (defaultField != null && defaultField.equals(fieldNameToCheck));
return rv; return rv;
} }
@ -372,7 +371,7 @@ public class WeightedSpanTermExtractor {
public Map<String,WeightedSpanTerm> getWeightedSpanTerms(Query query, TokenStream tokenStream, public Map<String,WeightedSpanTerm> getWeightedSpanTerms(Query query, TokenStream tokenStream,
String fieldName) throws IOException { String fieldName) throws IOException {
if (fieldName != null) { if (fieldName != null) {
this.fieldName = StringHelper.intern(fieldName); this.fieldName = fieldName;
} else { } else {
this.fieldName = null; this.fieldName = null;
} }
@ -408,7 +407,7 @@ public class WeightedSpanTermExtractor {
public Map<String,WeightedSpanTerm> getWeightedSpanTermsWithScores(Query query, TokenStream tokenStream, String fieldName, public Map<String,WeightedSpanTerm> getWeightedSpanTermsWithScores(Query query, TokenStream tokenStream, String fieldName,
IndexReader reader) throws IOException { IndexReader reader) throws IOException {
if (fieldName != null) { if (fieldName != null) {
this.fieldName = StringHelper.intern(fieldName); this.fieldName = fieldName;
} else { } else {
this.fieldName = null; this.fieldName = null;
} }

View File

@ -400,7 +400,7 @@ public class InstantiatedIndexReader extends IndexReader {
if (i < 0) { if (i < 0) {
i = -i - 1; i = -i - 1;
} }
if (i >= orderedTerms.length || orderedTerms[i].field() != field) { if (i >= orderedTerms.length || !orderedTerms[i].field().equals(field)) {
// field does not exist // field does not exist
return null; return null;
} }

View File

@ -44,7 +44,6 @@ import org.apache.lucene.index.Term;
import org.apache.lucene.index.TermVectorOffsetInfo; import org.apache.lucene.index.TermVectorOffsetInfo;
import org.apache.lucene.search.IndexSearcher; import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.SimilarityProvider; import org.apache.lucene.search.SimilarityProvider;
import org.apache.lucene.util.StringHelper;
import org.apache.lucene.util.ArrayUtil; import org.apache.lucene.util.ArrayUtil;
import org.apache.lucene.util.CollectionUtil; import org.apache.lucene.util.CollectionUtil;
import org.apache.lucene.util.AttributeImpl; import org.apache.lucene.util.AttributeImpl;
@ -475,7 +474,7 @@ public class InstantiatedIndexWriter implements Closeable {
FieldSetting fieldSetting = fieldSettingsByFieldName.get(field.name()); FieldSetting fieldSetting = fieldSettingsByFieldName.get(field.name());
if (fieldSetting == null) { if (fieldSetting == null) {
fieldSetting = new FieldSetting(); fieldSetting = new FieldSetting();
fieldSetting.fieldName = StringHelper.intern(field.name()); fieldSetting.fieldName = field.name();
fieldSettingsByFieldName.put(fieldSetting.fieldName, fieldSetting); fieldSettingsByFieldName.put(fieldSetting.fieldName, fieldSetting);
fieldNameBuffer.add(fieldSetting.fieldName); fieldNameBuffer.add(fieldSetting.fieldName);
} }

View File

@ -69,11 +69,9 @@ public class InstantiatedTermsEnum extends TermsEnum {
return SeekStatus.END; return SeekStatus.END;
} }
if (terms[upto].field() == field) { if (terms[upto].field().equals(field)) {
return SeekStatus.FOUND; return SeekStatus.FOUND;
} else { } else {
// make sure field was interned
assert !terms[upto].field().equals(field);
return SeekStatus.END; return SeekStatus.END;
} }
} }
@ -84,12 +82,10 @@ public class InstantiatedTermsEnum extends TermsEnum {
if (upto >= terms.length) { if (upto >= terms.length) {
return null; return null;
} }
if (terms[upto].field() == field) { if (terms[upto].field().equals(field)) {
br.copy(terms[upto].getTerm().text()); br.copy(terms[upto].getTerm().text());
return br; return br;
} else { } else {
// make sure field was interned
assert !terms[upto].field().equals(field);
return null; return null;
} }
} }

View File

@ -27,7 +27,6 @@ import org.apache.lucene.search.Similarity;
import org.apache.lucene.search.SimilarityProvider; import org.apache.lucene.search.SimilarityProvider;
import org.apache.lucene.store.Directory; import org.apache.lucene.store.Directory;
import org.apache.lucene.store.FSDirectory; import org.apache.lucene.store.FSDirectory;
import org.apache.lucene.util.StringHelper;
import org.apache.lucene.util.Bits; import org.apache.lucene.util.Bits;
import org.apache.lucene.util.ReaderUtil; import org.apache.lucene.util.ReaderUtil;
@ -111,7 +110,6 @@ public class FieldNormModifier {
* @param field the field whose norms should be reset * @param field the field whose norms should be reset
*/ */
public void reSetNorms(String field) throws IOException { public void reSetNorms(String field) throws IOException {
String fieldName = StringHelper.intern(field);
Similarity fieldSim = sim.get(field); Similarity fieldSim = sim.get(field);
IndexReader reader = null; IndexReader reader = null;
try { try {
@ -149,7 +147,7 @@ public class FieldNormModifier {
for (int d = 0; d < termCounts.length; d++) { for (int d = 0; d < termCounts.length; d++) {
if (delDocs == null || !delDocs.get(d)) { if (delDocs == null || !delDocs.get(d)) {
invertState.setLength(termCounts[d]); invertState.setLength(termCounts[d]);
subReader.setNorm(d, fieldName, fieldSim.encodeNormValue(fieldSim.computeNorm(invertState))); subReader.setNorm(d, field, fieldSim.encodeNormValue(fieldSim.computeNorm(invertState)));
} }
} }
} }

View File

@ -15,7 +15,6 @@ package org.apache.lucene.index;
* *
*/ */
import org.apache.lucene.util.StringHelper;
import org.apache.lucene.util.Bits; import org.apache.lucene.util.Bits;
import org.apache.lucene.util.BytesRef; import org.apache.lucene.util.BytesRef;
@ -54,9 +53,6 @@ public class TermVectorAccessor {
* @throws IOException * @throws IOException
*/ */
public void accept(IndexReader indexReader, int documentNumber, String fieldName, TermVectorMapper mapper) throws IOException { public void accept(IndexReader indexReader, int documentNumber, String fieldName, TermVectorMapper mapper) throws IOException {
fieldName = StringHelper.intern(fieldName);
decoratedMapper.decorated = mapper; decoratedMapper.decorated = mapper;
decoratedMapper.termVectorStored = false; decoratedMapper.termVectorStored = false;

View File

@ -190,7 +190,6 @@ public class FuzzyLikeThisQuery extends Query
CharTermAttribute termAtt = ts.addAttribute(CharTermAttribute.class); CharTermAttribute termAtt = ts.addAttribute(CharTermAttribute.class);
int corpusNumDocs=reader.numDocs(); int corpusNumDocs=reader.numDocs();
Term internSavingTemplateTerm =new Term(f.fieldName); //optimization to avoid constructing new Term() objects
HashSet<String> processedTerms=new HashSet<String>(); HashSet<String> processedTerms=new HashSet<String>();
ts.reset(); ts.reset();
while (ts.incrementToken()) while (ts.incrementToken())
@ -201,7 +200,7 @@ public class FuzzyLikeThisQuery extends Query
processedTerms.add(term); processedTerms.add(term);
ScoreTermQueue variantsQ=new ScoreTermQueue(MAX_VARIANTS_PER_TERM); //maxNum variants considered for any one term ScoreTermQueue variantsQ=new ScoreTermQueue(MAX_VARIANTS_PER_TERM); //maxNum variants considered for any one term
float minScore=0; float minScore=0;
Term startTerm=internSavingTemplateTerm.createTerm(term); Term startTerm=new Term(f.fieldName, term);
AttributeSource atts = new AttributeSource(); AttributeSource atts = new AttributeSource();
MaxNonCompetitiveBoostAttribute maxBoostAtt = MaxNonCompetitiveBoostAttribute maxBoostAtt =
atts.addAttribute(MaxNonCompetitiveBoostAttribute.class); atts.addAttribute(MaxNonCompetitiveBoostAttribute.class);

View File

@ -71,7 +71,7 @@ public class TermsFilter extends Filter
DocsEnum docs = null; DocsEnum docs = null;
for (Iterator<Term> iter = terms.iterator(); iter.hasNext();) { for (Iterator<Term> iter = terms.iterator(); iter.hasNext();) {
Term term = iter.next(); Term term = iter.next();
if (term.field() != lastField) { if (!term.field().equals(lastField)) {
termsC = fields.terms(term.field()); termsC = fields.terms(term.field());
termsEnum = termsC.iterator(); termsEnum = termsC.iterator();
lastField = term.field(); lastField = term.field();

View File

@ -67,14 +67,7 @@ public class TermsFilterBuilder implements FilterBuilder
ts.reset(); ts.reset();
while (ts.incrementToken()) { while (ts.incrementToken()) {
termAtt.fillBytesRef(); termAtt.fillBytesRef();
if (term == null)
{
term = new Term(fieldName, new BytesRef(bytes)); term = new Term(fieldName, new BytesRef(bytes));
} else
{
// create from previous to save fieldName.intern overhead
term = term.createTerm(new BytesRef(bytes));
}
tf.addTerm(term); tf.addTerm(term);
} }
ts.end(); ts.end();

View File

@ -64,14 +64,7 @@ public class TermsQueryBuilder implements QueryBuilder {
ts.reset(); ts.reset();
while (ts.incrementToken()) { while (ts.incrementToken()) {
termAtt.fillBytesRef(); termAtt.fillBytesRef();
if (term == null)
{
term = new Term(fieldName, new BytesRef(bytes)); term = new Term(fieldName, new BytesRef(bytes));
} else
{
// create from previous to save fieldName.intern overhead
term = term.createTerm(new BytesRef(bytes));
}
bq.add(new BooleanClause(new TermQuery(term),BooleanClause.Occur.SHOULD)); bq.add(new BooleanClause(new TermQuery(term),BooleanClause.Occur.SHOULD));
} }
ts.end(); ts.end();

View File

@ -21,7 +21,6 @@ import org.apache.lucene.analysis.TokenStream;
import org.apache.lucene.index.FieldInvertState; // for javadocs import org.apache.lucene.index.FieldInvertState; // for javadocs
import org.apache.lucene.index.values.PerDocFieldValues; import org.apache.lucene.index.values.PerDocFieldValues;
import org.apache.lucene.index.values.ValueType; import org.apache.lucene.index.values.ValueType;
import org.apache.lucene.util.StringHelper; // for javadocs
/** /**
@ -59,7 +58,7 @@ public abstract class AbstractField implements Fieldable {
protected AbstractField(String name, Field.Store store, Field.Index index, Field.TermVector termVector) { protected AbstractField(String name, Field.Store store, Field.Index index, Field.TermVector termVector) {
if (name == null) if (name == null)
throw new NullPointerException("name cannot be null"); throw new NullPointerException("name cannot be null");
this.name = StringHelper.intern(name); // field names are interned this.name = name;
this.isStored = store.isStored(); this.isStored = store.isStored();
this.isIndexed = index.isIndexed(); this.isIndexed = index.isIndexed();
@ -109,7 +108,7 @@ public abstract class AbstractField implements Fieldable {
return boost; return boost;
} }
/** Returns the name of the field as an interned string. /** Returns the name of the field.
* For example "date", "title", "body", ... * For example "date", "title", "body", ...
*/ */
public String name() { return name; } public String name() { return name; }

View File

@ -21,7 +21,6 @@ import java.io.Reader;
import org.apache.lucene.analysis.TokenStream; import org.apache.lucene.analysis.TokenStream;
import org.apache.lucene.index.IndexWriter; import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.util.StringHelper;
/** /**
A field is a section of a Document. Each field has two parts, a name and a A field is a section of a Document. Each field has two parts, a name and a
@ -367,28 +366,6 @@ public final class Field extends AbstractField implements Fieldable {
* </ul> * </ul>
*/ */
public Field(String name, String value, Store store, Index index, TermVector termVector) { public Field(String name, String value, Store store, Index index, TermVector termVector) {
this(name, true, value, store, index, termVector);
}
/**
* Create a field by specifying its name, value and how it will
* be saved in the index.
*
* @param name The name of the field
* @param internName Whether to .intern() name or not
* @param value The string to process
* @param store Whether <code>value</code> should be stored in the index
* @param index Whether the field should be indexed, and if so, if it should
* be tokenized before indexing
* @param termVector Whether term vector should be stored
* @throws NullPointerException if name or value is <code>null</code>
* @throws IllegalArgumentException in any of the following situations:
* <ul>
* <li>the field is neither stored nor indexed</li>
* <li>the field is not indexed but termVector is <code>TermVector.YES</code></li>
* </ul>
*/
public Field(String name, boolean internName, String value, Store store, Index index, TermVector termVector) {
if (name == null) if (name == null)
throw new NullPointerException("name cannot be null"); throw new NullPointerException("name cannot be null");
if (value == null) if (value == null)
@ -402,9 +379,6 @@ public final class Field extends AbstractField implements Fieldable {
throw new IllegalArgumentException("cannot store term vector information " throw new IllegalArgumentException("cannot store term vector information "
+ "for a field that is not indexed"); + "for a field that is not indexed");
if (internName) // field names are optionally interned
name = StringHelper.intern(name);
this.name = name; this.name = name;
this.fieldsData = value; this.fieldsData = value;
@ -454,7 +428,7 @@ public final class Field extends AbstractField implements Fieldable {
if (reader == null) if (reader == null)
throw new NullPointerException("reader cannot be null"); throw new NullPointerException("reader cannot be null");
this.name = StringHelper.intern(name); // field names are interned this.name = name;
this.fieldsData = reader; this.fieldsData = reader;
this.isStored = false; this.isStored = false;
@ -500,7 +474,7 @@ public final class Field extends AbstractField implements Fieldable {
if (tokenStream == null) if (tokenStream == null)
throw new NullPointerException("tokenStream cannot be null"); throw new NullPointerException("tokenStream cannot be null");
this.name = StringHelper.intern(name); // field names are interned this.name = name;
this.fieldsData = null; this.fieldsData = null;
this.tokenStream = tokenStream; this.tokenStream = tokenStream;
@ -540,7 +514,7 @@ public final class Field extends AbstractField implements Fieldable {
if (value == null) if (value == null)
throw new IllegalArgumentException("value cannot be null"); throw new IllegalArgumentException("value cannot be null");
this.name = StringHelper.intern(name); // field names are interned this.name = name;
fieldsData = value; fieldsData = value;
isStored = true; isStored = true;

View File

@ -71,7 +71,7 @@ public interface Fieldable {
*/ */
float getBoost(); float getBoost();
/** Returns the name of the field as an interned string. /** Returns the name of the field.
* For example "date", "title", "body", ... * For example "date", "title", "body", ...
*/ */
String name(); String name();

View File

@ -47,11 +47,12 @@ class BufferedDeletes {
key, Integer val, int hash, Entry next key, Integer val, int hash, Entry next
(OBJ_HEADER + 3*POINTER + INT). Term is object w/ (OBJ_HEADER + 3*POINTER + INT). Term is object w/
String field and String text (OBJ_HEADER + 2*POINTER). String field and String text (OBJ_HEADER + 2*POINTER).
We don't count Term's field since it's interned. Term's field is String (OBJ_HEADER + 4*INT + POINTER +
OBJ_HEADER + string.length*CHAR).
Term's text is String (OBJ_HEADER + 4*INT + POINTER + Term's text is String (OBJ_HEADER + 4*INT + POINTER +
OBJ_HEADER + string.length*CHAR). Integer is OBJ_HEADER + string.length*CHAR). Integer is
OBJ_HEADER + INT. */ OBJ_HEADER + INT. */
final static int BYTES_PER_DEL_TERM = 8*RamUsageEstimator.NUM_BYTES_OBJECT_REF + 5*RamUsageEstimator.NUM_BYTES_OBJECT_HEADER + 6*RamUsageEstimator.NUM_BYTES_INT; final static int BYTES_PER_DEL_TERM = 9*RamUsageEstimator.NUM_BYTES_OBJECT_REF + 7*RamUsageEstimator.NUM_BYTES_OBJECT_HEADER + 10*RamUsageEstimator.NUM_BYTES_INT;
/* Rough logic: del docIDs are List<Integer>. Say list /* Rough logic: del docIDs are List<Integer>. Say list
allocates ~2X size (2*POINTER). Integer is OBJ_HEADER allocates ~2X size (2*POINTER). Integer is OBJ_HEADER
@ -189,7 +190,7 @@ class BufferedDeletes {
terms.put(term, Integer.valueOf(docIDUpto)); terms.put(term, Integer.valueOf(docIDUpto));
numTermDeletes.incrementAndGet(); numTermDeletes.incrementAndGet();
if (current == null) { if (current == null) {
bytesUsed.addAndGet(BYTES_PER_DEL_TERM + term.bytes.length); bytesUsed.addAndGet(BYTES_PER_DEL_TERM + term.bytes.length + (RamUsageEstimator.NUM_BYTES_CHAR * term.field().length()));
} }
} }

View File

@ -380,7 +380,7 @@ class BufferedDeletesStream {
// Since we visit terms sorted, we gain performance // Since we visit terms sorted, we gain performance
// by re-using the same TermsEnum and seeking only // by re-using the same TermsEnum and seeking only
// forwards // forwards
if (term.field() != currentField) { if (!term.field().equals(currentField)) {
assert currentField == null || currentField.compareTo(term.field()) < 0; assert currentField == null || currentField.compareTo(term.field()) < 0;
currentField = term.field(); currentField = term.field();
Terms terms = fields.terms(currentField); Terms terms = fields.terms(currentField);

View File

@ -36,7 +36,6 @@ import org.apache.lucene.store.Directory;
import org.apache.lucene.store.IndexInput; import org.apache.lucene.store.IndexInput;
import org.apache.lucene.store.IndexOutput; import org.apache.lucene.store.IndexOutput;
import org.apache.lucene.util.CodecUtil; import org.apache.lucene.util.CodecUtil;
import org.apache.lucene.util.StringHelper;
/** Access to the Fieldable Info file that describes document fields and whether or /** Access to the Fieldable Info file that describes document fields and whether or
* not they are indexed. Each segment has a separate Fieldable Info file. Objects * not they are indexed. Each segment has a separate Fieldable Info file. Objects
@ -475,7 +474,6 @@ public final class FieldInfos implements Iterable<FieldInfo> {
boolean storeTermVector, boolean storePositionWithTermVector, boolean storeTermVector, boolean storePositionWithTermVector,
boolean storeOffsetWithTermVector, boolean omitNorms, boolean storePayloads, boolean omitTermFreqAndPositions, ValueType docValuesType) { boolean storeOffsetWithTermVector, boolean omitNorms, boolean storePayloads, boolean omitTermFreqAndPositions, ValueType docValuesType) {
// don't check modifiable here since we use that to initially build up FIs // don't check modifiable here since we use that to initially build up FIs
name = StringHelper.intern(name);
if (globalFieldNumbers != null) { if (globalFieldNumbers != null) {
globalFieldNumbers.setIfNotSet(fieldNumber, name); globalFieldNumbers.setIfNotSet(fieldNumber, name);
} }
@ -659,7 +657,7 @@ public final class FieldInfos implements Iterable<FieldInfo> {
final int size = input.readVInt(); //read in the size final int size = input.readVInt(); //read in the size
for (int i = 0; i < size; i++) { for (int i = 0; i < size; i++) {
String name = StringHelper.intern(input.readString()); String name = input.readString();
// if this is a previous format codec 0 will be preflex! // if this is a previous format codec 0 will be preflex!
final int fieldNumber = format <= FORMAT_PER_FIELD_CODEC? input.readInt():i; final int fieldNumber = format <= FORMAT_PER_FIELD_CODEC? input.readInt():i;
final int codecId = format <= FORMAT_PER_FIELD_CODEC? input.readInt():0; final int codecId = format <= FORMAT_PER_FIELD_CODEC? input.readInt():0;

View File

@ -43,10 +43,8 @@ public abstract class FieldsEnum {
return atts; return atts;
} }
/** Increments the enumeration to the next field. The /** Increments the enumeration to the next field. Returns
* returned field is always interned, so simple == * null when there are no more fields.*/
* comparison is allowed. Returns null when there are no
* more fields.*/
public abstract String next() throws IOException; public abstract String next() throws IOException;
/** Get {@link TermsEnum} for the current field. You /** Get {@link TermsEnum} for the current field. You

View File

@ -364,7 +364,6 @@ public final class FieldsReader implements Cloneable {
Field.Index index = Field.Index.toIndex(fi.isIndexed, tokenize); Field.Index index = Field.Index.toIndex(fi.isIndexed, tokenize);
Field.TermVector termVector = Field.TermVector.toTermVector(fi.storeTermVector, fi.storeOffsetWithTermVector, fi.storePositionWithTermVector); Field.TermVector termVector = Field.TermVector.toTermVector(fi.storeTermVector, fi.storeOffsetWithTermVector, fi.storePositionWithTermVector);
f = new Field(fi.name, // name f = new Field(fi.name, // name
false,
fieldsStream.readString(), // read value fieldsStream.readString(), // read value
Field.Store.YES, Field.Store.YES,
index, index,

View File

@ -234,8 +234,6 @@ final class FreqProxTermsWriterPerField extends TermsHashConsumerPerField implem
final TermsConsumer termsConsumer = consumer.addField(fieldInfo); final TermsConsumer termsConsumer = consumer.addField(fieldInfo);
final Comparator<BytesRef> termComp = termsConsumer.getComparator(); final Comparator<BytesRef> termComp = termsConsumer.getComparator();
final Term protoTerm = new Term(fieldName);
final boolean currentFieldOmitTermFreqAndPositions = fieldInfo.omitTermFreqAndPositions; final boolean currentFieldOmitTermFreqAndPositions = fieldInfo.omitTermFreqAndPositions;
final Map<Term,Integer> segDeletes; final Map<Term,Integer> segDeletes;
@ -274,7 +272,7 @@ final class FreqProxTermsWriterPerField extends TermsHashConsumerPerField implem
final int delDocLimit; final int delDocLimit;
if (segDeletes != null) { if (segDeletes != null) {
final Integer docIDUpto = segDeletes.get(protoTerm.createTerm(text)); final Integer docIDUpto = segDeletes.get(new Term(fieldName, text));
if (docIDUpto != null) { if (docIDUpto != null) {
delDocLimit = docIDUpto; delDocLimit = docIDUpto;
} else { } else {

View File

@ -33,10 +33,11 @@ class FrozenBufferedDeletes {
/* Rough logic: Term is object w/ /* Rough logic: Term is object w/
String field and String text (OBJ_HEADER + 2*POINTER). String field and String text (OBJ_HEADER + 2*POINTER).
We don't count Term's field since it's interned.
Term's text is String (OBJ_HEADER + 4*INT + POINTER + Term's text is String (OBJ_HEADER + 4*INT + POINTER +
OBJ_HEADER + string.length*CHAR). */ OBJ_HEADER + text.length*CHAR).
final static int BYTES_PER_DEL_TERM = 3*RamUsageEstimator.NUM_BYTES_OBJECT_REF + 3*RamUsageEstimator.NUM_BYTES_OBJECT_HEADER + 4*RamUsageEstimator.NUM_BYTES_INT; Term's field is String (OBJ_HEADER + 4*INT + POINTER +
OBJ_HEADER + field.length*CHAR). */
final static int BYTES_PER_DEL_TERM = 4*RamUsageEstimator.NUM_BYTES_OBJECT_REF + 4*RamUsageEstimator.NUM_BYTES_OBJECT_HEADER + 8*RamUsageEstimator.NUM_BYTES_INT;
/* Query we often undercount (say 24 bytes), plus int. */ /* Query we often undercount (say 24 bytes), plus int. */
final static int BYTES_PER_DEL_QUERY = RamUsageEstimator.NUM_BYTES_OBJECT_REF + RamUsageEstimator.NUM_BYTES_INT + 24; final static int BYTES_PER_DEL_QUERY = RamUsageEstimator.NUM_BYTES_OBJECT_REF + RamUsageEstimator.NUM_BYTES_INT + 24;

View File

@ -94,7 +94,7 @@ public final class MultiFieldsEnum extends FieldsEnum {
if (queue.size() > 0) { if (queue.size() > 0) {
while(true) { while(true) {
top[numTop++] = queue.pop(); top[numTop++] = queue.pop();
if (queue.size() == 0 || (queue.top()).current != top[0].current) { if (queue.size() == 0 || !(queue.top()).current.equals(top[0].current)) {
break; break;
} }
} }

View File

@ -17,15 +17,12 @@ package org.apache.lucene.index;
* limitations under the License. * limitations under the License.
*/ */
import java.util.Comparator;
import org.apache.lucene.util.BytesRef; import org.apache.lucene.util.BytesRef;
import org.apache.lucene.util.StringHelper;
/** /**
A Term represents a word from text. This is the unit of search. It is A Term represents a word from text. This is the unit of search. It is
composed of two elements, the text of the word, as a string, and the name of composed of two elements, the text of the word, as a string, and the name of
the field that the text occurred in, an interned string. the field that the text occurred in.
Note that terms may represent more than words from text fields, but also Note that terms may represent more than words from text fields, but also
things like dates, email addresses, urls, etc. */ things like dates, email addresses, urls, etc. */
@ -37,13 +34,14 @@ public final class Term implements Comparable<Term> {
/** Constructs a Term with the given field and bytes. /** Constructs a Term with the given field and bytes.
* <p>Note that a null field or null bytes value results in undefined * <p>Note that a null field or null bytes value results in undefined
* behavior for most Lucene APIs that accept a Term parameter. * behavior for most Lucene APIs that accept a Term parameter.
*
* <p>WARNING: the provided BytesRef is not copied, but used directly. * <p>WARNING: the provided BytesRef is not copied, but used directly.
* Therefore the bytes should not be modified after construction, for * Therefore the bytes should not be modified after construction, for
* example, you should clone a copy rather than pass reused bytes from * example, you should clone a copy rather than pass reused bytes from
* a TermsEnum. * a TermsEnum.
*/ */
public Term(String fld, BytesRef bytes) { public Term(String fld, BytesRef bytes) {
field = fld == null ? null : StringHelper.intern(fld); field = fld;
this.bytes = bytes; this.bytes = bytes;
} }
@ -61,28 +59,10 @@ public final class Term implements Comparable<Term> {
* @param fld * @param fld
*/ */
public Term(String fld) { public Term(String fld) {
this(fld, new BytesRef(), true); this(fld, new BytesRef());
} }
/** /** Returns the field of this term. The field indicates
* WARNING: the provided BytesRef is not copied, but used directly.
* Therefore the bytes should not be modified after construction, for
* example, you should clone a copy rather than pass reused bytes from
* a TermsEnum.
*
* @lucene.experimental
*/
public Term(String fld, BytesRef bytes, boolean intern) {
field = intern ? StringHelper.intern(fld) : fld; // field names are interned
this.bytes = bytes; // unless already known to be
}
/** @lucene.experimental */
public Term(String fld, String text, boolean intern) {
this(fld, new BytesRef(text), intern);
}
/** Returns the field of this term, an interned string. The field indicates
the part of a document which this term came from. */ the part of a document which this term came from. */
public final String field() { return field; } public final String field() { return field; }
@ -94,32 +74,6 @@ public final class Term implements Comparable<Term> {
/** Returns the bytes of this term. */ /** Returns the bytes of this term. */
public final BytesRef bytes() { return bytes; } public final BytesRef bytes() { return bytes; }
/**
* Optimized construction of new Terms by reusing same field as this Term
* - avoids field.intern() overhead
* <p>WARNING: the provided BytesRef is not copied, but used directly.
* Therefore the bytes should not be modified after construction, for
* example, you should clone a copy rather than pass reused bytes from
* a TermsEnum.
* @param bytes The bytes of the new term (field is implicitly same as this Term instance)
* @return A new Term
*/
public Term createTerm(BytesRef bytes)
{
return new Term(field,bytes,false);
}
/**
* Optimized construction of new Terms by reusing same field as this Term
* - avoids field.intern() overhead
* @param text The text of the new term (field is implicitly same as this Term instance)
* @return A new Term
*/
public Term createTerm(String text)
{
return new Term(field,text,false);
}
@Override @Override
public boolean equals(Object obj) { public boolean equals(Object obj) {
if (this == obj) if (this == obj)
@ -157,26 +111,11 @@ public final class Term implements Comparable<Term> {
The ordering of terms is first by field, then by text.*/ The ordering of terms is first by field, then by text.*/
public final int compareTo(Term other) { public final int compareTo(Term other) {
if (field == other.field) // fields are interned if (field.equals(other.field)) {
return bytes.compareTo(other.bytes); return bytes.compareTo(other.bytes);
else } else {
return field.compareTo(other.field); return field.compareTo(other.field);
} }
@Deprecated
private static final Comparator<BytesRef> legacyComparator =
BytesRef.getUTF8SortedAsUTF16Comparator();
/**
* @deprecated (4.0) For internal backwards compatibility use only
* @lucene.internal
*/
@Deprecated
public final int compareToUTF16(Term other) {
if (field == other.field) // fields are interned
return legacyComparator.compare(this.bytes, other.bytes);
else
return field.compareTo(other.field);
} }
/** /**

View File

@ -91,7 +91,7 @@ public class BlockTermsReader extends FieldsProducer {
@Override @Override
public boolean equals(Object _other) { public boolean equals(Object _other) {
FieldAndTerm other = (FieldAndTerm) _other; FieldAndTerm other = (FieldAndTerm) _other;
return other.field == field && term.bytesEquals(other.term); return other.field.equals(field) && term.bytesEquals(other.term);
} }
@Override @Override

View File

@ -270,11 +270,11 @@ public class PreFlexFields extends FieldsProducer {
private class PreTermsEnum extends TermsEnum { private class PreTermsEnum extends TermsEnum {
private SegmentTermEnum termEnum; private SegmentTermEnum termEnum;
private FieldInfo fieldInfo; private FieldInfo fieldInfo;
private String internedFieldName;
private boolean skipNext; private boolean skipNext;
private BytesRef current; private BytesRef current;
private SegmentTermEnum seekTermEnum; private SegmentTermEnum seekTermEnum;
private Term protoTerm;
private static final byte UTF8_NON_BMP_LEAD = (byte) 0xf0; private static final byte UTF8_NON_BMP_LEAD = (byte) 0xf0;
private static final byte UTF8_HIGH_BMP_LEAD = (byte) 0xee; private static final byte UTF8_HIGH_BMP_LEAD = (byte) 0xee;
@ -334,7 +334,7 @@ public class PreFlexFields extends FieldsProducer {
} }
// Seek "back": // Seek "back":
getTermsDict().seekEnum(te, protoTerm.createTerm(term), true); getTermsDict().seekEnum(te, new Term(fieldInfo.name, term), true);
// Test if the term we seek'd to in fact found a // Test if the term we seek'd to in fact found a
// surrogate pair at the same position as the E: // surrogate pair at the same position as the E:
@ -343,7 +343,7 @@ public class PreFlexFields extends FieldsProducer {
// Cannot be null (or move to next field) because at // Cannot be null (or move to next field) because at
// "worst" it'd seek to the same term we are on now, // "worst" it'd seek to the same term we are on now,
// unless we are being called from seek // unless we are being called from seek
if (t2 == null || t2.field() != fieldInfo.name) { if (t2 == null || t2.field() != internedFieldName) {
return false; return false;
} }
@ -461,13 +461,13 @@ public class PreFlexFields extends FieldsProducer {
// TODO: more efficient seek? can we simply swap // TODO: more efficient seek? can we simply swap
// the enums? // the enums?
getTermsDict().seekEnum(termEnum, protoTerm.createTerm(scratchTerm), true); getTermsDict().seekEnum(termEnum, new Term(fieldInfo.name, scratchTerm), true);
final Term t2 = termEnum.term(); final Term t2 = termEnum.term();
// We could hit EOF or different field since this // We could hit EOF or different field since this
// was a seek "forward": // was a seek "forward":
if (t2 != null && t2.field() == fieldInfo.name) { if (t2 != null && t2.field() == internedFieldName) {
if (DEBUG_SURROGATES) { if (DEBUG_SURROGATES) {
System.out.println(" got term=" + UnicodeUtil.toHexString(t2.text()) + " " + t2.bytes()); System.out.println(" got term=" + UnicodeUtil.toHexString(t2.text()) + " " + t2.bytes());
@ -552,7 +552,7 @@ public class PreFlexFields extends FieldsProducer {
// current term. // current term.
// TODO: can we avoid this copy? // TODO: can we avoid this copy?
if (termEnum.term() == null || termEnum.term().field() != fieldInfo.name) { if (termEnum.term() == null || termEnum.term().field() != internedFieldName) {
scratchTerm.length = 0; scratchTerm.length = 0;
} else { } else {
scratchTerm.copy(termEnum.term().bytes()); scratchTerm.copy(termEnum.term().bytes());
@ -637,7 +637,7 @@ public class PreFlexFields extends FieldsProducer {
// Seek "forward": // Seek "forward":
// TODO: more efficient seek? // TODO: more efficient seek?
getTermsDict().seekEnum(seekTermEnum, protoTerm.createTerm(scratchTerm), true); getTermsDict().seekEnum(seekTermEnum, new Term(fieldInfo.name, scratchTerm), true);
scratchTerm.bytes[upTo] = scratch[0]; scratchTerm.bytes[upTo] = scratch[0];
scratchTerm.bytes[upTo+1] = scratch[1]; scratchTerm.bytes[upTo+1] = scratch[1];
@ -659,7 +659,7 @@ public class PreFlexFields extends FieldsProducer {
// EOF or a different field: // EOF or a different field:
boolean matches; boolean matches;
if (t2 != null && t2.field() == fieldInfo.name) { if (t2 != null && t2.field() == internedFieldName) {
final BytesRef b2 = t2.bytes(); final BytesRef b2 = t2.bytes();
assert b2.offset == 0; assert b2.offset == 0;
if (b2.length >= upTo+3 && isHighBMPChar(b2.bytes, upTo)) { if (b2.length >= upTo+3 && isHighBMPChar(b2.bytes, upTo)) {
@ -713,20 +713,21 @@ public class PreFlexFields extends FieldsProducer {
void reset(FieldInfo fieldInfo) throws IOException { void reset(FieldInfo fieldInfo) throws IOException {
//System.out.println("pff.reset te=" + termEnum); //System.out.println("pff.reset te=" + termEnum);
this.fieldInfo = fieldInfo; this.fieldInfo = fieldInfo;
protoTerm = new Term(fieldInfo.name); internedFieldName = fieldInfo.name.intern();
final Term term = new Term(internedFieldName);
if (termEnum == null) { if (termEnum == null) {
termEnum = getTermsDict().terms(protoTerm); termEnum = getTermsDict().terms(term);
seekTermEnum = getTermsDict().terms(protoTerm); seekTermEnum = getTermsDict().terms(term);
//System.out.println(" term=" + termEnum.term()); //System.out.println(" term=" + termEnum.term());
} else { } else {
getTermsDict().seekEnum(termEnum, protoTerm, true); getTermsDict().seekEnum(termEnum, term, true);
} }
skipNext = true; skipNext = true;
unicodeSortOrder = sortTermsByUnicode(); unicodeSortOrder = sortTermsByUnicode();
final Term t = termEnum.term(); final Term t = termEnum.term();
if (t != null && t.field() == fieldInfo.name) { if (t != null && t.field() == internedFieldName) {
newSuffixStart = 0; newSuffixStart = 0;
prevTerm.length = 0; prevTerm.length = 0;
surrogateDance(); surrogateDance();
@ -761,7 +762,7 @@ public class PreFlexFields extends FieldsProducer {
} }
skipNext = false; skipNext = false;
final TermInfosReader tis = getTermsDict(); final TermInfosReader tis = getTermsDict();
final Term t0 = protoTerm.createTerm(term); final Term t0 = new Term(fieldInfo.name, term);
assert termEnum != null; assert termEnum != null;
@ -769,7 +770,7 @@ public class PreFlexFields extends FieldsProducer {
final Term t = termEnum.term(); final Term t = termEnum.term();
if (t != null && t.field() == fieldInfo.name && term.bytesEquals(t.bytes())) { if (t != null && t.field() == internedFieldName && term.bytesEquals(t.bytes())) {
// If we found an exact match, no need to do the // If we found an exact match, no need to do the
// surrogate dance // surrogate dance
if (DEBUG_SURROGATES) { if (DEBUG_SURROGATES) {
@ -777,7 +778,7 @@ public class PreFlexFields extends FieldsProducer {
} }
current = t.bytes(); current = t.bytes();
return SeekStatus.FOUND; return SeekStatus.FOUND;
} else if (t == null || t.field() != fieldInfo.name) { } else if (t == null || t.field() != internedFieldName) {
// TODO: maybe we can handle this like the next() // TODO: maybe we can handle this like the next()
// into null? set term as prevTerm then dance? // into null? set term as prevTerm then dance?
@ -840,8 +841,9 @@ public class PreFlexFields extends FieldsProducer {
surrogateDance(); surrogateDance();
final Term t2 = termEnum.term(); final Term t2 = termEnum.term();
if (t2 == null || t2.field() != fieldInfo.name) { if (t2 == null || t2.field() != internedFieldName) {
assert t2 == null || !t2.field().equals(fieldInfo.name); // make sure fields are in fact interned // PreFlex codec interns field names; verify:
assert t2 == null || !t2.field().equals(internedFieldName);
current = null; current = null;
return SeekStatus.END; return SeekStatus.END;
} else { } else {
@ -885,7 +887,8 @@ public class PreFlexFields extends FieldsProducer {
skipNext = false; skipNext = false;
if (termEnum.term() == null) { if (termEnum.term() == null) {
return null; return null;
} else if (termEnum.term().field() != fieldInfo.name) { // PreFlex codec interns field names:
} else if (termEnum.term().field() != internedFieldName) {
return null; return null;
} else { } else {
return current = termEnum.term().bytes(); return current = termEnum.term().bytes();
@ -895,15 +898,16 @@ public class PreFlexFields extends FieldsProducer {
// TODO: can we use STE's prevBuffer here? // TODO: can we use STE's prevBuffer here?
prevTerm.copy(termEnum.term().bytes()); prevTerm.copy(termEnum.term().bytes());
if (termEnum.next() && termEnum.term().field() == fieldInfo.name) { if (termEnum.next() && termEnum.term().field() == internedFieldName) {
newSuffixStart = termEnum.newSuffixStart; newSuffixStart = termEnum.newSuffixStart;
if (DEBUG_SURROGATES) { if (DEBUG_SURROGATES) {
System.out.println(" newSuffixStart=" + newSuffixStart); System.out.println(" newSuffixStart=" + newSuffixStart);
} }
surrogateDance(); surrogateDance();
final Term t = termEnum.term(); final Term t = termEnum.term();
if (t == null || t.field() != fieldInfo.name) { if (t == null || t.field() != internedFieldName) {
assert t == null || !t.field().equals(fieldInfo.name); // make sure fields are in fact interned // PreFlex codec interns field names; verify:
assert t == null || !t.field().equals(internedFieldName);
current = null; current = null;
} else { } else {
current = t.bytes(); current = t.bytes();
@ -920,8 +924,9 @@ public class PreFlexFields extends FieldsProducer {
surrogateDance(); surrogateDance();
final Term t = termEnum.term(); final Term t = termEnum.term();
if (t == null || t.field() != fieldInfo.name) { if (t == null || t.field() != internedFieldName) {
assert t == null || !t.field().equals(fieldInfo.name); // make sure fields are in fact interned // PreFlex codec interns field names; verify:
assert t == null || !t.field().equals(internedFieldName);
return null; return null;
} else { } else {
current = t.bytes(); current = t.bytes();

View File

@ -37,12 +37,17 @@ final class TermBuffer implements Cloneable {
private BytesRef bytes = new BytesRef(10); private BytesRef bytes = new BytesRef(10);
// Cannot be -1 since (strangely) we write that
// fieldNumber into index for first indexed term:
private int currentFieldNumber = -2;
private static final Comparator<BytesRef> utf8AsUTF16Comparator = BytesRef.getUTF8SortedAsUTF16Comparator(); private static final Comparator<BytesRef> utf8AsUTF16Comparator = BytesRef.getUTF8SortedAsUTF16Comparator();
int newSuffixStart; // only valid right after .read is called int newSuffixStart; // only valid right after .read is called
public int compareTo(TermBuffer other) { public int compareTo(TermBuffer other) {
if (field == other.field) // fields are interned if (field == other.field) // fields are interned
// (only by PreFlex codec)
return utf8AsUTF16Comparator.compare(bytes, other.bytes); return utf8AsUTF16Comparator.compare(bytes, other.bytes);
else else
return field.compareTo(other.field); return field.compareTo(other.field);
@ -59,7 +64,13 @@ final class TermBuffer implements Cloneable {
} }
bytes.length = totalLength; bytes.length = totalLength;
input.readBytes(bytes.bytes, newSuffixStart, length); input.readBytes(bytes.bytes, newSuffixStart, length);
this.field = fieldInfos.fieldName(input.readVInt()); final int fieldNumber = input.readVInt();
if (fieldNumber != currentFieldNumber) {
currentFieldNumber = fieldNumber;
field = fieldInfos.fieldName(currentFieldNumber).intern();
} else {
assert field.equals(fieldInfos.fieldName(fieldNumber)): "currentFieldNumber=" + currentFieldNumber + " field=" + field + " vs " + fieldInfos.fieldName(fieldNumber);
}
} }
public void set(Term term) { public void set(Term term) {
@ -68,12 +79,14 @@ final class TermBuffer implements Cloneable {
return; return;
} }
bytes.copy(term.bytes()); bytes.copy(term.bytes());
field = term.field(); field = term.field().intern();
currentFieldNumber = -1;
this.term = term; this.term = term;
} }
public void set(TermBuffer other) { public void set(TermBuffer other) {
field = other.field; field = other.field;
currentFieldNumber = other.currentFieldNumber;
// dangerous to copy Term over, since the underlying // dangerous to copy Term over, since the underlying
// BytesRef could subsequently be modified: // BytesRef could subsequently be modified:
term = null; term = null;
@ -83,6 +96,7 @@ final class TermBuffer implements Cloneable {
public void reset() { public void reset() {
field = null; field = null;
term = null; term = null;
currentFieldNumber= -1;
} }
public Term toTerm() { public Term toTerm() {
@ -90,8 +104,7 @@ final class TermBuffer implements Cloneable {
return null; return null;
if (term == null) { if (term == null) {
term = new Term(field, new BytesRef(bytes), false); term = new Term(field, new BytesRef(bytes));
//term = new Term(field, bytes, false);
} }
return term; return term;

View File

@ -18,12 +18,14 @@ package org.apache.lucene.index.codecs.preflex;
*/ */
import java.io.IOException; import java.io.IOException;
import java.util.Comparator;
import org.apache.lucene.index.CorruptIndexException; import org.apache.lucene.index.CorruptIndexException;
import org.apache.lucene.index.FieldInfos; import org.apache.lucene.index.FieldInfos;
import org.apache.lucene.index.Term;
import org.apache.lucene.index.IndexFileNames; import org.apache.lucene.index.IndexFileNames;
import org.apache.lucene.index.Term;
import org.apache.lucene.store.Directory; import org.apache.lucene.store.Directory;
import org.apache.lucene.util.BytesRef;
import org.apache.lucene.util.CloseableThreadLocal; import org.apache.lucene.util.CloseableThreadLocal;
import org.apache.lucene.util.DoubleBarrelLRUCache; import org.apache.lucene.util.DoubleBarrelLRUCache;
@ -189,6 +191,16 @@ public final class TermInfosReader {
return resources; return resources;
} }
private static final Comparator<BytesRef> legacyComparator =
BytesRef.getUTF8SortedAsUTF16Comparator();
private final int compareAsUTF16(Term term1, Term term2) {
if (term1.field().equals(term2.field())) {
return legacyComparator.compare(term1.bytes(), term2.bytes());
} else {
return term1.field().compareTo(term2.field());
}
}
/** Returns the offset of the greatest index entry which is less than or equal to term.*/ /** Returns the offset of the greatest index entry which is less than or equal to term.*/
private int getIndexOffset(Term term) { private int getIndexOffset(Term term) {
@ -198,7 +210,7 @@ public final class TermInfosReader {
while (hi >= lo) { while (hi >= lo) {
int mid = (lo + hi) >>> 1; int mid = (lo + hi) >>> 1;
assert indexTerms[mid] != null : "indexTerms = " + indexTerms.length + " mid=" + mid; assert indexTerms[mid] != null : "indexTerms = " + indexTerms.length + " mid=" + mid;
int delta = term.compareToUTF16(indexTerms[mid]); int delta = compareAsUTF16(term, indexTerms[mid]);
if (delta < 0) if (delta < 0)
hi = mid - 1; hi = mid - 1;
else if (delta > 0) else if (delta > 0)
@ -256,16 +268,16 @@ public final class TermInfosReader {
// optimize sequential access: first try scanning cached enum w/o seeking // optimize sequential access: first try scanning cached enum w/o seeking
if (enumerator.term() != null // term is at or past current if (enumerator.term() != null // term is at or past current
&& ((enumerator.prev() != null && term.compareToUTF16(enumerator.prev())> 0) && ((enumerator.prev() != null && compareAsUTF16(term, enumerator.prev())> 0)
|| term.compareToUTF16(enumerator.term()) >= 0)) { || compareAsUTF16(term, enumerator.term()) >= 0)) {
int enumOffset = (int)(enumerator.position/totalIndexInterval)+1; int enumOffset = (int)(enumerator.position/totalIndexInterval)+1;
if (indexTerms.length == enumOffset // but before end of block if (indexTerms.length == enumOffset // but before end of block
|| term.compareToUTF16(indexTerms[enumOffset]) < 0) { || compareAsUTF16(term, indexTerms[enumOffset]) < 0) {
// no need to seek // no need to seek
final TermInfo ti; final TermInfo ti;
int numScans = enumerator.scanTo(term); int numScans = enumerator.scanTo(term);
if (enumerator.term() != null && term.compareToUTF16(enumerator.term()) == 0) { if (enumerator.term() != null && compareAsUTF16(term, enumerator.term()) == 0) {
ti = enumerator.termInfo; ti = enumerator.termInfo;
if (numScans > 1) { if (numScans > 1) {
// we only want to put this TermInfo into the cache if // we only want to put this TermInfo into the cache if
@ -303,7 +315,7 @@ public final class TermInfosReader {
enumerator.scanTo(term); enumerator.scanTo(term);
final TermInfo ti; final TermInfo ti;
if (enumerator.term() != null && term.compareToUTF16(enumerator.term()) == 0) { if (enumerator.term() != null && compareAsUTF16(term, enumerator.term()) == 0) {
ti = enumerator.termInfo; ti = enumerator.termInfo;
if (tiOrd == null) { if (tiOrd == null) {
if (useCache) { if (useCache) {
@ -360,9 +372,9 @@ public final class TermInfosReader {
SegmentTermEnum enumerator = getThreadResources().termEnum; SegmentTermEnum enumerator = getThreadResources().termEnum;
seekEnum(enumerator, indexOffset); seekEnum(enumerator, indexOffset);
while(term.compareToUTF16(enumerator.term()) > 0 && enumerator.next()) {} while(compareAsUTF16(term, enumerator.term()) > 0 && enumerator.next()) {}
if (term.compareToUTF16(enumerator.term()) == 0) if (compareAsUTF16(term, enumerator.term()) == 0)
return enumerator.position; return enumerator.position;
else else
return -1; return -1;

View File

@ -30,7 +30,6 @@ import org.apache.lucene.store.IndexInput;
import org.apache.lucene.util.ArrayUtil; import org.apache.lucene.util.ArrayUtil;
import org.apache.lucene.util.Bits; import org.apache.lucene.util.Bits;
import org.apache.lucene.util.CharsRef; import org.apache.lucene.util.CharsRef;
import org.apache.lucene.util.StringHelper;
import org.apache.lucene.util.UnicodeUtil; import org.apache.lucene.util.UnicodeUtil;
import org.apache.lucene.util.fst.Builder; import org.apache.lucene.util.fst.Builder;
import org.apache.lucene.util.fst.BytesRefFSTEnum; import org.apache.lucene.util.fst.BytesRefFSTEnum;
@ -102,9 +101,7 @@ class SimpleTextFieldsReader extends FieldsProducer {
return null; return null;
} }
if (scratch.startsWith(FIELD)) { if (scratch.startsWith(FIELD)) {
String field = StringHelper.intern(new String(scratch.bytes, scratch.offset + FIELD.length, scratch.length - FIELD.length, "UTF-8")); return current = new String(scratch.bytes, scratch.offset + FIELD.length, scratch.length - FIELD.length, "UTF-8");
current = field;
return field;
} }
} }
} }

View File

@ -117,7 +117,7 @@ public class AutomatonQuery extends MultiTermQuery {
factory = new TermsEnumFactory() { factory = new TermsEnumFactory() {
@Override @Override
protected TermsEnum getTermsEnum(Terms terms, AttributeSource atts) throws IOException { protected TermsEnum getTermsEnum(Terms terms, AttributeSource atts) throws IOException {
return new SingleTermsEnum(terms.iterator(), term.createTerm(singleton)); return new SingleTermsEnum(terms.iterator(), new Term(field, singleton));
} }
}; };
} else if (BasicOperations.sameLanguage(automaton, BasicOperations.concatenate( } else if (BasicOperations.sameLanguage(automaton, BasicOperations.concatenate(
@ -126,7 +126,7 @@ public class AutomatonQuery extends MultiTermQuery {
factory = new TermsEnumFactory() { factory = new TermsEnumFactory() {
@Override @Override
protected TermsEnum getTermsEnum(Terms terms, AttributeSource atts) throws IOException { protected TermsEnum getTermsEnum(Terms terms, AttributeSource atts) throws IOException {
return new PrefixTermsEnum(terms.iterator(), term.createTerm(commonPrefix)); return new PrefixTermsEnum(terms.iterator(), new Term(field, commonPrefix));
} }
}; };
} else { } else {

View File

@ -100,14 +100,13 @@ class ConstantScoreAutoRewrite extends TermCollectingRewrite<BooleanQuery> {
return getTopLevelQuery(); return getTopLevelQuery();
} else { } else {
final BooleanQuery bq = getTopLevelQuery(); final BooleanQuery bq = getTopLevelQuery();
final Term placeholderTerm = new Term(query.field);
final BytesRefHash pendingTerms = col.pendingTerms; final BytesRefHash pendingTerms = col.pendingTerms;
final int sort[] = pendingTerms.sort(col.termsEnum.getComparator()); final int sort[] = pendingTerms.sort(col.termsEnum.getComparator());
for(int i = 0; i < size; i++) { for(int i = 0; i < size; i++) {
final int pos = sort[i]; final int pos = sort[i];
// docFreq is not used for constant score here, we pass 1 // docFreq is not used for constant score here, we pass 1
// to explicitely set a fake value, so it's not calculated // to explicitely set a fake value, so it's not calculated
addClause(bq, placeholderTerm.createTerm(pendingTerms.get(pos, new BytesRef())), 1, 1.0f, col.array.termState[pos]); addClause(bq, new Term(query.field, pendingTerms.get(pos, new BytesRef())), 1, 1.0f, col.array.termState[pos]);
} }
// Strip scores // Strip scores
final Query result = new ConstantScoreQuery(bq); final Query result = new ConstantScoreQuery(bq);

View File

@ -42,7 +42,6 @@ import org.apache.lucene.search.cache.CachedArray.IntValues;
import org.apache.lucene.search.cache.CachedArray.LongValues; import org.apache.lucene.search.cache.CachedArray.LongValues;
import org.apache.lucene.search.cache.CachedArray.ShortValues; import org.apache.lucene.search.cache.CachedArray.ShortValues;
import org.apache.lucene.util.FieldCacheSanityChecker; import org.apache.lucene.util.FieldCacheSanityChecker;
import org.apache.lucene.util.StringHelper;
/** /**
* Expert: The default cache implementation, storing all values in memory. * Expert: The default cache implementation, storing all values in memory.
@ -246,7 +245,7 @@ public class FieldCacheImpl implements FieldCache { // Made Public so that
/** Creates one of these objects for a custom comparator/parser. */ /** Creates one of these objects for a custom comparator/parser. */
Entry (String field, EntryCreator<T> custom) { Entry (String field, EntryCreator<T> custom) {
this.field = StringHelper.intern(field); this.field = field;
this.creator = custom; this.creator = custom;
} }
@ -255,7 +254,7 @@ public class FieldCacheImpl implements FieldCache { // Made Public so that
public boolean equals (Object o) { public boolean equals (Object o) {
if (o instanceof Entry) { if (o instanceof Entry) {
Entry other = (Entry) o; Entry other = (Entry) o;
if (other.field == field) { if (other.field.equals(field)) {
if (other.creator == null) { if (other.creator == null) {
if (creator == null) return true; if (creator == null) return true;
} else if (other.creator.equals (creator)) { } else if (other.creator.equals (creator)) {

View File

@ -88,7 +88,7 @@ public class MultiPhraseQuery extends Query {
field = terms[0].field(); field = terms[0].field();
for (int i = 0; i < terms.length; i++) { for (int i = 0; i < terms.length; i++) {
if (terms[i].field() != field) { if (!terms[i].field().equals(field)) {
throw new IllegalArgumentException( throw new IllegalArgumentException(
"All phrase terms must be in the same field (" + field + "): " "All phrase terms must be in the same field (" + field + "): "
+ terms[i]); + terms[i]);

View File

@ -85,10 +85,11 @@ public class PhraseQuery extends Query {
* @param position * @param position
*/ */
public void add(Term term, int position) { public void add(Term term, int position) {
if (terms.size() == 0) if (terms.size() == 0) {
field = term.field(); field = term.field();
else if (term.field() != field) } else if (!term.field().equals(field)) {
throw new IllegalArgumentException("All phrase terms must be in the same field: " + term); throw new IllegalArgumentException("All phrase terms must be in the same field: " + term);
}
terms.add(term); terms.add(term);
positions.add(Integer.valueOf(position)); positions.add(Integer.valueOf(position));

View File

@ -113,7 +113,6 @@ public abstract class ScoringRewrite<Q extends Query> extends TermCollectingRewr
final ParallelArraysTermCollector col = new ParallelArraysTermCollector(); final ParallelArraysTermCollector col = new ParallelArraysTermCollector();
collectTerms(reader, query, col); collectTerms(reader, query, col);
final Term placeholderTerm = new Term(query.field);
final int size = col.terms.size(); final int size = col.terms.size();
if (size > 0) { if (size > 0) {
final int sort[] = col.terms.sort(col.termsEnum.getComparator()); final int sort[] = col.terms.sort(col.termsEnum.getComparator());
@ -121,7 +120,7 @@ public abstract class ScoringRewrite<Q extends Query> extends TermCollectingRewr
final PerReaderTermState[] termStates = col.array.termState; final PerReaderTermState[] termStates = col.array.termState;
for (int i = 0; i < size; i++) { for (int i = 0; i < size; i++) {
final int pos = sort[i]; final int pos = sort[i];
final Term term = placeholderTerm.createTerm(col.terms.get(pos, new BytesRef())); final Term term = new Term(query.getField(), col.terms.get(pos, new BytesRef()));
assert reader.docFreq(term) == termStates[pos].docFreq(); assert reader.docFreq(term) == termStates[pos].docFreq();
addClause(result, term, termStates[pos].docFreq(), query.getBoost() * boost[pos], termStates[pos]); addClause(result, term, termStates[pos].docFreq(), query.getBoost() * boost[pos], termStates[pos]);
} }

View File

@ -21,8 +21,8 @@ import java.io.IOException;
import java.util.Comparator; import java.util.Comparator;
import org.apache.lucene.search.cache.*; import org.apache.lucene.search.cache.*;
import org.apache.lucene.util.StringHelper;
import org.apache.lucene.util.BytesRef; import org.apache.lucene.util.BytesRef;
import org.apache.lucene.util.StringHelper;
// TODO(simonw) -- for cleaner transition, maybe we should make // TODO(simonw) -- for cleaner transition, maybe we should make
// a new SortField that subclasses this one and always uses // a new SortField that subclasses this one and always uses
@ -166,7 +166,7 @@ public class SortField {
if (field == null) { if (field == null) {
throw new IllegalArgumentException("field can only be null when type is SCORE or DOC"); throw new IllegalArgumentException("field can only be null when type is SCORE or DOC");
} }
this.field = StringHelper.intern(field); this.field = field;
this.reverse = reverse; this.reverse = reverse;
if (parser instanceof FieldCache.IntParser) { if (parser instanceof FieldCache.IntParser) {
@ -205,7 +205,7 @@ public class SortField {
*/ */
public SortField( CachedArrayCreator<?> creator, boolean reverse ) public SortField( CachedArrayCreator<?> creator, boolean reverse )
{ {
this.field = StringHelper.intern(creator.field); this.field = creator.field;
this.reverse = reverse; this.reverse = reverse;
this.creator = creator; this.creator = creator;
this.type = creator.getSortTypeID(); this.type = creator.getSortTypeID();
@ -253,7 +253,7 @@ public class SortField {
if (type != SCORE && type != DOC) if (type != SCORE && type != DOC)
throw new IllegalArgumentException("field can only be null when type is SCORE or DOC"); throw new IllegalArgumentException("field can only be null when type is SCORE or DOC");
} else { } else {
this.field = StringHelper.intern(field); this.field = field;
} }
if( creator != null ) { if( creator != null ) {
@ -381,7 +381,7 @@ public class SortField {
if (!(o instanceof SortField)) return false; if (!(o instanceof SortField)) return false;
final SortField other = (SortField)o; final SortField other = (SortField)o;
return ( return (
other.field == this.field // field is always interned StringHelper.equals(other.field, this.field)
&& other.type == this.type && other.type == this.type
&& other.reverse == this.reverse && other.reverse == this.reverse
&& (other.comparatorSource == null ? this.comparatorSource == null : other.comparatorSource.equals(this.comparatorSource)) && (other.comparatorSource == null ? this.comparatorSource == null : other.comparatorSource.equals(this.comparatorSource))

View File

@ -131,12 +131,11 @@ public abstract class TopTermsRewrite<Q extends Query> extends TermCollectingRew
} }
}); });
final Term placeholderTerm = new Term(query.field);
final Q q = getTopLevelQuery(); final Q q = getTopLevelQuery();
final ScoreTerm[] scoreTerms = stQueue.toArray(new ScoreTerm[stQueue.size()]); final ScoreTerm[] scoreTerms = stQueue.toArray(new ScoreTerm[stQueue.size()]);
ArrayUtil.mergeSort(scoreTerms, scoreTermSortByTermComp); ArrayUtil.mergeSort(scoreTerms, scoreTermSortByTermComp);
for (final ScoreTerm st : scoreTerms) { for (final ScoreTerm st : scoreTerms) {
final Term term = placeholderTerm.createTerm(st.bytes); final Term term = new Term(query.field, st.bytes);
assert reader.docFreq(term) == st.termState.docFreq() : "reader DF is " + reader.docFreq(term) + " vs " + st.termState.docFreq(); assert reader.docFreq(term) == st.termState.docFreq() : "reader DF is " + reader.docFreq(term) + " vs " + st.termState.docFreq();
addClause(q, term, st.termState.docFreq(), query.getBoost() * st.boost, st.termState); // add to query addClause(q, term, st.termState.docFreq(), query.getBoost() * st.boost, st.termState); // add to query
} }

View File

@ -29,7 +29,6 @@ import org.apache.lucene.search.FieldCache.DocTerms;
import org.apache.lucene.util.Bits; import org.apache.lucene.util.Bits;
import org.apache.lucene.util.BytesRef; import org.apache.lucene.util.BytesRef;
import org.apache.lucene.util.PagedBytes; import org.apache.lucene.util.PagedBytes;
import org.apache.lucene.util.StringHelper;
import org.apache.lucene.util.packed.GrowableWriter; import org.apache.lucene.util.packed.GrowableWriter;
import org.apache.lucene.util.packed.PackedInts; import org.apache.lucene.util.packed.PackedInts;
@ -66,7 +65,6 @@ public class DocTermsCreator extends EntryCreatorWithOptions<DocTerms>
@Override @Override
public DocTerms create(IndexReader reader) throws IOException { public DocTerms create(IndexReader reader) throws IOException {
String field = StringHelper.intern(this.field); // TODO?? necessary?
Terms terms = MultiFields.getTerms(reader, field); Terms terms = MultiFields.getTerms(reader, field);
final boolean fasterButMoreRAM = hasOption( FASTER_BUT_MORE_RAM ); final boolean fasterButMoreRAM = hasOption( FASTER_BUT_MORE_RAM );

View File

@ -34,7 +34,6 @@ import org.apache.lucene.util.ArrayUtil;
import org.apache.lucene.util.Bits; import org.apache.lucene.util.Bits;
import org.apache.lucene.util.BytesRef; import org.apache.lucene.util.BytesRef;
import org.apache.lucene.util.PagedBytes; import org.apache.lucene.util.PagedBytes;
import org.apache.lucene.util.StringHelper;
import org.apache.lucene.util.packed.GrowableWriter; import org.apache.lucene.util.packed.GrowableWriter;
import org.apache.lucene.util.packed.PackedInts; import org.apache.lucene.util.packed.PackedInts;
@ -70,7 +69,6 @@ public class DocTermsIndexCreator extends EntryCreatorWithOptions<DocTermsIndex>
@Override @Override
public DocTermsIndex create(IndexReader reader) throws IOException public DocTermsIndex create(IndexReader reader) throws IOException
{ {
String field = StringHelper.intern(this.field); // TODO?? necessary?
Terms terms = MultiFields.getTerms(reader, field); Terms terms = MultiFields.getTerms(reader, field);
final boolean fasterButMoreRAM = hasOption(FASTER_BUT_MORE_RAM); final boolean fasterButMoreRAM = hasOption(FASTER_BUT_MORE_RAM);

View File

@ -208,7 +208,7 @@ public final class FieldCacheSanityChecker {
if (seen.contains(rf)) continue; if (seen.contains(rf)) continue;
List<Object> kids = getAllDecendentReaderKeys(rf.readerKey); List<Object> kids = getAllDescendentReaderKeys(rf.readerKey);
for (Object kidKey : kids) { for (Object kidKey : kids) {
ReaderField kid = new ReaderField(kidKey, rf.fieldName); ReaderField kid = new ReaderField(kidKey, rf.fieldName);
@ -252,7 +252,7 @@ public final class FieldCacheSanityChecker {
badness = badEntries.toArray(badness); badness = badEntries.toArray(badness);
insanity.add(new Insanity(InsanityType.SUBREADER, insanity.add(new Insanity(InsanityType.SUBREADER,
"Found caches for decendents of " + "Found caches for descendants of " +
parent.toString(), parent.toString(),
badness)); badness));
} }
@ -266,7 +266,7 @@ public final class FieldCacheSanityChecker {
* the hierarchy of subReaders building up a list of the objects * the hierarchy of subReaders building up a list of the objects
* returned by obj.getFieldCacheKey() * returned by obj.getFieldCacheKey()
*/ */
private List<Object> getAllDecendentReaderKeys(Object seed) { private List<Object> getAllDescendentReaderKeys(Object seed) {
List<Object> all = new ArrayList<Object>(17); // will grow as we iter List<Object> all = new ArrayList<Object>(17); // will grow as we iter
all.add(seed); all.add(seed);
for (int i = 0; i < all.size(); i++) { for (int i = 0; i < all.size(); i++) {

View File

@ -1,85 +0,0 @@
package org.apache.lucene.util;
/**
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
/**
* Simple lockless and memory barrier free String intern cache that is guaranteed
* to return the same String instance as String.intern()
* does.
*
* @lucene.internal
*/
public class SimpleStringInterner extends StringInterner {
private static class Entry {
final private String str;
final private int hash;
private Entry next;
private Entry(String str, int hash, Entry next) {
this.str = str;
this.hash = hash;
this.next = next;
}
}
private final Entry[] cache;
private final int maxChainLength;
/**
* @param tableSize Size of the hash table, should be a power of two.
* @param maxChainLength Maximum length of each bucket, after which the oldest item inserted is dropped.
*/
public SimpleStringInterner(int tableSize, int maxChainLength) {
cache = new Entry[Math.max(1,BitUtil.nextHighestPowerOfTwo(tableSize))];
this.maxChainLength = Math.max(2,maxChainLength);
}
@Override
public String intern(String s) {
int h = s.hashCode();
// In the future, it may be worth augmenting the string hash
// if the lower bits need better distribution.
int slot = h & (cache.length-1);
Entry first = this.cache[slot];
Entry nextToLast = null;
int chainLength = 0;
for(Entry e=first; e!=null; e=e.next) {
if (e.hash == h && (e.str == s || e.str.compareTo(s)==0)) {
// if (e.str == s || (e.hash == h && e.str.compareTo(s)==0)) {
return e.str;
}
chainLength++;
if (e.next != null) {
nextToLast = e;
}
}
// insertion-order cache: add new entry at head
s = s.intern();
this.cache[slot] = new Entry(s, h, first);
if (chainLength >= maxChainLength) {
// prune last entry
nextToLast.next = null;
}
return s;
}
}

View File

@ -27,17 +27,6 @@ import java.util.StringTokenizer;
* @lucene.internal * @lucene.internal
*/ */
public abstract class StringHelper { public abstract class StringHelper {
/**
* Expert:
* The StringInterner implementation used by Lucene.
* This shouldn't be changed to an incompatible implementation after other Lucene APIs have been used.
*/
public static StringInterner interner = new SimpleStringInterner(1024,8);
/** Return the same string object for all equal strings */
public static String intern(String s) {
return interner.intern(s);
}
/** /**
* Compares two byte[] arrays, element by element, and returns the * Compares two byte[] arrays, element by element, and returns the
@ -95,4 +84,12 @@ public abstract class StringHelper {
return 0; return 0;
} }
}; };
public static boolean equals(String s1, String s2) {
if (s1 == null) {
return s2 == null;
} else {
return s1.equals(s2);
}
}
} }

View File

@ -1,37 +0,0 @@
package org.apache.lucene.util;
/**
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
/**
* Subclasses of StringInterner are required to
* return the same single String object for all equal strings.
* Depending on the implementation, this may not be
* the same object returned as String.intern().
*
* This StringInterner base class simply delegates to String.intern().
*/
public class StringInterner {
/** Returns a single object instance for each equal string. */
public String intern(String s) {
return s.intern();
}
/** Returns a single object instance for each equal string. */
public String intern(char[] arr, int offset, int len) {
return intern(new String(arr, offset, len));
}
}

View File

@ -713,6 +713,10 @@ public abstract class LuceneTestCase extends Assert {
throw e; throw e;
} }
if (insanity.length != 0) {
reportAdditionalFailureInfo();
}
assertEquals(msg + ": Insane FieldCache usage(s) found", assertEquals(msg + ": Insane FieldCache usage(s) found",
0, insanity.length); 0, insanity.length);
insanity = null; insanity = null;
@ -1104,11 +1108,17 @@ public abstract class LuceneTestCase extends Assert {
/** Returns a new field instance, using the specified random. /** Returns a new field instance, using the specified random.
* See {@link #newField(String, String, Field.Store, Field.Index, Field.TermVector)} for more information */ * See {@link #newField(String, String, Field.Store, Field.Index, Field.TermVector)} for more information */
public static Field newField(Random random, String name, String value, Store store, Index index, TermVector tv) { public static Field newField(Random random, String name, String value, Store store, Index index, TermVector tv) {
if (usually(random)) { if (usually(random)) {
// most of the time, don't modify the params // most of the time, don't modify the params
return new Field(name, value, store, index, tv); return new Field(name, value, store, index, tv);
} }
if (random.nextBoolean()) {
// tickle any code still relying on field names being interned:
name = new String(name);
}
if (!index.isIndexed()) if (!index.isIndexed())
return new Field(name, value, store, index, tv); return new Field(name, value, store, index, tv);

View File

@ -39,7 +39,6 @@ public class TestDocumentsWriterDeleteQueue extends LuceneTestCase {
for (int i = 0; i < ids.length; i++) { for (int i = 0; i < ids.length; i++) {
ids[i] = random.nextInt(); ids[i] = random.nextInt();
} }
Term template = new Term("id");
DeleteSlice slice1 = queue.newSlice(); DeleteSlice slice1 = queue.newSlice();
DeleteSlice slice2 = queue.newSlice(); DeleteSlice slice2 = queue.newSlice();
BufferedDeletes bd1 = new BufferedDeletes(false); BufferedDeletes bd1 = new BufferedDeletes(false);
@ -50,7 +49,7 @@ public class TestDocumentsWriterDeleteQueue extends LuceneTestCase {
for (int j = 0; j < ids.length; j++) { for (int j = 0; j < ids.length; j++) {
Integer i = ids[j]; Integer i = ids[j];
// create an array here since we compare identity below against tailItem // create an array here since we compare identity below against tailItem
Term[] term = new Term[] {template.createTerm(i.toString())}; Term[] term = new Term[] {new Term("id", i.toString())};
uniqueValues.add(term[0]); uniqueValues.add(term[0]);
queue.addDelete(term); queue.addDelete(term);
if (random.nextInt(20) == 0 || j == ids.length - 1) { if (random.nextInt(20) == 0 || j == ids.length - 1) {
@ -79,16 +78,14 @@ public class TestDocumentsWriterDeleteQueue extends LuceneTestCase {
private void assertAllBetween(int start, int end, BufferedDeletes deletes, private void assertAllBetween(int start, int end, BufferedDeletes deletes,
Integer[] ids) { Integer[] ids) {
Term template = new Term("id");
for (int i = start; i <= end; i++) { for (int i = start; i <= end; i++) {
assertEquals(Integer.valueOf(end), deletes.terms.get(template assertEquals(Integer.valueOf(end), deletes.terms.get(new Term("id",
.createTerm(ids[i].toString()))); ids[i].toString())));
} }
} }
public void testClear() { public void testClear() {
DocumentsWriterDeleteQueue queue = new DocumentsWriterDeleteQueue(); DocumentsWriterDeleteQueue queue = new DocumentsWriterDeleteQueue();
Term template = new Term("id");
assertFalse(queue.anyChanges()); assertFalse(queue.anyChanges());
queue.clear(); queue.clear();
assertFalse(queue.anyChanges()); assertFalse(queue.anyChanges());
@ -96,7 +93,7 @@ public class TestDocumentsWriterDeleteQueue extends LuceneTestCase {
int termsSinceFreeze = 0; int termsSinceFreeze = 0;
int queriesSinceFreeze = 0; int queriesSinceFreeze = 0;
for (int i = 0; i < size; i++) { for (int i = 0; i < size; i++) {
Term term = template.createTerm("" + i); Term term = new Term("id", "" + i);
if (random.nextInt(10) == 0) { if (random.nextInt(10) == 0) {
queue.addDelete(new TermQuery(term)); queue.addDelete(new TermQuery(term));
queriesSinceFreeze++; queriesSinceFreeze++;
@ -116,12 +113,11 @@ public class TestDocumentsWriterDeleteQueue extends LuceneTestCase {
public void testAnyChanges() { public void testAnyChanges() {
DocumentsWriterDeleteQueue queue = new DocumentsWriterDeleteQueue(); DocumentsWriterDeleteQueue queue = new DocumentsWriterDeleteQueue();
Term template = new Term("id");
final int size = 200 + random.nextInt(500) * RANDOM_MULTIPLIER; final int size = 200 + random.nextInt(500) * RANDOM_MULTIPLIER;
int termsSinceFreeze = 0; int termsSinceFreeze = 0;
int queriesSinceFreeze = 0; int queriesSinceFreeze = 0;
for (int i = 0; i < size; i++) { for (int i = 0; i < size; i++) {
Term term = template.createTerm("" + i); Term term = new Term("id", "" + i);
if (random.nextInt(10) == 0) { if (random.nextInt(10) == 0) {
queue.addDelete(new TermQuery(term)); queue.addDelete(new TermQuery(term));
queriesSinceFreeze++; queriesSinceFreeze++;
@ -147,10 +143,9 @@ public class TestDocumentsWriterDeleteQueue extends LuceneTestCase {
Set<Term> uniqueValues = new HashSet<Term>(); Set<Term> uniqueValues = new HashSet<Term>();
final int size = 10000 + random.nextInt(500) * RANDOM_MULTIPLIER; final int size = 10000 + random.nextInt(500) * RANDOM_MULTIPLIER;
Integer[] ids = new Integer[size]; Integer[] ids = new Integer[size];
Term template = new Term("id");
for (int i = 0; i < ids.length; i++) { for (int i = 0; i < ids.length; i++) {
ids[i] = random.nextInt(); ids[i] = random.nextInt();
uniqueValues.add(template.createTerm(ids[i].toString())); uniqueValues.add(new Term("id", ids[i].toString()));
} }
CountDownLatch latch = new CountDownLatch(1); CountDownLatch latch = new CountDownLatch(1);
AtomicInteger index = new AtomicInteger(0); AtomicInteger index = new AtomicInteger(0);
@ -204,10 +199,9 @@ public class TestDocumentsWriterDeleteQueue extends LuceneTestCase {
} catch (InterruptedException e) { } catch (InterruptedException e) {
throw new ThreadInterruptedException(e); throw new ThreadInterruptedException(e);
} }
Term template = new Term("id");
int i = 0; int i = 0;
while ((i = index.getAndIncrement()) < ids.length) { while ((i = index.getAndIncrement()) < ids.length) {
Term term = template.createTerm(ids[i].toString()); Term term = new Term("id", ids[i].toString());
queue.add(term, slice); queue.add(term, slice);
assertTrue(slice.isTailItem(term)); assertTrue(slice.isTailItem(term));
slice.apply(deletes, BufferedDeletes.MAX_INT); slice.apply(deletes, BufferedDeletes.MAX_INT);

View File

@ -30,9 +30,6 @@ import org.apache.lucene.analysis.MockTokenizer;
import org.apache.lucene.analysis.TokenStream; import org.apache.lucene.analysis.TokenStream;
import org.apache.lucene.document.Document; import org.apache.lucene.document.Document;
import org.apache.lucene.document.Field; import org.apache.lucene.document.Field;
import org.apache.lucene.document.Field.Index;
import org.apache.lucene.document.Field.Store;
import org.apache.lucene.document.Field.TermVector;
import org.apache.lucene.search.IndexSearcher; import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.ScoreDoc; import org.apache.lucene.search.ScoreDoc;
import org.apache.lucene.search.TermQuery; import org.apache.lucene.search.TermQuery;
@ -940,7 +937,7 @@ public class TestIndexWriterDelete extends LuceneTestCase {
count++; count++;
} }
} }
assertTrue("flush happened too quickly during " + (doIndexing ? "indexing" : "deleting") + " count=" + count, count > 3000); assertTrue("flush happened too quickly during " + (doIndexing ? "indexing" : "deleting") + " count=" + count, count > 2500);
} }
w.close(); w.close();
dir.close(); dir.close();

View File

@ -40,13 +40,12 @@ public class TestRollback extends LuceneTestCase {
// If buffer size is small enough to cause a flush, errors ensue... // If buffer size is small enough to cause a flush, errors ensue...
IndexWriter w = new IndexWriter(dir, newIndexWriterConfig( TEST_VERSION_CURRENT, new MockAnalyzer(random)).setMaxBufferedDocs(2).setOpenMode(IndexWriterConfig.OpenMode.APPEND)); IndexWriter w = new IndexWriter(dir, newIndexWriterConfig( TEST_VERSION_CURRENT, new MockAnalyzer(random)).setMaxBufferedDocs(2).setOpenMode(IndexWriterConfig.OpenMode.APPEND));
Term pkTerm = new Term("pk", "");
for (int i = 0; i < 3; i++) { for (int i = 0; i < 3; i++) {
Document doc = new Document(); Document doc = new Document();
String value = Integer.toString(i); String value = Integer.toString(i);
doc.add(newField("pk", value, Store.YES, Index.ANALYZED_NO_NORMS)); doc.add(newField("pk", value, Store.YES, Index.ANALYZED_NO_NORMS));
doc.add(newField("text", "foo", Store.YES, Index.ANALYZED_NO_NORMS)); doc.add(newField("text", "foo", Store.YES, Index.ANALYZED_NO_NORMS));
w.updateDocument(pkTerm.createTerm(value), doc); w.updateDocument(new Term("pk", value), doc);
} }
w.rollback(); w.rollback();

View File

@ -312,7 +312,6 @@ public class TestStressIndexing2 extends LuceneTestCase {
int[] r2r1 = new int[r2.maxDoc()]; // r2 id to r1 id mapping int[] r2r1 = new int[r2.maxDoc()]; // r2 id to r1 id mapping
// create mapping from id2 space to id2 based on idField // create mapping from id2 space to id2 based on idField
idField = StringHelper.intern(idField);
final Fields f1 = MultiFields.getFields(r1); final Fields f1 = MultiFields.getFields(r1);
if (f1 == null) { if (f1 == null) {
// make sure r2 is empty // make sure r2 is empty
@ -669,7 +668,7 @@ public class TestStressIndexing2 extends LuceneTestCase {
ArrayList<Field> fields = new ArrayList<Field>(); ArrayList<Field> fields = new ArrayList<Field>();
String idString = getIdString(); String idString = getIdString();
Field idField = newField(idTerm.field(), idString, Field.Store.YES, Field.Index.NOT_ANALYZED_NO_NORMS); Field idField = newField("id", idString, Field.Store.YES, Field.Index.NOT_ANALYZED_NO_NORMS);
fields.add(idField); fields.add(idField);
int nFields = nextInt(maxFields); int nFields = nextInt(maxFields);
@ -720,7 +719,7 @@ public class TestStressIndexing2 extends LuceneTestCase {
if (VERBOSE) { if (VERBOSE) {
System.out.println(Thread.currentThread().getName() + ": indexing id:" + idString); System.out.println(Thread.currentThread().getName() + ": indexing id:" + idString);
} }
w.updateDocument(idTerm.createTerm(idString), d); w.updateDocument(new Term("id", idString), d);
//System.out.println(Thread.currentThread().getName() + ": indexing "+d); //System.out.println(Thread.currentThread().getName() + ": indexing "+d);
docs.put(idString, d); docs.put(idString, d);
} }
@ -730,7 +729,7 @@ public class TestStressIndexing2 extends LuceneTestCase {
if (VERBOSE) { if (VERBOSE) {
System.out.println(Thread.currentThread().getName() + ": del id:" + idString); System.out.println(Thread.currentThread().getName() + ": del id:" + idString);
} }
w.deleteDocuments(idTerm.createTerm(idString)); w.deleteDocuments(new Term("id", idString));
docs.remove(idString); docs.remove(idString);
} }
@ -739,7 +738,7 @@ public class TestStressIndexing2 extends LuceneTestCase {
if (VERBOSE) { if (VERBOSE) {
System.out.println(Thread.currentThread().getName() + ": del query id:" + idString); System.out.println(Thread.currentThread().getName() + ": del query id:" + idString);
} }
w.deleteDocuments(new TermQuery(idTerm.createTerm(idString))); w.deleteDocuments(new TermQuery(new Term("id", idString)));
docs.remove(idString); docs.remove(idString);
} }

View File

@ -75,8 +75,15 @@ public class TestSurrogates extends LuceneTestCase {
} }
private static class SortTermAsUTF16Comparator implements Comparator<Term> { private static class SortTermAsUTF16Comparator implements Comparator<Term> {
public int compare(Term o1, Term o2) { private static final Comparator<BytesRef> legacyComparator =
return o1.compareToUTF16(o2); BytesRef.getUTF8SortedAsUTF16Comparator();
public int compare(Term term1, Term term2) {
if (term1.field().equals(term2.field())) {
return legacyComparator.compare(term1.bytes(), term2.bytes());
} else {
return term1.field().compareTo(term2.field());
}
} }
} }
@ -171,7 +178,7 @@ public class TestSurrogates extends LuceneTestCase {
break; break;
} }
term = fieldTerms.get(1+spot+i); term = fieldTerms.get(1+spot+i);
if (term.field() != field) { if (!term.field().equals(field)) {
assertNull(te.next()); assertNull(te.next());
break; break;
} else { } else {
@ -224,7 +231,7 @@ public class TestSurrogates extends LuceneTestCase {
spot = -spot - 1; spot = -spot - 1;
if (spot == fieldTerms.size() || fieldTerms.get(spot).field() != field) { if (spot == fieldTerms.size() || !fieldTerms.get(spot).field().equals(field)) {
assertEquals(TermsEnum.SeekStatus.END, te.seek(tx.bytes())); assertEquals(TermsEnum.SeekStatus.END, te.seek(tx.bytes()));
} else { } else {
assertEquals(TermsEnum.SeekStatus.NOT_FOUND, te.seek(tx.bytes())); assertEquals(TermsEnum.SeekStatus.NOT_FOUND, te.seek(tx.bytes()));
@ -247,7 +254,7 @@ public class TestSurrogates extends LuceneTestCase {
break; break;
} }
Term term = fieldTerms.get(1+spot+i); Term term = fieldTerms.get(1+spot+i);
if (term.field() != field) { if (!term.field().equals(field)) {
assertNull(te.next()); assertNull(te.next());
break; break;
} else { } else {

View File

@ -1,89 +0,0 @@
/**
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.lucene.util;
import java.util.Random;
public class TestStringIntern extends LuceneTestCase {
String[] testStrings;
String[] internedStrings;
private String randStr(int len) {
char[] arr = new char[len];
for (int i=0; i<len; i++) {
arr[i] = (char)('a' + random.nextInt(26));
}
return new String(arr);
}
private void makeStrings(int sz) {
testStrings = new String[sz];
internedStrings = new String[sz];
for (int i=0; i<sz; i++) {
testStrings[i] = randStr(random.nextInt(8)+3);
}
}
public void testStringIntern() throws InterruptedException {
makeStrings(1024*10); // something greater than the capacity of the default cache size
// makeStrings(100); // realistic for perf testing
int nThreads = 20;
// final int iter=100000;
final int iter = atLeast(100000);
// try native intern
// StringHelper.interner = new StringInterner();
Thread[] threads = new Thread[nThreads];
for (int i=0; i<nThreads; i++) {
final int seed = i;
threads[i] = new Thread() {
@Override
public void run() {
Random rand = new Random(seed);
String[] myInterned = new String[testStrings.length];
for (int j=0; j<iter; j++) {
int idx = rand.nextInt(testStrings.length);
String s = testStrings[idx];
if (rand.nextBoolean()) s = new String(s); // make a copy half of the time
String interned = StringHelper.intern(s);
String prevInterned = myInterned[idx];
String otherInterned = internedStrings[idx];
// test against other threads
if (otherInterned != null && otherInterned != interned) {
fail();
}
internedStrings[idx] = interned;
// test against local copy
if (prevInterned != null && prevInterned != interned) {
fail();
}
myInterned[idx] = interned;
}
}
};
threads[i].start();
}
for (int i=0; i<nThreads; i++) {
threads[i].join();
}
}
}

View File

@ -481,7 +481,7 @@ public class TestPerfTasksLogic extends BenchmarkTestCase {
FieldsEnum fields = MultiFields.getFields(reader).iterator(); FieldsEnum fields = MultiFields.getFields(reader).iterator();
String fieldName = null; String fieldName = null;
while((fieldName = fields.next()) != null) { while((fieldName = fields.next()) != null) {
if (fieldName == DocMaker.ID_FIELD || fieldName == DocMaker.DATE_MSEC_FIELD || fieldName == DocMaker.TIME_SEC_FIELD) { if (fieldName.equals(DocMaker.ID_FIELD) || fieldName.equals(DocMaker.DATE_MSEC_FIELD) || fieldName.equals(DocMaker.TIME_SEC_FIELD)) {
continue; continue;
} }
TermsEnum terms = fields.terms(); TermsEnum terms = fields.terms();

View File

@ -328,8 +328,9 @@ public class DirectSpellChecker {
if (minQueryLength > 0 && text.codePointCount(0, text.length()) < minQueryLength) if (minQueryLength > 0 && text.codePointCount(0, text.length()) < minQueryLength)
return new SuggestWord[0]; return new SuggestWord[0];
if (lowerCaseTerms) if (lowerCaseTerms) {
term = term.createTerm(text.toLowerCase(Locale.ENGLISH)); term = new Term(term.field(), text.toLowerCase(Locale.ENGLISH));
}
int docfreq = ir.docFreq(term); int docfreq = ir.docFreq(term);

View File

@ -26,7 +26,6 @@ import org.apache.lucene.index.Terms;
import org.apache.lucene.index.MultiFields; import org.apache.lucene.index.MultiFields;
import org.apache.lucene.search.spell.Dictionary; import org.apache.lucene.search.spell.Dictionary;
import org.apache.lucene.util.CharsRef; import org.apache.lucene.util.CharsRef;
import org.apache.lucene.util.StringHelper;
import org.apache.lucene.util.BytesRef; import org.apache.lucene.util.BytesRef;
/** /**
@ -47,7 +46,7 @@ public class HighFrequencyDictionary implements Dictionary {
public HighFrequencyDictionary(IndexReader reader, String field, float thresh) { public HighFrequencyDictionary(IndexReader reader, String field, float thresh) {
this.reader = reader; this.reader = reader;
this.field = StringHelper.intern(field); this.field = field;
this.thresh = thresh; this.thresh = thresh;
} }

View File

@ -26,7 +26,6 @@ import org.apache.lucene.util.BytesRef;
import org.apache.lucene.util.CharsRef; import org.apache.lucene.util.CharsRef;
import org.apache.lucene.index.Terms; import org.apache.lucene.index.Terms;
import org.apache.lucene.index.MultiFields; import org.apache.lucene.index.MultiFields;
import org.apache.lucene.util.StringHelper;
import java.io.*; import java.io.*;
@ -46,7 +45,7 @@ public class LuceneDictionary implements Dictionary {
public LuceneDictionary(IndexReader reader, String field) { public LuceneDictionary(IndexReader reader, String field) {
this.reader = reader; this.reader = reader;
this.field = StringHelper.intern(field); this.field = field;
} }
public final Iterator<String> getWordsIterator() { public final Iterator<String> getWordsIterator() {

View File

@ -77,8 +77,6 @@ public class SpellChecker implements java.io.Closeable {
*/ */
public static final String F_WORD = "word"; public static final String F_WORD = "word";
private static final Term F_WORD_TERM = new Term(F_WORD);
/** /**
* the spell index * the spell index
*/ */
@ -486,7 +484,7 @@ public class SpellChecker implements java.io.Closeable {
// obtainSearcher calls ensureOpen // obtainSearcher calls ensureOpen
final IndexSearcher indexSearcher = obtainSearcher(); final IndexSearcher indexSearcher = obtainSearcher();
try{ try{
return indexSearcher.docFreq(F_WORD_TERM.createTerm(word)) > 0; return indexSearcher.docFreq(new Term(F_WORD, word)) > 0;
} finally { } finally {
releaseSearcher(indexSearcher); releaseSearcher(indexSearcher);
} }

View File

@ -46,7 +46,6 @@ import org.apache.lucene.index.IndexReader;
import org.apache.lucene.index.IndexReader.AtomicReaderContext; import org.apache.lucene.index.IndexReader.AtomicReaderContext;
import org.apache.lucene.index.Term; import org.apache.lucene.index.Term;
import org.apache.lucene.search.*; import org.apache.lucene.search.*;
import org.apache.lucene.util.StringHelper;
import org.apache.solr.cloud.ZkController; import org.apache.solr.cloud.ZkController;
import org.apache.lucene.util.BytesRef; import org.apache.lucene.util.BytesRef;
import org.apache.solr.common.SolrException; import org.apache.solr.common.SolrException;
@ -161,7 +160,7 @@ public class QueryElevationComponent extends SearchComponent implements SolrCore
throw new SolrException( SolrException.ErrorCode.SERVER_ERROR, throw new SolrException( SolrException.ErrorCode.SERVER_ERROR,
"QueryElevationComponent requires the schema to have a uniqueKeyField implemented using StrField" ); "QueryElevationComponent requires the schema to have a uniqueKeyField implemented using StrField" );
} }
idField = StringHelper.intern(sf.getName()); idField = sf.getName();
forceElevation = initArgs.getBool( QueryElevationParams.FORCE_ELEVATION, forceElevation ); forceElevation = initArgs.getBool( QueryElevationParams.FORCE_ELEVATION, forceElevation );
try { try {

View File

@ -296,7 +296,7 @@ public class TermVectorComponent extends SearchComponent implements SolrCoreAwar
private boolean useOffsets, usePositions; private boolean useOffsets, usePositions;
//private Map<String, Integer> idfCache; //private Map<String, Integer> idfCache;
private NamedList<Object> fieldNL; private NamedList<Object> fieldNL;
private Term currentTerm; private String field;
public TVMapper(IndexReader reader) { public TVMapper(IndexReader reader) {
@ -337,9 +337,8 @@ public class TermVectorComponent extends SearchComponent implements SolrCoreAwar
private int getDocFreq(BytesRef term) { private int getDocFreq(BytesRef term) {
int result = 1; int result = 1;
currentTerm = currentTerm.createTerm(term);
try { try {
Terms terms = MultiFields.getTerms(reader, currentTerm.field()); Terms terms = MultiFields.getTerms(reader, field);
if (terms != null) { if (terms != null) {
TermsEnum termsEnum = terms.iterator(); TermsEnum termsEnum = terms.iterator();
if (termsEnum.seek(term) == TermsEnum.SeekStatus.FOUND) { if (termsEnum.seek(term) == TermsEnum.SeekStatus.FOUND) {
@ -354,10 +353,7 @@ public class TermVectorComponent extends SearchComponent implements SolrCoreAwar
@Override @Override
public void setExpectations(String field, int numTerms, boolean storeOffsets, boolean storePositions) { public void setExpectations(String field, int numTerms, boolean storeOffsets, boolean storePositions) {
this.field = field;
if (fieldOptions.docFreq == true && reader != null) {
this.currentTerm = new Term(field);
}
useOffsets = storeOffsets && fieldOptions.offsets; useOffsets = storeOffsets && fieldOptions.offsets;
usePositions = storePositions && fieldOptions.positions; usePositions = storePositions && fieldOptions.positions;
fieldNL = new NamedList<Object>(); fieldNL = new NamedList<Object>();

View File

@ -22,7 +22,6 @@ import org.apache.lucene.queryParser.ParseException;
import org.apache.lucene.search.*; import org.apache.lucene.search.*;
import org.apache.lucene.util.BytesRef; import org.apache.lucene.util.BytesRef;
import org.apache.lucene.util.CharsRef; import org.apache.lucene.util.CharsRef;
import org.apache.lucene.util.StringHelper;
import org.apache.lucene.util.UnicodeUtil; import org.apache.lucene.util.UnicodeUtil;
import org.apache.lucene.util.packed.Direct16; import org.apache.lucene.util.packed.Direct16;
import org.apache.lucene.util.packed.Direct32; import org.apache.lucene.util.packed.Direct32;
@ -371,10 +370,9 @@ public class SimpleFacets {
FieldType ft = searcher.getSchema().getFieldType(field); FieldType ft = searcher.getSchema().getFieldType(field);
List<String> terms = StrUtils.splitSmart(termList, ",", true); List<String> terms = StrUtils.splitSmart(termList, ",", true);
NamedList<Integer> res = new NamedList<Integer>(); NamedList<Integer> res = new NamedList<Integer>();
Term t = new Term(field);
for (String term : terms) { for (String term : terms) {
String internal = ft.toInternal(term); String internal = ft.toInternal(term);
int count = searcher.numDocs(new TermQuery(t.createTerm(internal)), base); int count = searcher.numDocs(new TermQuery(new Term(field, internal)), base);
res.add(term, count); res.add(term, count);
} }
return res; return res;
@ -674,7 +672,7 @@ public class SimpleFacets {
if (deState==null) { if (deState==null) {
deState = new SolrIndexSearcher.DocsEnumState(); deState = new SolrIndexSearcher.DocsEnumState();
deState.fieldName = StringHelper.intern(field); deState.fieldName = field;
deState.deletedDocs = MultiFields.getDeletedDocs(r); deState.deletedDocs = MultiFields.getDeletedDocs(r);
deState.termsEnum = termsEnum; deState.termsEnum = termsEnum;
deState.docsEnum = docsEnum; deState.docsEnum = docsEnum;

View File

@ -23,7 +23,6 @@ import org.apache.lucene.index.Term;
import org.apache.lucene.index.TermsEnum; import org.apache.lucene.index.TermsEnum;
import org.apache.lucene.search.TermQuery; import org.apache.lucene.search.TermQuery;
import org.apache.lucene.search.TermRangeQuery; import org.apache.lucene.search.TermRangeQuery;
import org.apache.lucene.util.StringHelper;
import org.apache.solr.common.params.FacetParams; import org.apache.solr.common.params.FacetParams;
import org.apache.solr.common.util.NamedList; import org.apache.solr.common.util.NamedList;
import org.apache.solr.common.SolrException; import org.apache.solr.common.SolrException;
@ -123,7 +122,7 @@ public class UnInvertedField extends DocTermOrds {
if (deState == null) { if (deState == null) {
deState = new SolrIndexSearcher.DocsEnumState(); deState = new SolrIndexSearcher.DocsEnumState();
deState.fieldName = StringHelper.intern(field); deState.fieldName = field;
// deState.termsEnum = te.tenum; // deState.termsEnum = te.tenum;
deState.termsEnum = te; // TODO: check for MultiTermsEnum in SolrIndexSearcher could now fail? deState.termsEnum = te; // TODO: check for MultiTermsEnum in SolrIndexSearcher could now fail?
deState.docsEnum = docsEnum; deState.docsEnum = docsEnum;

View File

@ -27,7 +27,6 @@ import java.util.Map;
import java.util.Set; import java.util.Set;
import org.apache.lucene.document.Fieldable; import org.apache.lucene.document.Fieldable;
import org.apache.lucene.util.StringHelper;
import org.apache.solr.common.SolrDocument; import org.apache.solr.common.SolrDocument;
import org.apache.solr.common.params.CommonParams; import org.apache.solr.common.params.CommonParams;
import org.apache.solr.common.util.NamedList; import org.apache.solr.common.util.NamedList;
@ -75,7 +74,7 @@ class JSONWriter extends TextResponseWriter {
public JSONWriter(Writer writer, SolrQueryRequest req, SolrQueryResponse rsp) { public JSONWriter(Writer writer, SolrQueryRequest req, SolrQueryResponse rsp) {
super(writer, req, rsp); super(writer, req, rsp);
namedListStyle = StringHelper.intern(req.getParams().get(JSON_NL_STYLE, JSON_NL_FLAT)); namedListStyle = req.getParams().get(JSON_NL_STYLE, JSON_NL_FLAT).intern();
wrapperFunction = req.getParams().get(JSON_WRAPPER_FUNCTION); wrapperFunction = req.getParams().get(JSON_WRAPPER_FUNCTION);
} }

View File

@ -22,7 +22,6 @@ import org.apache.lucene.search.*;
import org.apache.lucene.util.Bits; import org.apache.lucene.util.Bits;
import org.apache.lucene.util.BytesRef; import org.apache.lucene.util.BytesRef;
import org.apache.lucene.util.OpenBitSet; import org.apache.lucene.util.OpenBitSet;
import org.apache.lucene.util.StringHelper;
import org.apache.solr.common.SolrException; import org.apache.solr.common.SolrException;
import org.apache.solr.common.params.SolrParams; import org.apache.solr.common.params.SolrParams;
import org.apache.solr.common.util.NamedList; import org.apache.solr.common.util.NamedList;
@ -290,14 +289,14 @@ class JoinQuery extends Query {
Bits toDeletedDocs = fromSearcher == toSearcher ? fromDeletedDocs : MultiFields.getDeletedDocs(toSearcher.getIndexReader()); Bits toDeletedDocs = fromSearcher == toSearcher ? fromDeletedDocs : MultiFields.getDeletedDocs(toSearcher.getIndexReader());
fromDeState = new SolrIndexSearcher.DocsEnumState(); fromDeState = new SolrIndexSearcher.DocsEnumState();
fromDeState.fieldName = StringHelper.intern(fromField); fromDeState.fieldName = fromField;
fromDeState.deletedDocs = fromDeletedDocs; fromDeState.deletedDocs = fromDeletedDocs;
fromDeState.termsEnum = termsEnum; fromDeState.termsEnum = termsEnum;
fromDeState.docsEnum = null; fromDeState.docsEnum = null;
fromDeState.minSetSizeCached = minDocFreqFrom; fromDeState.minSetSizeCached = minDocFreqFrom;
toDeState = new SolrIndexSearcher.DocsEnumState(); toDeState = new SolrIndexSearcher.DocsEnumState();
toDeState.fieldName = StringHelper.intern(toField); toDeState.fieldName = toField;
toDeState.deletedDocs = toDeletedDocs; toDeState.deletedDocs = toDeletedDocs;
toDeState.termsEnum = toTermsEnum; toDeState.termsEnum = toTermsEnum;
toDeState.docsEnum = null; toDeState.docsEnum = null;

View File

@ -715,7 +715,7 @@ public class SolrIndexSearcher extends IndexSearcher implements SolrInfoMBean {
TermQuery key = null; TermQuery key = null;
if (useCache) { if (useCache) {
key = new TermQuery(new Term(deState.fieldName, new BytesRef(deState.termsEnum.term()), false)); key = new TermQuery(new Term(deState.fieldName, new BytesRef(deState.termsEnum.term())));
DocSet result = filterCache.get(key); DocSet result = filterCache.get(key);
if (result != null) return result; if (result != null) return result;
} }

View File

@ -35,7 +35,6 @@ import org.apache.lucene.index.IndexReader.AtomicReaderContext;
import org.apache.lucene.index.IndexReader.ReaderContext; import org.apache.lucene.index.IndexReader.ReaderContext;
import org.apache.lucene.util.BytesRef; import org.apache.lucene.util.BytesRef;
import org.apache.lucene.util.ReaderUtil; import org.apache.lucene.util.ReaderUtil;
import org.apache.lucene.util.StringHelper;
import org.apache.solr.core.SolrCore; import org.apache.solr.core.SolrCore;
import org.apache.solr.handler.RequestHandlerBase; import org.apache.solr.handler.RequestHandlerBase;
import org.apache.solr.handler.RequestHandlerUtils; import org.apache.solr.handler.RequestHandlerUtils;
@ -224,7 +223,7 @@ public class FileFloatSource extends ValueSource {
BufferedReader r = new BufferedReader(new InputStreamReader(is)); BufferedReader r = new BufferedReader(new InputStreamReader(is));
String idName = StringHelper.intern(ffs.keyField.getName()); String idName = ffs.keyField.getName();
FieldType idType = ffs.keyField.getType(); FieldType idType = ffs.keyField.getType();
// warning: lucene's termEnum.skipTo() is not optimized... it simply does a next() // warning: lucene's termEnum.skipTo() is not optimized... it simply does a next()

View File

@ -181,13 +181,13 @@ public abstract class AbstractLuceneSpellChecker extends SolrSpellChecker {
} }
if (options.extendedResults == true && reader != null && field != null) { if (options.extendedResults == true && reader != null && field != null) {
term = term.createTerm(tokenText); term = new Term(field, tokenText);
result.addFrequency(token, reader.docFreq(term)); result.addFrequency(token, reader.docFreq(term));
int countLimit = Math.min(options.count, suggestions.length); int countLimit = Math.min(options.count, suggestions.length);
if(countLimit>0) if(countLimit>0)
{ {
for (int i = 0; i < countLimit; i++) { for (int i = 0; i < countLimit; i++) {
term = term.createTerm(suggestions[i]); term = new Term(field, suggestions[i]);
result.add(token, suggestions[i], reader.docFreq(term)); result.add(token, suggestions[i], reader.docFreq(term));
} }
} else if(shardRequest) { } else if(shardRequest) {

View File

@ -169,7 +169,7 @@ public class DirectUpdateHandler2 extends UpdateHandler {
if (cmd.indexedId == null) { if (cmd.indexedId == null) {
cmd.indexedId = getIndexedId(cmd.doc); cmd.indexedId = getIndexedId(cmd.doc);
} }
Term idTerm = this.idTerm.createTerm(cmd.indexedId); Term idTerm = new Term(idField.getName(), cmd.indexedId);
boolean del = false; boolean del = false;
if (cmd.updateTerm == null) { if (cmd.updateTerm == null) {
updateTerm = idTerm; updateTerm = idTerm;
@ -214,7 +214,7 @@ public class DirectUpdateHandler2 extends UpdateHandler {
iwCommit.lock(); iwCommit.lock();
try { try {
openWriter(); openWriter();
writer.deleteDocuments(idTerm.createTerm(idFieldType.toInternal(cmd.id))); writer.deleteDocuments(new Term(idField.getName(), idFieldType.toInternal(cmd.id)));
} finally { } finally {
iwCommit.unlock(); iwCommit.unlock();
} }

View File

@ -54,7 +54,6 @@ public abstract class UpdateHandler implements SolrInfoMBean {
protected final SchemaField idField; protected final SchemaField idField;
protected final FieldType idFieldType; protected final FieldType idFieldType;
protected final Term idTerm; // prototype term to avoid interning fieldname
protected Vector<SolrEventListener> commitCallbacks = new Vector<SolrEventListener>(); protected Vector<SolrEventListener> commitCallbacks = new Vector<SolrEventListener>();
protected Vector<SolrEventListener> optimizeCallbacks = new Vector<SolrEventListener>(); protected Vector<SolrEventListener> optimizeCallbacks = new Vector<SolrEventListener>();
@ -93,7 +92,6 @@ public abstract class UpdateHandler implements SolrInfoMBean {
schema = core.getSchema(); schema = core.getSchema();
idField = schema.getUniqueKeyField(); idField = schema.getUniqueKeyField();
idFieldType = idField!=null ? idField.getType() : null; idFieldType = idField!=null ? idField.getType() : null;
idTerm = idField!=null ? new Term(idField.getName(),"") : null;
parseEventListeners(); parseEventListeners();
} }

View File

@ -61,8 +61,6 @@ public class SignatureUpdateProcessorFactory
signatureField = params.get("signatureField", "signatureField"); signatureField = params.get("signatureField", "signatureField");
signatureTerm = new Term(signatureField, "");
signatureClass = params.get("signatureClass", signatureClass = params.get("signatureClass",
"org.apache.solr.update.processor.Lookup3Signature"); "org.apache.solr.update.processor.Lookup3Signature");
this.params = params; this.params = params;
@ -173,7 +171,7 @@ public class SignatureUpdateProcessorFactory
doc.addField(signatureField, sigString); doc.addField(signatureField, sigString);
if (overwriteDupes) { if (overwriteDupes) {
cmd.updateTerm = signatureTerm.createTerm(sigString); cmd.updateTerm = new Term(signatureField, sigString);
} }
} }