Don't allow negatives in the positions file

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1371961 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
Robert Muir 2012-08-11 14:31:56 +00:00
parent c97774fb5e
commit d0dd5fadcc
2 changed files with 9 additions and 13 deletions

View File

@ -31,6 +31,11 @@ Bug Fixes
had a custom Similarity where coord(1,1) != 1F, then the rewritten had a custom Similarity where coord(1,1) != 1F, then the rewritten
query would be scored differently. (Robert Muir) query would be scored differently. (Robert Muir)
* Don't allow negatives in the positions file. If you have an index
from 2.4.0 or earlier with such negative positions, and you already
upgraded to 3.x, then to Lucene 4.0-ALPHA or -BETA, you should run
CheckIndex. If it fails, then you need to upgrade again to 4.0 (Robert Muir)
======================= Lucene 4.0.0-BETA ======================= ======================= Lucene 4.0.0-BETA =======================
New features New features

View File

@ -822,11 +822,8 @@ public class CheckIndex {
if (hasPositions) { if (hasPositions) {
for(int j=0;j<freq;j++) { for(int j=0;j<freq;j++) {
final int pos = postings.nextPosition(); final int pos = postings.nextPosition();
// NOTE: pos=-1 is allowed because of ancient bug
// (LUCENE-1542) whereby IndexWriter could
// write pos=-1 when first token's posInc is 0
if (pos < -1) { if (pos < 0) {
throw new RuntimeException("term " + term + ": doc " + doc + ": pos " + pos + " is out of bounds"); throw new RuntimeException("term " + term + ": doc " + doc + ": pos " + pos + " is out of bounds");
} }
if (pos < lastPos) { if (pos < lastPos) {
@ -919,14 +916,8 @@ public class CheckIndex {
int lastOffset = 0; int lastOffset = 0;
for(int posUpto=0;posUpto<freq;posUpto++) { for(int posUpto=0;posUpto<freq;posUpto++) {
final int pos = postings.nextPosition(); final int pos = postings.nextPosition();
// NOTE: pos=-1 is allowed because of ancient bug
// (LUCENE-1542) whereby IndexWriter could if (pos < 0) {
// write pos=-1 when first token's posInc is 0
// (separately: analyzers should not give
// posInc=0 to first token); also, term
// vectors are allowed to return pos=-1 if
// they indexed offset but not positions:
if (pos < -1) {
throw new RuntimeException("position " + pos + " is out of bounds"); throw new RuntimeException("position " + pos + " is out of bounds");
} }
if (pos < lastPosition) { if (pos < lastPosition) {
@ -1498,7 +1489,7 @@ public class CheckIndex {
int pos = postings.nextPosition(); int pos = postings.nextPosition();
if (postingsPostings != null) { if (postingsPostings != null) {
int postingsPos = postingsPostings.nextPosition(); int postingsPos = postingsPostings.nextPosition();
if (pos != -1 && postingsPos != -1 && pos != postingsPos) { if (terms.hasPositions() && pos != postingsPos) {
throw new RuntimeException("vector term=" + term + " field=" + field + " doc=" + j + ": pos=" + pos + " differs from postings pos=" + postingsPos); throw new RuntimeException("vector term=" + term + " field=" + field + " doc=" + j + ": pos=" + pos + " differs from postings pos=" + postingsPos);
} }
} }