LUCENE-2728: fix id handling in EnwikiContentSource

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1028386 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
Grant Ingersoll 2010-10-28 17:04:26 +00:00
parent e5aa5c8e89
commit dd42b928c7
1 changed files with 4 additions and 1 deletions

View File

@ -152,7 +152,10 @@ public class EnwikiContentSource extends ContentSource {
title = contents.toString();
break;
case ID:
id = contents.toString();
//the doc id is the first one in the page. All other ids after that one can be ignored according to the schema
if (id == null) {
id = contents.toString();
}
break;
default:
// this element should be discarded.