mirror of https://github.com/apache/lucene.git
- This is not a unit test class, so it should not be here.
git-svn-id: https://svn.apache.org/repos/asf/lucene/java/trunk@149883 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
parent
748fdb1b96
commit
d0a577e1bd
|
@ -1,113 +0,0 @@
|
|||
package org.apache.lucene;
|
||||
|
||||
/* ====================================================================
|
||||
* The Apache Software License, Version 1.1
|
||||
*
|
||||
* Copyright (c) 2001 The Apache Software Foundation. All rights
|
||||
* reserved.
|
||||
*
|
||||
* Redistribution and use in source and binary forms, with or without
|
||||
* modification, are permitted provided that the following conditions
|
||||
* are met:
|
||||
*
|
||||
* 1. Redistributions of source code must retain the above copyright
|
||||
* notice, this list of conditions and the following disclaimer.
|
||||
*
|
||||
* 2. Redistributions in binary form must reproduce the above copyright
|
||||
* notice, this list of conditions and the following disclaimer in
|
||||
* the documentation and/or other materials provided with the
|
||||
* distribution.
|
||||
*
|
||||
* 3. The end-user documentation included with the redistribution,
|
||||
* if any, must include the following acknowledgment:
|
||||
* "This product includes software developed by the
|
||||
* Apache Software Foundation (http://www.apache.org/)."
|
||||
* Alternately, this acknowledgment may appear in the software itself,
|
||||
* if and wherever such third-party acknowledgments normally appear.
|
||||
*
|
||||
* 4. The names "Apache" and "Apache Software Foundation" and
|
||||
* "Apache Lucene" must not be used to endorse or promote products
|
||||
* derived from this software without prior written permission. For
|
||||
* written permission, please contact apache@apache.org.
|
||||
*
|
||||
* 5. Products derived from this software may not be called "Apache",
|
||||
* "Apache Lucene", nor may "Apache" appear in their name, without
|
||||
* prior written permission of the Apache Software Foundation.
|
||||
*
|
||||
* THIS SOFTWARE IS PROVIDED ``AS IS'' AND ANY EXPRESSED OR IMPLIED
|
||||
* WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
|
||||
* OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE
|
||||
* DISCLAIMED. IN NO EVENT SHALL THE APACHE SOFTWARE FOUNDATION OR
|
||||
* ITS CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
|
||||
* SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
|
||||
* LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF
|
||||
* USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND
|
||||
* ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,
|
||||
* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT
|
||||
* OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF
|
||||
* SUCH DAMAGE.
|
||||
* ====================================================================
|
||||
*
|
||||
* This software consists of voluntary contributions made by many
|
||||
* individuals on behalf of the Apache Software Foundation. For more
|
||||
* information on the Apache Software Foundation, please see
|
||||
* <http://www.apache.org/>.
|
||||
*/
|
||||
|
||||
import org.apache.lucene.util.PriorityQueue;
|
||||
import org.apache.lucene.store.Directory;
|
||||
import org.apache.lucene.store.FSDirectory;
|
||||
import org.apache.lucene.index.IndexReader;
|
||||
import org.apache.lucene.index.Term;
|
||||
import org.apache.lucene.index.TermEnum;
|
||||
|
||||
class HighFreqTerms {
|
||||
public static int numTerms = 100;
|
||||
|
||||
public static void main(String[] args) throws Exception {
|
||||
IndexReader reader = IndexReader.open("index");
|
||||
|
||||
TermInfoQueue tiq = new TermInfoQueue(numTerms);
|
||||
TermEnum terms = reader.terms();
|
||||
|
||||
int minFreq = 0;
|
||||
while (terms.next()) {
|
||||
if (terms.docFreq() > minFreq) {
|
||||
tiq.put(new TermInfo(terms.term(), terms.docFreq()));
|
||||
if (tiq.size() > numTerms) { // if tiq overfull
|
||||
tiq.pop(); // remove lowest in tiq
|
||||
minFreq = ((TermInfo)tiq.top()).docFreq; // reset minFreq
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
while (tiq.size() != 0) {
|
||||
TermInfo termInfo = (TermInfo)tiq.pop();
|
||||
System.out.println(termInfo.term + " " + termInfo.docFreq);
|
||||
}
|
||||
|
||||
reader.close();
|
||||
|
||||
}
|
||||
}
|
||||
|
||||
final class TermInfo {
|
||||
TermInfo(Term t, int df) {
|
||||
term = t;
|
||||
docFreq = df;
|
||||
}
|
||||
int docFreq;
|
||||
Term term;
|
||||
}
|
||||
|
||||
final class TermInfoQueue extends PriorityQueue {
|
||||
TermInfoQueue(int size) {
|
||||
initialize(size);
|
||||
}
|
||||
protected final boolean lessThan(Object a, Object b) {
|
||||
TermInfo termInfoA = (TermInfo)a;
|
||||
TermInfo termInfoB = (TermInfo)b;
|
||||
return termInfoA.docFreq < termInfoB.docFreq;
|
||||
}
|
||||
}
|
||||
|
Loading…
Reference in New Issue