mirror of
https://github.com/apache/lucene.git
synced 2025-02-08 02:58:58 +00:00
Use HTMLStripCharFilter instead of deprecated HTMLStripReader
git-svn-id: https://svn.apache.org/repos/asf/lucene/solr/trunk@819638 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
parent
36a99b82fc
commit
fae44c8c06
@ -16,10 +16,12 @@
|
|||||||
*/
|
*/
|
||||||
package org.apache.solr.handler.dataimport;
|
package org.apache.solr.handler.dataimport;
|
||||||
|
|
||||||
import org.apache.solr.analysis.HTMLStripReader;
|
import org.apache.solr.analysis.HTMLStripCharFilter;
|
||||||
|
import org.apache.lucene.analysis.CharReader;
|
||||||
|
|
||||||
import java.io.IOException;
|
import java.io.IOException;
|
||||||
import java.io.StringReader;
|
import java.io.StringReader;
|
||||||
|
import java.io.BufferedReader;
|
||||||
import java.util.ArrayList;
|
import java.util.ArrayList;
|
||||||
import java.util.List;
|
import java.util.List;
|
||||||
import java.util.Map;
|
import java.util.Map;
|
||||||
@ -29,7 +31,7 @@ import java.util.Map;
|
|||||||
* in case you don't need this HTML anyway.
|
* in case you don't need this HTML anyway.
|
||||||
*
|
*
|
||||||
* @version $Id$
|
* @version $Id$
|
||||||
* @see org.apache.solr.analysis.HTMLStripReader
|
* @see org.apache.solr.analysis.HTMLStripCharFilter
|
||||||
* @since solr 1.4
|
* @since solr 1.4
|
||||||
*/
|
*/
|
||||||
public class HTMLStripTransformer extends Transformer {
|
public class HTMLStripTransformer extends Transformer {
|
||||||
@ -73,7 +75,7 @@ public class HTMLStripTransformer extends Transformer {
|
|||||||
StringBuilder out = new StringBuilder();
|
StringBuilder out = new StringBuilder();
|
||||||
StringReader strReader = new StringReader(value);
|
StringReader strReader = new StringReader(value);
|
||||||
try {
|
try {
|
||||||
HTMLStripReader html = new HTMLStripReader(strReader);
|
HTMLStripCharFilter html = new HTMLStripCharFilter(CharReader.get(strReader.markSupported() ? strReader : new BufferedReader(strReader)));
|
||||||
char[] cbuf = new char[1024 * 10];
|
char[] cbuf = new char[1024 * 10];
|
||||||
while (true) {
|
while (true) {
|
||||||
int count = html.read(cbuf);
|
int count = html.read(cbuf);
|
||||||
|
Loading…
x
Reference in New Issue
Block a user