improve compressed string construction, allow to construct it from utf8 bytes and use it where applicable

This commit is contained in:
Shay Banon 2012-01-30 21:23:15 +02:00
parent 639a03fbe0
commit 9194d36a64
4 changed files with 27 additions and 3 deletions

View File

@ -168,7 +168,8 @@ public class AliasMetaData {
return this; return this;
} }
try { try {
this.filter = new CompressedString(XContentFactory.jsonBuilder().map(filter).string()); XContentBuilder builder = XContentFactory.jsonBuilder().map(filter);
this.filter = new CompressedString(builder.underlyingBytes(), 0, builder.underlyingBytesLength());
return this; return this;
} catch (IOException e) { } catch (IOException e) {
throw new ElasticSearchGenerationException("Failed to build json for alias request", e); throw new ElasticSearchGenerationException("Failed to build json for alias request", e);

View File

@ -28,6 +28,7 @@ import org.elasticsearch.common.io.stream.StreamInput;
import org.elasticsearch.common.io.stream.StreamOutput; import org.elasticsearch.common.io.stream.StreamOutput;
import org.elasticsearch.common.joda.FormatDateTimeFormatter; import org.elasticsearch.common.joda.FormatDateTimeFormatter;
import org.elasticsearch.common.joda.Joda; import org.elasticsearch.common.joda.Joda;
import org.elasticsearch.common.xcontent.XContentBuilder;
import org.elasticsearch.common.xcontent.XContentFactory; import org.elasticsearch.common.xcontent.XContentFactory;
import org.elasticsearch.common.xcontent.XContentHelper; import org.elasticsearch.common.xcontent.XContentHelper;
import org.elasticsearch.common.xcontent.XContentParser; import org.elasticsearch.common.xcontent.XContentParser;
@ -279,7 +280,8 @@ public class MappingMetaData {
public MappingMetaData(String type, Map<String, Object> mapping) throws IOException { public MappingMetaData(String type, Map<String, Object> mapping) throws IOException {
this.type = type; this.type = type;
this.source = new CompressedString(XContentFactory.jsonBuilder().map(mapping).string()); XContentBuilder mappingBuilder = XContentFactory.jsonBuilder().map(mapping);
this.source = new CompressedString(mappingBuilder.underlyingBytes(), 0, mappingBuilder.underlyingBytesLength());
Map<String, Object> withoutType = mapping; Map<String, Object> withoutType = mapping;
if (mapping.size() == 1 && mapping.containsKey(type)) { if (mapping.size() == 1 && mapping.containsKey(type)) {
withoutType = (Map<String, Object>) mapping.get(type); withoutType = (Map<String, Object>) mapping.get(type);

View File

@ -21,6 +21,7 @@ package org.elasticsearch.common.compress;
import org.apache.lucene.util.UnicodeUtil; import org.apache.lucene.util.UnicodeUtil;
import org.elasticsearch.common.Unicode; import org.elasticsearch.common.Unicode;
import org.elasticsearch.common.compress.lzf.LZF;
import org.elasticsearch.common.compress.lzf.LZFDecoder; import org.elasticsearch.common.compress.lzf.LZFDecoder;
import org.elasticsearch.common.compress.lzf.LZFEncoder; import org.elasticsearch.common.compress.lzf.LZFEncoder;
import org.elasticsearch.common.io.stream.StreamInput; import org.elasticsearch.common.io.stream.StreamInput;
@ -40,10 +41,30 @@ public class CompressedString implements Streamable {
CompressedString() { CompressedString() {
} }
/**
* Constructor assuming the data provided is compressed (UTF8). It uses the provided
* array without copying it.
*/
public CompressedString(byte[] compressed) { public CompressedString(byte[] compressed) {
this.bytes = compressed; this.bytes = compressed;
} }
/**
* Constructs a new compressed string, assuming the bytes are UTF8, by copying it over.
*
* @param data The byte array
* @param offset Offset into the byte array
* @param length The length of the data
* @throws IOException
*/
public CompressedString(byte[] data, int offset, int length) throws IOException {
if (LZF.isCompressed(data, offset, length)) {
this.bytes = Arrays.copyOfRange(data, offset, offset + length);
} else {
this.bytes = LZFEncoder.encode(data, offset, length);
}
}
public CompressedString(String str) throws IOException { public CompressedString(String str) throws IOException {
UnicodeUtil.UTF8Result result = Unicode.unsafeFromStringAsUtf8(str); UnicodeUtil.UTF8Result result = Unicode.unsafeFromStringAsUtf8(str);
this.bytes = LZFEncoder.encode(result.result, result.length); this.bytes = LZFEncoder.encode(result.result, result.length);

View File

@ -573,7 +573,7 @@ public class DocumentMapper implements ToXContent {
builder.startObject(); builder.startObject();
toXContent(builder, ToXContent.EMPTY_PARAMS); toXContent(builder, ToXContent.EMPTY_PARAMS);
builder.endObject(); builder.endObject();
this.mappingSource = new CompressedString(builder.string()); this.mappingSource = new CompressedString(builder.underlyingBytes(), 0, builder.underlyingBytesLength());
} catch (Exception e) { } catch (Exception e) {
throw new FailedToGenerateSourceMapperException(e.getMessage(), e); throw new FailedToGenerateSourceMapperException(e.getMessage(), e);
} }