mirror of https://github.com/apache/lucene.git
LUCENE-7239: Use interval tree to speed up LatLonPoint.newPolygonQuery
This commit is contained in:
parent
f3de223774
commit
4fd5d88080
|
@ -48,9 +48,6 @@ Optimizations
|
||||||
* LUCENE-7105, LUCENE-7215: Optimize LatLonPoint's newDistanceQuery.
|
* LUCENE-7105, LUCENE-7215: Optimize LatLonPoint's newDistanceQuery.
|
||||||
(Robert Muir)
|
(Robert Muir)
|
||||||
|
|
||||||
* LUCENE-7109: LatLonPoint's newPolygonQuery supports two-phase
|
|
||||||
iteration. (Robert Muir)
|
|
||||||
|
|
||||||
* LUCENE-7097: IntroSorter now recurses to 2 * log_2(count) quicksort
|
* LUCENE-7097: IntroSorter now recurses to 2 * log_2(count) quicksort
|
||||||
stack depth before switching to heapsort (Adrien Grand, Mike McCandless)
|
stack depth before switching to heapsort (Adrien Grand, Mike McCandless)
|
||||||
|
|
||||||
|
@ -64,8 +61,8 @@ Optimizations
|
||||||
multiple polygons and holes, with memory usage independent of
|
multiple polygons and holes, with memory usage independent of
|
||||||
polygon complexity. (Karl Wright, Mike McCandless, Robert Muir)
|
polygon complexity. (Karl Wright, Mike McCandless, Robert Muir)
|
||||||
|
|
||||||
* LUCENE-7159, LUCENE-7222, LUCENE-7229: Speed up LatLonPoint polygon performance for complex
|
* LUCENE-7159, LUCENE-7222, LUCENE-7229, LUCENE-7239: Speed up LatLonPoint
|
||||||
polygons. (Robert Muir)
|
polygon performance. (Robert Muir)
|
||||||
|
|
||||||
* LUCENE-7211: Reduce memory & GC for spatial RPT Intersects when the number of
|
* LUCENE-7211: Reduce memory & GC for spatial RPT Intersects when the number of
|
||||||
matching docs is small. (Jeff Wartes, David Smiley)
|
matching docs is small. (Jeff Wartes, David Smiley)
|
||||||
|
|
|
@ -60,14 +60,14 @@ final class LatLonGrid {
|
||||||
final long latPerCell;
|
final long latPerCell;
|
||||||
final long lonPerCell;
|
final long lonPerCell;
|
||||||
|
|
||||||
final Polygon[] polygons;
|
final LatLonTree[] tree;
|
||||||
|
|
||||||
LatLonGrid(int minLat, int maxLat, int minLon, int maxLon, Polygon... polygons) {
|
LatLonGrid(int minLat, int maxLat, int minLon, int maxLon, Polygon... polygons) {
|
||||||
this.minLat = minLat;
|
this.minLat = minLat;
|
||||||
this.maxLat = maxLat;
|
this.maxLat = maxLat;
|
||||||
this.minLon = minLon;
|
this.minLon = minLon;
|
||||||
this.maxLon = maxLon;
|
this.maxLon = maxLon;
|
||||||
this.polygons = polygons;
|
this.tree = LatLonTree.build(polygons);
|
||||||
if (minLon > maxLon) {
|
if (minLon > maxLon) {
|
||||||
// maybe make 2 grids if you want this?
|
// maybe make 2 grids if you want this?
|
||||||
throw new IllegalArgumentException("Grid cannot cross the dateline");
|
throw new IllegalArgumentException("Grid cannot cross the dateline");
|
||||||
|
@ -88,12 +88,12 @@ final class LatLonGrid {
|
||||||
// but it prevents edge case bugs.
|
// but it prevents edge case bugs.
|
||||||
latPerCell = latitudeRange / (GRID_SIZE - 1);
|
latPerCell = latitudeRange / (GRID_SIZE - 1);
|
||||||
lonPerCell = longitudeRange / (GRID_SIZE - 1);
|
lonPerCell = longitudeRange / (GRID_SIZE - 1);
|
||||||
fill(polygons, 0, GRID_SIZE, 0, GRID_SIZE);
|
fill(0, GRID_SIZE, 0, GRID_SIZE);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
/** fills a 2D range of grid cells [minLatIndex .. maxLatIndex) X [minLonIndex .. maxLonIndex) */
|
/** fills a 2D range of grid cells [minLatIndex .. maxLatIndex) X [minLonIndex .. maxLonIndex) */
|
||||||
void fill(Polygon[] polygons, int minLatIndex, int maxLatIndex, int minLonIndex, int maxLonIndex) {
|
void fill(int minLatIndex, int maxLatIndex, int minLonIndex, int maxLonIndex) {
|
||||||
// grid cells at the edge of the bounding box are typically smaller than normal, because we spill over.
|
// grid cells at the edge of the bounding box are typically smaller than normal, because we spill over.
|
||||||
long cellMinLat = minLat + (minLatIndex * latPerCell);
|
long cellMinLat = minLat + (minLatIndex * latPerCell);
|
||||||
long cellMaxLat = Math.min(maxLat, minLat + (maxLatIndex * latPerCell) - 1);
|
long cellMaxLat = Math.min(maxLat, minLat + (maxLatIndex * latPerCell) - 1);
|
||||||
|
@ -104,10 +104,10 @@ final class LatLonGrid {
|
||||||
assert cellMaxLat >= cellMinLat;
|
assert cellMaxLat >= cellMinLat;
|
||||||
assert cellMaxLon >= cellMinLon;
|
assert cellMaxLon >= cellMinLon;
|
||||||
|
|
||||||
Relation relation = Polygon.relate(polygons, decodeLatitude((int) cellMinLat),
|
Relation relation = LatLonTree.relate(tree, decodeLatitude((int) cellMinLat),
|
||||||
decodeLatitude((int) cellMaxLat),
|
decodeLatitude((int) cellMaxLat),
|
||||||
decodeLongitude((int) cellMinLon),
|
decodeLongitude((int) cellMinLon),
|
||||||
decodeLongitude((int) cellMaxLon));
|
decodeLongitude((int) cellMaxLon));
|
||||||
if (relation != Relation.CELL_CROSSES_QUERY) {
|
if (relation != Relation.CELL_CROSSES_QUERY) {
|
||||||
// we know the answer for this region, fill the cell range
|
// we know the answer for this region, fill the cell range
|
||||||
for (int i = minLatIndex; i < maxLatIndex; i++) {
|
for (int i = minLatIndex; i < maxLatIndex; i++) {
|
||||||
|
@ -127,10 +127,10 @@ final class LatLonGrid {
|
||||||
// grid range crosses our polygon, keep recursing.
|
// grid range crosses our polygon, keep recursing.
|
||||||
int midLatIndex = (minLatIndex + maxLatIndex) >>> 1;
|
int midLatIndex = (minLatIndex + maxLatIndex) >>> 1;
|
||||||
int midLonIndex = (minLonIndex + maxLonIndex) >>> 1;
|
int midLonIndex = (minLonIndex + maxLonIndex) >>> 1;
|
||||||
fill(polygons, minLatIndex, midLatIndex, minLonIndex, midLonIndex);
|
fill(minLatIndex, midLatIndex, minLonIndex, midLonIndex);
|
||||||
fill(polygons, minLatIndex, midLatIndex, midLonIndex, maxLonIndex);
|
fill(minLatIndex, midLatIndex, midLonIndex, maxLonIndex);
|
||||||
fill(polygons, midLatIndex, maxLatIndex, minLonIndex, midLonIndex);
|
fill(midLatIndex, maxLatIndex, minLonIndex, midLonIndex);
|
||||||
fill(polygons, midLatIndex, maxLatIndex, midLonIndex, maxLonIndex);
|
fill(midLatIndex, maxLatIndex, midLonIndex, maxLonIndex);
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
@ -147,7 +147,7 @@ final class LatLonGrid {
|
||||||
// the grid is unsure (boundary): do a real test.
|
// the grid is unsure (boundary): do a real test.
|
||||||
double docLatitude = decodeLatitude(latitude);
|
double docLatitude = decodeLatitude(latitude);
|
||||||
double docLongitude = decodeLongitude(longitude);
|
double docLongitude = decodeLongitude(longitude);
|
||||||
return Polygon.contains(polygons, docLatitude, docLongitude);
|
return LatLonTree.contains(tree, docLatitude, docLongitude);
|
||||||
}
|
}
|
||||||
|
|
||||||
/** Returns grid index of lat/lon, or -1 if the value is outside of the bounding box. */
|
/** Returns grid index of lat/lon, or -1 if the value is outside of the bounding box. */
|
||||||
|
|
|
@ -29,19 +29,13 @@ import org.apache.lucene.search.DocIdSetIterator;
|
||||||
import org.apache.lucene.search.IndexSearcher;
|
import org.apache.lucene.search.IndexSearcher;
|
||||||
import org.apache.lucene.search.Query;
|
import org.apache.lucene.search.Query;
|
||||||
import org.apache.lucene.search.Scorer;
|
import org.apache.lucene.search.Scorer;
|
||||||
import org.apache.lucene.search.TwoPhaseIterator;
|
|
||||||
import org.apache.lucene.search.Weight;
|
import org.apache.lucene.search.Weight;
|
||||||
import org.apache.lucene.index.PointValues;
|
import org.apache.lucene.index.PointValues;
|
||||||
import org.apache.lucene.index.SortedNumericDocValues;
|
|
||||||
import org.apache.lucene.index.DocValues;
|
|
||||||
import org.apache.lucene.index.FieldInfo;
|
import org.apache.lucene.index.FieldInfo;
|
||||||
import org.apache.lucene.index.LeafReader;
|
import org.apache.lucene.index.LeafReader;
|
||||||
import org.apache.lucene.index.LeafReaderContext;
|
import org.apache.lucene.index.LeafReaderContext;
|
||||||
import org.apache.lucene.util.BitSet;
|
|
||||||
import org.apache.lucene.util.DocIdSetBuilder;
|
import org.apache.lucene.util.DocIdSetBuilder;
|
||||||
import org.apache.lucene.util.FixedBitSet;
|
|
||||||
import org.apache.lucene.util.NumericUtils;
|
import org.apache.lucene.util.NumericUtils;
|
||||||
import org.apache.lucene.util.SparseFixedBitSet;
|
|
||||||
import org.apache.lucene.util.StringHelper;
|
import org.apache.lucene.util.StringHelper;
|
||||||
import org.apache.lucene.geo.Polygon;
|
import org.apache.lucene.geo.Polygon;
|
||||||
|
|
||||||
|
@ -98,13 +92,6 @@ final class LatLonPointInPolygonQuery extends Query {
|
||||||
NumericUtils.intToSortableBytes(encodeLongitude(box.minLon), minLon, 0);
|
NumericUtils.intToSortableBytes(encodeLongitude(box.minLon), minLon, 0);
|
||||||
NumericUtils.intToSortableBytes(encodeLongitude(box.maxLon), maxLon, 0);
|
NumericUtils.intToSortableBytes(encodeLongitude(box.maxLon), maxLon, 0);
|
||||||
|
|
||||||
// TODO: make this fancier, but currently linear with number of vertices
|
|
||||||
float cumulativeCost = 0;
|
|
||||||
for (Polygon polygon : polygons) {
|
|
||||||
cumulativeCost += 20 * (polygon.getPolyLats().length + polygon.getHoles().length);
|
|
||||||
}
|
|
||||||
final float matchCost = cumulativeCost;
|
|
||||||
|
|
||||||
final LatLonGrid grid = new LatLonGrid(encodeLatitude(box.minLat),
|
final LatLonGrid grid = new LatLonGrid(encodeLatitude(box.minLat),
|
||||||
encodeLatitude(box.maxLat),
|
encodeLatitude(box.maxLat),
|
||||||
encodeLongitude(box.minLon),
|
encodeLongitude(box.minLon),
|
||||||
|
@ -127,22 +114,14 @@ final class LatLonPointInPolygonQuery extends Query {
|
||||||
}
|
}
|
||||||
LatLonPoint.checkCompatible(fieldInfo);
|
LatLonPoint.checkCompatible(fieldInfo);
|
||||||
|
|
||||||
// approximation (postfiltering has not yet been applied)
|
// matching docids
|
||||||
DocIdSetBuilder result = new DocIdSetBuilder(reader.maxDoc());
|
DocIdSetBuilder result = new DocIdSetBuilder(reader.maxDoc());
|
||||||
// subset of documents that need no postfiltering, this is purely an optimization
|
|
||||||
final BitSet preApproved;
|
|
||||||
// dumb heuristic: if the field is really sparse, use a sparse impl
|
|
||||||
if (values.getDocCount(field) * 100L < reader.maxDoc()) {
|
|
||||||
preApproved = new SparseFixedBitSet(reader.maxDoc());
|
|
||||||
} else {
|
|
||||||
preApproved = new FixedBitSet(reader.maxDoc());
|
|
||||||
}
|
|
||||||
values.intersect(field,
|
values.intersect(field,
|
||||||
new IntersectVisitor() {
|
new IntersectVisitor() {
|
||||||
@Override
|
@Override
|
||||||
public void visit(int docID) {
|
public void visit(int docID) {
|
||||||
result.add(docID);
|
result.add(docID);
|
||||||
preApproved.set(docID);
|
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
|
@ -156,7 +135,10 @@ final class LatLonPointInPolygonQuery extends Query {
|
||||||
// outside of global bounding box range
|
// outside of global bounding box range
|
||||||
return;
|
return;
|
||||||
}
|
}
|
||||||
result.add(docID);
|
if (grid.contains(NumericUtils.sortableBytesToInt(packedValue, 0),
|
||||||
|
NumericUtils.sortableBytesToInt(packedValue, Integer.BYTES))) {
|
||||||
|
result.add(docID);
|
||||||
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
@Override
|
@Override
|
||||||
|
@ -184,36 +166,7 @@ final class LatLonPointInPolygonQuery extends Query {
|
||||||
return null;
|
return null;
|
||||||
}
|
}
|
||||||
|
|
||||||
// return two-phase iterator using docvalues to postfilter candidates
|
return new ConstantScoreScorer(this, score(), disi);
|
||||||
SortedNumericDocValues docValues = DocValues.getSortedNumeric(reader, field);
|
|
||||||
|
|
||||||
TwoPhaseIterator iterator = new TwoPhaseIterator(disi) {
|
|
||||||
@Override
|
|
||||||
public boolean matches() throws IOException {
|
|
||||||
int docId = disi.docID();
|
|
||||||
if (preApproved.get(docId)) {
|
|
||||||
return true;
|
|
||||||
} else {
|
|
||||||
docValues.setDocument(docId);
|
|
||||||
int count = docValues.count();
|
|
||||||
for (int i = 0; i < count; i++) {
|
|
||||||
long encoded = docValues.valueAt(i);
|
|
||||||
int latitudeBits = (int)(encoded >> 32);
|
|
||||||
int longitudeBits = (int)(encoded & 0xFFFFFFFF);
|
|
||||||
if (grid.contains(latitudeBits, longitudeBits)) {
|
|
||||||
return true;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
return false;
|
|
||||||
}
|
|
||||||
}
|
|
||||||
|
|
||||||
@Override
|
|
||||||
public float matchCost() {
|
|
||||||
return matchCost;
|
|
||||||
}
|
|
||||||
};
|
|
||||||
return new ConstantScoreScorer(this, score(), iterator);
|
|
||||||
}
|
}
|
||||||
};
|
};
|
||||||
}
|
}
|
||||||
|
|
|
@ -0,0 +1,401 @@
|
||||||
|
/*
|
||||||
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
||||||
|
* contributor license agreements. See the NOTICE file distributed with
|
||||||
|
* this work for additional information regarding copyright ownership.
|
||||||
|
* The ASF licenses this file to You under the Apache License, Version 2.0
|
||||||
|
* (the "License"); you may not use this file except in compliance with
|
||||||
|
* the License. You may obtain a copy of the License at
|
||||||
|
*
|
||||||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
*
|
||||||
|
* Unless required by applicable law or agreed to in writing, software
|
||||||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
* See the License for the specific language governing permissions and
|
||||||
|
* limitations under the License.
|
||||||
|
*/
|
||||||
|
package org.apache.lucene.document;
|
||||||
|
|
||||||
|
import java.util.ArrayList;
|
||||||
|
import java.util.Arrays;
|
||||||
|
import java.util.Collections;
|
||||||
|
import java.util.List;
|
||||||
|
import java.util.Random;
|
||||||
|
|
||||||
|
import org.apache.lucene.geo.Polygon;
|
||||||
|
import org.apache.lucene.index.PointValues.Relation;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* 2D polygon implementation represented as a randomized interval tree of edges.
|
||||||
|
* <p>
|
||||||
|
* contains() and crosses() are still O(n), but for most practical polygons
|
||||||
|
* are much faster than brute force.
|
||||||
|
* <p>
|
||||||
|
* Loosely based on the algorithm described in <a href="http://www-ma2.upc.es/geoc/Schirra-pointPolygon.pdf">
|
||||||
|
* http://www-ma2.upc.es/geoc/Schirra-pointPolygon.pdf</a>.
|
||||||
|
*/
|
||||||
|
// Both Polygon.contains() and Polygon.crossesSlowly() loop all edges, and first check that the edge is within a range.
|
||||||
|
// we just organize the edges to do the same computations on the same subset of edges more efficiently.
|
||||||
|
// TODO: clean this up, call it Polygon2D, and remove all the 2D methods from Polygon?
|
||||||
|
final class LatLonTree {
|
||||||
|
private final LatLonTree[] holes;
|
||||||
|
|
||||||
|
/** minimum latitude of this polygon's bounding box area */
|
||||||
|
final double minLat;
|
||||||
|
/** maximum latitude of this polygon's bounding box area */
|
||||||
|
final double maxLat;
|
||||||
|
/** minimum longitude of this polygon's bounding box area */
|
||||||
|
final double minLon;
|
||||||
|
/** maximum longitude of this polygon's bounding box area */
|
||||||
|
final double maxLon;
|
||||||
|
|
||||||
|
/** root node of our tree */
|
||||||
|
final Edge tree;
|
||||||
|
|
||||||
|
// TODO: "pack" all the gons and holes into one tree with separator.
|
||||||
|
// the algorithms support this, but we have to be careful.
|
||||||
|
LatLonTree(Polygon polygon, LatLonTree... holes) {
|
||||||
|
this.holes = holes.clone();
|
||||||
|
this.minLat = polygon.minLat;
|
||||||
|
this.maxLat = polygon.maxLat;
|
||||||
|
this.minLon = polygon.minLon;
|
||||||
|
this.maxLon = polygon.maxLon;
|
||||||
|
|
||||||
|
// create interval tree of edges
|
||||||
|
this.tree = createTree(polygon.getPolyLats(), polygon.getPolyLons());
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Returns true if the point is contained within this polygon.
|
||||||
|
* <p>
|
||||||
|
* See <a href="https://www.ecse.rpi.edu/~wrf/Research/Short_Notes/pnpoly.html">
|
||||||
|
* https://www.ecse.rpi.edu/~wrf/Research/Short_Notes/pnpoly.html</a> for more information.
|
||||||
|
*/
|
||||||
|
boolean contains(double latitude, double longitude) {
|
||||||
|
// check bounding box
|
||||||
|
if (latitude < minLat || latitude > maxLat || longitude < minLon || longitude > maxLon) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
if (tree.contains(latitude, longitude)) {
|
||||||
|
for (LatLonTree hole : holes) {
|
||||||
|
if (hole.contains(latitude, longitude)) {
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
/** Returns relation to the provided rectangle */
|
||||||
|
Relation relate(double minLat, double maxLat, double minLon, double maxLon) {
|
||||||
|
// if the bounding boxes are disjoint then the shape does not cross
|
||||||
|
if (maxLon < this.minLon || minLon > this.maxLon || maxLat < this.minLat || minLat > this.maxLat) {
|
||||||
|
return Relation.CELL_OUTSIDE_QUERY;
|
||||||
|
}
|
||||||
|
// if the rectangle fully encloses us, we cross.
|
||||||
|
if (minLat <= this.minLat && maxLat >= this.maxLat && minLon <= this.minLon && maxLon >= this.maxLon) {
|
||||||
|
return Relation.CELL_CROSSES_QUERY;
|
||||||
|
}
|
||||||
|
// check any holes
|
||||||
|
for (LatLonTree hole : holes) {
|
||||||
|
Relation holeRelation = hole.relate(minLat, maxLat, minLon, maxLon);
|
||||||
|
if (holeRelation == Relation.CELL_CROSSES_QUERY) {
|
||||||
|
return Relation.CELL_CROSSES_QUERY;
|
||||||
|
} else if (holeRelation == Relation.CELL_INSIDE_QUERY) {
|
||||||
|
return Relation.CELL_OUTSIDE_QUERY;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
// check each corner: if < 4 are present, its cheaper than crossesSlowly
|
||||||
|
int numCorners = numberOfCorners(minLat, maxLat, minLon, maxLon);
|
||||||
|
if (numCorners == 4) {
|
||||||
|
if (tree.crosses(minLat, maxLat, minLon, maxLon)) {
|
||||||
|
return Relation.CELL_CROSSES_QUERY;
|
||||||
|
}
|
||||||
|
return Relation.CELL_INSIDE_QUERY;
|
||||||
|
} else if (numCorners > 0) {
|
||||||
|
return Relation.CELL_CROSSES_QUERY;
|
||||||
|
}
|
||||||
|
|
||||||
|
// we cross
|
||||||
|
if (tree.crosses(minLat, maxLat, minLon, maxLon)) {
|
||||||
|
return Relation.CELL_CROSSES_QUERY;
|
||||||
|
}
|
||||||
|
|
||||||
|
return Relation.CELL_OUTSIDE_QUERY;
|
||||||
|
}
|
||||||
|
|
||||||
|
// returns 0, 4, or something in between
|
||||||
|
private int numberOfCorners(double minLat, double maxLat, double minLon, double maxLon) {
|
||||||
|
int containsCount = 0;
|
||||||
|
if (contains(minLat, minLon)) {
|
||||||
|
containsCount++;
|
||||||
|
}
|
||||||
|
if (contains(minLat, maxLon)) {
|
||||||
|
containsCount++;
|
||||||
|
}
|
||||||
|
if (containsCount == 1) {
|
||||||
|
return containsCount;
|
||||||
|
}
|
||||||
|
if (contains(maxLat, maxLon)) {
|
||||||
|
containsCount++;
|
||||||
|
}
|
||||||
|
if (containsCount == 2) {
|
||||||
|
return containsCount;
|
||||||
|
}
|
||||||
|
if (contains(maxLat, minLon)) {
|
||||||
|
containsCount++;
|
||||||
|
}
|
||||||
|
return containsCount;
|
||||||
|
}
|
||||||
|
|
||||||
|
/** Helper for multipolygon logic: returns true if any of the supplied polygons contain the point */
|
||||||
|
static boolean contains(LatLonTree[] polygons, double latitude, double longitude) {
|
||||||
|
for (LatLonTree polygon : polygons) {
|
||||||
|
if (polygon.contains(latitude, longitude)) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
|
||||||
|
/** Returns the multipolygon relation for the rectangle */
|
||||||
|
static Relation relate(LatLonTree[] polygons, double minLat, double maxLat, double minLon, double maxLon) {
|
||||||
|
for (LatLonTree polygon : polygons) {
|
||||||
|
Relation relation = polygon.relate(minLat, maxLat, minLon, maxLon);
|
||||||
|
if (relation != Relation.CELL_OUTSIDE_QUERY) {
|
||||||
|
// note: we optimize for non-overlapping multipolygons. so if we cross one,
|
||||||
|
// we won't keep iterating to try to find a contains.
|
||||||
|
return relation;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return Relation.CELL_OUTSIDE_QUERY;
|
||||||
|
}
|
||||||
|
|
||||||
|
/** Builds a tree from multipolygon */
|
||||||
|
static LatLonTree[] build(Polygon... polygons) {
|
||||||
|
// TODO: use one tree with separators (carefully!)
|
||||||
|
LatLonTree trees[] = new LatLonTree[polygons.length];
|
||||||
|
for (int i = 0; i < trees.length; i++) {
|
||||||
|
Polygon gon = polygons[i];
|
||||||
|
Polygon gonHoles[] = gon.getHoles();
|
||||||
|
LatLonTree holes[] = new LatLonTree[gonHoles.length];
|
||||||
|
for (int j = 0; j < holes.length; j++) {
|
||||||
|
holes[j] = new LatLonTree(gonHoles[j]);
|
||||||
|
}
|
||||||
|
trees[i] = new LatLonTree(gon, holes);
|
||||||
|
}
|
||||||
|
return trees;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Internal tree node: represents polygon edge from lat1,lon1 to lat2,lon2.
|
||||||
|
* The sort value is {@code low}, which is the minimum latitude of the edge.
|
||||||
|
* {@code max} stores the maximum latitude of this edge or any children.
|
||||||
|
*/
|
||||||
|
static final class Edge {
|
||||||
|
// lat-lon pair (in original order) of the two vertices
|
||||||
|
final double lat1, lat2;
|
||||||
|
final double lon1, lon2;
|
||||||
|
/** min of this edge */
|
||||||
|
final double low;
|
||||||
|
/** max latitude of this edge or any children */
|
||||||
|
double max;
|
||||||
|
|
||||||
|
/** left child edge, or null */
|
||||||
|
Edge left;
|
||||||
|
/** right child edge, or null */
|
||||||
|
Edge right;
|
||||||
|
|
||||||
|
Edge(double lat1, double lon1, double lat2, double lon2, double low, double max) {
|
||||||
|
this.lat1 = lat1;
|
||||||
|
this.lon1 = lon1;
|
||||||
|
this.lat2 = lat2;
|
||||||
|
this.lon2 = lon2;
|
||||||
|
this.low = low;
|
||||||
|
this.max = max;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Returns true if the point crosses this edge subtree an odd number of times
|
||||||
|
* <p>
|
||||||
|
* See <a href="https://www.ecse.rpi.edu/~wrf/Research/Short_Notes/pnpoly.html">
|
||||||
|
* https://www.ecse.rpi.edu/~wrf/Research/Short_Notes/pnpoly.html</a> for more information.
|
||||||
|
*/
|
||||||
|
// ported to java from https://www.ecse.rpi.edu/~wrf/Research/Short_Notes/pnpoly.html
|
||||||
|
// original code under the BSD license (https://www.ecse.rpi.edu/~wrf/Research/Short_Notes/pnpoly.html#License%20to%20Use)
|
||||||
|
//
|
||||||
|
// Copyright (c) 1970-2003, Wm. Randolph Franklin
|
||||||
|
//
|
||||||
|
// Permission is hereby granted, free of charge, to any person obtaining a copy of this software and associated
|
||||||
|
// documentation files (the "Software"), to deal in the Software without restriction, including without limitation
|
||||||
|
// the rights to use, copy, modify, merge, publish, distribute, sublicense, and/or sell copies of the Software, and
|
||||||
|
// to permit persons to whom the Software is furnished to do so, subject to the following conditions:
|
||||||
|
//
|
||||||
|
// 1. Redistributions of source code must retain the above copyright
|
||||||
|
// notice, this list of conditions and the following disclaimers.
|
||||||
|
// 2. Redistributions in binary form must reproduce the above copyright
|
||||||
|
// notice in the documentation and/or other materials provided with
|
||||||
|
// the distribution.
|
||||||
|
// 3. The name of W. Randolph Franklin may not be used to endorse or
|
||||||
|
// promote products derived from this Software without specific
|
||||||
|
// prior written permission.
|
||||||
|
//
|
||||||
|
// THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
|
||||||
|
// TO THE WARRANTIES OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
|
||||||
|
// THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF
|
||||||
|
// CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
|
||||||
|
// IN THE SOFTWARE.
|
||||||
|
boolean contains(double latitude, double longitude) {
|
||||||
|
// crossings algorithm is an odd-even algorithm, so we descend the tree xor'ing results along our path
|
||||||
|
boolean res = false;
|
||||||
|
if (latitude <= max) {
|
||||||
|
if (lat1 > latitude != lat2 > latitude) {
|
||||||
|
if (longitude < (lon1 - lon2) * (latitude - lat2) / (lat1 - lat2) + lon2) {
|
||||||
|
res = true;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
if (left != null) {
|
||||||
|
res ^= left.contains(latitude, longitude);
|
||||||
|
}
|
||||||
|
if (right != null && latitude >= low) {
|
||||||
|
res ^= right.contains(latitude, longitude);
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return res;
|
||||||
|
}
|
||||||
|
|
||||||
|
/** Returns true if the box crosses any edge in this edge subtree */
|
||||||
|
boolean crosses(double minLat, double maxLat, double minLon, double maxLon) {
|
||||||
|
// we just have to cross one edge to answer the question, so we descend the tree and return when we do.
|
||||||
|
if (minLat <= max) {
|
||||||
|
// we compute line intersections of every polygon edge with every box line.
|
||||||
|
// if we find one, return true.
|
||||||
|
// for each box line (AB):
|
||||||
|
// for each poly line (CD):
|
||||||
|
// intersects = orient(C,D,A) * orient(C,D,B) <= 0 && orient(A,B,C) * orient(A,B,D) <= 0
|
||||||
|
double cy = lat1;
|
||||||
|
double dy = lat2;
|
||||||
|
double cx = lon1;
|
||||||
|
double dx = lon2;
|
||||||
|
|
||||||
|
// optimization: see if the rectangle is outside of the "bounding box" of the polyline at all
|
||||||
|
// if not, don't waste our time trying more complicated stuff
|
||||||
|
boolean outside = (cy < minLat && dy < minLat) ||
|
||||||
|
(cy > maxLat && dy > maxLat) ||
|
||||||
|
(cx < minLon && dx < minLon) ||
|
||||||
|
(cx > maxLon && dx > maxLon);
|
||||||
|
if (outside == false) {
|
||||||
|
// does box's top edge intersect polyline?
|
||||||
|
// ax = minLon, bx = maxLon, ay = maxLat, by = maxLat
|
||||||
|
if (orient(cx, cy, dx, dy, minLon, maxLat) * orient(cx, cy, dx, dy, maxLon, maxLat) <= 0 &&
|
||||||
|
orient(minLon, maxLat, maxLon, maxLat, cx, cy) * orient(minLon, maxLat, maxLon, maxLat, dx, dy) <= 0) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
// does box's right edge intersect polyline?
|
||||||
|
// ax = maxLon, bx = maxLon, ay = maxLat, by = minLat
|
||||||
|
if (orient(cx, cy, dx, dy, maxLon, maxLat) * orient(cx, cy, dx, dy, maxLon, minLat) <= 0 &&
|
||||||
|
orient(maxLon, maxLat, maxLon, minLat, cx, cy) * orient(maxLon, maxLat, maxLon, minLat, dx, dy) <= 0) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
// does box's bottom edge intersect polyline?
|
||||||
|
// ax = maxLon, bx = minLon, ay = minLat, by = minLat
|
||||||
|
if (orient(cx, cy, dx, dy, maxLon, minLat) * orient(cx, cy, dx, dy, minLon, minLat) <= 0 &&
|
||||||
|
orient(maxLon, minLat, minLon, minLat, cx, cy) * orient(maxLon, minLat, minLon, minLat, dx, dy) <= 0) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
|
||||||
|
// does box's left edge intersect polyline?
|
||||||
|
// ax = minLon, bx = minLon, ay = minLat, by = maxLat
|
||||||
|
if (orient(cx, cy, dx, dy, minLon, minLat) * orient(cx, cy, dx, dy, minLon, maxLat) <= 0 &&
|
||||||
|
orient(minLon, minLat, minLon, maxLat, cx, cy) * orient(minLon, minLat, minLon, maxLat, dx, dy) <= 0) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if (left != null) {
|
||||||
|
if (left.crosses(minLat, maxLat, minLon, maxLon)) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
if (right != null && maxLat >= low) {
|
||||||
|
if (right.crosses(minLat, maxLat, minLon, maxLon)) {
|
||||||
|
return true;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return false;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Creates an edge interval tree from a set of polygon vertices.
|
||||||
|
* @return root node of the tree.
|
||||||
|
*/
|
||||||
|
private static Edge createTree(double polyLats[], double polyLons[]) {
|
||||||
|
// edge order is deterministic and reproducible based on the double values.
|
||||||
|
// TODO: make a real balanced tree instead :)
|
||||||
|
List<Integer> list = new ArrayList<Integer>(polyLats.length - 1);
|
||||||
|
for (int i = 1; i < polyLats.length; i++) {
|
||||||
|
list.add(i);
|
||||||
|
}
|
||||||
|
Collections.shuffle(list, new Random(Arrays.hashCode(polyLats) ^ Arrays.hashCode(polyLons)));
|
||||||
|
Edge root = null;
|
||||||
|
for (int i : list) {
|
||||||
|
double lat1 = polyLats[i-1];
|
||||||
|
double lon1 = polyLons[i-1];
|
||||||
|
double lat2 = polyLats[i];
|
||||||
|
double lon2 = polyLons[i];
|
||||||
|
Edge newNode = new Edge(lat1, lon1, lat2, lon2, Math.min(lat1, lat2), Math.max(lat1, lat2));
|
||||||
|
if (root == null) {
|
||||||
|
// add first node
|
||||||
|
root = newNode;
|
||||||
|
} else {
|
||||||
|
// traverse tree to find home for new node, along the path updating all parent's max value along the way.
|
||||||
|
Edge node = root;
|
||||||
|
while (true) {
|
||||||
|
node.max = Math.max(node.max, newNode.max);
|
||||||
|
if (newNode.low < node.low) {
|
||||||
|
if (node.left == null) {
|
||||||
|
node.left = newNode;
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
node = node.left;
|
||||||
|
} else {
|
||||||
|
if (node.right == null) {
|
||||||
|
node.right = newNode;
|
||||||
|
break;
|
||||||
|
}
|
||||||
|
node = node.right;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
return root;
|
||||||
|
}
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Returns a positive value if points a, b, and c are arranged in counter-clockwise order,
|
||||||
|
* negative value if clockwise, zero if collinear.
|
||||||
|
*/
|
||||||
|
// see the "Orient2D" method described here:
|
||||||
|
// http://www.cs.berkeley.edu/~jrs/meshpapers/robnotes.pdf
|
||||||
|
// https://www.cs.cmu.edu/~quake/robust.html
|
||||||
|
// Note that this one does not yet have the floating point tricks to be exact!
|
||||||
|
private static int orient(double ax, double ay, double bx, double by, double cx, double cy) {
|
||||||
|
double v1 = (bx - ax) * (cy - ay);
|
||||||
|
double v2 = (cx - ax) * (by - ay);
|
||||||
|
if (v1 > v2) {
|
||||||
|
return 1;
|
||||||
|
} else if (v1 < v2) {
|
||||||
|
return -1;
|
||||||
|
} else {
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
|
@ -0,0 +1,53 @@
|
||||||
|
/*
|
||||||
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
||||||
|
* contributor license agreements. See the NOTICE file distributed with
|
||||||
|
* this work for additional information regarding copyright ownership.
|
||||||
|
* The ASF licenses this file to You under the Apache License, Version 2.0
|
||||||
|
* (the "License"); you may not use this file except in compliance with
|
||||||
|
* the License. You may obtain a copy of the License at
|
||||||
|
*
|
||||||
|
* http://www.apache.org/licenses/LICENSE-2.0
|
||||||
|
*
|
||||||
|
* Unless required by applicable law or agreed to in writing, software
|
||||||
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||||
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||||
|
* See the License for the specific language governing permissions and
|
||||||
|
* limitations under the License.
|
||||||
|
*/
|
||||||
|
package org.apache.lucene.document;
|
||||||
|
|
||||||
|
import org.apache.lucene.geo.GeoTestUtil;
|
||||||
|
import org.apache.lucene.geo.Polygon;
|
||||||
|
import org.apache.lucene.geo.Rectangle;
|
||||||
|
import org.apache.lucene.index.PointValues.Relation;
|
||||||
|
import org.apache.lucene.util.LuceneTestCase;
|
||||||
|
|
||||||
|
/** Test LatLonTree against the slower implementation for now */
|
||||||
|
public class TestLatLonTree extends LuceneTestCase {
|
||||||
|
|
||||||
|
/** test that contains() works the same as brute force */
|
||||||
|
public void testContainsRandom() {
|
||||||
|
for (int i = 0; i < 1000; i++) {
|
||||||
|
Polygon polygon = GeoTestUtil.nextPolygon();
|
||||||
|
LatLonTree tree = new LatLonTree(polygon);
|
||||||
|
for (int j = 0; j < 1000; j++) {
|
||||||
|
double point[] = GeoTestUtil.nextPointNear(polygon);
|
||||||
|
boolean expected = polygon.contains(point[0], point[1]);
|
||||||
|
assertEquals(expected, tree.contains(point[0], point[1]));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
/** test that relate() works the same as brute force */
|
||||||
|
public void testRelateRandom() {
|
||||||
|
for (int i = 0; i < 1000; i++) {
|
||||||
|
Polygon polygon = GeoTestUtil.nextPolygon();
|
||||||
|
LatLonTree tree = new LatLonTree(polygon);
|
||||||
|
for (int j = 0; j < 1000; j++) {
|
||||||
|
Rectangle box = GeoTestUtil.nextBoxNear(polygon);
|
||||||
|
Relation expected = polygon.relate(box.minLat, box.maxLat, box.minLon, box.maxLon);
|
||||||
|
assertEquals(expected, tree.relate(box.minLat, box.maxLat, box.minLon, box.maxLon));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
Loading…
Reference in New Issue