BenchmarkSpatialJoin.java
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.facebook.presto.plugin.memory.geospatial;
import com.facebook.presto.common.QualifiedObjectName;
import com.facebook.presto.metadata.Metadata;
import com.facebook.presto.plugin.memory.MemoryConnectorFactory;
import com.facebook.presto.spi.TableHandle;
import com.facebook.presto.testing.LocalQueryRunner;
import com.facebook.presto.testing.MaterializedResult;
import com.google.common.collect.ImmutableMap;
import org.openjdk.jmh.annotations.Benchmark;
import org.openjdk.jmh.annotations.BenchmarkMode;
import org.openjdk.jmh.annotations.Fork;
import org.openjdk.jmh.annotations.Level;
import org.openjdk.jmh.annotations.Measurement;
import org.openjdk.jmh.annotations.OutputTimeUnit;
import org.openjdk.jmh.annotations.Param;
import org.openjdk.jmh.annotations.Setup;
import org.openjdk.jmh.annotations.State;
import org.openjdk.jmh.annotations.TearDown;
import org.openjdk.jmh.annotations.Warmup;
import org.openjdk.jmh.runner.Runner;
import org.openjdk.jmh.runner.options.Options;
import org.openjdk.jmh.runner.options.OptionsBuilder;
import org.openjdk.jmh.runner.options.VerboseMode;
import org.testng.annotations.Test;
import java.io.IOException;
import java.nio.file.Files;
import java.nio.file.Path;
import java.nio.file.Paths;
import java.util.Optional;
import java.util.stream.Collectors;
import static com.facebook.presto.testing.TestingSession.testSessionBuilder;
import static java.lang.String.format;
import static java.util.concurrent.TimeUnit.MILLISECONDS;
import static org.openjdk.jmh.annotations.Mode.AverageTime;
import static org.openjdk.jmh.annotations.Scope.Thread;
import static org.testng.Assert.assertTrue;
@SuppressWarnings("MethodMayBeStatic")
@State(Thread)
@OutputTimeUnit(MILLISECONDS)
@BenchmarkMode(AverageTime)
@Fork(3)
@Warmup(iterations = 10)
@Measurement(iterations = 10)
public class BenchmarkSpatialJoin
{
@State(Thread)
public static class Context
{
private LocalQueryRunner queryRunner;
@Param({"10", "100", "1000", "10000"})
private int pointCount;
public LocalQueryRunner getQueryRunner()
{
return queryRunner;
}
@Setup
public void setUp()
throws IOException
{
queryRunner = new LocalQueryRunner(testSessionBuilder()
.setCatalog("memory")
.setSchema("default")
.build());
queryRunner.createCatalog("memory", new MemoryConnectorFactory(), ImmutableMap.of());
Path path = Paths.get(BenchmarkSpatialJoin.class.getClassLoader().getResource("us-states1.tsv").getPath());
String polygonValues = Files.lines(path)
.map(line -> line.split("\t"))
.map(parts -> format("('%s', '%s')", parts[0], parts[1]))
.collect(Collectors.joining(","));
queryRunner.execute(format("CREATE TABLE memory.default.polygons AS SELECT * FROM (VALUES %s) as t (name, wkt)", polygonValues));
}
@Setup(Level.Invocation)
public void createPointsTable()
{
// Generate random points within the approximate bounding box of the US polygon:
// POLYGON ((-124 27, -65 27, -65 49, -124 49, -124 27))
queryRunner.execute(format("CREATE TABLE memory.default.points AS " +
"SELECT 'p' || cast(elem AS VARCHAR) as name, xMin + (xMax - xMin) * random() as longitude, yMin + (yMax - yMin) * random() as latitude " +
"FROM (SELECT -124 AS xMin, -65 AS xMax, 27 AS yMin, 49 AS yMax) " +
"CROSS JOIN UNNEST(sequence(1, %s)) AS t(elem)", pointCount));
}
@TearDown(Level.Invocation)
public void dropPointsTable()
{
queryRunner.inTransaction(queryRunner.getDefaultSession(), transactionSession -> {
Metadata metadata = queryRunner.getMetadata();
Optional<TableHandle> tableHandle = metadata.getMetadataResolver(transactionSession).getTableHandle(QualifiedObjectName.valueOf("memory.default.points"));
assertTrue(tableHandle.isPresent(), "Table memory.default.points does not exist");
metadata.dropTable(transactionSession, tableHandle.get());
return null;
});
}
@TearDown
public void tearDown()
{
queryRunner.close();
queryRunner = null;
}
}
@Benchmark
public MaterializedResult benchmarkJoin(Context context)
{
return context.getQueryRunner()
.execute("SELECT count(*) FROM points, polygons WHERE ST_Contains(ST_GeometryFromText(wkt), ST_Point(latitude, longitude))");
}
@Benchmark
public MaterializedResult benchmarkUserOptimizedJoin(Context context)
{
return context.getQueryRunner()
.execute("SELECT count(*) FROM (SELECT ST_Point(latitude, longitude) as point FROM points) t1, (SELECT ST_GeometryFromText(wkt) as geometry FROM polygons) t2 WHERE ST_Contains(geometry, point)");
}
@Test
public void verify()
throws IOException
{
Context context = new Context();
try {
context.setUp();
context.createPointsTable();
BenchmarkSpatialJoin benchmark = new BenchmarkSpatialJoin();
benchmark.benchmarkJoin(context);
benchmark.benchmarkUserOptimizedJoin(context);
}
finally {
context.queryRunner.close();
}
}
public static void main(String[] args)
throws Exception
{
// assure the benchmarks are valid before running
new BenchmarkSpatialJoin().verify();
Options options = new OptionsBuilder()
.verbosity(VerboseMode.NORMAL)
.include(".*" + BenchmarkSpatialJoin.class.getSimpleName() + ".*")
.build();
new Runner(options).run();
}
}