TableScanOperator.java
/*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.facebook.presto.operator;
import com.facebook.presto.common.Page;
import com.facebook.presto.common.RuntimeStats;
import com.facebook.presto.execution.ScheduledSplit;
import com.facebook.presto.memory.context.LocalMemoryContext;
import com.facebook.presto.metadata.Split;
import com.facebook.presto.spi.ColumnHandle;
import com.facebook.presto.spi.ConnectorPageSource;
import com.facebook.presto.spi.TableHandle;
import com.facebook.presto.spi.UpdatablePageSource;
import com.facebook.presto.spi.plan.PlanNodeId;
import com.facebook.presto.split.EmptySplit;
import com.facebook.presto.split.EmptySplitPageSource;
import com.facebook.presto.split.PageSourceProvider;
import com.google.common.base.Suppliers;
import com.google.common.collect.ImmutableList;
import com.google.common.util.concurrent.ListenableFuture;
import com.google.common.util.concurrent.SettableFuture;
import java.io.Closeable;
import java.io.IOException;
import java.io.UncheckedIOException;
import java.util.List;
import java.util.Map;
import java.util.Optional;
import java.util.concurrent.CompletableFuture;
import java.util.function.Supplier;
import static com.facebook.airlift.concurrent.MoreFutures.toListenableFuture;
import static com.facebook.presto.common.RuntimeMetricName.STORAGE_READ_DATA_BYTES;
import static com.facebook.presto.common.RuntimeMetricName.STORAGE_READ_TIME_NANOS;
import static com.facebook.presto.common.RuntimeUnit.BYTE;
import static com.facebook.presto.common.RuntimeUnit.NANO;
import static com.google.common.base.Preconditions.checkState;
import static java.util.Objects.requireNonNull;
public class TableScanOperator
implements SourceOperator, Closeable
{
public static class TableScanOperatorFactory
implements SourceOperatorFactory
{
private final int operatorId;
private final PlanNodeId sourceId;
private final PageSourceProvider pageSourceProvider;
private final TableHandle table;
private final List<ColumnHandle> columns;
private boolean closed;
public TableScanOperatorFactory(
int operatorId,
PlanNodeId sourceId,
PageSourceProvider pageSourceProvider,
TableHandle table,
Iterable<ColumnHandle> columns)
{
this.operatorId = operatorId;
this.sourceId = requireNonNull(sourceId, "sourceId is null");
this.pageSourceProvider = requireNonNull(pageSourceProvider, "pageSourceProvider is null");
this.table = requireNonNull(table, "table is null");
this.columns = ImmutableList.copyOf(requireNonNull(columns, "columns is null"));
}
@Override
public PlanNodeId getSourceId()
{
return sourceId;
}
@Override
public SourceOperator createOperator(DriverContext driverContext)
{
checkState(!closed, "Factory is already closed");
OperatorContext operatorContext = driverContext.addOperatorContext(operatorId, sourceId, TableScanOperator.class.getSimpleName());
return new TableScanOperator(
operatorContext,
sourceId,
pageSourceProvider,
table,
columns);
}
@Override
public void noMoreOperators()
{
closed = true;
}
}
private final OperatorContext operatorContext;
private final PlanNodeId planNodeId;
private final PageSourceProvider pageSourceProvider;
private final TableHandle table;
private final List<ColumnHandle> columns;
private final LocalMemoryContext systemMemoryContext;
private final SettableFuture<?> blocked = SettableFuture.create();
private Split split;
private ConnectorPageSource source;
private boolean finished;
private long completedBytes;
private long completedPositions;
private long readTimeNanos;
public TableScanOperator(
OperatorContext operatorContext,
PlanNodeId planNodeId,
PageSourceProvider pageSourceProvider,
TableHandle table,
Iterable<ColumnHandle> columns)
{
this.operatorContext = requireNonNull(operatorContext, "operatorContext is null");
this.planNodeId = requireNonNull(planNodeId, "planNodeId is null");
this.pageSourceProvider = requireNonNull(pageSourceProvider, "pageSourceProvider is null");
this.table = requireNonNull(table, "table is null");
this.columns = ImmutableList.copyOf(requireNonNull(columns, "columns is null"));
this.systemMemoryContext = operatorContext.localSystemMemoryContext();
}
@Override
public OperatorContext getOperatorContext()
{
return operatorContext;
}
@Override
public PlanNodeId getSourceId()
{
return planNodeId;
}
@Override
public Supplier<Optional<UpdatablePageSource>> addSplit(ScheduledSplit scheduledSplit)
{
Split split = requireNonNull(scheduledSplit, "scheduledSplit is null").getSplit();
requireNonNull(split, "split is null");
checkState(this.split == null, "Table scan split already set");
if (finished) {
return Optional::empty;
}
this.split = split;
Object splitInfo = split.getInfo();
Map<String, String> infoMap = split.getInfoMap();
//Make the implicit assumption that if infoMap is populated we can use that instead of the raw object.
if (infoMap != null && !infoMap.isEmpty()) {
operatorContext.setInfoSupplier(Suppliers.ofInstance(new SplitOperatorInfo(infoMap)));
}
else if (splitInfo != null) {
operatorContext.setInfoSupplier(Suppliers.ofInstance(new SplitOperatorInfo(splitInfo)));
}
blocked.set(null);
if (split.getConnectorSplit() instanceof EmptySplit) {
source = new EmptySplitPageSource();
}
return () -> {
if (source instanceof UpdatablePageSource) {
return Optional.of((UpdatablePageSource) source);
}
return Optional.empty();
};
}
@Override
public void noMoreSplits()
{
if (split == null) {
finished = true;
}
blocked.set(null);
}
@Override
public void close()
{
finish();
}
@Override
public void finish()
{
finished = true;
blocked.set(null);
if (source != null) {
try {
source.close();
}
catch (IOException e) {
throw new UncheckedIOException(e);
}
systemMemoryContext.setBytes(source.getSystemMemoryUsage());
}
}
@Override
public boolean isFinished()
{
if (!finished) {
finished = (source != null) && source.isFinished();
if (source != null) {
systemMemoryContext.setBytes(source.getSystemMemoryUsage());
}
}
return finished;
}
@Override
public ListenableFuture<?> isBlocked()
{
if (!blocked.isDone()) {
return blocked;
}
if (source != null) {
CompletableFuture<?> pageSourceBlocked = source.isBlocked();
return pageSourceBlocked.isDone() ? NOT_BLOCKED : toListenableFuture(pageSourceBlocked);
}
return NOT_BLOCKED;
}
@Override
public boolean needsInput()
{
return false;
}
@Override
public void addInput(Page page)
{
throw new UnsupportedOperationException(getClass().getName() + " can not take input");
}
@Override
public Page getOutput()
{
if (split == null) {
return null;
}
if (source == null) {
source = pageSourceProvider.createPageSource(operatorContext.getSession(), split, table, columns, operatorContext.getRuntimeStats());
}
Page page = source.getNextPage();
if (page != null) {
// assure the page is in memory before handing to another operator
page = page.getLoadedPage();
}
// update operator stats
recordInputStats();
// updating system memory usage should happen after page is loaded.
systemMemoryContext.setBytes(source.getSystemMemoryUsage());
return page;
}
private void recordInputStats()
{
checkState(source != null, "source must not be null");
// update operator stats
long endCompletedBytes = source.getCompletedBytes();
long endCompletedPositions = source.getCompletedPositions();
long endReadTimeNanos = source.getReadTimeNanos();
long inputBytes = endCompletedBytes - completedBytes;
long inputBytesReadTime = endReadTimeNanos - readTimeNanos;
long positionCount = endCompletedPositions - completedPositions;
operatorContext.recordProcessedInput(inputBytes, positionCount);
operatorContext.recordRawInputWithTiming(inputBytes, positionCount, inputBytesReadTime);
RuntimeStats runtimeStats = source.getRuntimeStats();
if (runtimeStats != null) {
runtimeStats.addMetricValueIgnoreZero(STORAGE_READ_TIME_NANOS, NANO, inputBytesReadTime);
runtimeStats.addMetricValueIgnoreZero(STORAGE_READ_DATA_BYTES, BYTE, inputBytes);
operatorContext.updateStats(runtimeStats);
}
completedBytes = endCompletedBytes;
completedPositions = endCompletedPositions;
readTimeNanos = endReadTimeNanos;
}
}