TestDistributedQueryResource.java

/*
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package com.facebook.presto.resourcemanager;

import com.facebook.airlift.http.client.HttpClient;
import com.facebook.airlift.http.client.jetty.JettyHttpClient;
import com.facebook.presto.execution.QueryState;
import com.facebook.presto.resourceGroups.FileResourceGroupConfigurationManagerFactory;
import com.facebook.presto.server.BasicQueryInfo;
import com.facebook.presto.server.testing.TestingPrestoServer;
import com.facebook.presto.tests.DistributedQueryRunner;
import com.google.common.collect.ImmutableMap;
import org.testng.annotations.AfterMethod;
import org.testng.annotations.BeforeMethod;
import org.testng.annotations.Test;

import java.util.List;
import java.util.Optional;

import static com.facebook.airlift.testing.Closeables.closeQuietly;
import static com.facebook.presto.tests.tpch.TpchQueryRunner.createQueryRunner;
import static com.facebook.presto.utils.QueryExecutionClientUtil.getQueryInfos;
import static com.facebook.presto.utils.QueryExecutionClientUtil.runToCompletion;
import static com.facebook.presto.utils.QueryExecutionClientUtil.runToFirstResult;
import static com.facebook.presto.utils.QueryExecutionClientUtil.runToQueued;
import static com.facebook.presto.utils.ResourceUtils.getResourceFilePath;
import static com.google.common.base.Preconditions.checkState;
import static java.lang.Thread.sleep;
import static org.testng.Assert.assertEquals;
import static org.testng.Assert.fail;

@Test(singleThreaded = true)
public class TestDistributedQueryResource
{
    private HttpClient client;
    private TestingPrestoServer coordinator1;
    private TestingPrestoServer coordinator2;
    private TestingPrestoServer resourceManager;

    @BeforeMethod
    public void setup()
            throws Exception
    {
        client = new JettyHttpClient();
        DistributedQueryRunner runner = createQueryRunner(ImmutableMap.of("query.client.timeout", "20s"), 2);
        coordinator1 = runner.getCoordinator(0);
        coordinator2 = runner.getCoordinator(1);
        Optional<TestingPrestoServer> resourceManager = runner.getResourceManager();
        checkState(resourceManager.isPresent(), "resource manager not present");
        this.resourceManager = resourceManager.get();
        coordinator1.getResourceGroupManager().get().addConfigurationManagerFactory(new FileResourceGroupConfigurationManagerFactory());
        coordinator1.getResourceGroupManager().get()
                .forceSetConfigurationManager("file", ImmutableMap.of("resource-groups.config-file", getResourceFilePath("resource_groups_config_simple.json")));
        coordinator2.getResourceGroupManager().get().addConfigurationManagerFactory(new FileResourceGroupConfigurationManagerFactory());
        coordinator2.getResourceGroupManager().get()
                .forceSetConfigurationManager("file", ImmutableMap.of("resource-groups.config-file", getResourceFilePath("resource_groups_config_simple.json")));
    }

    @AfterMethod(alwaysRun = true)
    public void teardown()
    {
        closeQuietly(coordinator1);
        closeQuietly(coordinator2);
        closeQuietly(resourceManager);
        closeQuietly(client);
        coordinator1 = null;
        coordinator2 = null;
        resourceManager = null;
        client = null;
    }

    @Test(timeOut = 60_000, enabled = false)
    public void testGetQueryInfos()
            throws Exception
    {
        runToCompletion(client, coordinator1, "SELECT 1");
        runToCompletion(client, coordinator2, "SELECT 2");
        runToCompletion(client, coordinator1, "SELECT x FROM y");
        runToFirstResult(client, coordinator1, "SELECT * from tpch.sf100.orders");
        runToFirstResult(client, coordinator1, "SELECT * from tpch.sf101.orders");
        runToFirstResult(client, coordinator1, "SELECT * from tpch.sf102.orders");
        runToQueued(client, coordinator1, "SELECT 3");

        waitForGlobalViewInRM(1, 3, 1, 2);

        List<BasicQueryInfo> infos = getQueryInfos(client, coordinator1, "/v1/query");
        assertEquals(infos.size(), 7);
        assertStateCounts(infos, 2, 1, 3, 1);

        infos = getQueryInfos(client, coordinator2, "/v1/query?state=finished");
        assertEquals(infos.size(), 2);
        assertStateCounts(infos, 2, 0, 0, 0);

        infos = getQueryInfos(client, coordinator1, "/v1/query?state=failed");
        assertEquals(infos.size(), 1);
        assertStateCounts(infos, 0, 1, 0, 0);

        infos = getQueryInfos(client, coordinator2, "/v1/query?state=running");
        assertEquals(infos.size(), 3);
        assertStateCounts(infos, 0, 0, 3, 0);

        infos = getQueryInfos(client, coordinator1, "/v1/query?state=queued");
        assertEquals(infos.size(), 1);
        assertStateCounts(infos, 0, 0, 0, 1);

        waitForGlobalViewInRM(0, 0, 5, 2);

        infos = getQueryInfos(client, coordinator2, "/v1/query?state=failed");
        assertEquals(infos.size(), 5);
        assertStateCounts(infos, 0, 5, 0, 0);
    }

    private void assertStateCounts(List<BasicQueryInfo> infos, int expectedFinished, int expectedFailed, int expectedRunning, int expectedQueued)
    {
        int failed = 0;
        int finished = 0;
        int running = 0;
        int queued = 0;
        for (BasicQueryInfo info : infos) {
            switch (info.getState()) {
                case RUNNING:
                case FINISHING:
                    running++;
                    break;
                case WAITING_FOR_RESOURCES:
                case PLANNING:
                case DISPATCHING:
                case QUEUED:
                    queued++;
                    break;
                case FINISHED:
                    finished++;
                    break;
                case FAILED:
                    failed++;
                    break;
                default:
                    fail("Unexpected query state " + info.getState());
            }
        }
        assertEquals(failed, expectedFailed);
        assertEquals(finished, expectedFinished);
        assertEquals(running, expectedRunning);
        assertEquals(queued, expectedQueued);
    }

    private void waitForGlobalViewInRM(long expectedQueuedQueries, long expectedRunningQueries, long expectedFailedQueries, long expectedFinishedQueries)
            throws InterruptedException
    {
        long runningQueries = 0;
        long queuedQueries = 0;
        long failedQueries = 0;
        long finishedQueries = 0;
        while (runningQueries != expectedRunningQueries || queuedQueries != expectedQueuedQueries ||
                failedQueries != expectedFailedQueries || finishedQueries != expectedFinishedQueries) {
            sleep(100);
            List<BasicQueryInfo> queries = resourceManager.getClusterStateProvider().getClusterQueries();
            runningQueries = queries.stream().filter(queryInfo -> queryInfo.getState() == QueryState.RUNNING).count();
            queuedQueries = queries.stream().filter(queryInfo -> queryInfo.getState() == QueryState.QUEUED).count();
            failedQueries = queries.stream().filter(queryInfo -> queryInfo.getState() == QueryState.FAILED).count();
            finishedQueries = queries.stream().filter(queryInfo -> queryInfo.getState() == QueryState.FINISHED).count();
        }
    }

    // Flaky test.
    @Test(timeOut = 60_000, enabled = false)
    public void testGetAllQueryInfoForLimits()
            throws InterruptedException
    {
        runToFirstResult(client, coordinator1, "SELECT * from tpch.sf100.orders");
        runToFirstResult(client, coordinator1, "SELECT * from tpch.sf100.orders");
        runToFirstResult(client, coordinator1, "SELECT * from tpch.sf101.orders");
        runToQueued(client, coordinator1, "SELECT * from tpch.sf100.orders");
        runToQueued(client, coordinator1, "SELECT * from tpch.sf101.orders");
        runToQueued(client, coordinator1, "SELECT * from tpch.sf102.orders");

        waitForGlobalViewInRM(3, 3, 0, 0);

        List<BasicQueryInfo> infos = getQueryInfos(client, coordinator1, "/v1/query?limit=4");
        assertEquals(infos.size(), 4);
        assertEquals(infos.get(0).getState(), QueryState.RUNNING);
        assertEquals(infos.get(1).getState(), QueryState.RUNNING);
        assertEquals(infos.get(2).getState(), QueryState.RUNNING);
        assertEquals(infos.get(3).getState(), QueryState.QUEUED);
    }

    @Test(enabled = false)
    public void testGetAllQueryInfoReturnsAllQueriesWithNoLimitSpecified()
            throws InterruptedException
    {
        runToFirstResult(client, coordinator1, "SELECT * from tpch.sf100.orders");
        runToFirstResult(client, coordinator1, "SELECT * from tpch.sf100.orders");
        runToFirstResult(client, coordinator1, "SELECT * from tpch.sf101.orders");
        runToQueued(client, coordinator1, "SELECT * from tpch.sf100.orders");
        runToQueued(client, coordinator1, "SELECT * from tpch.sf101.orders");
        runToQueued(client, coordinator1, "SELECT * from tpch.sf102.orders");

        waitForGlobalViewInRM(3, 3, 0, 0);

        List<BasicQueryInfo> infos = getQueryInfos(client, coordinator1, "/v1/query");
        assertEquals(infos.size(), 6);
    }
}