pulumi-gcp-kotlin/com.pulumi.gcp.dataproc.kotlin/Job

Job

class Job : KotlinCustomResource

Manages a job resource within a Dataproc cluster within GCE. For more information see the official dataproc documentation. !>Note: This resource does not support 'update' and changing any attributes will cause the resource to be recreated.

Example Usage

package generated_program;
import com.pulumi.Context;
import com.pulumi.Pulumi;
import com.pulumi.core.Output;
import com.pulumi.gcp.dataproc.Cluster;
import com.pulumi.gcp.dataproc.ClusterArgs;
import com.pulumi.gcp.dataproc.Job;
import com.pulumi.gcp.dataproc.JobArgs;
import com.pulumi.gcp.dataproc.inputs.JobPlacementArgs;
import com.pulumi.gcp.dataproc.inputs.JobSparkConfigArgs;
import com.pulumi.gcp.dataproc.inputs.JobSparkConfigLoggingConfigArgs;
import com.pulumi.gcp.dataproc.inputs.JobPysparkConfigArgs;
import java.util.List;
import java.util.ArrayList;
import java.util.Map;
import java.io.File;
import java.nio.file.Files;
import java.nio.file.Paths;
public class App {
    public static void main(String[] args) {
        Pulumi.run(App::stack);
    }
    public static void stack(Context ctx) {
        var mycluster = new Cluster("mycluster", ClusterArgs.builder()
            .region("us-central1")
            .build());
        var spark = new Job("spark", JobArgs.builder()
            .region(mycluster.region())
            .forceDelete(true)
            .placement(JobPlacementArgs.builder()
                .clusterName(mycluster.name())
                .build())
            .sparkConfig(JobSparkConfigArgs.builder()
                .mainClass("org.apache.spark.examples.SparkPi")
                .jarFileUris("file:///usr/lib/spark/examples/jars/spark-examples.jar")
                .args("1000")
                .properties(Map.of("spark.logConf", "true"))
                .loggingConfig(JobSparkConfigLoggingConfigArgs.builder()
                    .driverLogLevels(Map.of("root", "INFO"))
                    .build())
                .build())
            .build());
        var pyspark = new Job("pyspark", JobArgs.builder()
            .region(mycluster.region())
            .forceDelete(true)
            .placement(JobPlacementArgs.builder()
                .clusterName(mycluster.name())
                .build())
            .pysparkConfig(JobPysparkConfigArgs.builder()
                .mainPythonFileUri("gs://dataproc-examples-2f10d78d114f6aaec76462e3c310f31f/src/pyspark/hello-world/hello-world.py")
                .properties(Map.of("spark.logConf", "true"))
                .build())
            .build());
        ctx.export("sparkStatus", spark.statuses().applyValue(statuses -> statuses[0].state()));
        ctx.export("pysparkStatus", pyspark.statuses().applyValue(statuses -> statuses[0].state()));
    }
}

Import

This resource does not support import.

Properties

driverControlsFilesUri

val driverControlsFilesUri: Output<String>

If present, the location of miscellaneous control files which may be used as part of job setup and handling. If not present, control files may be placed in the same location as driver_output_uri.

driverOutputResourceUri

val driverOutputResourceUri: Output<String>

A URI pointing to the location of the stdout of the job's driver program.

forceDelete

val forceDelete: Output<Boolean>?

By default, you can only delete inactive jobs within Dataproc. Setting this to true, and calling destroy, will ensure that the job is first cancelled before issuing the delete.

hadoopConfig

val hadoopConfig: Output<JobHadoopConfig>?

The config of Hadoop job

hiveConfig

val hiveConfig: Output<JobHiveConfig>?

The config of hive job

val id: Output<String>

labels

val labels: Output<Map<String, String>>?

The list of labels (key/value pairs) to add to the job.

pigConfig

val pigConfig: Output<JobPigConfig>?

The config of pag job.

placement

val placement: Output<JobPlacement>

The config of job placement.

prestoConfig

val prestoConfig: Output<JobPrestoConfig>?

The config of presto job

project

val project: Output<String>

The project in which the cluster can be found and jobs subsequently run against. If it is not provided, the provider project is used.

pulumiChildResources

val pulumiChildResources: Set<KotlinResource>

pulumiResourceName

val pulumiResourceName: String

pulumiResourceType

val pulumiResourceType: String

pysparkConfig

val pysparkConfig: Output<JobPysparkConfig>?

The config of pySpark job.

reference

val reference: Output<JobReference>

The reference of the job

region

val region: Output<String>?

The Cloud Dataproc region. This essentially determines which clusters are available for this job to be submitted to. If not specified, defaults to global.

scheduling

val scheduling: Output<JobScheduling>?

Optional. Job scheduling configuration.

sparkConfig

val sparkConfig: Output<JobSparkConfig>?

The config of the Spark job.

sparksqlConfig

val sparksqlConfig: Output<JobSparksqlConfig>?

The config of SparkSql job

statuses

val statuses: Output<List<JobStatus>>

The status of the job.

urn

val urn: Output<String>