gigl.src.common.utils.spark_job_manager#
Attributes#
Classes#
Module Contents#
- class gigl.src.common.utils.spark_job_manager.DataprocClusterInitData[source]#
-
- init_script_uri: gigl.common.GcsUri | None = None[source]#
- class gigl.src.common.utils.spark_job_manager.SparkJobManager(project, region, cluster_name)[source]#
- Parameters:
project (str)
region (str)
cluster_name (str)
- create_dataproc_cluster(cluster_init_data, use_spark35=False)[source]#
- Parameters:
cluster_init_data (DataprocClusterInitData)
use_spark35 (bool)
- submit_and_wait_scala_spark_job(main_jar_file_uri, max_job_duration, runtime_args=[], extra_jar_file_uris=[], use_spark35=False)[source]#
- Parameters:
main_jar_file_uri (gigl.common.Uri)
max_job_duration (datetime.timedelta)
runtime_args (List[str])
extra_jar_file_uris (List[str])
use_spark35 (bool)