gigl.src.common.utils.spark_job_manager#
Attributes#
Classes#
Module Contents#
- class gigl.src.common.utils.spark_job_manager.DataprocClusterInitData[source]#
- 
- init_script_uri: gigl.common.GcsUri | None = None[source]#
 
- class gigl.src.common.utils.spark_job_manager.SparkJobManager(project, region, cluster_name)[source]#
- Parameters:
- project (str) 
- region (str) 
- cluster_name (str) 
 
 - create_dataproc_cluster(cluster_init_data, use_spark35=False)[source]#
- Parameters:
- cluster_init_data (DataprocClusterInitData) 
- use_spark35 (bool) 
 
 
 - submit_and_wait_scala_spark_job(main_jar_file_uri, max_job_duration, runtime_args=[], extra_jar_file_uris=[], use_spark35=False)[source]#
- Parameters:
- main_jar_file_uri (gigl.common.Uri) 
- max_job_duration (datetime.timedelta) 
- runtime_args (list[str]) 
- extra_jar_file_uris (list[str]) 
- use_spark35 (bool) 
 
 
 
