Source code for pydolphinscheduler.tasks.spark

# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements.  See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership.  The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License.  You may obtain a copy of the License at
#
#   http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied.  See the License for the
# specific language governing permissions and limitations
# under the License.

"""Task Spark."""

from typing import Optional

from pydolphinscheduler.constants import TaskType
from pydolphinscheduler.core.engine import Engine, ProgramType


[docs] class DeployMode(str): """SPARK deploy mode, for now it just contain `LOCAL`, `CLIENT` and `CLUSTER`.""" LOCAL = "local" CLIENT = "client" CLUSTER = "cluster"
[docs] class Spark(Engine): """Task spark object, declare behavior for spark task to dolphinscheduler.""" _task_custom_attr = { "deploy_mode", "driver_cores", "driver_memory", "num_executors", "executor_memory", "executor_cores", "app_name", "main_args", "others", } def __init__( self, name: str, main_class: str, main_package: str, program_type: Optional[ProgramType] = ProgramType.SCALA, deploy_mode: Optional[DeployMode] = DeployMode.CLUSTER, app_name: Optional[str] = None, driver_cores: Optional[int] = 1, driver_memory: Optional[str] = "512M", num_executors: Optional[int] = 2, executor_memory: Optional[str] = "2G", executor_cores: Optional[int] = 2, main_args: Optional[str] = None, others: Optional[str] = None, *args, **kwargs ): super().__init__( name, TaskType.SPARK, main_class, main_package, program_type, *args, **kwargs ) self.deploy_mode = deploy_mode self.app_name = app_name self.driver_cores = driver_cores self.driver_memory = driver_memory self.num_executors = num_executors self.executor_memory = executor_memory self.executor_cores = executor_cores self.main_args = main_args self.others = others