Files
superset2/superset/commands/tasks/update.py

171 lines
5.9 KiB
Python

# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
from __future__ import annotations
import logging
from datetime import datetime
from functools import partial
from typing import Any, TYPE_CHECKING
from uuid import UUID
from superset_core.tasks.types import TaskProperties
from superset import security_manager
from superset.commands.base import BaseCommand
from superset.commands.tasks.exceptions import (
TaskForbiddenError,
TaskNotFoundError,
TaskUpdateFailedError,
)
from superset.exceptions import SupersetSecurityException
from superset.tasks.locks import task_lock
from superset.tasks.utils import get_active_dedup_key
from superset.utils.decorators import on_error, transaction
if TYPE_CHECKING:
from superset.models.tasks import Task
logger = logging.getLogger(__name__)
class UpdateTaskCommand(BaseCommand):
"""
Command to update a task.
Uses explicit typed parameters to avoid confusion between
payload (task output) and properties (runtime state/config).
This command acquires a distributed lock to prevent race conditions with
concurrent submit/cancel operations on the same logical task.
"""
def __init__(
self,
task_uuid: UUID,
*,
status: str | None = None,
started_at: datetime | None = None,
ended_at: datetime | None = None,
payload: dict[str, Any] | None = None,
properties: TaskProperties | None = None,
skip_security_check: bool = False,
):
"""
Initialize UpdateTaskCommand.
:param task_uuid: UUID of the task to update
:param status: New status value (column field)
:param started_at: Started timestamp (column field)
:param ended_at: Ended timestamp (column field)
:param payload: Task output data to merge (stored in payload column)
:param properties: Runtime state/config updates as dict. Keys must be
valid TaskProperties field names (is_abortable, progress_percent, etc.)
:param skip_security_check: If True, skip ownership validation.
Use this for internal task updates (e.g., task executor updating
its own task's progress). Default is False for API-driven updates.
"""
self._task_uuid = task_uuid
self._status = status
self._started_at = started_at
self._ended_at = ended_at
self._payload = payload
self._properties = properties
self._model: Task | None = None
self._skip_security_check = skip_security_check
@transaction(on_error=partial(on_error, reraise=TaskUpdateFailedError))
def run(self) -> Task:
"""
Execute the update command with distributed locking.
Acquires lock based on dedup_key to prevent race conditions with
concurrent submit/cancel operations on the same logical task.
:returns: The updated task model
"""
from superset.daos.tasks import TaskDAO
self.validate()
# Fetch task to compute dedup_key for locking
task = TaskDAO.find_one_or_none(
skip_base_filter=self._skip_security_check,
uuid=self._task_uuid,
)
if not task:
raise TaskNotFoundError()
self._model = task
# Build lock key from task properties (same structure as dedup_key)
dedup_key = get_active_dedup_key(
scope=self._model.scope,
task_type=self._model.task_type,
task_key=self._model.task_key,
user_id=self._model.user_id,
)
# Acquire lock to prevent race with submit/cancel operations
with task_lock(dedup_key):
return self._execute_update()
def _execute_update(self) -> "Task":
"""
Execute the update operation under lock.
:returns: The updated task model
"""
from superset.daos.tasks import TaskDAO
# Re-fetch model under lock to get fresh state
fresh_model = TaskDAO.find_one_or_none(
skip_base_filter=self._skip_security_check,
uuid=self._task_uuid,
)
if not fresh_model:
raise TaskNotFoundError()
self._model = fresh_model
# Verify ownership (user can only update their own tasks)
# Skip this check for internal updates (e.g., task executor updating progress)
if not self._skip_security_check:
try:
security_manager.raise_for_ownership(self._model)
except SupersetSecurityException as ex:
raise TaskForbiddenError() from ex
# Update status via set_status() for proper timestamp handling
if self._status is not None:
self._model.set_status(self._status)
if self._started_at is not None:
self._model.started_at = self._started_at
if self._ended_at is not None:
self._model.ended_at = self._ended_at
# Update payload (merges with existing)
if self._payload is not None:
self._model.set_payload(self._payload)
# Update properties (dict passed through to model)
if self._properties:
self._model.update_properties(self._properties)
return TaskDAO.update(self._model)
def validate(self) -> None:
pass