Source code for pyflink.datastream.checkpoint_config

################################################################################
#  Licensed to the Apache Software Foundation (ASF) under one
#  or more contributor license agreements.  See the NOTICE file
#  distributed with this work for additional information
#  regarding copyright ownership.  The ASF licenses this file
#  to you under the Apache License, Version 2.0 (the
#  "License"); you may not use this file except in compliance
#  with the License.  You may obtain a copy of the License at
#
#      http://www.apache.org/licenses/LICENSE-2.0
#
#  Unless required by applicable law or agreed to in writing, software
#  distributed under the License is distributed on an "AS IS" BASIS,
#  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
#  See the License for the specific language governing permissions and
# limitations under the License.
################################################################################
from pyflink.datastream.checkpointing_mode import CheckpointingMode
from pyflink.java_gateway import get_gateway

__all__ = ['CheckpointConfig', 'ExternalizedCheckpointCleanup']


[docs]class CheckpointConfig(object): """ Configuration that captures all checkpointing related settings. :data:`DEFAULT_MODE`: The default checkpoint mode: exactly once. :data:`DEFAULT_TIMEOUT`: The default timeout of a checkpoint attempt: 10 minutes. :data:`DEFAULT_MIN_PAUSE_BETWEEN_CHECKPOINTS`: The default minimum pause to be made between checkpoints: none. :data:`DEFAULT_MAX_CONCURRENT_CHECKPOINTS`: The default limit of concurrently happening checkpoints: one. """ DEFAULT_MODE = CheckpointingMode.EXACTLY_ONCE DEFAULT_TIMEOUT = 10 * 60 * 1000 DEFAULT_MIN_PAUSE_BETWEEN_CHECKPOINTS = 0 DEFAULT_MAX_CONCURRENT_CHECKPOINTS = 1 def __init__(self, j_checkpoint_config): self._j_checkpoint_config = j_checkpoint_config
[docs] def is_checkpointing_enabled(self): """ Checks whether checkpointing is enabled. :return: True if checkpointing is enables, false otherwise. """ return self._j_checkpoint_config.isCheckpointingEnabled()
[docs] def get_checkpointing_mode(self): """ Gets the checkpointing mode (exactly-once vs. at-least-once). .. seealso:: :func:`set_checkpointing_mode` :return: The :class:`CheckpointingMode`. """ return CheckpointingMode._from_j_checkpointing_mode( self._j_checkpoint_config.getCheckpointingMode())
[docs] def set_checkpointing_mode(self, checkpointing_mode): """ Sets the checkpointing mode (:data:`CheckpointingMode.EXACTLY_ONCE` vs. :data:`CheckpointingMode.AT_LEAST_ONCE`). Example: :: >>> config.set_checkpointing_mode(CheckpointingMode.AT_LEAST_ONCE) :param checkpointing_mode: The :class:`CheckpointingMode`. """ self._j_checkpoint_config.setCheckpointingMode( CheckpointingMode._to_j_checkpointing_mode(checkpointing_mode))
[docs] def get_checkpoint_interval(self): """ Gets the interval in which checkpoints are periodically scheduled. This setting defines the base interval. Checkpoint triggering may be delayed by the settings :func:`get_max_concurrent_checkpoints` and :func:`get_min_pause_between_checkpoints`. :return: The checkpoint interval, in milliseconds. """ return self._j_checkpoint_config.getCheckpointInterval()
[docs] def set_checkpoint_interval(self, checkpoint_interval): """ Sets the interval in which checkpoints are periodically scheduled. This setting defines the base interval. Checkpoint triggering may be delayed by the settings :func:`set_max_concurrent_checkpoints` and :func:`set_min_pause_between_checkpoints`. :param checkpoint_interval: The checkpoint interval, in milliseconds. """ self._j_checkpoint_config.setCheckpointInterval(checkpoint_interval)
[docs] def get_checkpoint_timeout(self): """ Gets the maximum time that a checkpoint may take before being discarded. :return: The checkpoint timeout, in milliseconds. """ return self._j_checkpoint_config.getCheckpointTimeout()
[docs] def set_checkpoint_timeout(self, checkpoint_timeout): """ Sets the maximum time that a checkpoint may take before being discarded. :param checkpoint_timeout: The checkpoint timeout, in milliseconds. """ self._j_checkpoint_config.setCheckpointTimeout(checkpoint_timeout)
[docs] def get_min_pause_between_checkpoints(self): """ Gets the minimal pause between checkpointing attempts. This setting defines how soon the checkpoint coordinator may trigger another checkpoint after it becomes possible to trigger another checkpoint with respect to the maximum number of concurrent checkpoints (see :func:`get_max_concurrent_checkpoints`). :return: The minimal pause before the next checkpoint is triggered. """ return self._j_checkpoint_config.getMinPauseBetweenCheckpoints()
[docs] def set_min_pause_between_checkpoints(self, min_pause_between_checkpoints): """ Sets the minimal pause between checkpointing attempts. This setting defines how soon the checkpoint coordinator may trigger another checkpoint after it becomes possible to trigger another checkpoint with respect to the maximum number of concurrent checkpoints (see :func:`set_max_concurrent_checkpoints`). If the maximum number of concurrent checkpoints is set to one, this setting makes effectively sure that a minimum amount of time passes where no checkpoint is in progress at all. :param min_pause_between_checkpoints: The minimal pause before the next checkpoint is triggered. """ self._j_checkpoint_config.setMinPauseBetweenCheckpoints(min_pause_between_checkpoints)
[docs] def get_max_concurrent_checkpoints(self): """ Gets the maximum number of checkpoint attempts that may be in progress at the same time. If this value is *n*, then no checkpoints will be triggered while *n* checkpoint attempts are currently in flight. For the next checkpoint to be triggered, one checkpoint attempt would need to finish or expire. :return: The maximum number of concurrent checkpoint attempts. """ return self._j_checkpoint_config.getMaxConcurrentCheckpoints()
[docs] def set_max_concurrent_checkpoints(self, max_concurrent_checkpoints): """ Sets the maximum number of checkpoint attempts that may be in progress at the same time. If this value is *n*, then no checkpoints will be triggered while *n* checkpoint attempts are currently in flight. For the next checkpoint to be triggered, one checkpoint attempt would need to finish or expire. :param max_concurrent_checkpoints: The maximum number of concurrent checkpoint attempts. """ self._j_checkpoint_config.setMaxConcurrentCheckpoints(max_concurrent_checkpoints)
[docs] def is_fail_on_checkpointing_errors(self): """ This determines the behaviour of tasks if there is an error in their local checkpointing. If this returns true, tasks will fail as a reaction. If this returns false, task will only decline the failed checkpoint. :return: ``True`` if failing on checkpointing errors, false otherwise. """ return self._j_checkpoint_config.isFailOnCheckpointingErrors()
[docs] def set_fail_on_checkpointing_errors(self, fail_on_checkpointing_errors): """ Sets the expected behaviour for tasks in case that they encounter an error in their checkpointing procedure. If this is set to true, the task will fail on checkpointing error. If this is set to false, the task will only decline a the checkpoint and continue running. The default is true. Example: :: >>> config.set_fail_on_checkpointing_errors(False) :param fail_on_checkpointing_errors: ``True`` if failing on checkpointing errors, false otherwise. """ self._j_checkpoint_config.setFailOnCheckpointingErrors(fail_on_checkpointing_errors)
[docs] def enable_externalized_checkpoints(self, cleanup_mode): """ Enables checkpoints to be persisted externally. Externalized checkpoints write their meta data out to persistent storage and are **not** automatically cleaned up when the owning job fails or is suspended (terminating with job status ``FAILED`` or ``SUSPENDED``). In this case, you have to manually clean up the checkpoint state, both the meta data and actual program state. The :class:`ExternalizedCheckpointCleanup` mode defines how an externalized checkpoint should be cleaned up on job cancellation. If you choose to retain externalized checkpoints on cancellation you have you handle checkpoint clean up manually when you cancel the job as well (terminating with job status ``CANCELED``). The target directory for externalized checkpoints is configured via ``org.apache.flink.configuration.CheckpointingOptions#CHECKPOINTS_DIRECTORY``. Example: :: >>> config.enable_externalized_checkpoints( ... ExternalizedCheckpointCleanup.RETAIN_ON_CANCELLATION) :param cleanup_mode: Externalized checkpoint cleanup behaviour, the mode could be :data:`ExternalizedCheckpointCleanup.DELETE_ON_CANCELLATION` or :data:`ExternalizedCheckpointCleanup.RETAIN_ON_CANCELLATION` """ self._j_checkpoint_config.enableExternalizedCheckpoints( ExternalizedCheckpointCleanup._to_j_externalized_checkpoint_cleanup(cleanup_mode))
[docs] def is_externalized_checkpoints_enabled(self): """ Returns whether checkpoints should be persisted externally. :return: ``True`` if checkpoints should be externalized, false otherwise. """ return self._j_checkpoint_config.isExternalizedCheckpointsEnabled()
[docs] def is_prefer_checkpoint_for_recovery(self): """ Returns whether a job recovery should fallback to checkpoint when there is a more recent savepoint. :return: ``True`` if a job recovery should fallback to checkpoint, false otherwise. """ return self._j_checkpoint_config.isPreferCheckpointForRecovery()
[docs] def set_prefer_checkpoint_for_recovery(self, prefer_checkpoint_for_recovery): """ Sets whether a job recovery should fallback to checkpoint when there is a more recent savepoint. :param prefer_checkpoint_for_recovery: ``True`` if a job recovery should fallback to checkpoint, false otherwise. """ self._j_checkpoint_config.setPreferCheckpointForRecovery(prefer_checkpoint_for_recovery)
[docs] def get_externalized_checkpoint_cleanup(self): """ Returns the cleanup behaviour for externalized checkpoints. :return: The cleanup behaviour for externalized checkpoints or ``None`` if none is configured. """ cleanup_mode = self._j_checkpoint_config.getExternalizedCheckpointCleanup() return ExternalizedCheckpointCleanup._from_j_externalized_checkpoint_cleanup(cleanup_mode)
[docs]class ExternalizedCheckpointCleanup(object): """ Cleanup behaviour for externalized checkpoints when the job is cancelled. :data:`DELETE_ON_CANCELLATION`: Delete externalized checkpoints on job cancellation. All checkpoint state will be deleted when you cancel the owning job, both the meta data and actual program state. Therefore, you cannot resume from externalized checkpoints after the job has been cancelled. Note that checkpoint state is always kept if the job terminates with state ``FAILED``. :data:`RETAIN_ON_CANCELLATION`: Retain externalized checkpoints on job cancellation. All checkpoint state is kept when you cancel the owning job. You have to manually delete both the checkpoint meta data and actual program state after cancelling the job. Note that checkpoint state is always kept if the job terminates with state ``FAILED``. """ DELETE_ON_CANCELLATION = 0 RETAIN_ON_CANCELLATION = 1 @staticmethod def _from_j_externalized_checkpoint_cleanup(j_cleanup_mode): gateway = get_gateway() JExternalizedCheckpointCleanup = \ gateway.jvm.org.apache.flink.streaming.api.environment.CheckpointConfig \ .ExternalizedCheckpointCleanup if j_cleanup_mode == JExternalizedCheckpointCleanup.RETAIN_ON_CANCELLATION: return ExternalizedCheckpointCleanup.RETAIN_ON_CANCELLATION elif j_cleanup_mode == JExternalizedCheckpointCleanup.DELETE_ON_CANCELLATION: return ExternalizedCheckpointCleanup.DELETE_ON_CANCELLATION elif j_cleanup_mode is None: return None else: raise Exception("Unsupported java externalized checkpoint cleanup mode: %s" % j_cleanup_mode) @staticmethod def _to_j_externalized_checkpoint_cleanup(cleanup_mode): gateway = get_gateway() JExternalizedCheckpointCleanup = \ gateway.jvm.org.apache.flink.streaming.api.environment.CheckpointConfig \ .ExternalizedCheckpointCleanup if cleanup_mode == ExternalizedCheckpointCleanup.DELETE_ON_CANCELLATION: return JExternalizedCheckpointCleanup.DELETE_ON_CANCELLATION elif cleanup_mode == ExternalizedCheckpointCleanup.RETAIN_ON_CANCELLATION: return JExternalizedCheckpointCleanup.RETAIN_ON_CANCELLATION else: raise TypeError("Unsupported cleanup mode: %s, supported cleanup modes are: " "ExternalizedCheckpointCleanup.DELETE_ON_CANCELLATION and" "ExternalizedCheckpointCleanup.RETAIN_ON_CANCELLATION." % cleanup_mode)