takahe/stator/runner.py

import datetime
import os
import signal
import time
import traceback
import uuid
from concurrent.futures import Future, ThreadPoolExecutor

from django.conf import settings
from django.db import close_old_connections
from django.utils import timezone

from core import exceptions, sentry
from core.models import Config
from stator.models import StatorModel, Stats


class LoopingTimer:
    """
    Triggers check() to be true once every `interval`.
    """

    next_run: float | None = None

    def __init__(self, interval: float, trigger_at_start=True):
        self.interval = interval
        self.trigger_at_start = trigger_at_start

    def check(self) -> bool:
        # See if it's our first time being called
        if self.next_run is None:
            # Set up the next call based on trigger_at_start
            if self.trigger_at_start:
                self.next_run = time.monotonic()
            else:
                self.next_run = time.monotonic() + self.interval
        # See if it's time to run the next call
        if time.monotonic() >= self.next_run:
            self.next_run = time.monotonic() + self.interval
            return True
        return False


class StatorRunner:
    """
    Runs tasks on models that are looking for state changes.
    Designed to run either indefinitely, or just for a few seconds.
    """

    def __init__(
        self,
        models: list[type[StatorModel]],
        concurrency: int = getattr(settings, "STATOR_CONCURRENCY", 30),
        concurrency_per_model: int = getattr(
            settings, "STATOR_CONCURRENCY_PER_MODEL", 15
        ),
        liveness_file: str | None = None,
        schedule_interval: int = 60,
        delete_interval: int = 30,
        lock_expiry: int = 300,
        run_for: int = 0,
    ):
        self.models = models
        self.runner_id = uuid.uuid4().hex
        self.concurrency = concurrency
        self.concurrency_per_model = concurrency_per_model
        self.liveness_file = liveness_file
        self.schedule_interval = schedule_interval
        self.delete_interval = delete_interval
        self.lock_expiry = lock_expiry
        self.run_for = run_for
        self.minimum_loop_delay = 0.5
        self.maximum_loop_delay = 5
        self.tasks: dict[tuple[str, str], Future] = {}
        # Set up SIGALRM handler
        signal.signal(signal.SIGALRM, self.alarm_handler)

    def run(self):
        sentry.set_takahe_app("stator")
        self.handled = {}
        self.started = time.monotonic()
        self.executor = ThreadPoolExecutor(max_workers=self.concurrency)
        self.loop_delay = self.minimum_loop_delay
        self.scheduling_timer = LoopingTimer(self.schedule_interval)
        self.deletion_timer = LoopingTimer(self.delete_interval)
        # For the first time period, launch tasks
        print("Running main task loop")
        try:
            with sentry.configure_scope() as scope:
                while True:
                    # See if we need to run cleaning
                    if self.scheduling_timer.check():
                        # Set up the watchdog timer (each time we do this the previous one is cancelled)
                        signal.alarm(self.schedule_interval * 2)
                        # Write liveness file if configured
                        if self.liveness_file:
                            with open(self.liveness_file, "w") as fh:
                                fh.write(str(int(time.time())))
                        # Refresh the config
                        self.load_config()
                        # Do scheduling (stale lock deletion and stats gathering)
                        self.run_scheduling()

                    # Clear the cleaning breadcrumbs/extra for the main part of the loop
                    sentry.scope_clear(scope)

                    self.clean_tasks()

                    # See if we need to add deletion tasks
                    if self.deletion_timer.check():
                        self.add_deletion_tasks()

                    # Fetch and run any new handlers we can fit
                    self.add_transition_tasks()

                    # Are we in limited run mode?
                    if (
                        self.run_for
                        and (time.monotonic() - self.started) > self.run_for
                    ):
                        break

                    # Prevent busylooping, but also back off delay if we have
                    # no tasks
                    if self.tasks:
                        self.loop_delay = self.minimum_loop_delay
                    else:
                        self.loop_delay = min(
                            self.loop_delay * 1.5,
                            self.maximum_loop_delay,
                        )
                    time.sleep(self.loop_delay)

                    # Clear the Sentry breadcrumbs and extra for next loop
                    sentry.scope_clear(scope)
        except KeyboardInterrupt:
            pass

        # Wait for tasks to finish
        print("Waiting for tasks to complete")
        self.executor.shutdown()

        # We're done
        print("Complete")

    def alarm_handler(self, signum, frame):
        """
        Called when SIGALRM fires, which means we missed a schedule loop.
        Just exit as we're likely deadlocked.
        """
        print("Watchdog timeout exceeded")
        os._exit(2)

    def load_config(self):
        """
        Refreshes config from the DB
        """
        Config.system = Config.load_system()

    def run_scheduling(self):
        """
        Deletes stale locks for models, and submits their stats.
        """
        with sentry.start_transaction(op="task", name="stator.run_scheduling"):
            for model in self.models:
                num = self.handled.get(model._meta.label_lower, 0)
                if num or settings.DEBUG:
                    print(f"{model._meta.label_lower}: Scheduling ({num} handled)")
                self.submit_stats(model)
                model.transition_clean_locks()

    def submit_stats(self, model: type[StatorModel]):
        """
        Pop some statistics into the database from our local info for the given model
        """
        stats_instance = Stats.get_for_model(model)
        if stats_instance.model_label in self.handled:
            stats_instance.add_handled(self.handled[stats_instance.model_label])
            del self.handled[stats_instance.model_label]
        stats_instance.set_queued(model.transition_ready_count())
        stats_instance.trim_data()
        stats_instance.save()

    def add_transition_tasks(self, call_inline=False):
        """
        Adds a transition thread for as many instances as we can, given capacity
        and batch size limits.
        """
        # Calculate space left for tasks
        space_remaining = self.concurrency - len(self.tasks)
        # Fetch new tasks
        for model in self.models:
            if space_remaining > 0:
                for instance in model.transition_get_with_lock(
                    number=min(space_remaining, self.concurrency_per_model),
                    lock_expiry=(
                        timezone.now() + datetime.timedelta(seconds=self.lock_expiry)
                    ),
                ):
                    key = (model._meta.label_lower, instance.pk)
                    # Don't run two threads for the same thing
                    if key in self.tasks:
                        continue
                    if call_inline:
                        task_transition(instance, in_thread=False)
                    else:
                        self.tasks[key] = self.executor.submit(
                            task_transition, instance
                        )
                    self.handled[model._meta.label_lower] = (
                        self.handled.get(model._meta.label_lower, 0) + 1
                    )
                    space_remaining -= 1

    def add_deletion_tasks(self, call_inline=False):
        """
        Adds a deletion thread for each model
        """
        # Yes, this potentially goes over the capacity limit - it's fine.
        for model in self.models:
            if model.state_graph.deletion_states:
                if call_inline:
                    task_deletion(model, in_thread=False)
                else:
                    self.tasks[
                        model._meta.label_lower, "__delete__"
                    ] = self.executor.submit(task_deletion, model)

    def clean_tasks(self):
        """
        Removes any tasks that are done and handles exceptions if they
        raised them.
        """
        for key, task in list(self.tasks.items()):
            if task.done():
                del self.tasks[key]
                try:
                    task.result()
                except BaseException as e:
                    exceptions.capture_exception(e)
                    traceback.print_exc()

    def run_single_cycle(self):
        """
        Testing entrypoint to advance things just one cycle, and allow errors
        to propagate out.
        """
        self.add_deletion_tasks(call_inline=True)
        self.add_transition_tasks(call_inline=True)


def task_transition(instance: StatorModel, in_thread: bool = True):
    """
    Runs one state transition/action.
    """
    task_name = f"stator.task_transition:{instance._meta.label_lower}#{{id}} from {instance.state}"
    started = time.monotonic()
    with sentry.start_transaction(op="task", name=task_name):
        sentry.set_context(
            "instance",
            {
                "model": instance._meta.label_lower,
                "pk": instance.pk,
                "state": instance.state,
                "state_age": instance.state_age,
            },
        )
        result = instance.transition_attempt()
        duration = time.monotonic() - started
        if result:
            print(
                f"{instance._meta.label_lower}: {instance.pk}: {instance.state} -> {result} ({duration:.2f}s)"
            )
        else:
            print(
                f"{instance._meta.label_lower}: {instance.pk}: {instance.state} unchanged  ({duration:.2f}s)"
            )
    if in_thread:
        close_old_connections()


def task_deletion(model: type[StatorModel], in_thread: bool = True):
    """
    Runs one model deletion set.
    """
    # Loop, running deletions every second, until there are no more to do
    while True:
        deleted = model.transition_delete_due()
        if not deleted:
            break
        print(f"{model._meta.label_lower}: Deleted {deleted} stale items")
        time.sleep(1)
    if in_thread:
        close_old_connections()
Midway point in task refactor - changing direction 2022-11-08 22:06:29 -08:00			`import datetime`
Add watchdog to prevent stator freezing Refs #424 2023-01-16 10:15:28 -08:00			`import os`
			`import signal`
Midway point in task refactor - changing direction 2022-11-08 22:06:29 -08:00			`import time`
Profile fetching now working on state machine 2022-11-09 22:48:31 -08:00			`import traceback`
Midway point in task refactor - changing direction 2022-11-08 22:06:29 -08:00			`import uuid`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`from concurrent.futures import Future, ThreadPoolExecutor`
Midway point in task refactor - changing direction 2022-11-08 22:06:29 -08:00
Allow tuning of stator concurrency 2022-12-20 00:02:35 -08:00			`from django.conf import settings`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`from django.db import close_old_connections`
Midway point in task refactor - changing direction 2022-11-08 22:06:29 -08:00			`from django.utils import timezone`

[WIP] Sentry improvements (#108) Stator clears scope during the main loop to behave more like transactions. Transaction names are set. Sentry tags: * 'takahe.version' * 'takahe.app' values 'web' or 'stator' Added settings: * TAKAHE_SENTRY_SAMPLE_RATE * TAKAHE_SENTRY_TRACES_SAMPLE_RATE 2022-12-04 17:08:23 -08:00			`from core import exceptions, sentry`
StatorRunner will refresh Config.system on each schedule_interval 2022-11-22 20:06:21 -08:00			`from core.models import Config`
Stator stats overhaul Removes the error table, adds a stats table and admin page. Fixes #166 2022-12-15 11:26:17 -08:00			`from stator.models import StatorModel, Stats`
Midway point in task refactor - changing direction 2022-11-08 22:06:29 -08:00

Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`class LoopingTimer:`
Rework stator to avoid deadlocks on slow databases Refs #424 2023-02-03 20:51:24 -08:00			`"""`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			Triggers check() to be true once every `interval`.
Rework stator to avoid deadlocks on slow databases Refs #424 2023-02-03 20:51:24 -08:00			`"""`

Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`next_run: float \| None = None`
Rework stator to avoid deadlocks on slow databases Refs #424 2023-02-03 20:51:24 -08:00
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`def __init__(self, interval: float, trigger_at_start=True):`
			`self.interval = interval`
			`self.trigger_at_start = trigger_at_start`

			`def check(self) -> bool:`
			`# See if it's our first time being called`
			`if self.next_run is None:`
			`# Set up the next call based on trigger_at_start`
			`if self.trigger_at_start:`
			`self.next_run = time.monotonic()`
Rework stator to avoid deadlocks on slow databases Refs #424 2023-02-03 20:51:24 -08:00			`else:`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`self.next_run = time.monotonic() + self.interval`
			`# See if it's time to run the next call`
			`if time.monotonic() >= self.next_run:`
			`self.next_run = time.monotonic() + self.interval`
			`return True`
			`return False`
Rework stator to avoid deadlocks on slow databases Refs #424 2023-02-03 20:51:24 -08:00

Midway point in task refactor - changing direction 2022-11-08 22:06:29 -08:00			`class StatorRunner:`
			`"""`
			`Runs tasks on models that are looking for state changes.`
Delete mechanics and refactor of post fanout 2022-11-24 16:11:04 -08:00			`Designed to run either indefinitely, or just for a few seconds.`
Midway point in task refactor - changing direction 2022-11-08 22:06:29 -08:00			`"""`

Boosting! Incoming, anyway. 2022-11-13 17:42:47 -08:00			`def __init__(`
			`self,`
Add pyupgrade with --py310-plus in pre-commit (#103) 2022-12-05 09:38:37 -08:00			`models: list[type[StatorModel]],`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`concurrency: int = getattr(settings, "STATOR_CONCURRENCY", 30),`
Allow tuning of stator concurrency 2022-12-20 00:02:35 -08:00			`concurrency_per_model: int = getattr(`
Rework stator to avoid deadlocks on slow databases Refs #424 2023-02-03 20:51:24 -08:00			`settings, "STATOR_CONCURRENCY_PER_MODEL", 15`
Allow tuning of stator concurrency 2022-12-20 00:02:35 -08:00			`),`
Add pyupgrade with --py310-plus in pre-commit (#103) 2022-12-05 09:38:37 -08:00			`liveness_file: str \| None = None,`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`schedule_interval: int = 60,`
			`delete_interval: int = 30,`
A few more tweaks for an initial deploy 2022-11-19 09:20:13 -08:00			`lock_expiry: int = 300,`
The glorious return of the in-view runner 2022-11-26 10:54:14 -08:00			`run_for: int = 0,`
Boosting! Incoming, anyway. 2022-11-13 17:42:47 -08:00			`):`
Midway point in task refactor - changing direction 2022-11-08 22:06:29 -08:00			`self.models = models`
			`self.runner_id = uuid.uuid4().hex`
Boosting! Incoming, anyway. 2022-11-13 17:42:47 -08:00			`self.concurrency = concurrency`
			`self.concurrency_per_model = concurrency_per_model`
A few more tweaks for an initial deploy 2022-11-19 09:20:13 -08:00			`self.liveness_file = liveness_file`
			`self.schedule_interval = schedule_interval`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`self.delete_interval = delete_interval`
A few more tweaks for an initial deploy 2022-11-19 09:20:13 -08:00			`self.lock_expiry = lock_expiry`
The glorious return of the in-view runner 2022-11-26 10:54:14 -08:00			`self.run_for = run_for`
Back off Stator loop delay when there's no tasks Fixes #232 2022-12-21 21:03:41 -08:00			`self.minimum_loop_delay = 0.5`
			`self.maximum_loop_delay = 5`
Prevent race condition between threads and locking 2023-07-08 23:42:56 -07:00			`self.tasks: dict[tuple[str, str], Future] = {}`
Add watchdog to prevent stator freezing Refs #424 2023-01-16 10:15:28 -08:00			`# Set up SIGALRM handler`
			`signal.signal(signal.SIGALRM, self.alarm_handler)`
Midway point in task refactor - changing direction 2022-11-08 22:06:29 -08:00
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`def run(self):`
[WIP] Sentry improvements (#108) Stator clears scope during the main loop to behave more like transactions. Transaction names are set. Sentry tags: * 'takahe.version' * 'takahe.app' values 'web' or 'stator' Added settings: * TAKAHE_SENTRY_SAMPLE_RATE * TAKAHE_SENTRY_TRACES_SAMPLE_RATE 2022-12-04 17:08:23 -08:00			`sentry.set_takahe_app("stator")`
Stator stats overhaul Removes the error table, adds a stats table and admin page. Fixes #166 2022-12-15 11:26:17 -08:00			`self.handled = {}`
The glorious return of the in-view runner 2022-11-26 10:54:14 -08:00			`self.started = time.monotonic()`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`self.executor = ThreadPoolExecutor(max_workers=self.concurrency)`
Back off Stator loop delay when there's no tasks Fixes #232 2022-12-21 21:03:41 -08:00			`self.loop_delay = self.minimum_loop_delay`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`self.scheduling_timer = LoopingTimer(self.schedule_interval)`
			`self.deletion_timer = LoopingTimer(self.delete_interval)`
Midway point in task refactor - changing direction 2022-11-08 22:06:29 -08:00			`# For the first time period, launch tasks`
Most of the way through the stator refactor 2022-11-09 21:29:33 -08:00			`print("Running main task loop")`
A few more tweaks for an initial deploy 2022-11-19 09:20:13 -08:00			`try:`
[WIP] Sentry improvements (#108) Stator clears scope during the main loop to behave more like transactions. Transaction names are set. Sentry tags: * 'takahe.version' * 'takahe.app' values 'web' or 'stator' Added settings: * TAKAHE_SENTRY_SAMPLE_RATE * TAKAHE_SENTRY_TRACES_SAMPLE_RATE 2022-12-04 17:08:23 -08:00			`with sentry.configure_scope() as scope:`
			`while True:`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`# See if we need to run cleaning`
			`if self.scheduling_timer.check():`
			`# Set up the watchdog timer (each time we do this the previous one is cancelled)`
Add watchdog to prevent stator freezing Refs #424 2023-01-16 10:15:28 -08:00			`signal.alarm(self.schedule_interval * 2)`
Actually implement the liveness file 2022-12-31 10:54:51 -08:00			`# Write liveness file if configured`
			`if self.liveness_file:`
			`with open(self.liveness_file, "w") as fh:`
			`fh.write(str(int(time.time())))`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`# Refresh the config`
			`self.load_config()`
			`# Do scheduling (stale lock deletion and stats gathering)`
			`self.run_scheduling()`
Post editing 2022-11-27 10:09:46 -08:00
[WIP] Sentry improvements (#108) Stator clears scope during the main loop to behave more like transactions. Transaction names are set. Sentry tags: * 'takahe.version' * 'takahe.app' values 'web' or 'stator' Added settings: * TAKAHE_SENTRY_SAMPLE_RATE * TAKAHE_SENTRY_TRACES_SAMPLE_RATE 2022-12-04 17:08:23 -08:00			`# Clear the cleaning breadcrumbs/extra for the main part of the loop`
			`sentry.scope_clear(scope)`
Post editing 2022-11-27 10:09:46 -08:00
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`self.clean_tasks()`

			`# See if we need to add deletion tasks`
			`if self.deletion_timer.check():`
			`self.add_deletion_tasks()`
Rework stator to avoid deadlocks on slow databases Refs #424 2023-02-03 20:51:24 -08:00
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`# Fetch and run any new handlers we can fit`
			`self.add_transition_tasks()`
[WIP] Sentry improvements (#108) Stator clears scope during the main loop to behave more like transactions. Transaction names are set. Sentry tags: * 'takahe.version' * 'takahe.app' values 'web' or 'stator' Added settings: * TAKAHE_SENTRY_SAMPLE_RATE * TAKAHE_SENTRY_TRACES_SAMPLE_RATE 2022-12-04 17:08:23 -08:00
			`# Are we in limited run mode?`
			`if (`
			`self.run_for`
			`and (time.monotonic() - self.started) > self.run_for`
			`):`
			`break`
Back off Stator loop delay when there's no tasks Fixes #232 2022-12-21 21:03:41 -08:00
			`# Prevent busylooping, but also back off delay if we have`
			`# no tasks`
			`if self.tasks:`
			`self.loop_delay = self.minimum_loop_delay`
			`else:`
			`self.loop_delay = min(`
			`self.loop_delay * 1.5,`
			`self.maximum_loop_delay,`
			`)`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`time.sleep(self.loop_delay)`
Back off Stator loop delay when there's no tasks Fixes #232 2022-12-21 21:03:41 -08:00
[WIP] Sentry improvements (#108) Stator clears scope during the main loop to behave more like transactions. Transaction names are set. Sentry tags: * 'takahe.version' * 'takahe.app' values 'web' or 'stator' Added settings: * TAKAHE_SENTRY_SAMPLE_RATE * TAKAHE_SENTRY_TRACES_SAMPLE_RATE 2022-12-04 17:08:23 -08:00			`# Clear the Sentry breadcrumbs and extra for next loop`
			`sentry.scope_clear(scope)`
The glorious return of the in-view runner 2022-11-26 10:54:14 -08:00			`except KeyboardInterrupt:`
			`pass`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00
The glorious return of the in-view runner 2022-11-26 10:54:14 -08:00			`# Wait for tasks to finish`
			`print("Waiting for tasks to complete")`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`self.executor.shutdown()`

			`# We're done`
Most of the way through the stator refactor 2022-11-09 21:29:33 -08:00			`print("Complete")`
Midway point in task refactor - changing direction 2022-11-08 22:06:29 -08:00
Add watchdog to prevent stator freezing Refs #424 2023-01-16 10:15:28 -08:00			`def alarm_handler(self, signum, frame):`
			`"""`
			`Called when SIGALRM fires, which means we missed a schedule loop.`
			`Just exit as we're likely deadlocked.`
			`"""`
			`print("Watchdog timeout exceeded")`
			`os._exit(2)`

Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`def load_config(self):`
Rework stator to avoid deadlocks on slow databases Refs #424 2023-02-03 20:51:24 -08:00			`"""`
			`Refreshes config from the DB`
			`"""`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`Config.system = Config.load_system()`
Rework stator to avoid deadlocks on slow databases Refs #424 2023-02-03 20:51:24 -08:00
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`def run_scheduling(self):`
Post editing 2022-11-27 10:09:46 -08:00			`"""`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`Deletes stale locks for models, and submits their stats.`
Post editing 2022-11-27 10:09:46 -08:00			`"""`
[WIP] Sentry improvements (#108) Stator clears scope during the main loop to behave more like transactions. Transaction names are set. Sentry tags: * 'takahe.version' * 'takahe.app' values 'web' or 'stator' Added settings: * TAKAHE_SENTRY_SAMPLE_RATE * TAKAHE_SENTRY_TRACES_SAMPLE_RATE 2022-12-04 17:08:23 -08:00			`with sentry.start_transaction(op="task", name="stator.run_scheduling"):`
			`for model in self.models:`
Do not print "Scheduling 0 handled" unless settings.DEBUG is on (#636) 2023-08-23 05:12:21 -07:00			`num = self.handled.get(model._meta.label_lower, 0)`
			`if num or settings.DEBUG:`
			`print(f"{model._meta.label_lower}: Scheduling ({num} handled)")`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`self.submit_stats(model)`
			`model.transition_clean_locks()`
Post editing 2022-11-27 10:09:46 -08:00
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`def submit_stats(self, model: type[StatorModel]):`
Stator stats overhaul Removes the error table, adds a stats table and admin page. Fixes #166 2022-12-15 11:26:17 -08:00			`"""`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`Pop some statistics into the database from our local info for the given model`
Stator stats overhaul Removes the error table, adds a stats table and admin page. Fixes #166 2022-12-15 11:26:17 -08:00			`"""`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`stats_instance = Stats.get_for_model(model)`
Stator stats overhaul Removes the error table, adds a stats table and admin page. Fixes #166 2022-12-15 11:26:17 -08:00			`if stats_instance.model_label in self.handled:`
			`stats_instance.add_handled(self.handled[stats_instance.model_label])`
			`del self.handled[stats_instance.model_label]`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`stats_instance.set_queued(model.transition_ready_count())`
Stator stats overhaul Removes the error table, adds a stats table and admin page. Fixes #166 2022-12-15 11:26:17 -08:00			`stats_instance.trim_data()`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`stats_instance.save()`
Stator stats overhaul Removes the error table, adds a stats table and admin page. Fixes #166 2022-12-15 11:26:17 -08:00
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`def add_transition_tasks(self, call_inline=False):`
			`"""`
			`Adds a transition thread for as many instances as we can, given capacity`
			`and batch size limits.`
			`"""`
Post editing 2022-11-27 10:09:46 -08:00			`# Calculate space left for tasks`
			`space_remaining = self.concurrency - len(self.tasks)`
			`# Fetch new tasks`
			`for model in self.models:`
			`if space_remaining > 0:`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`for instance in model.transition_get_with_lock(`
Post editing 2022-11-27 10:09:46 -08:00			`number=min(space_remaining, self.concurrency_per_model),`
			`lock_expiry=(`
			`timezone.now() + datetime.timedelta(seconds=self.lock_expiry)`
			`),`
			`):`
Prevent race condition between threads and locking 2023-07-08 23:42:56 -07:00			`key = (model._meta.label_lower, instance.pk)`
			`# Don't run two threads for the same thing`
			`if key in self.tasks:`
			`continue`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`if call_inline:`
			`task_transition(instance, in_thread=False)`
			`else:`
Prevent race condition between threads and locking 2023-07-08 23:42:56 -07:00			`self.tasks[key] = self.executor.submit(`
			`task_transition, instance`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`)`
Stator stats overhaul Removes the error table, adds a stats table and admin page. Fixes #166 2022-12-15 11:26:17 -08:00			`self.handled[model._meta.label_lower] = (`
			`self.handled.get(model._meta.label_lower, 0) + 1`
			`)`
Post editing 2022-11-27 10:09:46 -08:00			`space_remaining -= 1`

Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`def add_deletion_tasks(self, call_inline=False):`
Profile fetching now working on state machine 2022-11-09 22:48:31 -08:00			`"""`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`Adds a deletion thread for each model`
Profile fetching now working on state machine 2022-11-09 22:48:31 -08:00			`"""`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`# Yes, this potentially goes over the capacity limit - it's fine.`
			`for model in self.models:`
			`if model.state_graph.deletion_states:`
			`if call_inline:`
			`task_deletion(model, in_thread=False)`
			`else:`
Prevent race condition between threads and locking 2023-07-08 23:42:56 -07:00			`self.tasks[`
			`model._meta.label_lower, "__delete__"`
			`] = self.executor.submit(task_deletion, model)`
Profile fetching now working on state machine 2022-11-09 22:48:31 -08:00
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`def clean_tasks(self):`
Profile fetching now working on state machine 2022-11-09 22:48:31 -08:00			`"""`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`Removes any tasks that are done and handles exceptions if they`
			`raised them.`
Profile fetching now working on state machine 2022-11-09 22:48:31 -08:00			`"""`
Prevent race condition between threads and locking 2023-07-08 23:42:56 -07:00			`for key, task in list(self.tasks.items()):`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`if task.done():`
Prevent race condition between threads and locking 2023-07-08 23:42:56 -07:00			`del self.tasks[key]`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`try:`
			`task.result()`
			`except BaseException as e:`
			`exceptions.capture_exception(e)`
			`traceback.print_exc()`
Policy pages and signup tests. Fixes #113 2022-12-05 18:21:00 -08:00
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`def run_single_cycle(self):`
Policy pages and signup tests. Fixes #113 2022-12-05 18:21:00 -08:00			`"""`
Handle deletions of post URIs Fixes #306 2022-12-28 21:47:28 -08:00			`Testing entrypoint to advance things just one cycle, and allow errors`
			`to propagate out.`
Policy pages and signup tests. Fixes #113 2022-12-05 18:21:00 -08:00			`"""`
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`self.add_deletion_tasks(call_inline=True)`
			`self.add_transition_tasks(call_inline=True)`


			`def task_transition(instance: StatorModel, in_thread: bool = True):`
			`"""`
			`Runs one state transition/action.`
			`"""`
			`task_name = f"stator.task_transition:{instance._meta.label_lower}#{{id}} from {instance.state}"`
			`started = time.monotonic()`
			`with sentry.start_transaction(op="task", name=task_name):`
			`sentry.set_context(`
			`"instance",`
			`{`
			`"model": instance._meta.label_lower,`
			`"pk": instance.pk,`
			`"state": instance.state,`
			`"state_age": instance.state_age,`
			`},`
			`)`
			`result = instance.transition_attempt()`
			`duration = time.monotonic() - started`
			`if result:`
			`print(`
			`f"{instance._meta.label_lower}: {instance.pk}: {instance.state} -> {result} ({duration:.2f}s)"`
			`)`
			`else:`
			`print(`
			`f"{instance._meta.label_lower}: {instance.pk}: {instance.state} unchanged ({duration:.2f}s)"`
			`)`
			`if in_thread:`
			`close_old_connections()`

Policy pages and signup tests. Fixes #113 2022-12-05 18:21:00 -08:00
Rework Stator to use a next field and no async 2023-07-07 14:14:06 -07:00			`def task_deletion(model: type[StatorModel], in_thread: bool = True):`
			`"""`
			`Runs one model deletion set.`
			`"""`
			`# Loop, running deletions every second, until there are no more to do`
			`while True:`
			`deleted = model.transition_delete_due()`
			`if not deleted:`
			`break`
			`print(f"{model._meta.label_lower}: Deleted {deleted} stale items")`
			`time.sleep(1)`
			`if in_thread:`
			`close_old_connections()`