mirror of
https://github.com/Significant-Gravitas/AutoGPT.git
synced 2026-04-08 03:00:28 -04:00
There is no 100% accurate way of retrying an agent that has been terminated. And the safest way to avoid executing an agent wrong is minimizing the chance of an agent execution being terminated. A whole set of mechanism to make sure the agent is retried on failure is still in place and improved, this is used as our best-effort reliability mechanism. ### Changes 🏗️ * Cap SIGINT & SIGTERM to be raised at most once, so the executor can gracefully handle the stopping. * SIGINT & SIGTERM will stop the execution request message consumption, but not agent execution. * Executor process will only stop if all the in-flight agent executions are completed or terminated. * Avoid retrying the agent stop command on AgentExecutorBlock on timeout. ### Checklist 📋 #### For code changes: - [x] I have clearly listed my changes in the PR description - [x] I have made a test plan - [x] I have tested my changes according to the test plan: <!-- Put your test plan here: --> - [x] Run agent, send SIGTERM to the executor pod, execution should not be interrupted. - [x] Run agent, send SIGKILL to the executor pod, execution should be transferred to another pod.
57 lines
1.5 KiB
Python
57 lines
1.5 KiB
Python
import logging
|
|
from typing import TYPE_CHECKING
|
|
|
|
from dotenv import load_dotenv
|
|
|
|
load_dotenv()
|
|
|
|
if TYPE_CHECKING:
|
|
from backend.util.process import AppProcess
|
|
|
|
logger = logging.getLogger(__name__)
|
|
|
|
|
|
def run_processes(*processes: "AppProcess", **kwargs):
|
|
"""
|
|
Execute all processes in the app. The last process is run in the foreground.
|
|
Includes enhanced error handling and process lifecycle management.
|
|
"""
|
|
try:
|
|
# Run all processes except the last one in the background.
|
|
for process in processes[:-1]:
|
|
process.start(background=True, **kwargs)
|
|
|
|
# Run the last process in the foreground.
|
|
processes[-1].start(background=False, **kwargs)
|
|
finally:
|
|
for process in processes:
|
|
try:
|
|
process.stop()
|
|
except Exception as e:
|
|
logger.exception(f"[{process.service_name}] unable to stop: {e}")
|
|
|
|
|
|
def main(**kwargs):
|
|
"""
|
|
Run all the processes required for the AutoGPT-server (REST and WebSocket APIs).
|
|
"""
|
|
|
|
from backend.executor import DatabaseManager, ExecutionManager, Scheduler
|
|
from backend.notifications import NotificationManager
|
|
from backend.server.rest_api import AgentServer
|
|
from backend.server.ws_api import WebsocketServer
|
|
|
|
run_processes(
|
|
DatabaseManager().set_log_level("warning"),
|
|
Scheduler(),
|
|
NotificationManager(),
|
|
WebsocketServer(),
|
|
AgentServer(),
|
|
ExecutionManager(),
|
|
**kwargs,
|
|
)
|
|
|
|
|
|
if __name__ == "__main__":
|
|
main()
|