2026-01-24 12:55:17 +02:00

331 lines
8.8 KiB
Go

package process
import (
"bytes"
"context"
"fmt"
"os/exec"
"path/filepath"
"strings"
"text/template"
"time"
"github.com/DeBrosOfficial/network/pkg/deployments"
"go.uber.org/zap"
)
// Manager manages deployment processes via systemd
type Manager struct {
logger *zap.Logger
}
// NewManager creates a new process manager
func NewManager(logger *zap.Logger) *Manager {
return &Manager{
logger: logger,
}
}
// Start starts a deployment process
func (m *Manager) Start(ctx context.Context, deployment *deployments.Deployment, workDir string) error {
serviceName := m.getServiceName(deployment)
m.logger.Info("Starting deployment process",
zap.String("deployment", deployment.Name),
zap.String("namespace", deployment.Namespace),
zap.String("service", serviceName),
)
// Create systemd service file
if err := m.createSystemdService(deployment, workDir); err != nil {
return fmt.Errorf("failed to create systemd service: %w", err)
}
// Reload systemd
if err := m.systemdReload(); err != nil {
return fmt.Errorf("failed to reload systemd: %w", err)
}
// Enable service
if err := m.systemdEnable(serviceName); err != nil {
return fmt.Errorf("failed to enable service: %w", err)
}
// Start service
if err := m.systemdStart(serviceName); err != nil {
return fmt.Errorf("failed to start service: %w", err)
}
m.logger.Info("Deployment process started",
zap.String("deployment", deployment.Name),
zap.String("service", serviceName),
)
return nil
}
// Stop stops a deployment process
func (m *Manager) Stop(ctx context.Context, deployment *deployments.Deployment) error {
serviceName := m.getServiceName(deployment)
m.logger.Info("Stopping deployment process",
zap.String("deployment", deployment.Name),
zap.String("service", serviceName),
)
// Stop service
if err := m.systemdStop(serviceName); err != nil {
m.logger.Warn("Failed to stop service", zap.Error(err))
}
// Disable service
if err := m.systemdDisable(serviceName); err != nil {
m.logger.Warn("Failed to disable service", zap.Error(err))
}
// Remove service file using sudo
serviceFile := filepath.Join("/etc/systemd/system", serviceName+".service")
cmd := exec.Command("sudo", "rm", "-f", serviceFile)
if err := cmd.Run(); err != nil {
m.logger.Warn("Failed to remove service file", zap.Error(err))
}
// Reload systemd
m.systemdReload()
return nil
}
// Restart restarts a deployment process
func (m *Manager) Restart(ctx context.Context, deployment *deployments.Deployment) error {
serviceName := m.getServiceName(deployment)
m.logger.Info("Restarting deployment process",
zap.String("deployment", deployment.Name),
zap.String("service", serviceName),
)
return m.systemdRestart(serviceName)
}
// Status gets the status of a deployment process
func (m *Manager) Status(ctx context.Context, deployment *deployments.Deployment) (string, error) {
serviceName := m.getServiceName(deployment)
cmd := exec.CommandContext(ctx, "systemctl", "is-active", serviceName)
output, err := cmd.Output()
if err != nil {
return "unknown", err
}
return strings.TrimSpace(string(output)), nil
}
// GetLogs retrieves logs for a deployment
func (m *Manager) GetLogs(ctx context.Context, deployment *deployments.Deployment, lines int, follow bool) ([]byte, error) {
serviceName := m.getServiceName(deployment)
args := []string{"-u", serviceName, "--no-pager"}
if lines > 0 {
args = append(args, "-n", fmt.Sprintf("%d", lines))
}
if follow {
args = append(args, "-f")
}
cmd := exec.CommandContext(ctx, "journalctl", args...)
return cmd.Output()
}
// createSystemdService creates a systemd service file
func (m *Manager) createSystemdService(deployment *deployments.Deployment, workDir string) error {
serviceName := m.getServiceName(deployment)
serviceFile := filepath.Join("/etc/systemd/system", serviceName+".service")
// Determine the start command based on deployment type
startCmd := m.getStartCommand(deployment, workDir)
// Build environment variables
envVars := make([]string, 0)
envVars = append(envVars, fmt.Sprintf("PORT=%d", deployment.Port))
for key, value := range deployment.Environment {
envVars = append(envVars, fmt.Sprintf("%s=%s", key, value))
}
// Create service from template
tmpl := `[Unit]
Description=Orama Deployment - {{.Namespace}}/{{.Name}}
After=network.target
[Service]
Type=simple
User=debros
Group=debros
WorkingDirectory={{.WorkDir}}
{{range .Env}}Environment="{{.}}"
{{end}}
ExecStart={{.StartCmd}}
Restart={{.RestartPolicy}}
RestartSec=5s
# Resource limits
MemoryLimit={{.MemoryLimitMB}}M
CPUQuota={{.CPULimitPercent}}%
# Security - minimal restrictions for deployments in home directory
PrivateTmp=true
ProtectSystem=full
ProtectHome=read-only
ReadWritePaths={{.WorkDir}}
StandardOutput=journal
StandardError=journal
SyslogIdentifier={{.ServiceName}}
[Install]
WantedBy=multi-user.target
`
t, err := template.New("service").Parse(tmpl)
if err != nil {
return err
}
data := struct {
Namespace string
Name string
ServiceName string
WorkDir string
StartCmd string
Env []string
RestartPolicy string
MemoryLimitMB int
CPULimitPercent int
}{
Namespace: deployment.Namespace,
Name: deployment.Name,
ServiceName: serviceName,
WorkDir: workDir,
StartCmd: startCmd,
Env: envVars,
RestartPolicy: m.mapRestartPolicy(deployment.RestartPolicy),
MemoryLimitMB: deployment.MemoryLimitMB,
CPULimitPercent: deployment.CPULimitPercent,
}
// Execute template to buffer
var buf bytes.Buffer
if err := t.Execute(&buf, data); err != nil {
return err
}
// Use sudo tee to write to systemd directory (debros user needs sudo access)
cmd := exec.Command("sudo", "tee", serviceFile)
cmd.Stdin = &buf
output, err := cmd.CombinedOutput()
if err != nil {
return fmt.Errorf("failed to write service file: %s: %w", string(output), err)
}
return nil
}
// getStartCommand determines the start command for a deployment
func (m *Manager) getStartCommand(deployment *deployments.Deployment, workDir string) string {
switch deployment.Type {
case deployments.DeploymentTypeNextJS:
// Next.js standalone output places server at .next/standalone/server.js
return "/usr/bin/node .next/standalone/server.js"
case deployments.DeploymentTypeNodeJSBackend:
// Check if ENTRY_POINT is set in environment
if entryPoint, ok := deployment.Environment["ENTRY_POINT"]; ok {
if entryPoint == "npm:start" {
return "/usr/bin/npm start"
}
return "/usr/bin/node " + entryPoint
}
return "/usr/bin/node index.js"
case deployments.DeploymentTypeGoBackend:
return filepath.Join(workDir, "app")
default:
return "echo 'Unknown deployment type'"
}
}
// mapRestartPolicy maps deployment restart policy to systemd restart policy
func (m *Manager) mapRestartPolicy(policy deployments.RestartPolicy) string {
switch policy {
case deployments.RestartPolicyAlways:
return "always"
case deployments.RestartPolicyOnFailure:
return "on-failure"
case deployments.RestartPolicyNever:
return "no"
default:
return "on-failure"
}
}
// getServiceName generates a systemd service name
func (m *Manager) getServiceName(deployment *deployments.Deployment) string {
// Sanitize namespace and name for service name
namespace := strings.ReplaceAll(deployment.Namespace, ".", "-")
name := strings.ReplaceAll(deployment.Name, ".", "-")
return fmt.Sprintf("orama-deploy-%s-%s", namespace, name)
}
// systemd helper methods (use sudo for non-root execution)
func (m *Manager) systemdReload() error {
cmd := exec.Command("sudo", "systemctl", "daemon-reload")
return cmd.Run()
}
func (m *Manager) systemdEnable(serviceName string) error {
cmd := exec.Command("sudo", "systemctl", "enable", serviceName)
return cmd.Run()
}
func (m *Manager) systemdDisable(serviceName string) error {
cmd := exec.Command("sudo", "systemctl", "disable", serviceName)
return cmd.Run()
}
func (m *Manager) systemdStart(serviceName string) error {
cmd := exec.Command("sudo", "systemctl", "start", serviceName)
return cmd.Run()
}
func (m *Manager) systemdStop(serviceName string) error {
cmd := exec.Command("sudo", "systemctl", "stop", serviceName)
return cmd.Run()
}
func (m *Manager) systemdRestart(serviceName string) error {
cmd := exec.Command("sudo", "systemctl", "restart", serviceName)
return cmd.Run()
}
// WaitForHealthy waits for a deployment to become healthy
func (m *Manager) WaitForHealthy(ctx context.Context, deployment *deployments.Deployment, timeout time.Duration) error {
deadline := time.Now().Add(timeout)
for time.Now().Before(deadline) {
status, err := m.Status(ctx, deployment)
if err == nil && status == "active" {
return nil
}
select {
case <-ctx.Done():
return ctx.Err()
case <-time.After(2 * time.Second):
// Continue checking
}
}
return fmt.Errorf("deployment did not become healthy within %v", timeout)
}