Implement Docker command handling for Llama, MLX, and vLLM backends

2025-11-06 09:04:27 +00:00 · 2025-09-24 21:31:58 +02:00
parent 72d2a601c8
commit 76ac93bedc
4 changed files with 222 additions and 16 deletions
--- a/pkg/backends/vllm/vllm.go
+++ b/pkg/backends/vllm/vllm.go
@@ -1,6 +1,12 @@
 package vllm

 import (
+	"context"
+	"fmt"
+	"llamactl/pkg/config"
+	"os/exec"
+	"strings"
+
 	"llamactl/pkg/backends"
 )

@@ -160,6 +166,75 @@ func (o *VllmServerOptions) BuildCommandArgs() []string {
 	return args
 }

+// BuildCommandArgsWithDocker converts VllmServerOptions to command line arguments,
+// handling Docker transformations if needed
+func (o *VllmServerOptions) BuildCommandArgsWithDocker(dockerImage string) []string {
+	args := o.BuildCommandArgs()
+
+	// Handle vLLM Docker image quirk
+	if isVLLMDocker(dockerImage) {
+		args = transformVLLMArgs(args)
+	}
+
+	return args
+}
+
+// isVLLMDocker checks if the Docker image is a vLLM image
+func isVLLMDocker(image string) bool {
+	return strings.Contains(strings.ToLower(image), "vllm")
+}
+
+// transformVLLMArgs converts vLLM arguments for Docker execution
+// Convert: ["serve", "microsoft/DialoGPT-medium", "--flag", "value"]
+// To: ["--model", "microsoft/DialoGPT-medium", "--flag", "value"]
+func transformVLLMArgs(args []string) []string {
+	if len(args) >= 2 && args[0] == "serve" {
+		return append([]string{"--model", args[1]}, args[2:]...)
+	}
+	return args
+}
+
+// BuildCommand creates the complete command for execution, handling Docker vs native execution
+func (o *VllmServerOptions) BuildCommand(ctx context.Context, backendConfig *config.BackendSettings) (*exec.Cmd, error) {
+	// Build instance-specific arguments using backend functions
+	var instanceArgs []string
+	if backendConfig.Docker != nil && backendConfig.Docker.Enabled {
+		// Use Docker-aware argument building
+		instanceArgs = o.BuildCommandArgsWithDocker(backendConfig.Docker.Image)
+	} else {
+		// Use regular argument building for native execution
+		instanceArgs = o.BuildCommandArgs()
+	}
+
+	// Combine backend args with instance args
+	finalArgs := append(backendConfig.Args, instanceArgs...)
+
+	// Choose Docker vs Native execution
+	if backendConfig.Docker != nil && backendConfig.Docker.Enabled {
+		return buildDockerCommand(ctx, backendConfig, finalArgs)
+	} else {
+		return exec.CommandContext(ctx, backendConfig.Command, finalArgs...), nil
+	}
+}
+
+// buildDockerCommand builds a Docker command with the specified configuration and arguments
+func buildDockerCommand(ctx context.Context, backendConfig *config.BackendSettings, args []string) (*exec.Cmd, error) {
+	// Start with configured Docker arguments (should include "run", "--rm", etc.)
+	dockerArgs := make([]string, len(backendConfig.Docker.Args))
+	copy(dockerArgs, backendConfig.Docker.Args)
+
+	// Add environment variables
+	for key, value := range backendConfig.Docker.Environment {
+		dockerArgs = append(dockerArgs, "-e", fmt.Sprintf("%s=%s", key, value))
+	}
+
+	// Add image and container arguments
+	dockerArgs = append(dockerArgs, backendConfig.Docker.Image)
+	dockerArgs = append(dockerArgs, args...)
+
+	return exec.CommandContext(ctx, "docker", dockerArgs...), nil
+}
+
 // ParseVllmCommand parses a vLLM serve command string into VllmServerOptions
 // Supports multiple formats:
 // 1. Full command: "vllm serve --model MODEL_NAME --other-args"