mirror of
https://github.com/lordmathis/llamactl.git
synced 2025-11-06 09:04:27 +00:00
Compare commits
9 Commits
| Author | SHA1 | Date | |
|---|---|---|---|
| eb5abae173 | |||
| 696a2cb18b | |||
| e7402f0029 | |||
| 5c9a397746 | |||
| e97ca727d1 | |||
| 9f3c01384b | |||
| c5097e59be | |||
| cf20f304b3 | |||
| 72eba48b80 |
2
.gitignore
vendored
2
.gitignore
vendored
@@ -35,3 +35,5 @@ node_modules/
|
|||||||
dist/
|
dist/
|
||||||
|
|
||||||
__pycache__/
|
__pycache__/
|
||||||
|
|
||||||
|
site/
|
||||||
@@ -58,7 +58,7 @@ func main() {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// Initialize the instance manager
|
// Initialize the instance manager
|
||||||
instanceManager := manager.NewInstanceManager(cfg.Backends, cfg.Instances, cfg.Nodes)
|
instanceManager := manager.NewInstanceManager(cfg.Backends, cfg.Instances, cfg.Nodes, cfg.LocalNode)
|
||||||
|
|
||||||
// Create a new handler with the instance manager
|
// Create a new handler with the instance manager
|
||||||
handler := server.NewHandler(instanceManager, cfg)
|
handler := server.NewHandler(instanceManager, cfg)
|
||||||
|
|||||||
60
docs/fix_line_endings.py
Normal file
60
docs/fix_line_endings.py
Normal file
@@ -0,0 +1,60 @@
|
|||||||
|
"""
|
||||||
|
MkDocs hook to fix line endings for proper rendering.
|
||||||
|
Automatically adds two spaces at the end of lines that need line breaks.
|
||||||
|
"""
|
||||||
|
import re
|
||||||
|
|
||||||
|
|
||||||
|
def on_page_markdown(markdown, page, config, **kwargs):
|
||||||
|
"""
|
||||||
|
Fix line endings in markdown content for proper MkDocs rendering.
|
||||||
|
Adds two spaces at the end of lines that need line breaks.
|
||||||
|
"""
|
||||||
|
lines = markdown.split('\n')
|
||||||
|
processed_lines = []
|
||||||
|
in_code_block = False
|
||||||
|
|
||||||
|
for i, line in enumerate(lines):
|
||||||
|
stripped = line.strip()
|
||||||
|
|
||||||
|
# Track code blocks
|
||||||
|
if stripped.startswith('```'):
|
||||||
|
in_code_block = not in_code_block
|
||||||
|
processed_lines.append(line)
|
||||||
|
continue
|
||||||
|
|
||||||
|
# Skip processing inside code blocks
|
||||||
|
if in_code_block:
|
||||||
|
processed_lines.append(line)
|
||||||
|
continue
|
||||||
|
|
||||||
|
# Skip empty lines
|
||||||
|
if not stripped:
|
||||||
|
processed_lines.append(line)
|
||||||
|
continue
|
||||||
|
|
||||||
|
# Skip lines that shouldn't have line breaks:
|
||||||
|
# - Headers (# ## ###)
|
||||||
|
# - Blockquotes (>)
|
||||||
|
# - Table rows (|)
|
||||||
|
# - Lines already ending with two spaces
|
||||||
|
# - YAML front matter and HTML tags
|
||||||
|
# - Standalone punctuation lines
|
||||||
|
if (stripped.startswith('#') or
|
||||||
|
stripped.startswith('>') or
|
||||||
|
'|' in stripped or
|
||||||
|
line.endswith(' ') or
|
||||||
|
stripped.startswith('---') or
|
||||||
|
stripped.startswith('<') or
|
||||||
|
stripped.endswith('>') or
|
||||||
|
stripped in ('.', '!', '?', ':', ';', '```', '---', ',')):
|
||||||
|
processed_lines.append(line)
|
||||||
|
continue
|
||||||
|
|
||||||
|
# Add two spaces to lines that end with regular text or most punctuation
|
||||||
|
if stripped and not in_code_block:
|
||||||
|
processed_lines.append(line.rstrip() + ' ')
|
||||||
|
else:
|
||||||
|
processed_lines.append(line)
|
||||||
|
|
||||||
|
return '\n'.join(processed_lines)
|
||||||
@@ -261,7 +261,7 @@ nodes: # Node configuration map
|
|||||||
```
|
```
|
||||||
|
|
||||||
**Node Configuration Fields:**
|
**Node Configuration Fields:**
|
||||||
- `local_node`: Specifies which node in the `nodes` map represents the local node
|
- `local_node`: Specifies which node in the `nodes` map represents the local node. Must match exactly what other nodes call this node.
|
||||||
- `nodes`: Map of node configurations
|
- `nodes`: Map of node configurations
|
||||||
- `address`: HTTP/HTTPS URL of the remote node (empty for local node)
|
- `address`: HTTP/HTTPS URL of the remote node (empty for local node)
|
||||||
- `api_key`: Management API key for authenticating with the remote node
|
- `api_key`: Management API key for authenticating with the remote node
|
||||||
|
|||||||
@@ -162,6 +162,7 @@ go build -o llamactl ./cmd/server
|
|||||||
For deployments with remote nodes:
|
For deployments with remote nodes:
|
||||||
- Install llamactl on each node using any of the methods above
|
- Install llamactl on each node using any of the methods above
|
||||||
- Configure API keys for authentication between nodes
|
- Configure API keys for authentication between nodes
|
||||||
|
- Ensure node names are consistent across all configurations
|
||||||
|
|
||||||
## Verification
|
## Verification
|
||||||
|
|
||||||
|
|||||||
@@ -143,7 +143,11 @@ This helps determine if the issue is with llamactl or with the underlying llama.
|
|||||||
api_key: "secure-key" # Must match worker1's management key
|
api_key: "secure-key" # Must match worker1's management key
|
||||||
```
|
```
|
||||||
|
|
||||||
2. **Test remote node connectivity:**
|
2. **Check node name consistency:**
|
||||||
|
- `local_node` on each node must match what other nodes call it
|
||||||
|
- Node names are case-sensitive
|
||||||
|
|
||||||
|
3. **Test remote node connectivity:**
|
||||||
```bash
|
```bash
|
||||||
curl -H "Authorization: Bearer remote-node-key" \
|
curl -H "Authorization: Bearer remote-node-key" \
|
||||||
http://remote-node:8080/api/v1/instances
|
http://remote-node:8080/api/v1/instances
|
||||||
|
|||||||
@@ -69,6 +69,7 @@ plugins:
|
|||||||
|
|
||||||
hooks:
|
hooks:
|
||||||
- docs/readme_sync.py
|
- docs/readme_sync.py
|
||||||
|
- docs/fix_line_endings.py
|
||||||
|
|
||||||
extra:
|
extra:
|
||||||
version:
|
version:
|
||||||
|
|||||||
@@ -35,6 +35,7 @@ type Process struct {
|
|||||||
options *CreateInstanceOptions `json:"-"`
|
options *CreateInstanceOptions `json:"-"`
|
||||||
globalInstanceSettings *config.InstancesConfig
|
globalInstanceSettings *config.InstancesConfig
|
||||||
globalBackendSettings *config.BackendConfig
|
globalBackendSettings *config.BackendConfig
|
||||||
|
localNodeName string `json:"-"` // Name of the local node for remote detection
|
||||||
|
|
||||||
// Status
|
// Status
|
||||||
Status InstanceStatus `json:"status"`
|
Status InstanceStatus `json:"status"`
|
||||||
@@ -66,7 +67,7 @@ type Process struct {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// NewInstance creates a new instance with the given name, log path, and options
|
// NewInstance creates a new instance with the given name, log path, and options
|
||||||
func NewInstance(name string, globalBackendSettings *config.BackendConfig, globalInstanceSettings *config.InstancesConfig, options *CreateInstanceOptions, onStatusChange func(oldStatus, newStatus InstanceStatus)) *Process {
|
func NewInstance(name string, globalBackendSettings *config.BackendConfig, globalInstanceSettings *config.InstancesConfig, options *CreateInstanceOptions, localNodeName string, onStatusChange func(oldStatus, newStatus InstanceStatus)) *Process {
|
||||||
// Validate and copy options
|
// Validate and copy options
|
||||||
options.ValidateAndApplyDefaults(name, globalInstanceSettings)
|
options.ValidateAndApplyDefaults(name, globalInstanceSettings)
|
||||||
|
|
||||||
@@ -78,6 +79,7 @@ func NewInstance(name string, globalBackendSettings *config.BackendConfig, globa
|
|||||||
options: options,
|
options: options,
|
||||||
globalInstanceSettings: globalInstanceSettings,
|
globalInstanceSettings: globalInstanceSettings,
|
||||||
globalBackendSettings: globalBackendSettings,
|
globalBackendSettings: globalBackendSettings,
|
||||||
|
localNodeName: localNodeName,
|
||||||
logger: logger,
|
logger: logger,
|
||||||
timeProvider: realTimeProvider{},
|
timeProvider: realTimeProvider{},
|
||||||
Created: time.Now().Unix(),
|
Created: time.Now().Unix(),
|
||||||
@@ -145,6 +147,11 @@ func (i *Process) SetOptions(options *CreateInstanceOptions) {
|
|||||||
return
|
return
|
||||||
}
|
}
|
||||||
|
|
||||||
|
// Preserve the original nodes to prevent changing instance location
|
||||||
|
if i.options != nil && i.options.Nodes != nil {
|
||||||
|
options.Nodes = i.options.Nodes
|
||||||
|
}
|
||||||
|
|
||||||
// Validate and copy options
|
// Validate and copy options
|
||||||
options.ValidateAndApplyDefaults(i.Name, i.globalInstanceSettings)
|
options.ValidateAndApplyDefaults(i.Name, i.globalInstanceSettings)
|
||||||
|
|
||||||
@@ -172,7 +179,7 @@ func (i *Process) GetProxy() (*httputil.ReverseProxy, error) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// Remote instances should not use local proxy - they are handled by RemoteInstanceProxy
|
// Remote instances should not use local proxy - they are handled by RemoteInstanceProxy
|
||||||
if len(i.options.Nodes) > 0 {
|
if len(i.options.Nodes) > 0 && i.options.Nodes[0] != i.localNodeName {
|
||||||
return nil, fmt.Errorf("instance %s is a remote instance and should not use local proxy", i.Name)
|
return nil, fmt.Errorf("instance %s is a remote instance and should not use local proxy", i.Name)
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -309,5 +316,16 @@ func (i *Process) IsRemote() bool {
|
|||||||
return false
|
return false
|
||||||
}
|
}
|
||||||
|
|
||||||
return len(i.options.Nodes) > 0
|
// If no nodes specified, it's a local instance
|
||||||
|
if len(i.options.Nodes) == 0 {
|
||||||
|
return false
|
||||||
|
}
|
||||||
|
|
||||||
|
// If the first node is the local node, treat it as a local instance
|
||||||
|
if i.options.Nodes[0] == i.localNodeName {
|
||||||
|
return false
|
||||||
|
}
|
||||||
|
|
||||||
|
// Otherwise, it's a remote instance
|
||||||
|
return true
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -44,7 +44,7 @@ func TestNewInstance(t *testing.T) {
|
|||||||
// Mock onStatusChange function
|
// Mock onStatusChange function
|
||||||
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
||||||
|
|
||||||
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, options, mockOnStatusChange)
|
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, options, "main", mockOnStatusChange)
|
||||||
|
|
||||||
if inst.Name != "test-instance" {
|
if inst.Name != "test-instance" {
|
||||||
t.Errorf("Expected name 'test-instance', got %q", inst.Name)
|
t.Errorf("Expected name 'test-instance', got %q", inst.Name)
|
||||||
@@ -115,7 +115,7 @@ func TestNewInstance_WithRestartOptions(t *testing.T) {
|
|||||||
// Mock onStatusChange function
|
// Mock onStatusChange function
|
||||||
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
||||||
|
|
||||||
instance := instance.NewInstance("test-instance", backendConfig, globalSettings, options, mockOnStatusChange)
|
instance := instance.NewInstance("test-instance", backendConfig, globalSettings, options, "main", mockOnStatusChange)
|
||||||
opts := instance.GetOptions()
|
opts := instance.GetOptions()
|
||||||
|
|
||||||
// Check that explicit values override defaults
|
// Check that explicit values override defaults
|
||||||
@@ -164,7 +164,7 @@ func TestSetOptions(t *testing.T) {
|
|||||||
// Mock onStatusChange function
|
// Mock onStatusChange function
|
||||||
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
||||||
|
|
||||||
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, initialOptions, mockOnStatusChange)
|
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, initialOptions, "main", mockOnStatusChange)
|
||||||
|
|
||||||
// Update options
|
// Update options
|
||||||
newOptions := &instance.CreateInstanceOptions{
|
newOptions := &instance.CreateInstanceOptions{
|
||||||
@@ -191,6 +191,58 @@ func TestSetOptions(t *testing.T) {
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
func TestSetOptions_PreservesNodes(t *testing.T) {
|
||||||
|
backendConfig := &config.BackendConfig{
|
||||||
|
LlamaCpp: config.BackendSettings{
|
||||||
|
Command: "llama-server",
|
||||||
|
Args: []string{},
|
||||||
|
},
|
||||||
|
}
|
||||||
|
|
||||||
|
globalSettings := &config.InstancesConfig{
|
||||||
|
LogsDir: "/tmp/test",
|
||||||
|
DefaultAutoRestart: true,
|
||||||
|
DefaultMaxRestarts: 3,
|
||||||
|
DefaultRestartDelay: 5,
|
||||||
|
}
|
||||||
|
|
||||||
|
// Create instance with initial nodes
|
||||||
|
initialOptions := &instance.CreateInstanceOptions{
|
||||||
|
BackendType: backends.BackendTypeLlamaCpp,
|
||||||
|
Nodes: []string{"worker1"},
|
||||||
|
LlamaServerOptions: &llamacpp.LlamaServerOptions{
|
||||||
|
Model: "/path/to/model.gguf",
|
||||||
|
Port: 8080,
|
||||||
|
},
|
||||||
|
}
|
||||||
|
|
||||||
|
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
||||||
|
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, initialOptions, "main", mockOnStatusChange)
|
||||||
|
|
||||||
|
// Try to update with different nodes
|
||||||
|
updatedOptions := &instance.CreateInstanceOptions{
|
||||||
|
BackendType: backends.BackendTypeLlamaCpp,
|
||||||
|
Nodes: []string{"worker2"}, // Attempt to change node
|
||||||
|
LlamaServerOptions: &llamacpp.LlamaServerOptions{
|
||||||
|
Model: "/path/to/new-model.gguf",
|
||||||
|
Port: 8081,
|
||||||
|
},
|
||||||
|
}
|
||||||
|
|
||||||
|
inst.SetOptions(updatedOptions)
|
||||||
|
opts := inst.GetOptions()
|
||||||
|
|
||||||
|
// Nodes should remain unchanged
|
||||||
|
if len(opts.Nodes) != 1 || opts.Nodes[0] != "worker1" {
|
||||||
|
t.Errorf("Expected nodes to remain ['worker1'], got %v", opts.Nodes)
|
||||||
|
}
|
||||||
|
|
||||||
|
// Other options should be updated
|
||||||
|
if opts.LlamaServerOptions.Model != "/path/to/new-model.gguf" {
|
||||||
|
t.Errorf("Expected updated model '/path/to/new-model.gguf', got %q", opts.LlamaServerOptions.Model)
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
func TestGetProxy(t *testing.T) {
|
func TestGetProxy(t *testing.T) {
|
||||||
backendConfig := &config.BackendConfig{
|
backendConfig := &config.BackendConfig{
|
||||||
LlamaCpp: config.BackendSettings{
|
LlamaCpp: config.BackendSettings{
|
||||||
@@ -222,7 +274,7 @@ func TestGetProxy(t *testing.T) {
|
|||||||
// Mock onStatusChange function
|
// Mock onStatusChange function
|
||||||
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
||||||
|
|
||||||
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, options, mockOnStatusChange)
|
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, options, "main", mockOnStatusChange)
|
||||||
|
|
||||||
// Get proxy for the first time
|
// Get proxy for the first time
|
||||||
proxy1, err := inst.GetProxy()
|
proxy1, err := inst.GetProxy()
|
||||||
@@ -277,7 +329,7 @@ func TestMarshalJSON(t *testing.T) {
|
|||||||
// Mock onStatusChange function
|
// Mock onStatusChange function
|
||||||
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
||||||
|
|
||||||
instance := instance.NewInstance("test-instance", backendConfig, globalSettings, options, mockOnStatusChange)
|
instance := instance.NewInstance("test-instance", backendConfig, globalSettings, options, "main", mockOnStatusChange)
|
||||||
|
|
||||||
data, err := json.Marshal(instance)
|
data, err := json.Marshal(instance)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
@@ -446,7 +498,7 @@ func TestCreateInstanceOptionsValidation(t *testing.T) {
|
|||||||
// Mock onStatusChange function
|
// Mock onStatusChange function
|
||||||
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
||||||
|
|
||||||
instance := instance.NewInstance("test", backendConfig, globalSettings, options, mockOnStatusChange)
|
instance := instance.NewInstance("test", backendConfig, globalSettings, options, "main", mockOnStatusChange)
|
||||||
opts := instance.GetOptions()
|
opts := instance.GetOptions()
|
||||||
|
|
||||||
if opts.MaxRestarts == nil {
|
if opts.MaxRestarts == nil {
|
||||||
|
|||||||
@@ -56,7 +56,7 @@ func TestUpdateLastRequestTime(t *testing.T) {
|
|||||||
// Mock onStatusChange function
|
// Mock onStatusChange function
|
||||||
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
||||||
|
|
||||||
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, options, mockOnStatusChange)
|
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, options, "main", mockOnStatusChange)
|
||||||
|
|
||||||
// Test that UpdateLastRequestTime doesn't panic
|
// Test that UpdateLastRequestTime doesn't panic
|
||||||
inst.UpdateLastRequestTime()
|
inst.UpdateLastRequestTime()
|
||||||
@@ -88,7 +88,7 @@ func TestShouldTimeout_NotRunning(t *testing.T) {
|
|||||||
// Mock onStatusChange function
|
// Mock onStatusChange function
|
||||||
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
||||||
|
|
||||||
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, options, mockOnStatusChange)
|
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, options, "main", mockOnStatusChange)
|
||||||
|
|
||||||
// Instance is not running, should not timeout regardless of configuration
|
// Instance is not running, should not timeout regardless of configuration
|
||||||
if inst.ShouldTimeout() {
|
if inst.ShouldTimeout() {
|
||||||
@@ -132,7 +132,7 @@ func TestShouldTimeout_NoTimeoutConfigured(t *testing.T) {
|
|||||||
},
|
},
|
||||||
}
|
}
|
||||||
|
|
||||||
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, options, mockOnStatusChange)
|
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, options, "main", mockOnStatusChange)
|
||||||
// Simulate running state
|
// Simulate running state
|
||||||
inst.SetStatus(instance.Running)
|
inst.SetStatus(instance.Running)
|
||||||
|
|
||||||
@@ -169,7 +169,7 @@ func TestShouldTimeout_WithinTimeLimit(t *testing.T) {
|
|||||||
// Mock onStatusChange function
|
// Mock onStatusChange function
|
||||||
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
||||||
|
|
||||||
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, options, mockOnStatusChange)
|
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, options, "main", mockOnStatusChange)
|
||||||
inst.SetStatus(instance.Running)
|
inst.SetStatus(instance.Running)
|
||||||
|
|
||||||
// Update last request time to now
|
// Update last request time to now
|
||||||
@@ -207,7 +207,7 @@ func TestShouldTimeout_ExceedsTimeLimit(t *testing.T) {
|
|||||||
// Mock onStatusChange function
|
// Mock onStatusChange function
|
||||||
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
||||||
|
|
||||||
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, options, mockOnStatusChange)
|
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, options, "main", mockOnStatusChange)
|
||||||
inst.SetStatus(instance.Running)
|
inst.SetStatus(instance.Running)
|
||||||
|
|
||||||
// Use MockTimeProvider to simulate old last request time
|
// Use MockTimeProvider to simulate old last request time
|
||||||
@@ -263,7 +263,7 @@ func TestTimeoutConfiguration_Validation(t *testing.T) {
|
|||||||
// Mock onStatusChange function
|
// Mock onStatusChange function
|
||||||
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
mockOnStatusChange := func(oldStatus, newStatus instance.InstanceStatus) {}
|
||||||
|
|
||||||
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, options, mockOnStatusChange)
|
inst := instance.NewInstance("test-instance", backendConfig, globalSettings, options, "main", mockOnStatusChange)
|
||||||
opts := inst.GetOptions()
|
opts := inst.GetOptions()
|
||||||
|
|
||||||
if opts.IdleTimeout == nil || *opts.IdleTimeout != tt.expectedTimeout {
|
if opts.IdleTimeout == nil || *opts.IdleTimeout != tt.expectedTimeout {
|
||||||
|
|||||||
@@ -49,6 +49,7 @@ type instanceManager struct {
|
|||||||
ports map[int]bool
|
ports map[int]bool
|
||||||
instancesConfig config.InstancesConfig
|
instancesConfig config.InstancesConfig
|
||||||
backendsConfig config.BackendConfig
|
backendsConfig config.BackendConfig
|
||||||
|
localNodeName string // Name of the local node
|
||||||
|
|
||||||
// Timeout checker
|
// Timeout checker
|
||||||
timeoutChecker *time.Ticker
|
timeoutChecker *time.Ticker
|
||||||
@@ -63,7 +64,7 @@ type instanceManager struct {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// NewInstanceManager creates a new instance of InstanceManager.
|
// NewInstanceManager creates a new instance of InstanceManager.
|
||||||
func NewInstanceManager(backendsConfig config.BackendConfig, instancesConfig config.InstancesConfig, nodesConfig map[string]config.NodeConfig) InstanceManager {
|
func NewInstanceManager(backendsConfig config.BackendConfig, instancesConfig config.InstancesConfig, nodesConfig map[string]config.NodeConfig, localNodeName string) InstanceManager {
|
||||||
if instancesConfig.TimeoutCheckInterval <= 0 {
|
if instancesConfig.TimeoutCheckInterval <= 0 {
|
||||||
instancesConfig.TimeoutCheckInterval = 5 // Default to 5 minutes if not set
|
instancesConfig.TimeoutCheckInterval = 5 // Default to 5 minutes if not set
|
||||||
}
|
}
|
||||||
@@ -81,6 +82,7 @@ func NewInstanceManager(backendsConfig config.BackendConfig, instancesConfig con
|
|||||||
ports: make(map[int]bool),
|
ports: make(map[int]bool),
|
||||||
instancesConfig: instancesConfig,
|
instancesConfig: instancesConfig,
|
||||||
backendsConfig: backendsConfig,
|
backendsConfig: backendsConfig,
|
||||||
|
localNodeName: localNodeName,
|
||||||
|
|
||||||
timeoutChecker: time.NewTicker(time.Duration(instancesConfig.TimeoutCheckInterval) * time.Minute),
|
timeoutChecker: time.NewTicker(time.Duration(instancesConfig.TimeoutCheckInterval) * time.Minute),
|
||||||
shutdownChan: make(chan struct{}),
|
shutdownChan: make(chan struct{}),
|
||||||
@@ -274,7 +276,8 @@ func (im *instanceManager) loadInstance(name, path string) error {
|
|||||||
options := persistedInstance.GetOptions()
|
options := persistedInstance.GetOptions()
|
||||||
|
|
||||||
// Check if this is a remote instance
|
// Check if this is a remote instance
|
||||||
isRemote := options != nil && len(options.Nodes) > 0
|
// An instance is remote if Nodes is specified AND the first node is not the local node
|
||||||
|
isRemote := options != nil && len(options.Nodes) > 0 && options.Nodes[0] != im.localNodeName
|
||||||
|
|
||||||
var statusCallback func(oldStatus, newStatus instance.InstanceStatus)
|
var statusCallback func(oldStatus, newStatus instance.InstanceStatus)
|
||||||
if !isRemote {
|
if !isRemote {
|
||||||
@@ -285,7 +288,7 @@ func (im *instanceManager) loadInstance(name, path string) error {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// Create new inst using NewInstance (handles validation, defaults, setup)
|
// Create new inst using NewInstance (handles validation, defaults, setup)
|
||||||
inst := instance.NewInstance(name, &im.backendsConfig, &im.instancesConfig, options, statusCallback)
|
inst := instance.NewInstance(name, &im.backendsConfig, &im.instancesConfig, options, im.localNodeName, statusCallback)
|
||||||
|
|
||||||
// Restore persisted fields that NewInstance doesn't set
|
// Restore persisted fields that NewInstance doesn't set
|
||||||
inst.Created = persistedInstance.Created
|
inst.Created = persistedInstance.Created
|
||||||
|
|||||||
@@ -34,7 +34,7 @@ func TestNewInstanceManager(t *testing.T) {
|
|||||||
TimeoutCheckInterval: 5,
|
TimeoutCheckInterval: 5,
|
||||||
}
|
}
|
||||||
|
|
||||||
mgr := manager.NewInstanceManager(backendConfig, cfg, map[string]config.NodeConfig{})
|
mgr := manager.NewInstanceManager(backendConfig, cfg, map[string]config.NodeConfig{}, "main")
|
||||||
if mgr == nil {
|
if mgr == nil {
|
||||||
t.Fatal("NewInstanceManager returned nil")
|
t.Fatal("NewInstanceManager returned nil")
|
||||||
}
|
}
|
||||||
@@ -69,7 +69,7 @@ func TestPersistence(t *testing.T) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// Test instance persistence on creation
|
// Test instance persistence on creation
|
||||||
manager1 := manager.NewInstanceManager(backendConfig, cfg, map[string]config.NodeConfig{})
|
manager1 := manager.NewInstanceManager(backendConfig, cfg, map[string]config.NodeConfig{}, "main")
|
||||||
options := &instance.CreateInstanceOptions{
|
options := &instance.CreateInstanceOptions{
|
||||||
BackendType: backends.BackendTypeLlamaCpp,
|
BackendType: backends.BackendTypeLlamaCpp,
|
||||||
LlamaServerOptions: &llamacpp.LlamaServerOptions{
|
LlamaServerOptions: &llamacpp.LlamaServerOptions{
|
||||||
@@ -90,7 +90,7 @@ func TestPersistence(t *testing.T) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// Test loading instances from disk
|
// Test loading instances from disk
|
||||||
manager2 := manager.NewInstanceManager(backendConfig, cfg, map[string]config.NodeConfig{})
|
manager2 := manager.NewInstanceManager(backendConfig, cfg, map[string]config.NodeConfig{}, "main")
|
||||||
instances, err := manager2.ListInstances()
|
instances, err := manager2.ListInstances()
|
||||||
if err != nil {
|
if err != nil {
|
||||||
t.Fatalf("ListInstances failed: %v", err)
|
t.Fatalf("ListInstances failed: %v", err)
|
||||||
@@ -207,7 +207,7 @@ func createTestManager() manager.InstanceManager {
|
|||||||
DefaultRestartDelay: 5,
|
DefaultRestartDelay: 5,
|
||||||
TimeoutCheckInterval: 5,
|
TimeoutCheckInterval: 5,
|
||||||
}
|
}
|
||||||
return manager.NewInstanceManager(backendConfig, cfg, map[string]config.NodeConfig{})
|
return manager.NewInstanceManager(backendConfig, cfg, map[string]config.NodeConfig{}, "main")
|
||||||
}
|
}
|
||||||
|
|
||||||
func TestAutoRestartDisabledInstanceStatus(t *testing.T) {
|
func TestAutoRestartDisabledInstanceStatus(t *testing.T) {
|
||||||
@@ -227,7 +227,7 @@ func TestAutoRestartDisabledInstanceStatus(t *testing.T) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
// Create first manager and instance with auto-restart disabled
|
// Create first manager and instance with auto-restart disabled
|
||||||
manager1 := manager.NewInstanceManager(backendConfig, cfg, map[string]config.NodeConfig{})
|
manager1 := manager.NewInstanceManager(backendConfig, cfg, map[string]config.NodeConfig{}, "main")
|
||||||
|
|
||||||
autoRestart := false
|
autoRestart := false
|
||||||
options := &instance.CreateInstanceOptions{
|
options := &instance.CreateInstanceOptions{
|
||||||
@@ -252,7 +252,7 @@ func TestAutoRestartDisabledInstanceStatus(t *testing.T) {
|
|||||||
manager1.Shutdown()
|
manager1.Shutdown()
|
||||||
|
|
||||||
// Create second manager (simulating restart of llamactl)
|
// Create second manager (simulating restart of llamactl)
|
||||||
manager2 := manager.NewInstanceManager(backendConfig, cfg, map[string]config.NodeConfig{})
|
manager2 := manager.NewInstanceManager(backendConfig, cfg, map[string]config.NodeConfig{}, "main")
|
||||||
|
|
||||||
// Get the loaded instance
|
// Get the loaded instance
|
||||||
loadedInst, err := manager2.GetInstance("test-instance")
|
loadedInst, err := manager2.GetInstance("test-instance")
|
||||||
|
|||||||
@@ -99,7 +99,8 @@ func (im *instanceManager) CreateInstance(name string, options *instance.CreateI
|
|||||||
}
|
}
|
||||||
|
|
||||||
// Check if this is a remote instance
|
// Check if this is a remote instance
|
||||||
isRemote := len(options.Nodes) > 0
|
// An instance is remote if Nodes is specified AND the first node is not the local node
|
||||||
|
isRemote := len(options.Nodes) > 0 && options.Nodes[0] != im.localNodeName
|
||||||
var nodeConfig *config.NodeConfig
|
var nodeConfig *config.NodeConfig
|
||||||
|
|
||||||
if isRemote {
|
if isRemote {
|
||||||
@@ -119,7 +120,7 @@ func (im *instanceManager) CreateInstance(name string, options *instance.CreateI
|
|||||||
|
|
||||||
// Create a local stub that preserves the Nodes field for tracking
|
// Create a local stub that preserves the Nodes field for tracking
|
||||||
// We keep the original options (with Nodes) so IsRemote() works correctly
|
// We keep the original options (with Nodes) so IsRemote() works correctly
|
||||||
inst := instance.NewInstance(name, &im.backendsConfig, &im.instancesConfig, options, nil)
|
inst := instance.NewInstance(name, &im.backendsConfig, &im.instancesConfig, options, im.localNodeName, nil)
|
||||||
|
|
||||||
// Update the local stub with all remote data (preserving Nodes)
|
// Update the local stub with all remote data (preserving Nodes)
|
||||||
im.updateLocalInstanceFromRemote(inst, remoteInst)
|
im.updateLocalInstanceFromRemote(inst, remoteInst)
|
||||||
@@ -152,7 +153,7 @@ func (im *instanceManager) CreateInstance(name string, options *instance.CreateI
|
|||||||
im.onStatusChange(name, oldStatus, newStatus)
|
im.onStatusChange(name, oldStatus, newStatus)
|
||||||
}
|
}
|
||||||
|
|
||||||
inst := instance.NewInstance(name, &im.backendsConfig, &im.instancesConfig, options, statusCallback)
|
inst := instance.NewInstance(name, &im.backendsConfig, &im.instancesConfig, options, im.localNodeName, statusCallback)
|
||||||
im.instances[inst.Name] = inst
|
im.instances[inst.Name] = inst
|
||||||
|
|
||||||
if err := im.persistInstance(inst); err != nil {
|
if err := im.persistInstance(inst); err != nil {
|
||||||
|
|||||||
@@ -75,7 +75,7 @@ func TestCreateInstance_ValidationAndLimits(t *testing.T) {
|
|||||||
MaxInstances: 1, // Very low limit for testing
|
MaxInstances: 1, // Very low limit for testing
|
||||||
TimeoutCheckInterval: 5,
|
TimeoutCheckInterval: 5,
|
||||||
}
|
}
|
||||||
limitedManager := manager.NewInstanceManager(backendConfig, cfg, map[string]config.NodeConfig{})
|
limitedManager := manager.NewInstanceManager(backendConfig, cfg, map[string]config.NodeConfig{}, "main")
|
||||||
|
|
||||||
_, err = limitedManager.CreateInstance("instance1", options)
|
_, err = limitedManager.CreateInstance("instance1", options)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
|
|||||||
@@ -10,31 +10,10 @@ import (
|
|||||||
"net/http"
|
"net/http"
|
||||||
)
|
)
|
||||||
|
|
||||||
// stripNodesFromOptions creates a copy of the instance options without the Nodes field
|
|
||||||
// to prevent routing loops when sending requests to remote nodes
|
|
||||||
func (im *instanceManager) stripNodesFromOptions(options *instance.CreateInstanceOptions) *instance.CreateInstanceOptions {
|
|
||||||
if options == nil {
|
|
||||||
return nil
|
|
||||||
}
|
|
||||||
|
|
||||||
// Create a copy of the options struct
|
|
||||||
optionsCopy := *options
|
|
||||||
|
|
||||||
// Clear the Nodes field to prevent the remote node from trying to route further
|
|
||||||
optionsCopy.Nodes = nil
|
|
||||||
|
|
||||||
return &optionsCopy
|
|
||||||
}
|
|
||||||
|
|
||||||
// makeRemoteRequest is a helper function to make HTTP requests to a remote node
|
// makeRemoteRequest is a helper function to make HTTP requests to a remote node
|
||||||
func (im *instanceManager) makeRemoteRequest(nodeConfig *config.NodeConfig, method, path string, body any) (*http.Response, error) {
|
func (im *instanceManager) makeRemoteRequest(nodeConfig *config.NodeConfig, method, path string, body any) (*http.Response, error) {
|
||||||
var reqBody io.Reader
|
var reqBody io.Reader
|
||||||
if body != nil {
|
if body != nil {
|
||||||
// Strip nodes from CreateInstanceOptions to prevent routing loops
|
|
||||||
if options, ok := body.(*instance.CreateInstanceOptions); ok {
|
|
||||||
body = im.stripNodesFromOptions(options)
|
|
||||||
}
|
|
||||||
|
|
||||||
jsonData, err := json.Marshal(body)
|
jsonData, err := json.Marshal(body)
|
||||||
if err != nil {
|
if err != nil {
|
||||||
return nil, fmt.Errorf("failed to marshal request body: %w", err)
|
return nil, fmt.Errorf("failed to marshal request body: %w", err)
|
||||||
|
|||||||
@@ -1,39 +0,0 @@
|
|||||||
package manager
|
|
||||||
|
|
||||||
import (
|
|
||||||
"llamactl/pkg/backends"
|
|
||||||
"llamactl/pkg/instance"
|
|
||||||
"testing"
|
|
||||||
)
|
|
||||||
|
|
||||||
func TestStripNodesFromOptions(t *testing.T) {
|
|
||||||
im := &instanceManager{}
|
|
||||||
|
|
||||||
// Test nil case
|
|
||||||
if result := im.stripNodesFromOptions(nil); result != nil {
|
|
||||||
t.Errorf("Expected nil, got %+v", result)
|
|
||||||
}
|
|
||||||
|
|
||||||
// Test main case: nodes should be stripped, other fields preserved
|
|
||||||
options := &instance.CreateInstanceOptions{
|
|
||||||
BackendType: backends.BackendTypeLlamaCpp,
|
|
||||||
Nodes: []string{"node1", "node2"},
|
|
||||||
Environment: map[string]string{"TEST": "value"},
|
|
||||||
}
|
|
||||||
|
|
||||||
result := im.stripNodesFromOptions(options)
|
|
||||||
|
|
||||||
if result.Nodes != nil {
|
|
||||||
t.Errorf("Expected Nodes to be nil, got %+v", result.Nodes)
|
|
||||||
}
|
|
||||||
if result.BackendType != backends.BackendTypeLlamaCpp {
|
|
||||||
t.Errorf("Expected BackendType preserved")
|
|
||||||
}
|
|
||||||
if result.Environment["TEST"] != "value" {
|
|
||||||
t.Errorf("Expected Environment preserved")
|
|
||||||
}
|
|
||||||
// Original should not be modified
|
|
||||||
if len(options.Nodes) != 2 {
|
|
||||||
t.Errorf("Original options should not be modified")
|
|
||||||
}
|
|
||||||
}
|
|
||||||
@@ -23,7 +23,7 @@ func TestTimeoutFunctionality(t *testing.T) {
|
|||||||
MaxInstances: 5,
|
MaxInstances: 5,
|
||||||
}
|
}
|
||||||
|
|
||||||
manager := manager.NewInstanceManager(backendConfig, cfg, map[string]config.NodeConfig{})
|
manager := manager.NewInstanceManager(backendConfig, cfg, map[string]config.NodeConfig{}, "main")
|
||||||
if manager == nil {
|
if manager == nil {
|
||||||
t.Fatal("Manager should be initialized with timeout checker")
|
t.Fatal("Manager should be initialized with timeout checker")
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -100,7 +100,8 @@ const InstanceSettingsCard: React.FC<InstanceSettingsCardProps> = ({
|
|||||||
value={selectedNode}
|
value={selectedNode}
|
||||||
onChange={handleNodeChange}
|
onChange={handleNodeChange}
|
||||||
options={nodeOptions}
|
options={nodeOptions}
|
||||||
description="Select the node where the instance will run (default: main node)"
|
description={isEditing ? "Node cannot be changed after instance creation" : "Select the node where the instance will run"}
|
||||||
|
disabled={isEditing}
|
||||||
/>
|
/>
|
||||||
)}
|
)}
|
||||||
|
|
||||||
|
|||||||
Reference in New Issue
Block a user