mirror of
https://github.com/lordmathis/llamactl.git
synced 2025-12-23 17:44:24 +00:00
Deployed 9cea295 to dev with MkDocs 1.6.1 and mike 2.1.3
This commit is contained in:
Binary file not shown.
Binary file not shown.
@@ -852,39 +852,6 @@
|
|||||||
</ul>
|
</ul>
|
||||||
</nav>
|
</nav>
|
||||||
|
|
||||||
</li>
|
|
||||||
|
|
||||||
<li class="md-nav__item">
|
|
||||||
<a href="#nodes" class="md-nav__link">
|
|
||||||
<span class="md-ellipsis">
|
|
||||||
Nodes
|
|
||||||
</span>
|
|
||||||
</a>
|
|
||||||
|
|
||||||
<nav class="md-nav" aria-label="Nodes">
|
|
||||||
<ul class="md-nav__list">
|
|
||||||
|
|
||||||
<li class="md-nav__item">
|
|
||||||
<a href="#get-apiv1nodes" class="md-nav__link">
|
|
||||||
<span class="md-ellipsis">
|
|
||||||
GET /api/v1/nodes
|
|
||||||
</span>
|
|
||||||
</a>
|
|
||||||
|
|
||||||
</li>
|
|
||||||
|
|
||||||
<li class="md-nav__item">
|
|
||||||
<a href="#get-apiv1nodesname" class="md-nav__link">
|
|
||||||
<span class="md-ellipsis">
|
|
||||||
GET /api/v1/nodes/{name}
|
|
||||||
</span>
|
|
||||||
</a>
|
|
||||||
|
|
||||||
</li>
|
|
||||||
|
|
||||||
</ul>
|
|
||||||
</nav>
|
|
||||||
|
|
||||||
</li>
|
</li>
|
||||||
|
|
||||||
<li class="md-nav__item">
|
<li class="md-nav__item">
|
||||||
@@ -897,6 +864,33 @@
|
|||||||
<nav class="md-nav" aria-label="Llama.cpp">
|
<nav class="md-nav" aria-label="Llama.cpp">
|
||||||
<ul class="md-nav__list">
|
<ul class="md-nav__list">
|
||||||
|
|
||||||
|
<li class="md-nav__item">
|
||||||
|
<a href="#get-apiv1llama-cppnamemodels" class="md-nav__link">
|
||||||
|
<span class="md-ellipsis">
|
||||||
|
GET /api/v1/llama-cpp/{name}/models
|
||||||
|
</span>
|
||||||
|
</a>
|
||||||
|
|
||||||
|
</li>
|
||||||
|
|
||||||
|
<li class="md-nav__item">
|
||||||
|
<a href="#post-apiv1llama-cppnamemodelsmodelload" class="md-nav__link">
|
||||||
|
<span class="md-ellipsis">
|
||||||
|
POST /api/v1/llama-cpp/{name}/models/{model}/load
|
||||||
|
</span>
|
||||||
|
</a>
|
||||||
|
|
||||||
|
</li>
|
||||||
|
|
||||||
|
<li class="md-nav__item">
|
||||||
|
<a href="#post-apiv1llama-cppnamemodelsmodelunload" class="md-nav__link">
|
||||||
|
<span class="md-ellipsis">
|
||||||
|
POST /api/v1/llama-cpp/{name}/models/{model}/unload
|
||||||
|
</span>
|
||||||
|
</a>
|
||||||
|
|
||||||
|
</li>
|
||||||
|
|
||||||
<li class="md-nav__item">
|
<li class="md-nav__item">
|
||||||
<a href="#get-llama-cppname" class="md-nav__link">
|
<a href="#get-llama-cppname" class="md-nav__link">
|
||||||
<span class="md-ellipsis">
|
<span class="md-ellipsis">
|
||||||
@@ -1008,6 +1002,39 @@
|
|||||||
</ul>
|
</ul>
|
||||||
</nav>
|
</nav>
|
||||||
|
|
||||||
|
</li>
|
||||||
|
|
||||||
|
<li class="md-nav__item">
|
||||||
|
<a href="#nodes" class="md-nav__link">
|
||||||
|
<span class="md-ellipsis">
|
||||||
|
Nodes
|
||||||
|
</span>
|
||||||
|
</a>
|
||||||
|
|
||||||
|
<nav class="md-nav" aria-label="Nodes">
|
||||||
|
<ul class="md-nav__list">
|
||||||
|
|
||||||
|
<li class="md-nav__item">
|
||||||
|
<a href="#get-apiv1nodes" class="md-nav__link">
|
||||||
|
<span class="md-ellipsis">
|
||||||
|
GET /api/v1/nodes
|
||||||
|
</span>
|
||||||
|
</a>
|
||||||
|
|
||||||
|
</li>
|
||||||
|
|
||||||
|
<li class="md-nav__item">
|
||||||
|
<a href="#get-apiv1nodesname" class="md-nav__link">
|
||||||
|
<span class="md-ellipsis">
|
||||||
|
GET /api/v1/nodes/{name}
|
||||||
|
</span>
|
||||||
|
</a>
|
||||||
|
|
||||||
|
</li>
|
||||||
|
|
||||||
|
</ul>
|
||||||
|
</nav>
|
||||||
|
|
||||||
</li>
|
</li>
|
||||||
|
|
||||||
<li class="md-nav__item">
|
<li class="md-nav__item">
|
||||||
@@ -2308,55 +2335,14 @@ port </p>
|
|||||||
<strong>Response <span class="response-code code-500">500</span> <span class="status-phrase">Internal Server Error</span></strong>
|
<strong>Response <span class="response-code code-500">500</span> <span class="status-phrase">Internal Server Error</span></strong>
|
||||||
</p>
|
</p>
|
||||||
|
|
||||||
<h2 id="nodes"><span class="api-tag">Nodes</span><a class="headerlink" href="#nodes" title="Permanent link">¶</a></h2>
|
<h2 id="llamacpp"><span class="api-tag">Llama.cpp</span><a class="headerlink" href="#llamacpp" title="Permanent link">¶</a></h2>
|
||||||
<hr class="operation-separator" />
|
<hr class="operation-separator" />
|
||||||
|
|
||||||
<h3 id="get-apiv1nodes"><span class="http-get">GET</span> /api/v1/nodes<a class="headerlink" href="#get-apiv1nodes" title="Permanent link">¶</a></h3>
|
<h3 id="get-apiv1llama-cppnamemodels"><span class="http-get">GET</span> /api/v1/llama-cpp/<span class="route-param">{name}</span>/models<a class="headerlink" href="#get-apiv1llama-cppnamemodels" title="Permanent link">¶</a></h3>
|
||||||
<p>List all configured nodes </p>
|
<p>List models in a llama.cpp instance </p>
|
||||||
<details class="note">
|
<details class="note">
|
||||||
<summary>Description</summary>
|
<summary>Description</summary>
|
||||||
<p>Returns a map of all nodes configured in the server (node name -> node<br />
|
<p>Returns a list of models available in the specified llama.cpp instance </p>
|
||||||
config) </p>
|
|
||||||
</details>
|
|
||||||
<p><strong>Input parameters</strong> </p>
|
|
||||||
<table>
|
|
||||||
<thead>
|
|
||||||
<tr>
|
|
||||||
<th>Parameter</th>
|
|
||||||
<th>In</th>
|
|
||||||
<th>Type</th>
|
|
||||||
<th>Default</th>
|
|
||||||
<th>Nullable</th>
|
|
||||||
<th>Description</th>
|
|
||||||
</tr>
|
|
||||||
</thead>
|
|
||||||
<tbody>
|
|
||||||
<tr>
|
|
||||||
<td class="parameter-name"><code>ApiKeyAuth</code></td>
|
|
||||||
<td>header</td>
|
|
||||||
<td>string</td>
|
|
||||||
<td>N/A</td>
|
|
||||||
<td>No</td>
|
|
||||||
<td></td>
|
|
||||||
</tr>
|
|
||||||
</tbody>
|
|
||||||
</table>
|
|
||||||
|
|
||||||
<p class="response-title">
|
|
||||||
<strong>Response <span class="response-code code-200">200</span> <span class="status-phrase">OK</span></strong>
|
|
||||||
</p>
|
|
||||||
|
|
||||||
<p class="response-title">
|
|
||||||
<strong>Response <span class="response-code code-500">500</span> <span class="status-phrase">Internal Server Error</span></strong>
|
|
||||||
</p>
|
|
||||||
|
|
||||||
<hr class="operation-separator" />
|
|
||||||
|
|
||||||
<h3 id="get-apiv1nodesname"><span class="http-get">GET</span> /api/v1/nodes/<span class="route-param">{name}</span><a class="headerlink" href="#get-apiv1nodesname" title="Permanent link">¶</a></h3>
|
|
||||||
<p>Get details of a specific node </p>
|
|
||||||
<details class="note">
|
|
||||||
<summary>Description</summary>
|
|
||||||
<p>Returns the details of a specific node by name </p>
|
|
||||||
</details>
|
</details>
|
||||||
<p><strong>Input parameters</strong> </p>
|
<p><strong>Input parameters</strong> </p>
|
||||||
<table>
|
<table>
|
||||||
@@ -2385,7 +2371,7 @@ config) </p>
|
|||||||
<td>None</td>
|
<td>None</td>
|
||||||
<td></td>
|
<td></td>
|
||||||
<td>No</td>
|
<td>No</td>
|
||||||
<td>Node Name</td>
|
<td>Instance Name</td>
|
||||||
</tr>
|
</tr>
|
||||||
</tbody>
|
</tbody>
|
||||||
</table>
|
</table>
|
||||||
@@ -2399,14 +2385,129 @@ config) </p>
|
|||||||
</p>
|
</p>
|
||||||
|
|
||||||
<p class="response-title">
|
<p class="response-title">
|
||||||
<strong>Response <span class="response-code code-404">404</span> <span class="status-phrase">Not Found</span></strong>
|
<strong>Response <span class="response-code code-500">500</span> <span class="status-phrase">Internal Server Error</span></strong>
|
||||||
|
</p>
|
||||||
|
|
||||||
|
<hr class="operation-separator" />
|
||||||
|
|
||||||
|
<h3 id="post-apiv1llama-cppnamemodelsmodelload"><span class="http-post">POST</span> /api/v1/llama-cpp/<span class="route-param">{name}</span>/models/<span class="route-param">{model}</span>/load<a class="headerlink" href="#post-apiv1llama-cppnamemodelsmodelload" title="Permanent link">¶</a></h3>
|
||||||
|
<p>Load a model in a llama.cpp instance </p>
|
||||||
|
<details class="note">
|
||||||
|
<summary>Description</summary>
|
||||||
|
<p>Loads the specified model in the given llama.cpp instance </p>
|
||||||
|
</details>
|
||||||
|
<p><strong>Input parameters</strong> </p>
|
||||||
|
<table>
|
||||||
|
<thead>
|
||||||
|
<tr>
|
||||||
|
<th>Parameter</th>
|
||||||
|
<th>In</th>
|
||||||
|
<th>Type</th>
|
||||||
|
<th>Default</th>
|
||||||
|
<th>Nullable</th>
|
||||||
|
<th>Description</th>
|
||||||
|
</tr>
|
||||||
|
</thead>
|
||||||
|
<tbody>
|
||||||
|
<tr>
|
||||||
|
<td class="parameter-name"><code>ApiKeyAuth</code></td>
|
||||||
|
<td>header</td>
|
||||||
|
<td>string</td>
|
||||||
|
<td>N/A</td>
|
||||||
|
<td>No</td>
|
||||||
|
<td></td>
|
||||||
|
</tr>
|
||||||
|
<tr>
|
||||||
|
<td class="parameter-name"><code>model</code></td>
|
||||||
|
<td>path</td>
|
||||||
|
<td>None</td>
|
||||||
|
<td></td>
|
||||||
|
<td>No</td>
|
||||||
|
<td>Model Name</td>
|
||||||
|
</tr>
|
||||||
|
<tr>
|
||||||
|
<td class="parameter-name"><code>name</code></td>
|
||||||
|
<td>path</td>
|
||||||
|
<td>None</td>
|
||||||
|
<td></td>
|
||||||
|
<td>No</td>
|
||||||
|
<td>Instance Name</td>
|
||||||
|
</tr>
|
||||||
|
</tbody>
|
||||||
|
</table>
|
||||||
|
|
||||||
|
<p class="response-title">
|
||||||
|
<strong>Response <span class="response-code code-200">200</span> <span class="status-phrase">OK</span></strong>
|
||||||
|
</p>
|
||||||
|
|
||||||
|
<p class="response-title">
|
||||||
|
<strong>Response <span class="response-code code-400">400</span> <span class="status-phrase">Bad Request</span></strong>
|
||||||
|
</p>
|
||||||
|
|
||||||
|
<p class="response-title">
|
||||||
|
<strong>Response <span class="response-code code-500">500</span> <span class="status-phrase">Internal Server Error</span></strong>
|
||||||
|
</p>
|
||||||
|
|
||||||
|
<hr class="operation-separator" />
|
||||||
|
|
||||||
|
<h3 id="post-apiv1llama-cppnamemodelsmodelunload"><span class="http-post">POST</span> /api/v1/llama-cpp/<span class="route-param">{name}</span>/models/<span class="route-param">{model}</span>/unload<a class="headerlink" href="#post-apiv1llama-cppnamemodelsmodelunload" title="Permanent link">¶</a></h3>
|
||||||
|
<p>Unload a model in a llama.cpp instance </p>
|
||||||
|
<details class="note">
|
||||||
|
<summary>Description</summary>
|
||||||
|
<p>Unloads the specified model in the given llama.cpp instance </p>
|
||||||
|
</details>
|
||||||
|
<p><strong>Input parameters</strong> </p>
|
||||||
|
<table>
|
||||||
|
<thead>
|
||||||
|
<tr>
|
||||||
|
<th>Parameter</th>
|
||||||
|
<th>In</th>
|
||||||
|
<th>Type</th>
|
||||||
|
<th>Default</th>
|
||||||
|
<th>Nullable</th>
|
||||||
|
<th>Description</th>
|
||||||
|
</tr>
|
||||||
|
</thead>
|
||||||
|
<tbody>
|
||||||
|
<tr>
|
||||||
|
<td class="parameter-name"><code>ApiKeyAuth</code></td>
|
||||||
|
<td>header</td>
|
||||||
|
<td>string</td>
|
||||||
|
<td>N/A</td>
|
||||||
|
<td>No</td>
|
||||||
|
<td></td>
|
||||||
|
</tr>
|
||||||
|
<tr>
|
||||||
|
<td class="parameter-name"><code>model</code></td>
|
||||||
|
<td>path</td>
|
||||||
|
<td>None</td>
|
||||||
|
<td></td>
|
||||||
|
<td>No</td>
|
||||||
|
<td>Model Name</td>
|
||||||
|
</tr>
|
||||||
|
<tr>
|
||||||
|
<td class="parameter-name"><code>name</code></td>
|
||||||
|
<td>path</td>
|
||||||
|
<td>None</td>
|
||||||
|
<td></td>
|
||||||
|
<td>No</td>
|
||||||
|
<td>Instance Name</td>
|
||||||
|
</tr>
|
||||||
|
</tbody>
|
||||||
|
</table>
|
||||||
|
|
||||||
|
<p class="response-title">
|
||||||
|
<strong>Response <span class="response-code code-200">200</span> <span class="status-phrase">OK</span></strong>
|
||||||
|
</p>
|
||||||
|
|
||||||
|
<p class="response-title">
|
||||||
|
<strong>Response <span class="response-code code-400">400</span> <span class="status-phrase">Bad Request</span></strong>
|
||||||
</p>
|
</p>
|
||||||
|
|
||||||
<p class="response-title">
|
<p class="response-title">
|
||||||
<strong>Response <span class="response-code code-500">500</span> <span class="status-phrase">Internal Server Error</span></strong>
|
<strong>Response <span class="response-code code-500">500</span> <span class="status-phrase">Internal Server Error</span></strong>
|
||||||
</p>
|
</p>
|
||||||
|
|
||||||
<h2 id="llamacpp"><span class="api-tag">Llama.cpp</span><a class="headerlink" href="#llamacpp" title="Permanent link">¶</a></h2>
|
|
||||||
<hr class="operation-separator" />
|
<hr class="operation-separator" />
|
||||||
|
|
||||||
<h3 id="get-llama-cppname"><span class="http-get">GET</span> /llama-cpp/<span class="route-param">{name}</span>/<a class="headerlink" href="#get-llama-cppname" title="Permanent link">¶</a></h3>
|
<h3 id="get-llama-cppname"><span class="http-get">GET</span> /llama-cpp/<span class="route-param">{name}</span>/<a class="headerlink" href="#get-llama-cppname" title="Permanent link">¶</a></h3>
|
||||||
@@ -3042,6 +3143,104 @@ demand if configured </p>
|
|||||||
<strong>Response <span class="response-code code-500">500</span> <span class="status-phrase">Internal Server Error</span></strong>
|
<strong>Response <span class="response-code code-500">500</span> <span class="status-phrase">Internal Server Error</span></strong>
|
||||||
</p>
|
</p>
|
||||||
|
|
||||||
|
<h2 id="nodes"><span class="api-tag">Nodes</span><a class="headerlink" href="#nodes" title="Permanent link">¶</a></h2>
|
||||||
|
<hr class="operation-separator" />
|
||||||
|
|
||||||
|
<h3 id="get-apiv1nodes"><span class="http-get">GET</span> /api/v1/nodes<a class="headerlink" href="#get-apiv1nodes" title="Permanent link">¶</a></h3>
|
||||||
|
<p>List all configured nodes </p>
|
||||||
|
<details class="note">
|
||||||
|
<summary>Description</summary>
|
||||||
|
<p>Returns a map of all nodes configured in the server (node name -> node<br />
|
||||||
|
config) </p>
|
||||||
|
</details>
|
||||||
|
<p><strong>Input parameters</strong> </p>
|
||||||
|
<table>
|
||||||
|
<thead>
|
||||||
|
<tr>
|
||||||
|
<th>Parameter</th>
|
||||||
|
<th>In</th>
|
||||||
|
<th>Type</th>
|
||||||
|
<th>Default</th>
|
||||||
|
<th>Nullable</th>
|
||||||
|
<th>Description</th>
|
||||||
|
</tr>
|
||||||
|
</thead>
|
||||||
|
<tbody>
|
||||||
|
<tr>
|
||||||
|
<td class="parameter-name"><code>ApiKeyAuth</code></td>
|
||||||
|
<td>header</td>
|
||||||
|
<td>string</td>
|
||||||
|
<td>N/A</td>
|
||||||
|
<td>No</td>
|
||||||
|
<td></td>
|
||||||
|
</tr>
|
||||||
|
</tbody>
|
||||||
|
</table>
|
||||||
|
|
||||||
|
<p class="response-title">
|
||||||
|
<strong>Response <span class="response-code code-200">200</span> <span class="status-phrase">OK</span></strong>
|
||||||
|
</p>
|
||||||
|
|
||||||
|
<p class="response-title">
|
||||||
|
<strong>Response <span class="response-code code-500">500</span> <span class="status-phrase">Internal Server Error</span></strong>
|
||||||
|
</p>
|
||||||
|
|
||||||
|
<hr class="operation-separator" />
|
||||||
|
|
||||||
|
<h3 id="get-apiv1nodesname"><span class="http-get">GET</span> /api/v1/nodes/<span class="route-param">{name}</span><a class="headerlink" href="#get-apiv1nodesname" title="Permanent link">¶</a></h3>
|
||||||
|
<p>Get details of a specific node </p>
|
||||||
|
<details class="note">
|
||||||
|
<summary>Description</summary>
|
||||||
|
<p>Returns the details of a specific node by name </p>
|
||||||
|
</details>
|
||||||
|
<p><strong>Input parameters</strong> </p>
|
||||||
|
<table>
|
||||||
|
<thead>
|
||||||
|
<tr>
|
||||||
|
<th>Parameter</th>
|
||||||
|
<th>In</th>
|
||||||
|
<th>Type</th>
|
||||||
|
<th>Default</th>
|
||||||
|
<th>Nullable</th>
|
||||||
|
<th>Description</th>
|
||||||
|
</tr>
|
||||||
|
</thead>
|
||||||
|
<tbody>
|
||||||
|
<tr>
|
||||||
|
<td class="parameter-name"><code>ApiKeyAuth</code></td>
|
||||||
|
<td>header</td>
|
||||||
|
<td>string</td>
|
||||||
|
<td>N/A</td>
|
||||||
|
<td>No</td>
|
||||||
|
<td></td>
|
||||||
|
</tr>
|
||||||
|
<tr>
|
||||||
|
<td class="parameter-name"><code>name</code></td>
|
||||||
|
<td>path</td>
|
||||||
|
<td>None</td>
|
||||||
|
<td></td>
|
||||||
|
<td>No</td>
|
||||||
|
<td>Node Name</td>
|
||||||
|
</tr>
|
||||||
|
</tbody>
|
||||||
|
</table>
|
||||||
|
|
||||||
|
<p class="response-title">
|
||||||
|
<strong>Response <span class="response-code code-200">200</span> <span class="status-phrase">OK</span></strong>
|
||||||
|
</p>
|
||||||
|
|
||||||
|
<p class="response-title">
|
||||||
|
<strong>Response <span class="response-code code-400">400</span> <span class="status-phrase">Bad Request</span></strong>
|
||||||
|
</p>
|
||||||
|
|
||||||
|
<p class="response-title">
|
||||||
|
<strong>Response <span class="response-code code-404">404</span> <span class="status-phrase">Not Found</span></strong>
|
||||||
|
</p>
|
||||||
|
|
||||||
|
<p class="response-title">
|
||||||
|
<strong>Response <span class="response-code code-500">500</span> <span class="status-phrase">Internal Server Error</span></strong>
|
||||||
|
</p>
|
||||||
|
|
||||||
<h2 id="openai"><span class="api-tag">OpenAI</span><a class="headerlink" href="#openai" title="Permanent link">¶</a></h2>
|
<h2 id="openai"><span class="api-tag">OpenAI</span><a class="headerlink" href="#openai" title="Permanent link">¶</a></h2>
|
||||||
<hr class="operation-separator" />
|
<hr class="operation-separator" />
|
||||||
|
|
||||||
|
|||||||
176
dev/docs.go
176
dev/docs.go
@@ -999,6 +999,156 @@ const docTemplate = `{
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
|
"/api/v1/llama-cpp/{name}/models": {
|
||||||
|
"get": {
|
||||||
|
"security": [
|
||||||
|
{
|
||||||
|
"ApiKeyAuth": []
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"description": "Returns a list of models available in the specified llama.cpp instance",
|
||||||
|
"tags": [
|
||||||
|
"Llama.cpp"
|
||||||
|
],
|
||||||
|
"summary": "List models in a llama.cpp instance",
|
||||||
|
"parameters": [
|
||||||
|
{
|
||||||
|
"type": "string",
|
||||||
|
"description": "Instance Name",
|
||||||
|
"name": "name",
|
||||||
|
"in": "path",
|
||||||
|
"required": true
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"responses": {
|
||||||
|
"200": {
|
||||||
|
"description": "Models list response",
|
||||||
|
"schema": {
|
||||||
|
"type": "object",
|
||||||
|
"additionalProperties": true
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"400": {
|
||||||
|
"description": "Invalid instance",
|
||||||
|
"schema": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"500": {
|
||||||
|
"description": "Internal Server Error",
|
||||||
|
"schema": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"/api/v1/llama-cpp/{name}/models/{model}/load": {
|
||||||
|
"post": {
|
||||||
|
"security": [
|
||||||
|
{
|
||||||
|
"ApiKeyAuth": []
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"description": "Loads the specified model in the given llama.cpp instance",
|
||||||
|
"tags": [
|
||||||
|
"Llama.cpp"
|
||||||
|
],
|
||||||
|
"summary": "Load a model in a llama.cpp instance",
|
||||||
|
"parameters": [
|
||||||
|
{
|
||||||
|
"type": "string",
|
||||||
|
"description": "Instance Name",
|
||||||
|
"name": "name",
|
||||||
|
"in": "path",
|
||||||
|
"required": true
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "string",
|
||||||
|
"description": "Model Name",
|
||||||
|
"name": "model",
|
||||||
|
"in": "path",
|
||||||
|
"required": true
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"responses": {
|
||||||
|
"200": {
|
||||||
|
"description": "Success message",
|
||||||
|
"schema": {
|
||||||
|
"type": "object",
|
||||||
|
"additionalProperties": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"400": {
|
||||||
|
"description": "Invalid request",
|
||||||
|
"schema": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"500": {
|
||||||
|
"description": "Internal Server Error",
|
||||||
|
"schema": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"/api/v1/llama-cpp/{name}/models/{model}/unload": {
|
||||||
|
"post": {
|
||||||
|
"security": [
|
||||||
|
{
|
||||||
|
"ApiKeyAuth": []
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"description": "Unloads the specified model in the given llama.cpp instance",
|
||||||
|
"tags": [
|
||||||
|
"Llama.cpp"
|
||||||
|
],
|
||||||
|
"summary": "Unload a model in a llama.cpp instance",
|
||||||
|
"parameters": [
|
||||||
|
{
|
||||||
|
"type": "string",
|
||||||
|
"description": "Instance Name",
|
||||||
|
"name": "name",
|
||||||
|
"in": "path",
|
||||||
|
"required": true
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "string",
|
||||||
|
"description": "Model Name",
|
||||||
|
"name": "model",
|
||||||
|
"in": "path",
|
||||||
|
"required": true
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"responses": {
|
||||||
|
"200": {
|
||||||
|
"description": "Success message",
|
||||||
|
"schema": {
|
||||||
|
"type": "object",
|
||||||
|
"additionalProperties": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"400": {
|
||||||
|
"description": "Invalid request",
|
||||||
|
"schema": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"500": {
|
||||||
|
"description": "Internal Server Error",
|
||||||
|
"schema": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
},
|
||||||
"/api/v1/nodes": {
|
"/api/v1/nodes": {
|
||||||
"get": {
|
"get": {
|
||||||
"security": [
|
"security": [
|
||||||
@@ -1788,13 +1938,6 @@ const docTemplate = `{
|
|||||||
"config.AuthConfig": {
|
"config.AuthConfig": {
|
||||||
"type": "object",
|
"type": "object",
|
||||||
"properties": {
|
"properties": {
|
||||||
"inference_keys": {
|
|
||||||
"description": "List of keys for OpenAI compatible inference endpoints",
|
|
||||||
"type": "array",
|
|
||||||
"items": {
|
|
||||||
"type": "string"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
"management_keys": {
|
"management_keys": {
|
||||||
"description": "List of keys for management endpoints",
|
"description": "List of keys for management endpoints",
|
||||||
"type": "array",
|
"type": "array",
|
||||||
@@ -1905,10 +2048,6 @@ const docTemplate = `{
|
|||||||
"description": "Automatically create the data directory if it doesn't exist",
|
"description": "Automatically create the data directory if it doesn't exist",
|
||||||
"type": "boolean"
|
"type": "boolean"
|
||||||
},
|
},
|
||||||
"configs_dir": {
|
|
||||||
"description": "Instance config directory override (relative to data_dir if not absolute)",
|
|
||||||
"type": "string"
|
|
||||||
},
|
|
||||||
"default_auto_restart": {
|
"default_auto_restart": {
|
||||||
"description": "Default auto-restart setting for new instances",
|
"description": "Default auto-restart setting for new instances",
|
||||||
"type": "boolean"
|
"type": "boolean"
|
||||||
@@ -1929,6 +2068,21 @@ const docTemplate = `{
|
|||||||
"description": "Enable LRU eviction for instance logs",
|
"description": "Enable LRU eviction for instance logs",
|
||||||
"type": "boolean"
|
"type": "boolean"
|
||||||
},
|
},
|
||||||
|
"logRotationCompress": {
|
||||||
|
"description": "Whether to compress rotated log files",
|
||||||
|
"type": "boolean",
|
||||||
|
"default": false
|
||||||
|
},
|
||||||
|
"logRotationEnabled": {
|
||||||
|
"description": "Log rotation enabled",
|
||||||
|
"type": "boolean",
|
||||||
|
"default": true
|
||||||
|
},
|
||||||
|
"logRotationMaxSize": {
|
||||||
|
"description": "Maximum log file size in MB before rotation",
|
||||||
|
"type": "integer",
|
||||||
|
"default": 100
|
||||||
|
},
|
||||||
"logs_dir": {
|
"logs_dir": {
|
||||||
"description": "Logs directory override (relative to data_dir if not absolute)",
|
"description": "Logs directory override (relative to data_dir if not absolute)",
|
||||||
"type": "string"
|
"type": "string"
|
||||||
|
|||||||
File diff suppressed because one or more lines are too long
176
dev/swagger.json
176
dev/swagger.json
@@ -992,6 +992,156 @@
|
|||||||
}
|
}
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
|
"/api/v1/llama-cpp/{name}/models": {
|
||||||
|
"get": {
|
||||||
|
"security": [
|
||||||
|
{
|
||||||
|
"ApiKeyAuth": []
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"description": "Returns a list of models available in the specified llama.cpp instance",
|
||||||
|
"tags": [
|
||||||
|
"Llama.cpp"
|
||||||
|
],
|
||||||
|
"summary": "List models in a llama.cpp instance",
|
||||||
|
"parameters": [
|
||||||
|
{
|
||||||
|
"type": "string",
|
||||||
|
"description": "Instance Name",
|
||||||
|
"name": "name",
|
||||||
|
"in": "path",
|
||||||
|
"required": true
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"responses": {
|
||||||
|
"200": {
|
||||||
|
"description": "Models list response",
|
||||||
|
"schema": {
|
||||||
|
"type": "object",
|
||||||
|
"additionalProperties": true
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"400": {
|
||||||
|
"description": "Invalid instance",
|
||||||
|
"schema": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"500": {
|
||||||
|
"description": "Internal Server Error",
|
||||||
|
"schema": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"/api/v1/llama-cpp/{name}/models/{model}/load": {
|
||||||
|
"post": {
|
||||||
|
"security": [
|
||||||
|
{
|
||||||
|
"ApiKeyAuth": []
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"description": "Loads the specified model in the given llama.cpp instance",
|
||||||
|
"tags": [
|
||||||
|
"Llama.cpp"
|
||||||
|
],
|
||||||
|
"summary": "Load a model in a llama.cpp instance",
|
||||||
|
"parameters": [
|
||||||
|
{
|
||||||
|
"type": "string",
|
||||||
|
"description": "Instance Name",
|
||||||
|
"name": "name",
|
||||||
|
"in": "path",
|
||||||
|
"required": true
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "string",
|
||||||
|
"description": "Model Name",
|
||||||
|
"name": "model",
|
||||||
|
"in": "path",
|
||||||
|
"required": true
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"responses": {
|
||||||
|
"200": {
|
||||||
|
"description": "Success message",
|
||||||
|
"schema": {
|
||||||
|
"type": "object",
|
||||||
|
"additionalProperties": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"400": {
|
||||||
|
"description": "Invalid request",
|
||||||
|
"schema": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"500": {
|
||||||
|
"description": "Internal Server Error",
|
||||||
|
"schema": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"/api/v1/llama-cpp/{name}/models/{model}/unload": {
|
||||||
|
"post": {
|
||||||
|
"security": [
|
||||||
|
{
|
||||||
|
"ApiKeyAuth": []
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"description": "Unloads the specified model in the given llama.cpp instance",
|
||||||
|
"tags": [
|
||||||
|
"Llama.cpp"
|
||||||
|
],
|
||||||
|
"summary": "Unload a model in a llama.cpp instance",
|
||||||
|
"parameters": [
|
||||||
|
{
|
||||||
|
"type": "string",
|
||||||
|
"description": "Instance Name",
|
||||||
|
"name": "name",
|
||||||
|
"in": "path",
|
||||||
|
"required": true
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "string",
|
||||||
|
"description": "Model Name",
|
||||||
|
"name": "model",
|
||||||
|
"in": "path",
|
||||||
|
"required": true
|
||||||
|
}
|
||||||
|
],
|
||||||
|
"responses": {
|
||||||
|
"200": {
|
||||||
|
"description": "Success message",
|
||||||
|
"schema": {
|
||||||
|
"type": "object",
|
||||||
|
"additionalProperties": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"400": {
|
||||||
|
"description": "Invalid request",
|
||||||
|
"schema": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"500": {
|
||||||
|
"description": "Internal Server Error",
|
||||||
|
"schema": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
}
|
||||||
|
},
|
||||||
"/api/v1/nodes": {
|
"/api/v1/nodes": {
|
||||||
"get": {
|
"get": {
|
||||||
"security": [
|
"security": [
|
||||||
@@ -1781,13 +1931,6 @@
|
|||||||
"config.AuthConfig": {
|
"config.AuthConfig": {
|
||||||
"type": "object",
|
"type": "object",
|
||||||
"properties": {
|
"properties": {
|
||||||
"inference_keys": {
|
|
||||||
"description": "List of keys for OpenAI compatible inference endpoints",
|
|
||||||
"type": "array",
|
|
||||||
"items": {
|
|
||||||
"type": "string"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
"management_keys": {
|
"management_keys": {
|
||||||
"description": "List of keys for management endpoints",
|
"description": "List of keys for management endpoints",
|
||||||
"type": "array",
|
"type": "array",
|
||||||
@@ -1898,10 +2041,6 @@
|
|||||||
"description": "Automatically create the data directory if it doesn't exist",
|
"description": "Automatically create the data directory if it doesn't exist",
|
||||||
"type": "boolean"
|
"type": "boolean"
|
||||||
},
|
},
|
||||||
"configs_dir": {
|
|
||||||
"description": "Instance config directory override (relative to data_dir if not absolute)",
|
|
||||||
"type": "string"
|
|
||||||
},
|
|
||||||
"default_auto_restart": {
|
"default_auto_restart": {
|
||||||
"description": "Default auto-restart setting for new instances",
|
"description": "Default auto-restart setting for new instances",
|
||||||
"type": "boolean"
|
"type": "boolean"
|
||||||
@@ -1922,6 +2061,21 @@
|
|||||||
"description": "Enable LRU eviction for instance logs",
|
"description": "Enable LRU eviction for instance logs",
|
||||||
"type": "boolean"
|
"type": "boolean"
|
||||||
},
|
},
|
||||||
|
"logRotationCompress": {
|
||||||
|
"description": "Whether to compress rotated log files",
|
||||||
|
"type": "boolean",
|
||||||
|
"default": false
|
||||||
|
},
|
||||||
|
"logRotationEnabled": {
|
||||||
|
"description": "Log rotation enabled",
|
||||||
|
"type": "boolean",
|
||||||
|
"default": true
|
||||||
|
},
|
||||||
|
"logRotationMaxSize": {
|
||||||
|
"description": "Maximum log file size in MB before rotation",
|
||||||
|
"type": "integer",
|
||||||
|
"default": 100
|
||||||
|
},
|
||||||
"logs_dir": {
|
"logs_dir": {
|
||||||
"description": "Logs directory override (relative to data_dir if not absolute)",
|
"description": "Logs directory override (relative to data_dir if not absolute)",
|
||||||
"type": "string"
|
"type": "string"
|
||||||
|
|||||||
117
dev/swagger.yaml
117
dev/swagger.yaml
@@ -39,11 +39,6 @@ definitions:
|
|||||||
type: object
|
type: object
|
||||||
config.AuthConfig:
|
config.AuthConfig:
|
||||||
properties:
|
properties:
|
||||||
inference_keys:
|
|
||||||
description: List of keys for OpenAI compatible inference endpoints
|
|
||||||
items:
|
|
||||||
type: string
|
|
||||||
type: array
|
|
||||||
management_keys:
|
management_keys:
|
||||||
description: List of keys for management endpoints
|
description: List of keys for management endpoints
|
||||||
items:
|
items:
|
||||||
@@ -118,10 +113,6 @@ definitions:
|
|||||||
auto_create_dirs:
|
auto_create_dirs:
|
||||||
description: Automatically create the data directory if it doesn't exist
|
description: Automatically create the data directory if it doesn't exist
|
||||||
type: boolean
|
type: boolean
|
||||||
configs_dir:
|
|
||||||
description: Instance config directory override (relative to data_dir if not
|
|
||||||
absolute)
|
|
||||||
type: string
|
|
||||||
default_auto_restart:
|
default_auto_restart:
|
||||||
description: Default auto-restart setting for new instances
|
description: Default auto-restart setting for new instances
|
||||||
type: boolean
|
type: boolean
|
||||||
@@ -137,6 +128,18 @@ definitions:
|
|||||||
enable_lru_eviction:
|
enable_lru_eviction:
|
||||||
description: Enable LRU eviction for instance logs
|
description: Enable LRU eviction for instance logs
|
||||||
type: boolean
|
type: boolean
|
||||||
|
logRotationCompress:
|
||||||
|
default: false
|
||||||
|
description: Whether to compress rotated log files
|
||||||
|
type: boolean
|
||||||
|
logRotationEnabled:
|
||||||
|
default: true
|
||||||
|
description: Log rotation enabled
|
||||||
|
type: boolean
|
||||||
|
logRotationMaxSize:
|
||||||
|
default: 100
|
||||||
|
description: Maximum log file size in MB before rotation
|
||||||
|
type: integer
|
||||||
logs_dir:
|
logs_dir:
|
||||||
description: Logs directory override (relative to data_dir if not absolute)
|
description: Logs directory override (relative to data_dir if not absolute)
|
||||||
type: string
|
type: string
|
||||||
@@ -955,6 +958,102 @@ paths:
|
|||||||
summary: Stop a running instance
|
summary: Stop a running instance
|
||||||
tags:
|
tags:
|
||||||
- Instances
|
- Instances
|
||||||
|
/api/v1/llama-cpp/{name}/models:
|
||||||
|
get:
|
||||||
|
description: Returns a list of models available in the specified llama.cpp instance
|
||||||
|
parameters:
|
||||||
|
- description: Instance Name
|
||||||
|
in: path
|
||||||
|
name: name
|
||||||
|
required: true
|
||||||
|
type: string
|
||||||
|
responses:
|
||||||
|
"200":
|
||||||
|
description: Models list response
|
||||||
|
schema:
|
||||||
|
additionalProperties: true
|
||||||
|
type: object
|
||||||
|
"400":
|
||||||
|
description: Invalid instance
|
||||||
|
schema:
|
||||||
|
type: string
|
||||||
|
"500":
|
||||||
|
description: Internal Server Error
|
||||||
|
schema:
|
||||||
|
type: string
|
||||||
|
security:
|
||||||
|
- ApiKeyAuth: []
|
||||||
|
summary: List models in a llama.cpp instance
|
||||||
|
tags:
|
||||||
|
- Llama.cpp
|
||||||
|
/api/v1/llama-cpp/{name}/models/{model}/load:
|
||||||
|
post:
|
||||||
|
description: Loads the specified model in the given llama.cpp instance
|
||||||
|
parameters:
|
||||||
|
- description: Instance Name
|
||||||
|
in: path
|
||||||
|
name: name
|
||||||
|
required: true
|
||||||
|
type: string
|
||||||
|
- description: Model Name
|
||||||
|
in: path
|
||||||
|
name: model
|
||||||
|
required: true
|
||||||
|
type: string
|
||||||
|
responses:
|
||||||
|
"200":
|
||||||
|
description: Success message
|
||||||
|
schema:
|
||||||
|
additionalProperties:
|
||||||
|
type: string
|
||||||
|
type: object
|
||||||
|
"400":
|
||||||
|
description: Invalid request
|
||||||
|
schema:
|
||||||
|
type: string
|
||||||
|
"500":
|
||||||
|
description: Internal Server Error
|
||||||
|
schema:
|
||||||
|
type: string
|
||||||
|
security:
|
||||||
|
- ApiKeyAuth: []
|
||||||
|
summary: Load a model in a llama.cpp instance
|
||||||
|
tags:
|
||||||
|
- Llama.cpp
|
||||||
|
/api/v1/llama-cpp/{name}/models/{model}/unload:
|
||||||
|
post:
|
||||||
|
description: Unloads the specified model in the given llama.cpp instance
|
||||||
|
parameters:
|
||||||
|
- description: Instance Name
|
||||||
|
in: path
|
||||||
|
name: name
|
||||||
|
required: true
|
||||||
|
type: string
|
||||||
|
- description: Model Name
|
||||||
|
in: path
|
||||||
|
name: model
|
||||||
|
required: true
|
||||||
|
type: string
|
||||||
|
responses:
|
||||||
|
"200":
|
||||||
|
description: Success message
|
||||||
|
schema:
|
||||||
|
additionalProperties:
|
||||||
|
type: string
|
||||||
|
type: object
|
||||||
|
"400":
|
||||||
|
description: Invalid request
|
||||||
|
schema:
|
||||||
|
type: string
|
||||||
|
"500":
|
||||||
|
description: Internal Server Error
|
||||||
|
schema:
|
||||||
|
type: string
|
||||||
|
security:
|
||||||
|
- ApiKeyAuth: []
|
||||||
|
summary: Unload a model in a llama.cpp instance
|
||||||
|
tags:
|
||||||
|
- Llama.cpp
|
||||||
/api/v1/nodes:
|
/api/v1/nodes:
|
||||||
get:
|
get:
|
||||||
description: Returns a map of all nodes configured in the server (node name
|
description: Returns a map of all nodes configured in the server (node name
|
||||||
|
|||||||
Reference in New Issue
Block a user