Skip to content

Commit

Permalink
Deployed bd77a0a with MkDocs version: 1.4.3
Browse files Browse the repository at this point in the history
  • Loading branch information
Unknown committed Nov 19, 2024
1 parent 682edb4 commit dfb9b86
Show file tree
Hide file tree
Showing 3 changed files with 35 additions and 20 deletions.
53 changes: 34 additions & 19 deletions api/python_client/index.html
Original file line number Diff line number Diff line change
Expand Up @@ -2868,25 +2868,26 @@ <h3 id="llmengine.Model.create" class="doc doc-heading">
<a id="__codelineno-0-7" name="__codelineno-0-7" href="#__codelineno-0-7"></a> num_shards: <span style="color: #008000">int</span> <span style="color: #666666">=</span> <span style="color: #666666">1</span>,
<a id="__codelineno-0-8" name="__codelineno-0-8" href="#__codelineno-0-8"></a> quantize: Optional[Quantization] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-9" name="__codelineno-0-9" href="#__codelineno-0-9"></a> checkpoint_path: Optional[<span style="color: #008000">str</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-10" name="__codelineno-0-10" href="#__codelineno-0-10"></a> cpus: Optional[<span style="color: #008000">int</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-11" name="__codelineno-0-11" href="#__codelineno-0-11"></a> memory: Optional[<span style="color: #008000">str</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-12" name="__codelineno-0-12" href="#__codelineno-0-12"></a> storage: Optional[<span style="color: #008000">str</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-13" name="__codelineno-0-13" href="#__codelineno-0-13"></a> gpus: Optional[<span style="color: #008000">int</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-14" name="__codelineno-0-14" href="#__codelineno-0-14"></a> nodes_per_worker: <span style="color: #008000">int</span> <span style="color: #666666">=</span> <span style="color: #666666">1</span>,
<a id="__codelineno-0-15" name="__codelineno-0-15" href="#__codelineno-0-15"></a> min_workers: <span style="color: #008000">int</span> <span style="color: #666666">=</span> <span style="color: #666666">0</span>,
<a id="__codelineno-0-16" name="__codelineno-0-16" href="#__codelineno-0-16"></a> max_workers: <span style="color: #008000">int</span> <span style="color: #666666">=</span> <span style="color: #666666">1</span>,
<a id="__codelineno-0-17" name="__codelineno-0-17" href="#__codelineno-0-17"></a> per_worker: <span style="color: #008000">int</span> <span style="color: #666666">=</span> <span style="color: #666666">2</span>,
<a id="__codelineno-0-18" name="__codelineno-0-18" href="#__codelineno-0-18"></a> endpoint_type: ModelEndpointType <span style="color: #666666">=</span> ModelEndpointType<span style="color: #666666">.</span>STREAMING,
<a id="__codelineno-0-19" name="__codelineno-0-19" href="#__codelineno-0-19"></a> gpu_type: Optional[<span style="color: #008000">str</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-20" name="__codelineno-0-20" href="#__codelineno-0-20"></a> high_priority: Optional[<span style="color: #008000">bool</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">False</span>,
<a id="__codelineno-0-21" name="__codelineno-0-21" href="#__codelineno-0-21"></a> post_inference_hooks: Optional[
<a id="__codelineno-0-22" name="__codelineno-0-22" href="#__codelineno-0-22"></a> List[PostInferenceHooks]
<a id="__codelineno-0-23" name="__codelineno-0-23" href="#__codelineno-0-23"></a> ] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-24" name="__codelineno-0-24" href="#__codelineno-0-24"></a> default_callback_url: Optional[<span style="color: #008000">str</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-25" name="__codelineno-0-25" href="#__codelineno-0-25"></a> public_inference: Optional[<span style="color: #008000">bool</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">True</span>,
<a id="__codelineno-0-26" name="__codelineno-0-26" href="#__codelineno-0-26"></a> labels: Optional[Dict[<span style="color: #008000">str</span>, <span style="color: #008000">str</span>]] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-27" name="__codelineno-0-27" href="#__codelineno-0-27"></a> request_headers: Optional[Dict[<span style="color: #008000">str</span>, <span style="color: #008000">str</span>]] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-28" name="__codelineno-0-28" href="#__codelineno-0-28"></a>) <span style="color: #666666">-&gt;</span> CreateLLMEndpointResponse
<a id="__codelineno-0-10" name="__codelineno-0-10" href="#__codelineno-0-10"></a> max_model_len: Optional[<span style="color: #008000">int</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-11" name="__codelineno-0-11" href="#__codelineno-0-11"></a> cpus: Optional[<span style="color: #008000">int</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-12" name="__codelineno-0-12" href="#__codelineno-0-12"></a> memory: Optional[<span style="color: #008000">str</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-13" name="__codelineno-0-13" href="#__codelineno-0-13"></a> storage: Optional[<span style="color: #008000">str</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-14" name="__codelineno-0-14" href="#__codelineno-0-14"></a> gpus: Optional[<span style="color: #008000">int</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-15" name="__codelineno-0-15" href="#__codelineno-0-15"></a> nodes_per_worker: <span style="color: #008000">int</span> <span style="color: #666666">=</span> <span style="color: #666666">1</span>,
<a id="__codelineno-0-16" name="__codelineno-0-16" href="#__codelineno-0-16"></a> min_workers: <span style="color: #008000">int</span> <span style="color: #666666">=</span> <span style="color: #666666">0</span>,
<a id="__codelineno-0-17" name="__codelineno-0-17" href="#__codelineno-0-17"></a> max_workers: <span style="color: #008000">int</span> <span style="color: #666666">=</span> <span style="color: #666666">1</span>,
<a id="__codelineno-0-18" name="__codelineno-0-18" href="#__codelineno-0-18"></a> per_worker: <span style="color: #008000">int</span> <span style="color: #666666">=</span> <span style="color: #666666">2</span>,
<a id="__codelineno-0-19" name="__codelineno-0-19" href="#__codelineno-0-19"></a> endpoint_type: ModelEndpointType <span style="color: #666666">=</span> ModelEndpointType<span style="color: #666666">.</span>STREAMING,
<a id="__codelineno-0-20" name="__codelineno-0-20" href="#__codelineno-0-20"></a> gpu_type: Optional[<span style="color: #008000">str</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-21" name="__codelineno-0-21" href="#__codelineno-0-21"></a> high_priority: Optional[<span style="color: #008000">bool</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">False</span>,
<a id="__codelineno-0-22" name="__codelineno-0-22" href="#__codelineno-0-22"></a> post_inference_hooks: Optional[
<a id="__codelineno-0-23" name="__codelineno-0-23" href="#__codelineno-0-23"></a> List[PostInferenceHooks]
<a id="__codelineno-0-24" name="__codelineno-0-24" href="#__codelineno-0-24"></a> ] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-25" name="__codelineno-0-25" href="#__codelineno-0-25"></a> default_callback_url: Optional[<span style="color: #008000">str</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-26" name="__codelineno-0-26" href="#__codelineno-0-26"></a> public_inference: Optional[<span style="color: #008000">bool</span>] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">True</span>,
<a id="__codelineno-0-27" name="__codelineno-0-27" href="#__codelineno-0-27"></a> labels: Optional[Dict[<span style="color: #008000">str</span>, <span style="color: #008000">str</span>]] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-28" name="__codelineno-0-28" href="#__codelineno-0-28"></a> request_headers: Optional[Dict[<span style="color: #008000">str</span>, <span style="color: #008000">str</span>]] <span style="color: #666666">=</span> <span style="color: #008000; font-weight: bold">None</span>,
<a id="__codelineno-0-29" name="__codelineno-0-29" href="#__codelineno-0-29"></a>) <span style="color: #666666">-&gt;</span> CreateLLMEndpointResponse
</code></pre></div>

<div class="doc doc-contents ">
Expand Down Expand Up @@ -3023,6 +3024,20 @@ <h3 id="llmengine.Model.create" class="doc doc-heading">
<code>None</code>
</td>
</tr>
<tr class="doc-section-item">
<td><code>max_model_len</code></td>
<td>
<code>`Optional[int]`</code>
</td>
<td>
<div class="doc-md-description">
<p>Model context length. If unspecified, will be automatically derived from the model config.</p>
</div>
</td>
<td>
<code>None</code>
</td>
</tr>
<tr class="doc-section-item">
<td><code>cpus</code></td>
<td>
Expand Down
2 changes: 1 addition & 1 deletion search/search_index.json

Large diffs are not rendered by default.

Binary file modified sitemap.xml.gz
Binary file not shown.

0 comments on commit dfb9b86

Please sign in to comment.