Merge pull request #201 from notV3NOM/main
Fix: simulstreaming preload model count argument in cli
This commit is contained in:
commit
84890b8e61
2 changed files with 3 additions and 3 deletions
|
|
@ -177,7 +177,7 @@ The rest I don't recommend. But below are your options.
|
|||
| `--static-init-prompt` | Static prompt that doesn't scroll | `None` |
|
||||
| `--max-context-tokens` | Maximum context tokens | `None` |
|
||||
| `--model-path` | Direct path to .pt model file. Download it if not found | `./base.pt` |
|
||||
| `--preloaded-model-count` | Optional. Number of models to preload in memory to speed up loading (set up to the expected number of concurrent users) | `1` |
|
||||
| `--preload-model-count` | Optional. Number of models to preload in memory to speed up loading (set up to the expected number of concurrent users) | `1` |
|
||||
|
||||
|
||||
| WhisperStreaming backend options | Description | Default |
|
||||
|
|
|
|||
|
|
@ -269,10 +269,10 @@ def parse_args():
|
|||
)
|
||||
|
||||
simulstreaming_group.add_argument(
|
||||
"--preloaded_model_count",
|
||||
"--preload-model-count",
|
||||
type=int,
|
||||
default=1,
|
||||
dest="preloaded_model_count",
|
||||
dest="preload_model_count",
|
||||
help="Optional. Number of models to preload in memory to speed up loading (set up to the expected number of concurrent instances).",
|
||||
)
|
||||
|
||||
|
|
|
|||
Loading…
Reference in a new issue