diff --git a/src/converters/utils.js b/src/converters/utils.js index a7501c4..7797a5e 100644 --- a/src/converters/utils.js +++ b/src/converters/utils.js @@ -17,16 +17,16 @@ export const DEFAULT_TOP_P = 0.95; // ============================================================================= // OpenAI 相关常量 // ============================================================================= -export const OPENAI_DEFAULT_MAX_TOKENS = 64000; +export const OPENAI_DEFAULT_MAX_TOKENS = 128000; export const OPENAI_DEFAULT_TEMPERATURE = 1; export const OPENAI_DEFAULT_TOP_P = 0.95; export const OPENAI_DEFAULT_INPUT_TOKEN_LIMIT = 32768; -export const OPENAI_DEFAULT_OUTPUT_TOKEN_LIMIT = 64000; +export const OPENAI_DEFAULT_OUTPUT_TOKEN_LIMIT = 128000; // ============================================================================= // Claude 相关常量 // ============================================================================= -export const CLAUDE_DEFAULT_MAX_TOKENS = 64000; +export const CLAUDE_DEFAULT_MAX_TOKENS = 200000; export const CLAUDE_DEFAULT_TEMPERATURE = 1; export const CLAUDE_DEFAULT_TOP_P = 0.95; @@ -37,89 +37,89 @@ export const GEMINI_DEFAULT_MAX_TOKENS = 65534; export const GEMINI_DEFAULT_TEMPERATURE = 1; export const GEMINI_DEFAULT_TOP_P = 0.95; export const GEMINI_DEFAULT_INPUT_TOKEN_LIMIT = 32768; -export const GEMINI_DEFAULT_OUTPUT_TOKEN_LIMIT = 64000; +export const GEMINI_DEFAULT_OUTPUT_TOKEN_LIMIT = 65534; // ============================================================================= // OpenAI Responses 相关常量 // ============================================================================= -export const OPENAI_RESPONSES_DEFAULT_MAX_TOKENS = 4096; +export const OPENAI_RESPONSES_DEFAULT_MAX_TOKENS = 128000; export const OPENAI_RESPONSES_DEFAULT_TEMPERATURE = 1; export const OPENAI_RESPONSES_DEFAULT_TOP_P = 0.95; export const OPENAI_RESPONSES_DEFAULT_INPUT_TOKEN_LIMIT = 32768; -export const OPENAI_RESPONSES_DEFAULT_OUTPUT_TOKEN_LIMIT = 64000; +export const OPENAI_RESPONSES_DEFAULT_OUTPUT_TOKEN_LIMIT = 128000; // ============================================================================= // Ollama 相关常量 // ============================================================================= -export const OLLAMA_DEFAULT_CONTEXT_LENGTH = 64000; -export const OLLAMA_DEFAULT_MAX_OUTPUT_TOKENS = 4096; +export const OLLAMA_DEFAULT_CONTEXT_LENGTH = 65534; +export const OLLAMA_DEFAULT_MAX_OUTPUT_TOKENS = 8192; // Claude 模型上下文长度 export const OLLAMA_CLAUDE_DEFAULT_CONTEXT_LENGTH = 200000; export const OLLAMA_CLAUDE_SONNET_45_CONTEXT_LENGTH = 200000; -export const OLLAMA_CLAUDE_SONNET_45_MAX_OUTPUT_TOKENS = 64000; +export const OLLAMA_CLAUDE_SONNET_45_MAX_OUTPUT_TOKENS = 200000; export const OLLAMA_CLAUDE_HAIKU_45_CONTEXT_LENGTH = 200000; -export const OLLAMA_CLAUDE_HAIKU_45_MAX_OUTPUT_TOKENS = 64000; +export const OLLAMA_CLAUDE_HAIKU_45_MAX_OUTPUT_TOKENS = 200000; export const OLLAMA_CLAUDE_OPUS_41_CONTEXT_LENGTH = 200000; export const OLLAMA_CLAUDE_OPUS_41_MAX_OUTPUT_TOKENS = 32000; export const OLLAMA_CLAUDE_SONNET_40_CONTEXT_LENGTH = 200000; -export const OLLAMA_CLAUDE_SONNET_40_MAX_OUTPUT_TOKENS = 64000; +export const OLLAMA_CLAUDE_SONNET_40_MAX_OUTPUT_TOKENS = 200000; export const OLLAMA_CLAUDE_SONNET_37_CONTEXT_LENGTH = 200000; -export const OLLAMA_CLAUDE_SONNET_37_MAX_OUTPUT_TOKENS = 64000; +export const OLLAMA_CLAUDE_SONNET_37_MAX_OUTPUT_TOKENS = 200000; export const OLLAMA_CLAUDE_OPUS_40_CONTEXT_LENGTH = 200000; export const OLLAMA_CLAUDE_OPUS_40_MAX_OUTPUT_TOKENS = 32000; export const OLLAMA_CLAUDE_HAIKU_35_CONTEXT_LENGTH = 200000; -export const OLLAMA_CLAUDE_HAIKU_35_MAX_OUTPUT_TOKENS = 64000; +export const OLLAMA_CLAUDE_HAIKU_35_MAX_OUTPUT_TOKENS = 200000; export const OLLAMA_CLAUDE_HAIKU_30_CONTEXT_LENGTH = 200000; -export const OLLAMA_CLAUDE_HAIKU_30_MAX_OUTPUT_TOKENS = 4096; +export const OLLAMA_CLAUDE_HAIKU_30_MAX_OUTPUT_TOKENS = 8192; export const OLLAMA_CLAUDE_SONNET_35_CONTEXT_LENGTH = 200000; -export const OLLAMA_CLAUDE_SONNET_35_MAX_OUTPUT_TOKENS = 64000; +export const OLLAMA_CLAUDE_SONNET_35_MAX_OUTPUT_TOKENS = 200000; export const OLLAMA_CLAUDE_OPUS_30_CONTEXT_LENGTH = 200000; -export const OLLAMA_CLAUDE_OPUS_30_MAX_OUTPUT_TOKENS = 4096; +export const OLLAMA_CLAUDE_OPUS_30_MAX_OUTPUT_TOKENS = 8192; // Gemini 模型上下文长度 export const OLLAMA_GEMINI_25_PRO_CONTEXT_LENGTH = 1048576; -export const OLLAMA_GEMINI_25_PRO_MAX_OUTPUT_TOKENS = 65536; +export const OLLAMA_GEMINI_25_PRO_MAX_OUTPUT_TOKENS = 65534; export const OLLAMA_GEMINI_25_FLASH_CONTEXT_LENGTH = 1048576; -export const OLLAMA_GEMINI_25_FLASH_MAX_OUTPUT_TOKENS = 65536; -export const OLLAMA_GEMINI_25_IMAGE_CONTEXT_LENGTH = 65536; +export const OLLAMA_GEMINI_25_FLASH_MAX_OUTPUT_TOKENS = 65534; +export const OLLAMA_GEMINI_25_IMAGE_CONTEXT_LENGTH = 65534; export const OLLAMA_GEMINI_25_IMAGE_MAX_OUTPUT_TOKENS = 32768; export const OLLAMA_GEMINI_25_LIVE_CONTEXT_LENGTH = 131072; -export const OLLAMA_GEMINI_25_LIVE_MAX_OUTPUT_TOKENS = 64000; -export const OLLAMA_GEMINI_25_TTS_CONTEXT_LENGTH = 64000; +export const OLLAMA_GEMINI_25_LIVE_MAX_OUTPUT_TOKENS = 65534; +export const OLLAMA_GEMINI_25_TTS_CONTEXT_LENGTH = 65534; export const OLLAMA_GEMINI_25_TTS_MAX_OUTPUT_TOKENS = 16384; export const OLLAMA_GEMINI_20_FLASH_CONTEXT_LENGTH = 1048576; -export const OLLAMA_GEMINI_20_FLASH_MAX_OUTPUT_TOKENS = 64000; +export const OLLAMA_GEMINI_20_FLASH_MAX_OUTPUT_TOKENS = 65534; export const OLLAMA_GEMINI_20_IMAGE_CONTEXT_LENGTH = 32768; -export const OLLAMA_GEMINI_20_IMAGE_MAX_OUTPUT_TOKENS = 64000; +export const OLLAMA_GEMINI_20_IMAGE_MAX_OUTPUT_TOKENS = 65534; export const OLLAMA_GEMINI_15_PRO_CONTEXT_LENGTH = 2097152; -export const OLLAMA_GEMINI_15_PRO_MAX_OUTPUT_TOKENS = 64000; +export const OLLAMA_GEMINI_15_PRO_MAX_OUTPUT_TOKENS = 65534; export const OLLAMA_GEMINI_15_FLASH_CONTEXT_LENGTH = 1048576; -export const OLLAMA_GEMINI_15_FLASH_MAX_OUTPUT_TOKENS = 64000; +export const OLLAMA_GEMINI_15_FLASH_MAX_OUTPUT_TOKENS = 65534; export const OLLAMA_GEMINI_DEFAULT_CONTEXT_LENGTH = 1048576; -export const OLLAMA_GEMINI_DEFAULT_MAX_OUTPUT_TOKENS = 64000; +export const OLLAMA_GEMINI_DEFAULT_MAX_OUTPUT_TOKENS = 65534; // GPT 模型上下文长度 export const OLLAMA_GPT4_TURBO_CONTEXT_LENGTH = 128000; -export const OLLAMA_GPT4_TURBO_MAX_OUTPUT_TOKENS = 4096; +export const OLLAMA_GPT4_TURBO_MAX_OUTPUT_TOKENS = 8192; export const OLLAMA_GPT4_32K_CONTEXT_LENGTH = 32768; -export const OLLAMA_GPT4_32K_MAX_OUTPUT_TOKENS = 4096; -export const OLLAMA_GPT4_BASE_CONTEXT_LENGTH = 64000; -export const OLLAMA_GPT4_BASE_MAX_OUTPUT_TOKENS = 4096; +export const OLLAMA_GPT4_32K_MAX_OUTPUT_TOKENS = 8192; +export const OLLAMA_GPT4_BASE_CONTEXT_LENGTH = 200000; +export const OLLAMA_GPT4_BASE_MAX_OUTPUT_TOKENS = 8192; export const OLLAMA_GPT35_16K_CONTEXT_LENGTH = 16385; -export const OLLAMA_GPT35_16K_MAX_OUTPUT_TOKENS = 4096; -export const OLLAMA_GPT35_BASE_CONTEXT_LENGTH = 4096; -export const OLLAMA_GPT35_BASE_MAX_OUTPUT_TOKENS = 4096; +export const OLLAMA_GPT35_16K_MAX_OUTPUT_TOKENS = 8192; +export const OLLAMA_GPT35_BASE_CONTEXT_LENGTH = 8192; +export const OLLAMA_GPT35_BASE_MAX_OUTPUT_TOKENS = 8192; // Qwen 模型上下文长度 export const OLLAMA_QWEN_CODER_PLUS_CONTEXT_LENGTH = 128000; -export const OLLAMA_QWEN_CODER_PLUS_MAX_OUTPUT_TOKENS = 65536; +export const OLLAMA_QWEN_CODER_PLUS_MAX_OUTPUT_TOKENS = 65534; export const OLLAMA_QWEN_VL_PLUS_CONTEXT_LENGTH = 262144; export const OLLAMA_QWEN_VL_PLUS_MAX_OUTPUT_TOKENS = 32768; export const OLLAMA_QWEN_CODER_FLASH_CONTEXT_LENGTH = 128000; -export const OLLAMA_QWEN_CODER_FLASH_MAX_OUTPUT_TOKENS = 65536; +export const OLLAMA_QWEN_CODER_FLASH_MAX_OUTPUT_TOKENS = 65534; export const OLLAMA_QWEN_DEFAULT_CONTEXT_LENGTH = 32768; -export const OLLAMA_QWEN_DEFAULT_MAX_OUTPUT_TOKENS = 64000; +export const OLLAMA_QWEN_DEFAULT_MAX_OUTPUT_TOKENS = 200000; export const OLLAMA_DEFAULT_FILE_TYPE = 2; export const OLLAMA_DEFAULT_QUANTIZATION_VERSION = 2;