mirror of
https://github.com/CherryHQ/cherry-studio.git
synced 2026-01-02 10:29:02 +08:00
40 lines
1.3 KiB
YAML
40 lines
1.3 KiB
YAML
id: microsoft/phi-3-medium-128k-instruct
|
|
canonical_slug: microsoft/phi-3-medium-128k-instruct
|
|
hugging_face_id: microsoft/Phi-3-medium-128k-instruct
|
|
name: 'Microsoft: Phi-3 Medium 128K Instruct'
|
|
type: chat
|
|
created: 1716508800
|
|
description: |-
|
|
Phi-3 128K Medium is a powerful 14-billion parameter model designed for advanced language understanding, reasoning, and instruction following. Optimized through supervised fine-tuning and preference adjustments, it excels in tasks involving common sense, mathematics, logical reasoning, and code processing.
|
|
|
|
At time of release, Phi-3 Medium demonstrated state-of-the-art performance among lightweight models. In the MMLU-Pro eval, the model even comes close to a Llama3 70B level of performance.
|
|
|
|
For 4k context length, try [Phi-3 Medium 4K](/models/microsoft/phi-3-medium-4k-instruct).
|
|
context_length: 128000
|
|
architecture:
|
|
modality: text->text
|
|
input_modalities:
|
|
- text
|
|
output_modalities:
|
|
- text
|
|
tokenizer: Other
|
|
instruct_type: phi3
|
|
pricing:
|
|
prompt: '0.000001'
|
|
completion: '0.000001'
|
|
input_cache_read: ''
|
|
input_cache_write: ''
|
|
request: '0'
|
|
image: '0'
|
|
web_search: '0'
|
|
internal_reasoning: '0'
|
|
unit: 1
|
|
currency: USD
|
|
supported_parameters:
|
|
- tools
|
|
- tool_choice
|
|
- max_tokens
|
|
- temperature
|
|
- top_p
|
|
model_provider: microsoft
|