Skip to content

Commit

Permalink
feat:nvidia add nemotron4-340b and microsoft/phi-3 (#6973)
Browse files Browse the repository at this point in the history
  • Loading branch information
sulgweb authored Aug 6, 2024
1 parent 312d905 commit 23ed15d
Show file tree
Hide file tree
Showing 5 changed files with 115 additions and 2 deletions.
Original file line number Diff line number Diff line change
Expand Up @@ -10,5 +10,8 @@
- mistralai/mistral-large
- mistralai/mixtral-8x7b-instruct-v0.1
- mistralai/mixtral-8x22b-instruct-v0.1
- nvidia/nemotron-4-340b-instruct
- microsoft/phi-3-medium-128k-instruct
- microsoft/phi-3-mini-128k-instruct
- fuyu-8b
- snowflake/arctic
6 changes: 4 additions & 2 deletions api/core/model_runtime/model_providers/nvidia/llm/llm.py
Original file line number Diff line number Diff line change
Expand Up @@ -34,8 +34,10 @@ class NVIDIALargeLanguageModel(OAIAPICompatLargeLanguageModel):
'meta/llama-3.1-8b-instruct': '',
'meta/llama-3.1-70b-instruct': '',
'meta/llama-3.1-405b-instruct': '',
'google/recurrentgemma-2b': ''

'google/recurrentgemma-2b': '',
'nvidia/nemotron-4-340b-instruct': '',
'microsoft/phi-3-medium-128k-instruct':'',
'microsoft/phi-3-mini-128k-instruct':''
}

def _invoke(self, model: str, credentials: dict,
Expand Down
Original file line number Diff line number Diff line change
@@ -0,0 +1,36 @@
model: nvidia/nemotron-4-340b-instruct
label:
zh_Hans: nvidia/nemotron-4-340b-instruct
en_US: nvidia/nemotron-4-340b-instruct
model_type: llm
features:
- agent-thought
model_properties:
mode: chat
context_size: 131072
parameter_rules:
- name: temperature
use_template: temperature
min: 0
max: 1
default: 0.5
- name: top_p
use_template: top_p
min: 0
max: 1
default: 1
- name: max_tokens
use_template: max_tokens
min: 1
max: 4096
default: 1024
- name: frequency_penalty
use_template: frequency_penalty
min: -2
max: 2
default: 0
- name: presence_penalty
use_template: presence_penalty
min: -2
max: 2
default: 0
Original file line number Diff line number Diff line change
@@ -0,0 +1,36 @@
model: microsoft/phi-3-medium-128k-instruct
label:
zh_Hans: microsoft/phi-3-medium-128k-instruct
en_US: microsoft/phi-3-medium-128k-instruct
model_type: llm
features:
- agent-thought
model_properties:
mode: chat
context_size: 131072
parameter_rules:
- name: temperature
use_template: temperature
min: 0
max: 1
default: 0.5
- name: top_p
use_template: top_p
min: 0
max: 1
default: 1
- name: max_tokens
use_template: max_tokens
min: 1
max: 4096
default: 1024
- name: frequency_penalty
use_template: frequency_penalty
min: -2
max: 2
default: 0
- name: presence_penalty
use_template: presence_penalty
min: -2
max: 2
default: 0
Original file line number Diff line number Diff line change
@@ -0,0 +1,36 @@
model: microsoft/phi-3-mini-128k-instruct
label:
zh_Hans: microsoft/phi-3-mini-128k-instruct
en_US: microsoft/phi-3-mini-128k-instruct
model_type: llm
features:
- agent-thought
model_properties:
mode: chat
context_size: 131072
parameter_rules:
- name: temperature
use_template: temperature
min: 0
max: 1
default: 0.5
- name: top_p
use_template: top_p
min: 0
max: 1
default: 1
- name: max_tokens
use_template: max_tokens
min: 1
max: 4096
default: 1024
- name: frequency_penalty
use_template: frequency_penalty
min: -2
max: 2
default: 0
- name: presence_penalty
use_template: presence_penalty
min: -2
max: 2
default: 0

0 comments on commit 23ed15d

Please sign in to comment.