Co-authored-by: Chenhe Gu <guchenhe@gmail.com>
@@ -12,6 +12,7 @@
- meta.llama3-70b-instruct-v1:0
- meta.llama2-13b-chat-v1
- meta.llama2-70b-chat-v1
+- mistral.mistral-small-2402-v1:0
- mistral.mistral-large-2402-v1:0
- mistral.mixtral-8x7b-instruct-v0:1
- mistral.mistral-7b-instruct-v0:2
@@ -0,0 +1,27 @@
+model: mistral.mistral-small-2402-v1:0
+label:
+ en_US: Mistral Small
+model_type: llm
+model_properties:
+ mode: completion
+ context_size: 32000
+parameter_rules:
+ - name: temperature
+ use_template: temperature
+ required: false
+ default: 0.7
+ - name: top_p
+ use_template: top_p
+ default: 1
+ - name: max_tokens
+ use_template: max_tokens
+ required: true
+ default: 512
+ min: 1
+ max: 4096
+pricing:
+ input: '0.001'
+ output: '0.03'
+ unit: '0.001'
+ currency: USD
@@ -1,3 +1,4 @@
- amazon.titan-embed-text-v1
+- amazon.titan-embed-text-v2:0
- cohere.embed-english-v3
- cohere.embed-multilingual-v3
@@ -4,5 +4,5 @@ model_properties:
context_size: 8192
pricing:
input: '0.0001'
- unit: '0.001'
+ unit: '0.0001'
currency: USD
@@ -0,0 +1,8 @@
+model: amazon.titan-embed-text-v2:0
+model_type: text-embedding
+ context_size: 8192
+ input: '0.00002'
+ unit: '0.00001'