chatlawv1 / trlx /examples /hh /triton_config.pbtxt
teachyourselfcoding's picture
Upload 245 files
fa6856c
raw
history blame
624 Bytes
name: "${model_name}"
backend: "pytorch"
default_model_filename: "traced-model.pt"
max_batch_size: 25
parameters {
key: "model_name"
value: {
string_value: "${model_name}"
}
}
instance_group [
{
count: 1
kind: KIND_GPU
gpus: [0]
}
]
input [
{
name: "input_ids"
data_type: TYPE_INT32
dims: [-1]
}
]
output [
{
name: "rewards"
data_type: TYPE_FP16
dims: [-1]
}
]
parameters {
key: "data_type"
value: {
string_value: "fp16"
}
}
parameters: {
key: "INFERENCE_MODE"
value: {
string_value: "true"
}
}
version_policy: {specific: {versions: [1]}}