OLive/examples/falcon/config.json

43 строки
1.5 KiB
JSON

{
"input_model": { "type": "HfModel", "model_path": "tiiuae/falcon-7b", "task": "text-generation" },
"systems": {
"local_system": {
"type": "LocalSystem",
"accelerators": [ { "device": "gpu", "execution_providers": [ "CUDAExecutionProvider" ] } ]
}
},
"data_configs": [
{
"name": "openassistant_train",
"type": "HuggingfaceContainer",
"load_dataset_config": { "data_name": "timdettmers/openassistant-guanaco", "split": "train" },
"pre_process_data_config": { "max_seq_len": 512, "max_samples": 1 }
}
],
"evaluators": {
"common_evaluator": {
"metrics": [
{
"name": "latency",
"type": "latency",
"data_config": "openassistant_train",
"sub_types": [
{ "name": "avg", "priority": 1, "goal": { "type": "percent-min-improvement", "value": 5 } },
{ "name": "max" },
{ "name": "min" }
]
}
]
}
},
"passes": {
"conversion": { "type": "OnnxConversion", "target_opset": 13 },
"transformers_optimization": { "type": "OrtTransformersOptimization", "float16": true }
},
"evaluator": "common_evaluator",
"host": "local_system",
"target": "local_system",
"cache_dir": "cache",
"output_dir": "models/falcon"
}