-
Notifications
You must be signed in to change notification settings - Fork 48
Expand file tree
/
Copy pathconfig.json
More file actions
51 lines (51 loc) · 1.83 KB
/
config.json
File metadata and controls
51 lines (51 loc) · 1.83 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
{
"input_model": {
"type": "HfModel",
"model_path": "Alibaba-NLP/gte-large-en-v1.5",
"load_kwargs": { "trust_remote_code": true },
"task": "feature-extraction",
"io_config": {
"input_names": [ "input_ids", "token_type_ids", "attention_mask" ],
"input_shapes": [ [ 1, 128 ], [ 1, 128 ], [ 1, 128 ] ],
"input_types": [ "int64", "int64", "int64" ],
"output_names": [ "last_hidden_state" ],
"dynamic_axes": {
"input_ids": { "0": "batch_size", "1": "seq_len" },
"token_type_ids": { "0": "batch_size", "1": "seq_len" },
"attention_mask": { "0": "batch_size", "1": "seq_len" },
"last_hidden_state": { "0": "batch_size", "1": "seq_len" }
}
}
},
"data_configs": [
{
"name": "c4",
"type": "HuggingfaceContainer",
"user_script": "user_script.py",
"load_dataset_config": {
"data_name": "allenai/c4",
"subset": "en",
"split": "validation",
"streaming": true
},
"pre_process_data_config": {
"type": "dataset_pre_process",
"max_samples": 128,
"model_name": "Alibaba-NLP/gte-large-en-v1.5"
}
}
],
"evaluators": {
"evaluator": {
"metrics": [
{ "name": "latency", "type": "latency", "sub_types": [ { "name": "avg" } ], "data_config": "c4" }
]
}
},
"passes": {
"conversion": { "type": "OnnxConversion" },
"OnnxQuantization": { "type": "OnnxStaticQuantization", "quant_preprocess": true, "data_config": "c4" }
},
"evaluator": "evaluator",
"output_dir": "models/gte-large-en-v1.5"
}