|
1 | 1 | {
|
2 | 2 | "bert_mini_mrpc": {
|
3 |
| - "working_dir": "deployment/neural_engine/mrpc/bert_mini", |
| 3 | + "working_dir": "huggingface/pytorch/text-classification/deployment/mrpc/bert_mini", |
4 | 4 | "data_dir": "/tf_dataset2/datasets/mrpc_data",
|
5 | 5 | "hf_model_name": "M-FAC/bert-mini-finetuned-mrpc",
|
6 | 6 | "benchmark": {
|
|
18 | 18 | }
|
19 | 19 | },
|
20 | 20 | "launcher": {
|
21 |
| - "cmd": "deployment/neural_engine/launcher.py", |
| 21 | + "cmd": "huggingface/pytorch/text-classification/deployment/launcher.py", |
22 | 22 | "params": {
|
23 | 23 | "max_throughput": {
|
24 | 24 | "mode": "max_throughput",
|
|
32 | 32 | }
|
33 | 33 | },
|
34 | 34 | "bert_mini_sst2": {
|
35 |
| - "working_dir": "deployment/neural_engine/sst2/bert_mini", |
| 35 | + "working_dir": "huggingface/pytorch/text-classification/deployment/sst2/bert_mini", |
36 | 36 | "data_dir": "/tf_dataset2/datasets/sst2_data",
|
37 | 37 | "hf_model_name": "moshew/bert-mini-sst2-distilled",
|
38 | 38 | "benchmark": {
|
|
50 | 50 | }
|
51 | 51 | },
|
52 | 52 | "launcher": {
|
53 |
| - "cmd": "deployment/neural_engine/launcher.py", |
| 53 | + "cmd": "huggingface/pytorch/text-classification/deployment/launcher.py", |
54 | 54 | "params": {
|
55 | 55 | "max_throughput": {
|
56 | 56 | "mode": "max_throughput",
|
|
64 | 64 | }
|
65 | 65 | },
|
66 | 66 | "bert_base_mrpc": {
|
67 |
| - "working_dir": "deployment/neural_engine/mrpc/bert_base", |
| 67 | + "working_dir": "huggingface/pytorch/text-classification/deployment/mrpc/bert_base", |
68 | 68 | "data_dir": "/tf_dataset2/datasets/mrpc_data",
|
69 | 69 | "hf_model_name": "textattack/bert-base-uncased-MRPC",
|
70 | 70 | "benchmark": {
|
|
82 | 82 | }
|
83 | 83 | },
|
84 | 84 | "launcher": {
|
85 |
| - "cmd": "deployment/neural_engine/launcher.py", |
| 85 | + "cmd": "huggingface/pytorch/text-classification/deployment/launcher.py", |
86 | 86 | "params": {
|
87 | 87 | "max_throughput": {
|
88 | 88 | "mode": "max_throughput",
|
|
96 | 96 | }
|
97 | 97 | },
|
98 | 98 | "distilbert_base_uncased_emotion": {
|
99 |
| - "working_dir": "deployment/neural_engine/emotion/distilbert_base_uncased", |
| 99 | + "working_dir": "huggingface/pytorch/text-classification/deployment/emotion/distilbert_base_uncased", |
100 | 100 | "tokenizer_dir": "/tf_dataset2/models/deep-engine/distilbert_base_uncased/test_tokenizer",
|
101 | 101 | "data_dir": "/tf_dataset2/datasets/emotion_data",
|
102 | 102 | "hf_model_name": "bhadresh-savani/distilbert-base-uncased-emotion",
|
|
114 | 114 | }
|
115 | 115 | },
|
116 | 116 | "launcher": {
|
117 |
| - "cmd": "deployment/neural_engine/launcher.py", |
| 117 | + "cmd": "huggingface/pytorch/text-classification/deployment/launcher.py", |
118 | 118 | "params": {
|
119 | 119 | "max_throughput": {
|
120 | 120 | "mode": "max_throughput",
|
|
128 | 128 | }
|
129 | 129 | },
|
130 | 130 | "bert_large_squad": {
|
131 |
| - "working_dir": "deployment/neural_engine/squad/bert_large", |
| 131 | + "working_dir": "huggingface/pytorch/question-answering/deployment/squad/bert_large", |
132 | 132 | "data_dir": "/tf_dataset2/models/deep-engine/bert_large",
|
133 | 133 | "hf_model_name": "bert-large-uncased-whole-word-masking-finetuned-squad",
|
134 | 134 | "benchmark": {
|
|
146 | 146 | }
|
147 | 147 | },
|
148 | 148 | "launcher": {
|
149 |
| - "cmd": "deployment/neural_engine/launcher.py", |
| 149 | + "cmd": "huggingface/pytorch/text-classification/deployment/launcher.py", |
150 | 150 | "params": {
|
151 | 151 | "max_throughput": {
|
152 | 152 | "mode": "max_throughput",
|
|
160 | 160 | }
|
161 | 161 | },
|
162 | 162 | "distilbert_base_uncased_sst2": {
|
163 |
| - "working_dir": "deployment/neural_engine/sst2/distilbert_base_uncased", |
| 163 | + "working_dir": "huggingface/pytorch/text-classification/deployment/sst2/distilbert_base_uncased", |
164 | 164 | "data_dir": "/tf_dataset2/datasets/sst2_data",
|
165 | 165 | "hf_model_name": "distilbert-base-uncased-finetuned-sst-2-english",
|
166 | 166 | "benchmark": {
|
|
178 | 178 | }
|
179 | 179 | },
|
180 | 180 | "launcher": {
|
181 |
| - "cmd": "deployment/neural_engine/launcher.py", |
| 181 | + "cmd": "huggingface/pytorch/text-classification/deployment/launcher.py", |
182 | 182 | "params": {
|
183 | 183 | "max_throughput": {
|
184 | 184 | "mode": "max_throughput",
|
|
192 | 192 | }
|
193 | 193 | },
|
194 | 194 | "distilbert_base_uncased_mrpc": {
|
195 |
| - "working_dir": "deployment/neural_engine/mrpc/distilbert_base_uncased", |
| 195 | + "working_dir": "huggingface/pytorch/text-classification/deployment/mrpc/distilbert_base_uncased", |
196 | 196 | "data_dir": "/tf_dataset2/datasets/mrpc_data",
|
197 | 197 | "hf_model_name": "textattack/distilbert-base-uncased-MRPC",
|
198 | 198 | "benchmark": {
|
|
210 | 210 | }
|
211 | 211 | },
|
212 | 212 | "launcher": {
|
213 |
| - "cmd": "deployment/neural_engine/launcher.py", |
| 213 | + "cmd": "huggingface/pytorch/text-classification/deployment/launcher.py", |
214 | 214 | "params": {
|
215 | 215 | "max_throughput": {
|
216 | 216 | "mode": "max_throughput",
|
|
224 | 224 | }
|
225 | 225 | },
|
226 | 226 | "minilm_l6_h384_uncased_sst2": {
|
227 |
| - "working_dir": "deployment/neural_engine/sst2/minilm_l6_h384_uncased", |
| 227 | + "working_dir": "huggingface/pytorch/text-classification/deployment/sst2/minilm_l6_h384_uncased", |
228 | 228 | "data_dir": "/tf_dataset2/datasets/sst2_data",
|
229 | 229 | "hf_model_name": "philschmid/MiniLM-L6-H384-uncased-sst2",
|
230 | 230 | "benchmark": {
|
|
242 | 242 | }
|
243 | 243 | },
|
244 | 244 | "launcher": {
|
245 |
| - "cmd": "deployment/neural_engine/launcher.py", |
| 245 | + "cmd": "huggingface/pytorch/text-classification/deployment/launcher.py", |
246 | 246 | "params": {
|
247 | 247 | "max_throughput": {
|
248 | 248 | "mode": "max_throughput",
|
|
256 | 256 | }
|
257 | 257 | },
|
258 | 258 | "bert_base_cased_mrpc": {
|
259 |
| - "working_dir": "deployment/neural_engine/mrpc/bert_base_cased", |
| 259 | + "working_dir": "huggingface/pytorch/text-classification/deployment/mrpc/bert_base_cased", |
260 | 260 | "data_dir": "/tf_dataset2/models/deep-engine/bert_base_cased_mrpc/mrpc_data",
|
261 | 261 | "hf_model_name": "bert-base-cased-finetuned-mrpc",
|
262 | 262 | "benchmark": {
|
|
274 | 274 | }
|
275 | 275 | },
|
276 | 276 | "launcher": {
|
277 |
| - "cmd": "deployment/neural_engine/launcher.py", |
| 277 | + "cmd": "huggingface/pytorch/text-classification/deployment/launcher.py", |
278 | 278 | "params": {
|
279 | 279 | "max_throughput": {
|
280 | 280 | "mode": "max_throughput",
|
|
288 | 288 | }
|
289 | 289 | },
|
290 | 290 | "roberta_base_mrpc": {
|
291 |
| - "working_dir": "deployment/neural_engine/mrpc/roberta_base", |
| 291 | + "working_dir": "huggingface/pytorch/text-classification/deployment/mrpc/roberta_base", |
292 | 292 | "data_dir": "/tf_dataset2/models/deep-engine/roberta_base_mrpc/data",
|
293 | 293 | "hf_model_name": "textattack/roberta-base-MRPC",
|
294 | 294 | "benchmark": {
|
|
306 | 306 | }
|
307 | 307 | },
|
308 | 308 | "launcher": {
|
309 |
| - "cmd": "deployment/neural_engine/launcher.py", |
| 309 | + "cmd": "huggingface/pytorch/text-classification/deployment/launcher.py", |
310 | 310 | "params": {
|
311 | 311 | "max_throughput": {
|
312 | 312 | "mode": "max_throughput",
|
|
320 | 320 | }
|
321 | 321 | },
|
322 | 322 | "bert_mini_sparse": {
|
323 |
| - "working_dir": "deployment/neural_engine/sparse/bert_mini", |
| 323 | + "working_dir": "huggingface/pytorch/text-classification/deployment/sst2/bert_mini", |
324 | 324 | "data_dir": "/tf_dataset2/datasets/sst2_data",
|
325 | 325 | "hf_model_name": "Intel/bert-mini-sst2-distilled-sparse-90-1X4-block",
|
326 | 326 | "benchmark": {
|
|
338 | 338 | }
|
339 | 339 | },
|
340 | 340 | "launcher": {
|
341 |
| - "cmd": "deployment/neural_engine/launcher.py", |
| 341 | + "cmd": "huggingface/pytorch/text-classification/deployment/launcher.py", |
342 | 342 | "params": {
|
343 | 343 | "max_throughput": {
|
344 | 344 | "mode": "max_throughput",
|
|
352 | 352 | }
|
353 | 353 | },
|
354 | 354 | "distilbert_base_uncased_squad_sparse": {
|
355 |
| - "working_dir": "deployment/neural_engine/sparse/distilbert_base_uncased", |
| 355 | + "working_dir": "huggingface/pytorch/text-classification/deployment/sparse/distilbert_base_uncased", |
356 | 356 | "data_dir": "/tf_dataset2/models/deep-engine/bert_large",
|
357 | 357 | "hf_model_name": "Intel/distilbert-base-uncased-squadv1.1-sparse-80-1x4-block-pruneofa",
|
358 | 358 | "benchmark": {
|
|
370 | 370 | }
|
371 | 371 | },
|
372 | 372 | "launcher": {
|
373 |
| - "cmd": "deployment/neural_engine/launcher.py", |
| 373 | + "cmd": "huggingface/pytorch/text-classification/deployment/launcher.py", |
374 | 374 | "params": {
|
375 | 375 | "max_throughput": {
|
376 | 376 | "mode": "max_throughput",
|
|
384 | 384 | }
|
385 | 385 | },
|
386 | 386 | "length_adaptive_dynamic": {
|
387 |
| - "working_dir": "deployment/neural_engine/squad/length_adaptive_transformer", |
| 387 | + "working_dir": "huggingface/pytorch/question-answering/deployment/squad/length_adaptive_transformer", |
388 | 388 | "data_dir": "/tf_dataset2/models/deep-engine/bert_large",
|
389 | 389 | "hf_model_name": "sguskin/dynamic-minilmv2-L6-H384-squad1.1",
|
390 | 390 | "benchmark": {
|
|
402 | 402 | }
|
403 | 403 | },
|
404 | 404 | "launcher": {
|
405 |
| - "cmd": "deployment/neural_engine/launcher.py", |
| 405 | + "cmd": "huggingface/pytorch/text-classification/deployment/launcher.py", |
406 | 406 | "params": {
|
407 | 407 | "max_throughput": {
|
408 | 408 | "mode": "max_throughput",
|
|
416 | 416 | }
|
417 | 417 | },
|
418 | 418 | "vit_large": {
|
419 |
| - "working_dir": "deployment/neural_engine/imagenet/vit", |
| 419 | + "working_dir": "huggingface/pytorch/image-classification/deployment/imagenet/vit", |
420 | 420 | "data_dir": "/tf_dataset2/models/nlp_toolkit/vit/cached-2k-imagenet-1k-datasets",
|
421 | 421 | "hf_model_name": "google/vit-large-patch16-224",
|
422 | 422 | "benchmark": {
|
|
432 | 432 | }
|
433 | 433 | },
|
434 | 434 | "launcher": {
|
435 |
| - "cmd": "deployment/neural_engine/launcher.py", |
| 435 | + "cmd": "huggingface/pytorch/text-classification/deployment/launcher.py", |
436 | 436 | "params": {
|
437 | 437 | "max_throughput": {
|
438 | 438 | "mode": "max_throughput",
|
|
446 | 446 | }
|
447 | 447 | },
|
448 | 448 | "vit_base": {
|
449 |
| - "working_dir": "deployment/neural_engine/imagenet/vit", |
| 449 | + "working_dir": "huggingface/pytorch/image-classification/deployment/imagenet/vit", |
450 | 450 | "data_dir": "/tf_dataset2/models/nlp_toolkit/vit/cached-2k-imagenet-1k-datasets",
|
451 | 451 | "hf_model_name": "google/vit-base-patch16-224",
|
452 | 452 | "benchmark": {
|
|
463 | 463 | }
|
464 | 464 | },
|
465 | 465 | "launcher": {
|
466 |
| - "cmd": "deployment/neural_engine/launcher.py", |
| 466 | + "cmd": "huggingface/pytorch/text-classification/deployment/launcher.py", |
467 | 467 | "params": {
|
468 | 468 | "max_throughput": {
|
469 | 469 | "mode": "max_throughput",
|
|
477 | 477 | }
|
478 | 478 | },
|
479 | 479 | "stable_diffusion": {
|
480 |
| - "working_dir": "deployment/neural_engine/stable_diffusion", |
| 480 | + "working_dir": "huggingface/pytorch/text-to-image/deployment/stable_diffusion", |
481 | 481 | "data_dir": " ",
|
482 | 482 | "hf_model_name": "CompVis/stable-diffusion-v1-4",
|
483 | 483 | "prepare": {
|
|
498 | 498 | }
|
499 | 499 | },
|
500 | 500 | "gpt-j-6b": {
|
501 |
| - "working_dir": "deployment/neural_engine/gpt-j", |
| 501 | + "working_dir": "huggingface/pytorch/text-generation/deployment/gpt-j", |
502 | 502 | "data_dir": " ",
|
503 | 503 | "hf_model_name": "EleutherAI/gpt-j-6B",
|
504 | 504 | "prepare": {
|
505 | 505 | "cmd": "python gen_ir.py",
|
506 | 506 | "params": {
|
507 |
| - "model": "EleutherAI/gpt-j-6B", |
| 507 | + "model": "/tf_dataset2/models/pytorch/gpt-j-6B", |
508 | 508 | "dtype": "fp32/bf16/int8",
|
509 | 509 | "output_model": "ir",
|
510 | 510 | "pt_file": "pt"
|
|
0 commit comments