|
| 1 | +{ |
| 2 | + "_parent_entries": [ [ "^", "byname", "base_loadgen_experiment" ] ], |
| 3 | + |
| 4 | + "transformers_query": [ "python_package", "package_name=transformers", ["desired_python_version", ["^", "kernel_python_major_dot_minor"]] ], |
| 5 | + |
| 6 | + "_BEFORE_CODE_LOADING": [ "^^", "execute", [[ |
| 7 | + [ "get_kernel" ], |
| 8 | + [ "byquery", [[ "^^", "get", "transformers_query" ]] ], |
| 9 | + [ "use" ] |
| 10 | + ]] ], |
| 11 | + |
| 12 | + "desired_python_version": "3.10", |
| 13 | + |
| 14 | + "mlperf_inference_git_entry": [ "^", "byquery", "git_repo,repo_name=mlperf_inference_git" ], |
| 15 | + |
| 16 | + "abs_script_path": [ "^^", "execute", [[ |
| 17 | + [ "get", "mlperf_inference_git_entry" ], |
| 18 | + [ "get_path_of", "llama3_1_8b_cnndm_accuracy_script" ] |
| 19 | + ]] ], |
| 20 | + |
| 21 | + "accuracy_log_path": ["^^", "get_path", "mlperf_log_accuracy.json"], |
| 22 | + |
| 23 | + "dataset_name": "cnndm", |
| 24 | + "model_family": "llama3_1", |
| 25 | + "model_variant": "8b", |
| 26 | + |
| 27 | + "dataset_query": [ "downloaded", [ "^^", "substitute", "dataset_name=#{dataset_name}#,model_family=#{model_family}#,variant=#{model_variant}#" ]], |
| 28 | + "dataset_entry": [ "^", "byquery", [[ "^^", "get", "dataset_query" ]], {}, ["dataset_query"] ], |
| 29 | + |
| 30 | + "dataset_path": [ "^^", "execute", [[ |
| 31 | + [ "get", "dataset_entry" ], |
| 32 | + [ "get_path" ], |
| 33 | + [ "__add__", "/cnn_eval.json" ] |
| 34 | + ]] ], |
| 35 | + |
| 36 | + "checkpoint_path_query": [ "^^", "substitute", "downloaded,hf_tokeniser,model_family=#{model_family}#,variant=#{model_variant}#" ], |
| 37 | + "checkpoint_path": [ "^^", "execute", [[ |
| 38 | + [ "get_kernel" ], |
| 39 | + [ "byquery", [[ "^^", "get", "checkpoint_path_query" ]] ], |
| 40 | + [ "get_path" ] |
| 41 | + ]] ], |
| 42 | + |
| 43 | + "accuracy_log_dtype": "int32", |
| 44 | + |
| 45 | + "extract_accuracy_report": [ "^^", "execute", [[ |
| 46 | + [ "get_kernel" ], |
| 47 | + [ "byname", "python_script" ], |
| 48 | + [ "run", [], { |
| 49 | + "python_deps": [ |
| 50 | + [ "AS^IS", "^^", "python_sync_pip_package", "python_package,package_name=protobuf" ], |
| 51 | + [ "AS^IS", "^^", "python_sync_pip_package", "python_package,package_name=torch" ], |
| 52 | + [ "AS^IS", "^^", "python_sync_pip_package", "python_package,package_name=transformers" ], |
| 53 | + [ "AS^IS", "^^", "python_sync_pip_package", "python_package,package_name=nltk" ], |
| 54 | + [ "AS^IS", "^^", "python_sync_pip_package", "python_package,package_name=rouge_score" ], |
| 55 | + [ "AS^IS", "^^", "python_sync_pip_package", "python_package,package_name=sentencepiece" ], |
| 56 | + [ "AS^IS", "^^", "python_sync_pip_package", "python_package,package_name=pillow" ], |
| 57 | + [ "AS^IS", "^^", "python_sync_pip_package", "python_package,package_name=evaluate" ] |
| 58 | + ], |
| 59 | + "abs_script_path": ["^^", "get", "abs_script_path"], |
| 60 | + "script_extra_params": [ "^^", "substitute", "--mlperf-accuracy-file #{accuracy_log_path}# --dataset-file #{dataset_path}# --dtype #{accuracy_log_dtype}#" ], |
| 61 | + "desired_python_version": ["^", "kernel_python_major_dot_minor"], |
| 62 | + "capture_output": true |
| 63 | + } ], |
| 64 | + 0, |
| 65 | + [ "func", [ "ufun.rematch", "(\\{.*\\})" ] ], |
| 66 | + 0, |
| 67 | + [ "denumpify_dict" ], |
| 68 | + 0, |
| 69 | + [ "func", "str" ] |
| 70 | + ]], {} ], |
| 71 | + |
| 72 | + "accuracy_dict_full": [ "^^", "execute", [[ |
| 73 | + ["get", "accuracy_report" ], |
| 74 | + 0, |
| 75 | + [ "func", "eval" ] |
| 76 | + ]], {} ], |
| 77 | + "accuracy_dict": [ "^^", "get_accuracy_dict" ], |
| 78 | + "rouge1": [ "^^" , "dig","accuracy_dict.rouge1" ], |
| 79 | + "rouge2": [ "^^" , "dig","accuracy_dict.rouge2" ], |
| 80 | + "rougeL": [ "^^" , "dig","accuracy_dict.rougeL" ], |
| 81 | + "rougeLsum": [ "^^" , "dig","accuracy_dict.rougeLsum" ], |
| 82 | + "gen_len": [ "^^" , "dig","accuracy_dict.gen_len" ], |
| 83 | + "gen_num": [ "^^" , "dig","accuracy_dict.gen_num" ], |
| 84 | + "tokens_per_sample": [ "^^" , "dig","accuracy_dict.tokens_per_sample" ], |
| 85 | + |
| 86 | + "tokenised_accuracy_log_path": [ "^^", "get_path", "mlperf_log_accuracy.json" ], |
| 87 | + "output_log_path": [ "^^", "get_path", "detokenised_mlperf_log.json" ], |
| 88 | + |
| 89 | + "detokenised_log": [ "^^", "detokenise" ] |
| 90 | +} |
0 commit comments