[ Kernel ] Enable fp8-marlin for fbgemm-fp8 models (#6606)

This commit is contained in:
Robert Shaw
2024-07-20 14:50:10 -04:00
committed by GitHub
parent 06d6c5fe9f
commit 9364f74eee
4 changed files with 44 additions and 3 deletions

View File

@@ -0,0 +1,11 @@
# bash .buildkite/lm-eval-harness/run-lm-eval-gsm-hf-baseline.sh -m nm-testing/Meta-Llama-3-70B-Instruct-FBGEMM-nonuniform -b auto -l 1000 -f 5
model_name: "nm-testing/Meta-Llama-3-70B-Instruct-FBGEMM-nonuniform"
tasks:
- name: "gsm8k"
metrics:
- name: "exact_match,strict-match"
value: 0.905
- name: "exact_match,flexible-extract"
value: 0.905
limit: 1000
num_fewshot: 5