Skip to content

Commit

Permalink
Xfail 405b as sharding vmfb is unsupported
Browse files Browse the repository at this point in the history
  • Loading branch information
archana-ramalingam committed Oct 28, 2024
1 parent 09796b7 commit 8069f24
Showing 1 changed file with 4 additions and 1 deletion.
5 changes: 4 additions & 1 deletion sharktank/tests/evaluate/perplexity_vmfb_test.py
Original file line number Diff line number Diff line change
Expand Up @@ -164,6 +164,9 @@ def test_llama3_8B_fp8(self):
msg=f"Current perplexity deviates baseline by {perplexity_difference}",
)

@pytest.mark.xfail(
reason="Sharding is not supported yet",
)
@longrun
def test_llama3_405B_f16_decomposed(self):

Expand Down Expand Up @@ -267,7 +270,7 @@ def test_llama3_405B_fp8_decomposed(self):
)

@pytest.mark.xfail(
reason="Non-decomposed attention is not supported yet",
reason="FP8 model is unsupported",
)
@longrun
def test_llama3_405B_fp8(self):
Expand Down

0 comments on commit 8069f24

Please sign in to comment.