Skip to content

Commit 8069f24

Browse files
Xfail 405b as sharding vmfb is unsupported
1 parent 09796b7 commit 8069f24

File tree

1 file changed

+4
-1
lines changed

1 file changed

+4
-1
lines changed

sharktank/tests/evaluate/perplexity_vmfb_test.py

+4-1
Original file line numberDiff line numberDiff line change
@@ -164,6 +164,9 @@ def test_llama3_8B_fp8(self):
164164
msg=f"Current perplexity deviates baseline by {perplexity_difference}",
165165
)
166166

167+
@pytest.mark.xfail(
168+
reason="Sharding is not supported yet",
169+
)
167170
@longrun
168171
def test_llama3_405B_f16_decomposed(self):
169172

@@ -267,7 +270,7 @@ def test_llama3_405B_fp8_decomposed(self):
267270
)
268271

269272
@pytest.mark.xfail(
270-
reason="Non-decomposed attention is not supported yet",
273+
reason="FP8 model is unsupported",
271274
)
272275
@longrun
273276
def test_llama3_405B_fp8(self):

0 commit comments

Comments
 (0)