@@ -19,8 +19,8 @@ class TestClass:
1919 params = {
2020 "test_batched_w8o16_qembedding" : [
2121 dict (batch = 1 , seqlen = 33 , vocab_size = 50288 , embedding_dim = 768 ), # mamba2-130m
22- dict (batch = 16 , seqlen = 33 , vocab_size = 50288 , embedding_dim = 2560 ), # mamba2-2.7b
23- dict (batch = 16 , seqlen = 1024 , vocab_size = 256000 , embedding_dim = 4096 ), # mamba2-8b
22+ dict (batch = 8 , seqlen = 33 , vocab_size = 50288 , embedding_dim = 2560 ), # mamba2-2.7b
23+ dict (batch = 8 , seqlen = 1024 , vocab_size = 256000 , embedding_dim = 4096 ), # mamba2-8b
2424 ],
2525 "test_w8o16_qembedding" : [
2626 dict (seqlen = 33 , vocab_size = 50288 , embedding_dim = 768 ), # mamba2-130m
@@ -29,8 +29,8 @@ class TestClass:
2929 ],
3030 "test_batched_w4o16_qembedding" : [
3131 dict (batch = 1 , seqlen = 33 , vocab_size = 50288 , embedding_dim = 768 ), # mamba2-130m
32- dict (batch = 16 , seqlen = 33 , vocab_size = 50288 , embedding_dim = 2560 ), # mamba2-2.7b
33- dict (batch = 16 , seqlen = 1024 , vocab_size = 256000 , embedding_dim = 4096 ), # mamba2-8b
32+ dict (batch = 8 , seqlen = 33 , vocab_size = 50288 , embedding_dim = 2560 ), # mamba2-2.7b
33+ dict (batch = 8 , seqlen = 1024 , vocab_size = 256000 , embedding_dim = 4096 ), # mamba2-8b
3434 ],
3535 "test_w4o16_qembedding" : [
3636 dict (seqlen = 33 , vocab_size = 50288 , embedding_dim = 768 ), # mamba2-130m
0 commit comments