remove performance test

sgl-project · Nov 24, 2024 · 8db243d · 8db243d
1 parent 30a0bab
commit 8db243d
Showing 1 changed file with 0 additions and 26 deletions.
diff --git a/test/srt/test_eagle_infer.py b/test/srt/test_eagle_infer.py
@@ -47,32 +47,6 @@ def test_eagle_accuracy(self):
         print(out2)
         self.assertEqual(out1, out2)
 
-    def test_2_eagle_offline_throughput(self):
-        server_args = ServerArgs(
-            model_path="meta-llama/Llama-2-7b-chat-hf",
-            draft_model_path="kavio/Sglang-EAGLE-llama2-chat-7B",
-            speculative_algorithm="EAGLE",
-            num_speculative_steps=3,
-            eagle_topk=4,
-            num_draft_tokens=16,
-        )
-        bench_args = BenchArgs(num_prompts=10)
-        result_eagle = throughput_test(server_args=server_args, bench_args=bench_args)
-
-        server_args = ServerArgs(
-            model_path="meta-llama/Llama-2-7b-chat-hf",
-        )
-        result_naive = throughput_test(server_args=server_args, bench_args=bench_args)
-
-        print("==== Throughput EAGLE ====")
-        print(result_eagle["total_throughput"])
-        print("==== Throughput Baseline ====")
-        print(result_naive["total_throughput"])
-
-        self.assertGreater(
-            result_eagle["total_throughput"], result_naive["total_throughput"] * 1.5
-        )
-
 
 if __name__ == "__main__":
     unittest.main()