Skip to content

Commit

Permalink
remove performance test
Browse files Browse the repository at this point in the history
  • Loading branch information
kavioyu committed Nov 24, 2024
1 parent 30a0bab commit 8db243d
Showing 1 changed file with 0 additions and 26 deletions.
26 changes: 0 additions & 26 deletions test/srt/test_eagle_infer.py
Original file line number Diff line number Diff line change
Expand Up @@ -47,32 +47,6 @@ def test_eagle_accuracy(self):
print(out2)
self.assertEqual(out1, out2)

def test_2_eagle_offline_throughput(self):
server_args = ServerArgs(
model_path="meta-llama/Llama-2-7b-chat-hf",
draft_model_path="kavio/Sglang-EAGLE-llama2-chat-7B",
speculative_algorithm="EAGLE",
num_speculative_steps=3,
eagle_topk=4,
num_draft_tokens=16,
)
bench_args = BenchArgs(num_prompts=10)
result_eagle = throughput_test(server_args=server_args, bench_args=bench_args)

server_args = ServerArgs(
model_path="meta-llama/Llama-2-7b-chat-hf",
)
result_naive = throughput_test(server_args=server_args, bench_args=bench_args)

print("==== Throughput EAGLE ====")
print(result_eagle["total_throughput"])
print("==== Throughput Baseline ====")
print(result_naive["total_throughput"])

self.assertGreater(
result_eagle["total_throughput"], result_naive["total_throughput"] * 1.5
)


if __name__ == "__main__":
unittest.main()

0 comments on commit 8db243d

Please sign in to comment.