Skip to content

Commit adc470e

Browse files
authored
Merge pull request #13 from davidz-ampere/image_2.2.1
update to docker image 2.2.1
2 parents 0c31b38 + 0c4789c commit adc470e

File tree

2 files changed

+4
-4
lines changed

2 files changed

+4
-4
lines changed

benchmarks/run.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ def get_file_dir():
1212

1313

1414
def docker_init(node):
15-
tag = "amperecomputingai/llama.cpp:2.0.0"
15+
tag = "amperecomputingai/llama.cpp:2.2.1"
1616
if subprocess.run(
1717
["docker", "pull", tag]).returncode != 0:
1818
print("Docker pull process failed!")

benchmarks/utils/benchmark.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -67,7 +67,7 @@ def summarize_results(logs_dir, args, start, finish):
6767
ttfts = []
6868
tg_lats = []
6969
for n in range(args.num_processes):
70-
results = open(f"{logs_dir}/log_{n}", "r").readlines()[-9].split("|")
70+
results = open(f"{logs_dir}/log_{n}", "r").readlines()[5].split("|")
7171
prompt_size = int(results[1])
7272
assert prompt_size == args.prompt_size
7373
tokens_generated = int(results[2])
@@ -142,11 +142,11 @@ def main():
142142
if mem_place == "none":
143143
cmd = ["numactl", f"--physcpubind={gen_threads_config(args.num_threads, n)}",
144144
"/llm/llama-batched-bench", "-m", args.model, "-c", str(args.kv_cache), "-b", "2048", "-ub", "512", "-npp", str(args.prompt_size), "-ntg", str(TOKENS),
145-
"-npl", str(args.batch_size), "-t", str(args.num_threads), "-tb", str(args.num_threads), "-td", str(args.num_threads)]
145+
"-npl", str(args.batch_size), "-t", str(args.num_threads), "-tb", str(args.num_threads)]
146146
else:
147147
cmd = ["numactl", f"--physcpubind={gen_threads_config(args.num_threads, n)}",str(mem_place),
148148
"/llm/llama-batched-bench", "-m", args.model, "-c", str(args.kv_cache), "-b", "2048", "-ub", "512", "-npp", str(args.prompt_size), "-ntg", str(TOKENS),
149-
"-npl", str(args.batch_size), "-t", str(args.num_threads), "-tb", str(args.num_threads), "-td", str(args.num_threads)]
149+
"-npl", str(args.batch_size), "-t", str(args.num_threads), "-tb", str(args.num_threads)]
150150

151151
else:
152152
print("FAIL: batched-bench not found!")

0 commit comments

Comments
 (0)