File tree 1 file changed +2
-1
lines changed
examples/qualcomm/oss_scripts/llama
1 file changed +2
-1
lines changed Original file line number Diff line number Diff line change @@ -843,6 +843,7 @@ def post_process():
843
843
)
844
844
845
845
runner_cmd = ""
846
+ performance_output_path = "outputs/inference_speed.txt"
846
847
if args .enable_x86_64 :
847
848
# x86 emulator is intended for CI and not performance. Check only the first few tokens.
848
849
seq_len = min (seq_len , 16 )
@@ -862,6 +863,7 @@ def post_process():
862
863
f"--model_path { pte_path } " ,
863
864
f"--seq_len { seq_len } " ,
864
865
f"--output_path { args .artifact } /outputs/outputs.txt" ,
866
+ f"--performance_output_path { performance_output_path } " ,
865
867
f"--kv_updater ShiftPointer" ,
866
868
runner_args ,
867
869
]
@@ -874,7 +876,6 @@ def post_process():
874
876
)
875
877
post_process ()
876
878
else :
877
- performance_output_path = "outputs/inference_speed.txt"
878
879
runner_cmd = " " .join (
879
880
[
880
881
f"cd { workspace } &&" ,
You can’t perform that action at this time.
0 commit comments