aviator19941/llama8b_commands.txt Secret

## llama8b_commands.txt
ROCR_VISIBLE_DEVICES=0 ../iree-build-no-trace/tools/iree-benchmark-module \
  --device=hip://0 \
  --hip_use_streams=true \
  --hip_allow_inline_execution=true \
  --device_allocator=caching \
  --module={VMFB_NAME} \
  --parameters=model={GGUF NAME} \
  --function=prefill_bs4 \
  --input=4x32xsi64 \
  --input=4xsi64 \
  --input=4x2xsi64 \
  --input=128x1048576xf16 \
  --benchmark_repetitions=3

ROCR_VISIBLE_DEVICES=0 ../iree-build-no-trace/tools/iree-benchmark-module \
  --device=hip://0 \
  --hip_use_streams=true \
  --hip_allow_inline_execution=true \
  --device_allocator=caching \
  --module={VMFB_NAME} \
  --parameters=model={GGUF_NAME} \
  --function=decode_bs4 \
  --input=4x1xsi64 \
  --input=4xsi64 \
  --input=4xsi64 \
  --input=4x2xsi64 \
  --input=128x1048576xf16 \
  --benchmark_repetitions=3
	ROCR_VISIBLE_DEVICES=0 ../iree-build-no-trace/tools/iree-benchmark-module \
	--device=hip://0 \
	--hip_use_streams=true \
	--hip_allow_inline_execution=true \
	--device_allocator=caching \
	--module={VMFB_NAME} \
	--parameters=model={GGUF NAME} \
	--function=prefill_bs4 \
	--input=4x32xsi64 \
	--input=4xsi64 \
	--input=4x2xsi64 \
	--input=128x1048576xf16 \
	--benchmark_repetitions=3

	ROCR_VISIBLE_DEVICES=0 ../iree-build-no-trace/tools/iree-benchmark-module \
	--device=hip://0 \
	--hip_use_streams=true \
	--hip_allow_inline_execution=true \
	--device_allocator=caching \
	--module={VMFB_NAME} \
	--parameters=model={GGUF_NAME} \
	--function=decode_bs4 \
	--input=4x1xsi64 \
	--input=4xsi64 \
	--input=4xsi64 \
	--input=4x2xsi64 \
	--input=128x1048576xf16 \
	--benchmark_repetitions=3