forked from ggml-org/llama.cpp
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcheck_sparq.sh
executable file
·24 lines (18 loc) · 1.56 KB
/
check_sparq.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
# Copyright (c) 2024 Graphcore Ltd. All rights reserved.
set -e
set -o xtrace
make -j main tests/test-sparq
./tests/test-sparq
./main -m ./models/llama-2-7b.Q8_0.gguf -p 'How tall is the Eiffel tower?' -n 16 -e --temp 0 -ctk f32 -ctv f32
./main -m ./models/llama-2-7b.Q8_0.gguf -p 'How tall is the Eiffel tower?' -n 16 -e --temp 0 -ctk f32 -ctv f32 --sparq -k1 0 -k2 0
./main -m ./models/llama-2-7b.Q8_0.gguf -p 'How tall is the Eiffel tower?' -n 16 -e --temp 0 -ctk f32 -ctv f32 --sparq -k1 0 -k2 0 --sparq-default-layout
./main -m ./models/llama-2-7b.Q8_0.gguf -p 'How tall is the Eiffel tower?' -n 16 -e --temp 0 -ctk f32 -ctv f32 --sparq -k1 32 -k2 8
./main -m ./models/llama-2-7b.Q8_0.gguf -p 'How tall is the Eiffel tower?' -n 16 -e --temp 0 -ctk f32 -ctv f32 --sparq -k1 32 -k2 8 --sparq-default-layout
if [[ $1 == "--half" ]] ; then
./main -m ./models/llama-2-7b.Q8_0.gguf -p 'How tall is the Eiffel tower?' -n 16 -e --temp 0 -ctk f16 -ctv f16
./main -m ./models/llama-2-7b.Q8_0.gguf -p 'How tall is the Eiffel tower?' -n 16 -e --temp 0 -ctk f16 -ctv f16 --sparq -k1 0 -k2 0
./main -m ./models/llama-2-7b.Q8_0.gguf -p 'How tall is the Eiffel tower?' -n 16 -e --temp 0 -ctk f16 -ctv f16 --sparq -k1 0 -k2 0 --sparq-default-layout
./main -m ./models/llama-2-7b.Q8_0.gguf -p 'How tall is the Eiffel tower?' -n 16 -e --temp 0 -ctk f16 -ctv f16 --sparq -k1 32 -k2 8
./main -m ./models/llama-2-7b.Q8_0.gguf -p 'How tall is the Eiffel tower?' -n 16 -e --temp 0 -ctk f16 -ctv f16 --sparq -k1 32 -k2 8 --sparq-default-layout
fi
echo -e "\n\n##### All checks passed! #####\n"