Skip to content
This repository has been archived by the owner on Aug 30, 2024. It is now read-only.

Commit

Permalink
Merge branch 'phi2' of https://github.com/intel/neural-speed into phi2
Browse files Browse the repository at this point in the history
  • Loading branch information
intellinjun committed Jan 25, 2024
2 parents 3702d1a + 105fab6 commit 1a86d12
Show file tree
Hide file tree
Showing 3 changed files with 6 additions and 7 deletions.
1 change: 0 additions & 1 deletion requirements.txt
Original file line number Diff line number Diff line change
Expand Up @@ -13,5 +13,4 @@ tiktoken
py-cpuinfo
gguf
cmake
auto-gptq
setuptools>=61
8 changes: 4 additions & 4 deletions scripts/cal_diff.py
Original file line number Diff line number Diff line change
Expand Up @@ -35,10 +35,10 @@ def cmpData(numa, numb):
args = parser.parse_args()

woq_configs = {
"fp32": {"use_cache":True, "use_quant":False},
# "ggml_int4": {"compute_dtype":"int8", "weight_dtype":"int4", "use_cache":True, "use_ggml":True},
"jblas_int4": {"compute_dtype":"int8", "weight_dtype":"int4", "use_cache":True},
# "jblas_int8": {"compute_dtype":"bf16", "weight_dtype":"int8", "use_cache":True},
"fp32": {"use_quant":False},
# "ggml_int4": {"compute_dtype":"int8", "weight_dtype":"int4", "use_ggml":True},
"jblas_int4": {"compute_dtype":"int8", "weight_dtype":"int4"},
# "jblas_int8": {"compute_dtype":"bf16", "weight_dtype":"int8"},

}
prompt = "What is the meaning of life?"
Expand Down
4 changes: 2 additions & 2 deletions tests/model-test/cpp_graph_inference.sh
Original file line number Diff line number Diff line change
Expand Up @@ -260,9 +260,9 @@ function main() {
infer_cmd="./build/bin/run_whisper"
precision_list+=("q4_0")
elif [[ "${model}" == "phi2" ]]; then
quant_script="./build/bin/quant_phi2"
quant_script="./build/bin/quant_phi"
convert_script="${convert_script}/convert_phi.py"
infer_cmd="./build/bin/run_phi2"
infer_cmd="./build/bin/run_phi"
else
echo "Error: Unexpedted model: $model" 1>&2
exit 1
Expand Down

0 comments on commit 1a86d12

Please sign in to comment.