forked from intel/neural-compressor
-
Notifications
You must be signed in to change notification settings - Fork 1
/
run_sample.sh
executable file
·53 lines (41 loc) · 1.61 KB
/
run_sample.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
#!/bin/bash
echo "Note, please enable running environment before running this script."
echo "Enable Intel Optimized TensorFlow 2.6.0 and newer by setting environment variable TF_ENABLE_ONEDNN_OPTS=1"
echo "That will accelerate training and inference, and it's mandatory requirement of running Intel® Neural Compressor quantize Fp32 model or deploying the quantized model."
export TF_ENABLE_ONEDNN_OPTS=1
echo "Train Model by Keras/Tensorflow"
python train_model.py
FP32_FILE="model_keras.fp32"
if [ ! -d $FP32_FILE ]; then
echo "$FP32_FILE not exists."
echo "Train model is fault, exit!"
exit 1
else
echo "Training is finished"
fi
echo "Quantize Model by Intel Neural Compressor"
python inc_quantize_model.py
INT8_FILE="model_pb.int8"
if [ ! -d $INT8_FILE ]; then
echo "$INT8_FILE not exists."
echo "Quantize FP32 model is fault, exit!"
exit 1
else
echo "Quantization is finished"
fi
echo "Execute the profiling_inc.py with FP32 model file"
python profiling_inc.py --input-graph=./${FP32_FILE} --omp-num-threads=4 --num-inter-threads=1 --num-intra-threads=4 --index=32
echo "FP32 performance test is finished"
echo "Execute the profiling_inc.py with INT8 model file"
python profiling_inc.py --input-graph=./$INT8_FILE --omp-num-threads=4 --num-inter-threads=1 --num-intra-threads=4 --index=8
echo "INT8 performance test is finished"
echo "Compare the Performance of FP32 and INT8 Models"
python compare_perf.py
echo "Please check the PNG files to see the performance!"
if [[ $? -eq 0 ]]; then
echo "This demo is finished successfully!"
else
echo "This demo is fault!"
fi
echo "Thank you!"
exit 0