min-jean-cho
diff --git a/‎dockerfiles/pytorch/pytorch-spr-rnnt-inference.Dockerfile
+3-10 b/‎dockerfiles/pytorch/pytorch-spr-rnnt-inference.Dockerfile
+3-10
diff --git a/‎quickstart/language_modeling/pytorch/rnnt/inference/cpu/.docs/datasets.md
+1-1 b/‎quickstart/language_modeling/pytorch/rnnt/inference/cpu/.docs/datasets.md
+1-1
diff --git a/‎quickstart/language_modeling/pytorch/rnnt/inference/cpu/.docs/docker_spr.md
+7-5 b/‎quickstart/language_modeling/pytorch/rnnt/inference/cpu/.docs/docker_spr.md
+7-5
diff --git a/‎quickstart/language_modeling/pytorch/rnnt/inference/cpu/.docs/quickstart.md
+1-1 b/‎quickstart/language_modeling/pytorch/rnnt/inference/cpu/.docs/quickstart.md
+1-1
diff --git a/‎quickstart/language_modeling/pytorch/rnnt/inference/cpu/README.md
+5-5 b/‎quickstart/language_modeling/pytorch/rnnt/inference/cpu/README.md
+5-5
diff --git a/‎quickstart/language_modeling/pytorch/rnnt/inference/cpu/README_SPR.md
+9-7 b/‎quickstart/language_modeling/pytorch/rnnt/inference/cpu/README_SPR.md
+9-7
diff --git a/‎quickstart/language_modeling/pytorch/rnnt/inference/cpu/accuracy.sh
+43-28 b/‎quickstart/language_modeling/pytorch/rnnt/inference/cpu/accuracy.sh
+43-28
diff --git a/‎quickstart/language_modeling/pytorch/rnnt/inference/cpu/accuracy_baremetal.sh
-73 b/‎quickstart/language_modeling/pytorch/rnnt/inference/cpu/accuracy_baremetal.sh
-73
@@ -62,19 +62,13 @@ RUN chown -R root ${MODEL_WORKSPACE}/${PACKAGE_NAME} && chgrp -R root ${MODEL_WO
 
 WORKDIR ${MODEL_WORKSPACE}/${PACKAGE_NAME}
 
-ARG RNNT_DIR="/workspace/pytorch-spr-rnnt-inference/models/rnnt"
 
 RUN source activate pytorch && \
-    conda install intel-openmp && \
-    yum install -y libsndfile && \
-    cd ${RNNT_DIR} && \
-    cd training/rnn_speech_recognition/pytorch && \
+    cd ${MODEL_WORKSPACE}/${PACKAGE_NAME}/models/language_modeling/pytorch/rnnt/inference/cpu && \
     pip install -r requirements.txt && \
     pip install unidecode inflect && \
-    mkdir -p /root/.local
-
-RUN source activate pytorch && \
-    cd /workspace && \
+    yum install -y libsndfile && \
+    mkdir -p /root/.local && \
     git clone https://github.com/HawkAaron/warp-transducer && \
     cd warp-transducer && \
     mkdir build && \
@@ -84,7 +78,6 @@ RUN source activate pytorch && \
     cd ../pytorch_binding && \
     python setup.py install
 
-
 FROM intel-optimized-pytorch AS release
 COPY --from=intel-optimized-pytorch /root/conda /root/conda
 COPY --from=intel-optimized-pytorch /workspace/lib/ /workspace/lib/
 
@@ -16,7 +16,7 @@ docker run --rm \
   -w /workspace/<package dir> \
   -it \
   <docker image> \
-  /bin/bash quickstart/download_inference_dataset.sh
+  /bin/bash quickstart/download_dataset.sh
 ```
 
 This `DATASET_DIR` environment variable will be used again when
 
@@ -1,10 +1,12 @@
 ## Run the model
 
-Download the pretrained model and set the `PRETRAINED_MODEL` environment variable
-to point to the file:
+Set the `CHECKPOINT_DIR` environment variable and run the script to download the
+pretrained model:
 ```
-wget https://zenodo.org/record/3662521/files/DistributedDataParallel_1576581068.9962234-epoch-100.pt?download=1 -O rnnt.pt
-export PRETRAINED_MODEL=$(pwd)/rnnt.pt
+export CHECKPOINT_DIR=<directory to download the pretrained model>
+mkdir -p $CHECKPOINT_DIR
+cd <package dir>
+bash download_model.sh
 ```
 
 After you've downloaded the pretrained model and followed the instructions to
@@ -22,7 +24,7 @@ cd <package dir>
 
 # Set the required environment vars
 export DATASET_DIR=<path to the dataset>
-export PRETRAINED_MODEL=<path to the rnnt.pt file>
+export CHECKPOINT_DIR=<path to the downloaded model weights directory>
 export PRECISION=<specify the precision to run (fp32 or bf16)>
 export OUTPUT_DIR=<directory where log files will be written>
 
 
@@ -3,7 +3,7 @@
 
 | Script name | Description |
 |-------------|-------------|
-| `download_inference_dataset.sh` | Download and prepare the LibriSpeech inference dataset. See the [datasets section](#datasets) for instructions on it's usage. |
+| `download_dataset.sh` | Download and prepare the LibriSpeech inference dataset. See the [datasets section](#datasets) for instructions on it's usage. |
 | `inference_realtime.sh` | Runs multi-instance inference using 4 cores per instance for the specified precision (fp32, avx-fp32, or bf16). |
 | `inference_throughput.sh` | Runs multi-instance inference using 1 instance per socket for the specified precision (fp32, avx-fp32, or bf16). |
 | `accuracy.sh` | Runs an inference accuracy test for the specified precision (fp32, avx-fp32, or bf16). |
 
@@ -19,13 +19,13 @@ Follow [link](/docs/general/pytorch/BareMetalSetup.md) to install Conda and buil
 * Download and preprocess RNN-T dataset:
   ```bash
   export DATASET_DIR=#Where_to_save_Dataset
-  bash ${MODEL_DIR}/quickstart/language_modeling/pytorch/rnnt/inference/cpu/download_dataset_baremetal.sh
+  bash ${MODEL_DIR}/quickstart/language_modeling/pytorch/rnnt/inference/cpu/download_dataset.sh
   ```
 
 * Download pretrained model
   ```bash
   export CHECKPOINT_DIR=#Where_to_save_pretrained_model
-  bash ${MODEL_DIR}/quickstart/language_modeling/pytorch/rnnt/inference/cpu/download_model_baremetal.sh
+  bash ${MODEL_DIR}/quickstart/language_modeling/pytorch/rnnt/inference/cpu/download_model.sh
   ```
 
 * Set Jemalloc Preload for better performance
@@ -52,8 +52,8 @@ Follow [link](/docs/general/pytorch/BareMetalSetup.md) to install Conda and buil
 
 |  DataType   | Throughput  |  Latency    |   Accuracy  |
 | ----------- | ----------- | ----------- | ----------- |
-| FP32        | bash batch_inference_baremetal.sh fp32 | bash online_inference_baremetal.sh fp32 | bash accuracy_baremetal.sh fp32 |
-| BF16        | bash batch_inference_baremetal.sh bf16 | bash online_inference_baremetal.sh bf16 | bash accuracy_baremetal.sh bf16 |
+| FP32        | bash inference_throughput.sh fp32 | bash inference_realtime.sh fp32 | bash accuracy.sh fp32 |
+| BF16        | bash inference_throughput.sh bf16 | bash inference_realtime.sh bf16 | bash accuracy.sh bf16 |
 
 ## Run the model
 
@@ -76,7 +76,7 @@ export DATASET_DIR=<path to the dataset>
 
 # Run a quickstart script (for example, FP32 batch inference)
 cd ${MODEL_DIR}/quickstart/language_modeling/pytorch/rnnt/inference/cpu
-bash batch_inference_baremetal.sh fp32
+bash inference_throughput.sh fp32
 ```
 
 <!--- 80. License -->
 
@@ -29,7 +29,7 @@ pytorch-spr-rnnt-inference
 
 | Script name | Description |
 |-------------|-------------|
-| `download_inference_dataset.sh` | Download and prepare the LibriSpeech inference dataset. See the [datasets section](#datasets) for instructions on it's usage. |
+| `download_dataset.sh` | Download and prepare the LibriSpeech inference dataset. See the [datasets section](#datasets) for instructions on it's usage. |
 | `inference_realtime.sh` | Runs multi-instance inference using 4 cores per instance for the specified precision (fp32, avx-fp32, or bf16). |
 | `inference_throughput.sh` | Runs multi-instance inference using 1 instance per socket for the specified precision (fp32, avx-fp32, or bf16). |
 | `accuracy.sh` | Runs an inference accuracy test for the specified precision (fp32, avx-fp32, or bf16). |
@@ -83,19 +83,21 @@ docker run --rm \
   -w /workspace/pytorch-spr-rnnt-inference \
   -it \
   model-zoo:pytorch-spr-rnnt-inference \
-  /bin/bash quickstart/download_inference_dataset.sh
+  /bin/bash quickstart/download_dataset.sh
 ```
 
 This `DATASET_DIR` environment variable will be used again when
 [running the model](#run-the-model).
 
 ## Run the model
 
-Download the pretrained model and set the `PRETRAINED_MODEL` environment variable
-to point to the file:
+Set the `CHECKPOINT_DIR` environment variable and run the script to download the
+pretrained model:
 ```
-wget https://zenodo.org/record/3662521/files/DistributedDataParallel_1576581068.9962234-epoch-100.pt?download=1 -O rnnt.pt
-export PRETRAINED_MODEL=$(pwd)/rnnt.pt
+export CHECKPOINT_DIR=<directory to download the pretrained model>
+mkdir -p $CHECKPOINT_DIR
+cd pytorch-spr-rnnt-inference
+bash download_model.sh
 ```
 
 After you've downloaded the pretrained model and followed the instructions to
@@ -113,7 +115,7 @@ cd pytorch-spr-rnnt-inference
 
 # Set the required environment vars
 export DATASET_DIR=<path to the dataset>
-export PRETRAINED_MODEL=<path to the rnnt.pt file>
+export CHECKPOINT_DIR=<path to the downloaded model weights directory>
 export PRECISION=<specify the precision to run (fp32 or bf16)>
 export OUTPUT_DIR=<directory where log files will be written>
 
 
@@ -1,6 +1,6 @@
 #!/usr/bin/env bash
 #
-# Copyright (c) 2021 Intel Corporation
+# Copyright (c) 2020 Intel Corporation
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -17,47 +17,62 @@
 
 MODEL_DIR=${MODEL_DIR-$PWD}
 
-echo "PRETRAINED_MODEL: ${PRETRAINED_MODEL}"
-echo "DATASET_DIR: ${DATASET_DIR}"
-echo "PRECISION: ${PRECISION}"
-echo "OUTPUT_DIR: ${OUTPUT_DIR}"
-
-if [ -z "${OUTPUT_DIR}" ]; then
-  echo "The required environment variable OUTPUT_DIR has not been set"
+if [ ! -e "${MODEL_DIR}/models/language_modeling/pytorch/rnnt/inference/cpu/inference.py" ]; then
+  echo "Could not find the script of inference.py. Please set environment variable '\${MODEL_DIR}'."
+  echo "From which the inference.py exist at the: \${MODEL_DIR}/models/language_modeling/pytorch/rnnt/inference/cpu/inference.py"
   exit 1
 fi
 
-# Create the output directory in case it doesn't already exist
-mkdir -p ${OUTPUT_DIR}
-
-if [ -z "${DATASET_DIR}" ]; then
-  echo "The required environment variable DATASET_DIR has not been set"
+if [ ! -e "${CHECKPOINT_DIR}/results/rnnt.pt" ]; then
+  echo "The pretrained model \${CHECKPOINT_DIR}/results/rnnt.pt does not exist"
   exit 1
 fi
 
-if [ ! -d "${DATASET_DIR}" ]; then
-  echo "The DATASET_DIR '${DATASET_DIR}' does not exist"
+if [ ! -d "${DATASET_DIR}/dataset/LibriSpeech" ]; then
+  echo "The DATASET_DIR \${DATASET_DIR}/dataset/LibriSpeech does not exist"
   exit 1
 fi
 
-if [ -z "${PRECISION}" ]; then
-  echo "The required environment variable PRECISION has not been set"
-  echo "Please set PRECISION to fp32, avx-fp32, or bf16."
+if [ ! -d "${OUTPUT_DIR}" ]; then
+  echo "The OUTPUT_DIR '${OUTPUT_DIR}' does not exist"
   exit 1
 fi
 
-cd ${MODEL_DIR}/models/rnnt/training/rnn_speech_recognition/pytorch
-export work_space=${OUTPUT_DIR}
-
-if [[ $PRECISION == "avx-fp32" ]]; then
+if [[ "$1" == *"avx"* ]]; then
     unset DNNL_MAX_CPU_ISA
-    PRECISION=fp32
 fi
 
-if [[ $PRECISION == "bf16" || $PRECISION == "fp32" ]]; then
-    bash run_inference_cpu_accuracy_ipex.sh ${DATASET_DIR} ${PRETRAINED_MODEL} ipex ${PRECISION} jit 2>&1 | tee -a ${OUTPUT_DIR}/rnnt-inference-accuracy-${PRECISION}.log
+ARGS=""
+if [ "$1" == "bf16" ]; then
+    ARGS="$ARGS --mix-precision"
+    echo "### running bf16 datatype"
 else
-    echo "The specified precision '${PRECISION}' is unsupported."
-    echo "Supported precisions are: fp32, avx-fp32, and bf16"
-    exit 1
+    echo "### running fp32 datatype"
 fi
+
+export DNNL_PRIMITIVE_CACHE_CAPACITY=1024
+export KMP_BLOCKTIME=1
+export KMP_AFFINITY=granularity=fine,compact,1,0
+
+BATCH_SIZE=64
+PRECISION=$1
+
+rm -rf ${OUTPUT_DIR}/rnnt_${PRECISION}_inference_accuracy*
+
+python -m intel_extension_for_pytorch.cpu.launch \
+    --use_default_allocator \
+    ${MODEL_DIR}/models/language_modeling/pytorch/rnnt/inference/cpu/inference.py \
+    --dataset_dir ${DATASET_DIR}/dataset/LibriSpeech/ \
+    --val_manifest ${DATASET_DIR}/dataset/LibriSpeech/librispeech-dev-clean-wav.json \
+    --model_toml ${MODEL_DIR}/models/language_modeling/pytorch/rnnt/inference/cpu/configs/rnnt.toml \
+    --ckpt ${CHECKPOINT_DIR}/results/rnnt.pt \
+    --batch_size $BATCH_SIZE \
+    --ipex \
+    --jit \
+    $ARGS 2>&1 | tee ${OUTPUT_DIR}/rnnt_${PRECISION}_inference_accuracy.log
+
+# For the summary of results
+wait
+
+accuracy=$(grep 'Accuracy:' ${OUTPUT_DIR}/rnnt_${PRECISION}_inference_accuracy* |sed -e 's/.*Accuracy//;s/[^0-9.]//g')
+echo ""RNN-T";"accuracy";$1; ${BATCH_SIZE};${accuracy}" | tee -a ${OUTPUT_DIR}/summary.log