muendelezaji · February 11, 2020 13:22
diff --git a/0001-tflite-allow-fp16-for-fp32-models.patch b/0001-tflite-allow-fp16-for-fp32-models.patch
 From b5a99e2174f115f87c0cb3de9d2a2479a0193db2 Mon Sep 17 00:00:00 2001
 From: Koan-Sin Tan <[email protected]>
 Date: Sun, 18 Nov 2018 13:11:38 +0800
 Subject: [PATCH 1/3] add cmdline option to allow running fp32 models with fp16

 Add an option for TFLite benchmark_model to allow running fp32
 models with fp16. Useful when testing NNPAI accelerators with
 fp16.
 ---
 .../lite/tools/benchmark/benchmark_tflite_model.cc       | 9 ++++++++-
 1 file changed, 8 insertions(+), 1 deletion(-)

 diff --git a/tensorflow/lite/tools/benchmark/benchmark_tflite_model.cc b/tensorflow/lite/tools/benchmark/benchmark_tflite_model.cc
 index 83e0ff1f872ef7..2d8b3a198c2967 100644
 --- a/tensorflow/lite/tools/benchmark/benchmark_tflite_model.cc
 +++ b/tensorflow/lite/tools/benchmark/benchmark_tflite_model.cc
 @@ -200,6 +200,7 @@ BenchmarkParams BenchmarkTfLiteModel::DefaultParams() {
   default_params.AddParam("input_layer_shape",
                           BenchmarkParam::Create<std::string>(""));
   default_params.AddParam("use_nnapi", BenchmarkParam::Create<bool>(false));
 +  default_params.AddParam("allow_fp16", BenchmarkParam::Create<bool>(false));
   return default_params;
 }
 
 @@ -219,7 +220,8 @@ std::vector<Flag> BenchmarkTfLiteModel::GetFlags() {
       CreateFlag<std::string>("input_layer", &params_, "input layer names"),
       CreateFlag<std::string>("input_layer_shape", &params_,
                               "input layer shape"),
 -      CreateFlag<bool>("use_nnapi", &params_, "use nnapi api")};
 +      CreateFlag<bool>("use_nnapi", &params_, "use nnapi api"),
 +      CreateFlag<bool>("allow_fp16", &params_, "allow fp16")};
 
   flags.insert(flags.end(), specific_flags.begin(), specific_flags.end());
   return flags;
 @@ -233,6 +235,7 @@ void BenchmarkTfLiteModel::LogParams() {
   TFLITE_LOG(INFO) << "Input shapes: ["
                    << params_.Get<std::string>("input_layer_shape") << "]";
   TFLITE_LOG(INFO) << "Use nnapi : [" << params_.Get<bool>("use_nnapi") << "]";
 +  TFLITE_LOG(INFO) << "Allow fp16 : [" << params_.Get<bool>("allow_fp16") << "]";
 }
 
 bool BenchmarkTfLiteModel::ValidateParams() {
 @@ -328,6 +331,10 @@ void BenchmarkTfLiteModel::Init() {
   interpreter->UseNNAPI(use_nnapi);
   ApplyDelegates();
 
 +  bool allow_fp16 = params_.Get<bool>("allow_fp16");
 +
 +  interpreter->SetAllowFp16PrecisionForFp32(allow_fp16);
 +
   auto interpreter_inputs = interpreter->inputs();
 
   if (!inputs.empty()) {

 From dc4b9745b41ca7b2a00efb142bb0ab1e9895b4e0 Mon Sep 17 00:00:00 2001
 From: Koan-Sin Tan <[email protected]>
 Date: Sun, 18 Nov 2018 13:31:02 +0800
 Subject: [PATCH 2/3] add option for label_image to allow running fp32 models
 with fp16

 Add an option for TFLite label_image to allow running fp32
 models with fp16. Useful when testing NNPAI accelerators with
 fp16.
 ---
 tensorflow/lite/examples/label_image/label_image.cc | 6 ++++++
 tensorflow/lite/examples/label_image/label_image.h  | 1 +
 2 files changed, 7 insertions(+)

 diff --git a/tensorflow/lite/examples/label_image/label_image.cc b/tensorflow/lite/examples/label_image/label_image.cc
 index b8dc2840dfb49f..b83563280ec173 100644
 --- a/tensorflow/lite/examples/label_image/label_image.cc
 +++ b/tensorflow/lite/examples/label_image/label_image.cc
 @@ -113,6 +113,7 @@ void RunInference(Settings* s) {
   }
 
   interpreter->UseNNAPI(s->accel);
 +  interpreter->SetAllowFp16PrecisionForFp32(s->allow_fp16);
 
   if (s->verbose) {
     LOG(INFO) << "tensors size: " << interpreter->tensors_size() << "\n";
 @@ -253,6 +254,7 @@ void RunInference(Settings* s) {
 void display_usage() {
   LOG(INFO) << "label_image\n"
             << "--accelerated, -a: [0|1], use Android NNAPI or not\n"
 +            << "--allow_fp16, -f: [0|1], allow running fp32 models with fp16 not\n"
             << "--count, -c: loop interpreter->Invoke() for certain times\n"
             << "--input_mean, -b: input mean\n"
             << "--input_std, -s: input standard deviation\n"
 @@ -273,6 +275,7 @@ int Main(int argc, char** argv) {
   while (1) {
     static struct option long_options[] = {
         {"accelerated", required_argument, nullptr, 'a'},
 +        {"allow_fp16", required_argument, nullptr, 'f'},
         {"count", required_argument, nullptr, 'c'},
         {"verbose", required_argument, nullptr, 'v'},
         {"image", required_argument, nullptr, 'i'},
 @@ -305,6 +308,9 @@ int Main(int argc, char** argv) {
         s.loop_count =
             strtol(optarg, nullptr, 10);  // NOLINT(runtime/deprecated_fn)
         break;
 +      case 'f':
 +        s.allow_fp16 = strtol(optarg, nullptr, 10);  // NOLINT(runtime/deprecated_fn)
 +        break;
       case 'i':
         s.input_bmp_name = optarg;
         break;
 diff --git a/tensorflow/lite/examples/label_image/label_image.h b/tensorflow/lite/examples/label_image/label_image.h
 index 88b047fecc4b3e..cc46e56b64a9dc 100644
 --- a/tensorflow/lite/examples/label_image/label_image.h
 +++ b/tensorflow/lite/examples/label_image/label_image.h
 @@ -26,6 +26,7 @@ struct Settings {
   bool accel = false;
   bool input_floating = false;
   bool profiling = false;
 +  bool allow_fp16 = false;
   int loop_count = 1;
   float input_mean = 127.5f;
   float input_std = 127.5f;

 From ab7b554405dc4bf5b023522095a9b4a318327e0b Mon Sep 17 00:00:00 2001
 From: Koan-Sin Tan <[email protected]>
 Date: Tue, 12 Feb 2019 16:15:22 +0800
 Subject: [PATCH 3/3] rebase and run clang-format

 ---
 .../lite/examples/label_image/label_image.cc  | 32 ++++++++++---------
 1 file changed, 17 insertions(+), 15 deletions(-)

 diff --git a/tensorflow/lite/examples/label_image/label_image.cc b/tensorflow/lite/examples/label_image/label_image.cc
 index b83563280ec173..340fbab5c6fcc9 100644
 --- a/tensorflow/lite/examples/label_image/label_image.cc
 +++ b/tensorflow/lite/examples/label_image/label_image.cc
 @@ -252,20 +252,21 @@ void RunInference(Settings* s) {
 }
 
 void display_usage() {
 -  LOG(INFO) << "label_image\n"
 -            << "--accelerated, -a: [0|1], use Android NNAPI or not\n"
 -            << "--allow_fp16, -f: [0|1], allow running fp32 models with fp16 not\n"
 -            << "--count, -c: loop interpreter->Invoke() for certain times\n"
 -            << "--input_mean, -b: input mean\n"
 -            << "--input_std, -s: input standard deviation\n"
 -            << "--image, -i: image_name.bmp\n"
 -            << "--labels, -l: labels for the model\n"
 -            << "--tflite_model, -m: model_name.tflite\n"
 -            << "--profiling, -p: [0|1], profiling or not\n"
 -            << "--num_results, -r: number of results to show\n"
 -            << "--threads, -t: number of threads\n"
 -            << "--verbose, -v: [0|1] print more information\n"
 -            << "\n";
 +  LOG(INFO)
 +      << "label_image\n"
 +      << "--accelerated, -a: [0|1], use Android NNAPI or not\n"
 +      << "--allow_fp16, -f: [0|1], allow running fp32 models with fp16 not\n"
 +      << "--count, -c: loop interpreter->Invoke() for certain times\n"
 +      << "--input_mean, -b: input mean\n"
 +      << "--input_std, -s: input standard deviation\n"
 +      << "--image, -i: image_name.bmp\n"
 +      << "--labels, -l: labels for the model\n"
 +      << "--tflite_model, -m: model_name.tflite\n"
 +      << "--profiling, -p: [0|1], profiling or not\n"
 +      << "--num_results, -r: number of results to show\n"
 +      << "--threads, -t: number of threads\n"
 +      << "--verbose, -v: [0|1] print more information\n"
 +      << "\n";
 }
 
 int Main(int argc, char** argv) {
 @@ -309,7 +310,8 @@ int Main(int argc, char** argv) {
             strtol(optarg, nullptr, 10);  // NOLINT(runtime/deprecated_fn)
         break;
       case 'f':
 -        s.allow_fp16 = strtol(optarg, nullptr, 10);  // NOLINT(runtime/deprecated_fn)
 +        s.allow_fp16 =
 +            strtol(optarg, nullptr, 10);  // NOLINT(runtime/deprecated_fn)
         break;
       case 'i':
         s.input_bmp_name = optarg;
diff --git a/0002-tflite-label-image-log-timing-dist.patch b/0002-tflite-label-image-log-timing-dist.patch
 diff --git a/tensorflow/lite/examples/label_image/label_image.cc b/tensorflow/lite/examples/label_image/label_image.cc
 index 7c6f523..e458423 100644
 --- a/tensorflow/lite/examples/label_image/label_image.cc
 +++ b/tensorflow/lite/examples/label_image/label_image.cc
 @@ -24,6 +24,8 @@ limitations under the License.
 #include <string>
 #include <unordered_set>
 #include <vector>
 +#include <algorithm>
 +#include <functional>
 
 #include <fcntl.h>      // NOLINT(build/include_order)
 #include <getopt.h>     // NOLINT(build/include_order)
 @@ -45,7 +47,7 @@ limitations under the License.
 namespace tflite {
 namespace label_image {
 
 -double get_us(struct timeval t) { return (t.tv_sec * 1000000 + t.tv_usec); }
 +double get_us(struct timeval t) { return (t.tv_sec * 1000000.0 + (double)t.tv_usec); }
 
 // Takes a file name, and loads a list of labels from it, one per line, and
 // returns a vector of the strings. It pads with empty strings so the length
 @@ -87,6 +89,41 @@ void PrintProfilingInfo(const profiling::ProfileEvent* e, uint32_t op_index,
             << "\n";
 }
 
 +void LogTimingDistribution(std::vector<double> & timings) {
 +  int timing_count = timings.size();
 +  int p5_count = timing_count / 20;
 +  std::sort(timings.begin(), timings.end());
 +
 +  int i = 0;
 +  int c = 0;
 +  double avg = 0;
 +  for(auto t : timings) {
 +    double ms = t / 1000.0;
 +    avg += ms;
 +    ++i;
 +    ++c;
 +    if (i > p5_count || c == timing_count) {
 +      LOG(INFO) << " => " << (c*100/timing_count) << "% is " << ms <<
 +          " ms. avg within bucket: " << (avg/i) << " ms\n";
 +      i = 0;
 +      avg = 0;
 +    }
 +  }
 +}
 +
 +void LogTimings(std::vector<double> & timings) {
 +  int timing_count = timings.size();
 +
 +  int i = 0;
 +  int c = 0;
 +  double avg = 0;
 +  for(auto t : timings) {
 +    double ms = t / 1000.0;
 +    LOG(INFO) << "Iteration_" << c << "=" << ms <<" ms\n";
 +    ++c;
 +  }
 +}
 +
 void RunInference(Settings* s) {
   if (!s->model_name.c_str()) {
     LOG(ERROR) << "no model file name\n";
 @@ -188,19 +226,26 @@ void RunInference(Settings* s) {
 
   if (s->profiling) profiler->StartProfiling();
 
 -  struct timeval start_time, stop_time;
 +  struct timeval start_time, stop_time, act_time;
   gettimeofday(&start_time, nullptr);
 +  std::vector<double> timings;
 +  double prev_time_us = get_us(start_time);
   for (int i = 0; i < s->loop_count; i++) {
     if (interpreter->Invoke() != kTfLiteOk) {
       LOG(FATAL) << "Failed to invoke tflite!\n";
     }
 +    gettimeofday(&act_time, NULL);
 +    double act_time_us = get_us(act_time);
 +    timings.push_back(act_time_us - prev_time_us);
 +    prev_time_us = act_time_us;
   }
   gettimeofday(&stop_time, nullptr);
   LOG(INFO) << "invoked \n";
   LOG(INFO) << "average time: "
             << (get_us(stop_time) - get_us(start_time)) / (s->loop_count * 1000)
             << " ms \n";
 -
 +  LogTimings(timings);
 +  LogTimingDistribution(timings);
   if (s->profiling) {
     profiler->StopProfiling();
     auto profile_events = profiler->GetProfileEvents();
diff --git a/build-tflite-1.13.sh b/build-tflite-1.13.sh
 #!/usr/bin/env bash

 set -eo pipefail

 # Release tag or branch name
 TF_VERSION=${TF_VERSION:-"v1.13.1"}

 # Clone a fresh copy
 if [ -n "${TF_CLONE}" ]; then
    TF_SRCDIR=/tmp/build-tflite/tensorflow_src
    rm -rf ${TF_SRCDIR}
    mkdir -p ${TF_SRCDIR}
    if [ ! -d "${TF_SRCDIR}" ]; then
        git clone --branch ${TF_VERSION} --depth 1 https://github.com/tensorflow/tensorflow ${TF_SRCDIR}
    fi

    # Download patches
    TF_PATCH_DIR=/tmp/build-tflite/tf_patches
    TF_APPLY_PATCH="yes"
    TF_PATCHES=("0001-tflite-allow-fp16-for-fp32-models.patch" "0002-tflite-label-image-log-timing-dist.patch")
    for patch in "${TF_PATCHES[@]}"; do
        wget -q -nc --show-progress https://gist.github.com/muendelezaji/47b32812a15b622f05019b0e433de9b1/raw/${patch} -P ${TF_PATCH_DIR}
    done
 fi

 # Alternatively, provide path to cloned TensorFlow repo
 TF_SRCDIR=${1:-"$TF_SRCDIR"}
 TF_SRCDIR="$(readlink -f ${1:-"$TF_SRCDIR"})" # get absolute
 # Folder with patches
 TF_PATCH_DIR="$(readlink -f ${TF_PATCH_DIR:-"patches"})"
 TF_APPLY_PATCH=${TF_APPLY_PATCH:-"yes"}
 # Output folder
 TF_OUTDIR="$(readlink -f ${TF_OUTDIR:-"out"})"

 # Sanity checks
 if [ ! -d "${TF_SRCDIR}" ]; then
    echo "ERROR: Cannot find TensorFlow source directory. Ensure it exists or set TF_CLONE to do a new clone."
    exit 1
 elif [ ! -f "${TF_SRCDIR}/configure" -o ! -f "${TF_SRCDIR}/BUILD" ]; then
    echo "ERROR: Missing configure or BUILD file in $TF_SRCDIR. Ensure it is a valid Bazel workspace."
    exit 1
 elif [ "${TF_APPLY_PATCH}" = "yes" -a ! -d "${TF_PATCH_DIR}" ]; then
    echo "ERROR: Patches directory was not found. It must exist when TF_APPLY_PATCH is set to 'yes'."
    exit 1
 elif [ -z "${ANDROID_NDK_HOME}" -o -z "${ANDROID_SDK_HOME}" ]; then
    echo "ERROR: Cannot locate Android NDK or SDK. Ensure both ANDROID_NDK_HOME and ANDROID_SDK_HOME are set."
    exit 1
 fi

 # Apply required patches
 if [ "${TF_APPLY_PATCH}" = "yes" ]; then
    pushd ${TF_SRCDIR}
    for patch in $(find "${TF_PATCH_DIR}" -type f -name "*.patch" | sort); do
        git apply ${patch}
    done
    git config --local user.name temp
    git config --local user.email [email protected]
    git commit -am "[TFLite] Add fp16 support and log timing distribution"
    popd
 fi

 # Select features
 TF_BUILD_VARS="TF_NEED_CUDA=0"
 TF_BUILD_VARS+=" TF_NEED_OPENCL_SYCL=0"
 TF_BUILD_VARS+=" TF_NEED_ROCM=0"
 TF_BUILD_VARS+=" TF_NEED_JEMALLOC=1"
 TF_BUILD_VARS+=" TF_NEED_MPI=0"
 TF_BUILD_VARS+=" TF_ENABLE_XLA=0"
 TF_BUILD_VARS+=" TF_DOWNLOAD_CLANG=0"
 TF_BUILD_VARS+=" TF_SET_ANDROID_WORKSPACE=1"
 export ${TF_BUILD_VARS}

 # Bazel settings
 BAZEL_BIN=${BAZEL_BIN:-"$(command -v bazel || true)"}
 BAZEL_JOBS=${BAZEL_JOBS:-"4"}
 # BAZEL_PATCH="yes"
 # BAZEL_AVAIL_RAM=1536 # MB
 # BAZEL_AVAIL_CPU=4.0  # number of cpu cores (1.0 representing a single full core)
 # BAZEL_AVAIL_IO=1.0   # workstation I/O capability (with 1.0 representing average workstation)
 # if [ -n "$BAZEL_AVAIL_RAM" -a -n "$BAZEL_AVAIL_CPU" -a -n "$BAZEL_AVAIL_IO" ]; then
 #     BAZEL_RESOURCES="--local_resources ${BAZEL_AVAIL_RAM},${BAZEL_AVAIL_CPU},${BAZEL_AVAIL_IO}"
 # fi

 # Download if not present - use portable binary to avoid installation
 if [ ! -x "${BAZEL_BIN}" ]; then
    BAZEL_VERSION="0.20.0" # was 0.19.2
    BAZEL_FILE="bazel-${BAZEL_VERSION}-linux-x86_64"
    BAZEL_DIR="/tmp/build-tflite/bazel_bin/${BAZEL_VERSION}"
    mkdir -p ${BAZEL_DIR}
    wget -q -nc --show-progress https://github.com/bazelbuild/bazel/releases/download/${BAZEL_VERSION}/${BAZEL_FILE} -P ${BAZEL_DIR}
    chmod +x ${BAZEL_DIR}/${BAZEL_FILE}
    ln -sf ${BAZEL_DIR}/${BAZEL_FILE} ${BAZEL_DIR}/bazel
    export PATH="${BAZEL_DIR}:$PATH"
    BAZEL_BIN="$(command -v bazel)"
 fi

 # Build config
 # Disable default-on TensorFlow cloud features
 BAZEL_COPT_FLAGS=" --config=noaws --config=nogcp --config=nohdfs --config=nokafka --config=noignite --config=nonccl --define tensorflow_mkldnn_contraction_kernel=0"
 # Android "--config=android_arm64" is equivalent to:
 # --cpu=arm64-v8a --fat_apk_cpu=arm64-v8a --crosstool_top=//external:android/crosstool --host_crosstool_top=@bazel_tools//tools/cpp:toolchain
 BAZEL_COPT_FLAGS+=" --copt=-DTFLITE_PROFILING_ENABLED --cxxopt=-std=c++11 --config=monolithic --config=android_arm64 --action_env ANDROID_NDK_API_LEVEL=28" # was 21
 # TFLite targets for Android
 BAZEL_EXTRA_FLAGS=" //tensorflow/lite/examples/label_image:label_image"
 BAZEL_EXTRA_FLAGS+=" //tensorflow/lite/tools/benchmark:benchmark_model"

 # Python
 TF_PYTHON_VERSION=${TF_PYTHON_VERSION:-"2"}
 export PYTHON_BIN_PATH="$(command -v python${TF_PYTHON_VERSION})"
 export USE_DEFAULT_PYTHON_LIB_PATH="1"

 # GCC optimisations
 # For more info, see: https://gcc.gnu.org/onlinedocs/gcc/ARM-Options.html
 export CC_OPT_FLAGS="-march=armv8-a"
 # Add suffix to TF_OUTDIR for more specialised builds
 if [ "${TF_GCC_OPTS}" = "simd" ]; then
    CC_OPT_FLAGS="-march=armv8-a+simd"
    TF_OUTDIR="${TF_OUTDIR}-simd"
 elif [ "${TF_GCC_OPTS}" = "fp16" ]; then
    CC_OPT_FLAGS="-march=armv8.2-a+fp16"
    TF_OUTDIR="${TF_OUTDIR}-fp16"
 fi
 BAZEL_COPT_FLAGS+=" --copt=${CC_OPT_FLAGS}"

 # Android
 export NDK_ROOT="${ANDROID_NDK_HOME}"
 export ANDROID_API_LEVEL="28" # was 26
 export ANDROID_BUILD_TOOLS_VERSION="28.0.3"

 # Configure and build
 pushd ${TF_SRCDIR} && ./configure
 # Clean if not an incremental rebuild
 if [ -z "${TF_REBUILD}" ]; then
    ${BAZEL_BIN} clean
 fi

 ${BAZEL_BIN} build ${BAZEL_RESOURCES} -c opt --verbose_failures --jobs=${BAZEL_JOBS} ${BAZEL_COPT_FLAGS} ${BAZEL_EXTRA_FLAGS}

 mkdir -p ${TF_OUTDIR}
 cp -a --remove-destination -t ${TF_OUTDIR} \
    bazel-bin/tensorflow/lite/examples/label_image/label_image \
    bazel-bin/tensorflow/lite/tools/benchmark/benchmark_model

 echo "Builds saved to: ${TF_OUTDIR}"
diff --git a/build-tflite-for-arm64.jenkinsfile b/build-tflite-for-arm64.jenkinsfile
 #!/usr/bin/env groovy

 pipeline {
    agent any

    parameters {
        choice name: 'BAZEL_VERSION', choices: ['0.19.2', '0.21.0', '0.24.1'], description: 'Bazel version to use when building'
        choice name: 'NDK_VERSION', choices: ['13', '14', '18', '19'], description: 'NDK version to use when building'
        choice name: 'SDK_VERSION', choices: ['21', '28', '29'], description: 'SDK version to use when building'
        choice name: 'TF_VERSION', choices: ['v1.13.1', 'v1.14.0', 'v2.0.0-beta1'], description: 'Tagged version of TensorFlow to download'
    }

    options {
        buildDiscarder logRotator(numToKeepStr: '10')
        skipDefaultCheckout()
        skipStagesAfterUnstable()
        timeout time: 30, unit: 'MINUTES'
        timestamps()
    }

    environment {
        ANDROID_NDK_HOME = "${env.BUILD_TOOLS}/android/android-ndk-r${params.NDK_VERSION}"
        ANDROID_SDK_HOME = "${env.BUILD_TOOLS}/android/android-sdk"
        BAZEL_HOME = "${env.BUILD_TOOLS}/bazel/bazel-${params.BAZEL_VERSION}"
        VENV_HOME  = "${env.HOME}/.local"

        // Set env from params (used in build shell script)
        BAZEL_VERSION = "${params.BAZEL_VERSION}"
        NDK_VERSION   = "${params.NDK_VERSION}"
        SDK_VERSION   = "${params.SDK_VERSION}"
        TF_VERSION    = "${params.TF_VERSION}"

        TF_SRCDIR    = 'src'
        TF_OUTDIR    = 'out'
        TF_PATCH_DIR = 'patches'
        TF_PATCH     = (params.TF_VERSION ==~ '.*1.13.*') ? 'yes' : 'no'
    }

    stages {
        stage('Checkout repo') {
            steps {
                dir("${env.TF_SRCDIR}") {
                    checkout([$class: 'GitSCM', branches: [[name: "refs/tags/${params.TF_VERSION}"]], userRemoteConfigs: [[url: 'https://github.com/tensorflow/tensorflow']]])
                }
            }
        }

        stage('Build TFLite') {
            steps {
                echo '====++++ executing Build TFLite ++++===='
                withEnv([
                    "BAZEL_BIN=${env.BAZEL_HOME}/bin/bazel",
                    "PATH+BAZEL=${env.BAZEL_HOME}/bin",
                    "PATH+VENV=${env.VENV_HOME}/bin",
                ]) {
                    sh '''
                        # Create and activate Python venv
                        virtualenv .
                        virtualenv --relocatable .
                        . ./bin/activate

                        # Install pip requirements
                        # From REQUIRED_PACKAGES in tensorflow/tools/pip_package/setup.py
                        pip install -U pip six numpy wheel setuptools mock future>=0.17.1
                        pip install -U keras_applications==1.0.6 --no-deps
                        pip install -U keras_preprocessing==1.0.5 --no-deps

                        # Download patches
                        GIST_URL=https://gist.github.com/muendelezaji/47b32812a15b622f05019b0e433de9b1/raw
                        mkdir -p $TF_PATCH_DIR
                        for patch in '0001-tflite-allow-fp16-for-fp32-models.patch' '0002-tflite-label-image-log-timing-dist.patch'; do
                            curl -fsL $GIST_URL/$patch > $TF_PATCH_DIR/$patch
                        done

                        # Get build script and run it
                        BUILD_SCRIPT='build-tflite-1.13.sh'
                        curl -fsL $GIST_URL/$BUILD_SCRIPT > $BUILD_SCRIPT
                        chmod +x $BUILD_SCRIPT
                        bash -x ./$BUILD_SCRIPT

                        deactivate
                    '''
                }
            }

            post {
                success {
                    echo '====++++ Build TFLite executed succesfully ++++===='
                    archiveArtifacts artifacts: "${env.TF_OUTDIR}/*", fingerprint: true
                }

                failure {
                    echo '====++++ Build TFLite execution failed ++++===='
                }
            }
        }

        stage('Run TFLite') {
            steps {
                echo '====++++ executing Run TFLite ++++===='
            }
        }
    }

    post {
        always {
            echo '====++++ Pipeline finished ++++===='
            deleteDir() // clean up the workspace
        }
    }
 }
diff --git a/build-tflite-for-arm64.sh b/build-tflite-for-arm64.sh
 #!/bin/sh

 # Configurable build tool parameters
 BAZEL_VERSION=0.19.2
 NDK_VERSION=18
 SDK_VERSION=28
 TF_VERSION=v1.13.1
 TF_PATCH=yes
 TF_PATCH_DIR=patches

 # Setup build tools - use global config or custom tools plugin
 ANDROID_NDK_HOME=$BUILD_TOOLS/android/android-ndk-r$NDK_VERSION
 ANDROID_SDK_HOME=$BUILD_TOOLS/android/android-sdk
 BAZEL_HOME=$BUILD_TOOLS/bazel/bazel-$BAZEL_VERSION
 VENV_HOME=$HOME/.local
 # Add them to path
 PATH=$BAZEL_HOME/bin:$VENV_HOME/bin:$PATH

 # Create and activate Python venv
 virtualenv .
 virtualenv --relocatable .
 . ./bin/activate

 # Install pip requirements
 # From REQUIRED_PACKAGES in tensorflow/tools/pip_package/setup.py
 pip install -U pip six numpy wheel setuptools mock future>=0.17.1
 pip install -U keras_applications==1.0.6 --no-deps
 pip install -U keras_preprocessing==1.0.5 --no-deps

 # Download patches
 GIST_URL=https://gist.github.com/muendelezaji/47b32812a15b622f05019b0e433de9b1/raw
 mkdir -p $TF_PATCH_DIR
 for patch in '0001-tflite-allow-fp16-for-fp32-models.patch'; do
    curl -fsL $GIST_URL/$patch > $TF_PATCH_DIR/$patch
 done

 # Get build script and run it
 BUILD_SCRIPT='build-tflite.sh'
 curl -fsL $GIST_URL/$BUILD_SCRIPT > $BUILD_SCRIPT
 chmod +x $BUILD_SCRIPT
 bash -x ./$BUILD_SCRIPT

 deactivate
diff --git a/build-tflite.sh b/build-tflite.sh
 #!/usr/bin/env bash

 set -eo pipefail

 if [ "${BUILD_CONFIG}" = "2.0" ]; then
    TF_VERSION=v2.0.0-beta1
    TF_PATCH=0
    TF_CLONE=1
    BAZEL_VERSION=0.24.1
    BAZEL_BIN=none # force download
    BAZEL_COPT_FLAGS+=" --config=v2"
 elif [ "${BUILD_CONFIG}" = "1.14" ]; then
    TF_VERSION=v1.14.0
    TF_PATCH=0
    TF_CLONE=1
    BAZEL_VERSION=0.24.1
    BAZEL_BIN=none
 fi

 # Release tag or branch name
 TF_VERSION=${TF_VERSION:-"v1.13.1"}
 TF_PATCH=${TF_PATCH:-"1"}
 # Shorthand
 # : ${TF_VERSION:="v1.13.1"}
 # : ${TF_PATCH:="1"}

 # Clone a fresh copy
 if [ -n "${TF_CLONE}" ]; then
    TF_SRCDIR="/tmp/build-tflite/tensorflow/${TF_VERSION}/src"
    TF_OUTDIR="/tmp/build-tflite/tensorflow/${TF_VERSION}/out"
    if [ ! -d "${TF_SRCDIR}" ]; then
        git clone --branch ${TF_VERSION} --depth 1 https://github.com/tensorflow/tensorflow ${TF_SRCDIR}
    fi

    # Download patches
    if [ "${TF_PATCH}" = "1" ]; then
        TF_PATCH_DIR="/tmp/build-tflite/tensorflow/${TF_VERSION}/patches"
        TF_PATCHES=("0001-tflite-allow-fp16-for-fp32-models.patch" "0002-tflite-label-image-log-timing-dist.patch")
        for patch in "${TF_PATCHES[@]}"; do
            wget -q -nc --show-progress https://gist.github.com/muendelezaji/47b32812a15b622f05019b0e433de9b1/raw/${patch} -P ${TF_PATCH_DIR}
        done
    fi
 fi

 # Alternatively, provide path to cloned TensorFlow repo
 TF_SRCDIR="${TF_SRCDIR:-$(readlink -f "src")}"
 TF_OUTDIR="${TF_OUTDIR:-$(readlink -f "out")}"           # Build outputs folder
 TF_PATCH_DIR="${TF_PATCH_DIR:-$(readlink -f "patches")}" # Folder with patches
 # Shorthand
 # : ${TF_SRCDIR:=$(readlink -f "src")}
 # : ${TF_OUTDIR:=$(readlink -f "out")}
 # : ${TF_PATCH_DIR:=$(readlink -f "patches")}

 # Sanity checks
 if [ ! -d "${TF_SRCDIR}" ]; then
    echo "ERROR: Cannot find TensorFlow source directory. Ensure it exists or set TF_CLONE to do a new clone."
    exit 1
 elif [ ! -f "${TF_SRCDIR}/configure" -o ! -f "${TF_SRCDIR}/BUILD" ]; then
    echo "ERROR: Missing configure or BUILD file in ${TF_SRCDIR}. Ensure it is a valid Bazel workspace."
    exit 1
 elif [ "${TF_PATCH}" = "1" -a ! -d "${TF_PATCH_DIR}" ]; then
    echo "ERROR: Patches directory was not found. It must exist when TF_PATCH is set to 'yes'."
    exit 1
 elif [ -z "${ANDROID_NDK_HOME}" -o -z "${ANDROID_SDK_HOME}" ]; then
    echo "ERROR: Cannot locate Android NDK or SDK. Ensure both ANDROID_NDK_HOME and ANDROID_SDK_HOME are set."
    exit 1
 fi

 pushd ${TF_SRCDIR}

 # Apply required patches
 if [ "${TF_PATCH}" = "1" ]; then
    for patch in $(find ${TF_PATCH_DIR} -type f -name "*.patch" | sort); do
        git apply ${patch}
    done
    git config --local user.name temp
    git config --local user.email [email protected]
    git commit -am "[TFLite] All patched up and ready to go"
 fi

 # Bazel
 BAZEL_BIN=${BAZEL_BIN:-"$(command -v bazel || true)"}
 BAZEL_JOBS=${BAZEL_JOBS:-"4"}
 # BAZEL_PATCH="no"
 # BAZEL_AVAIL_RAM=2048 # MB
 # BAZEL_AVAIL_CPU=4.0  # number of cpu cores (1.0 representing a single full core)
 # BAZEL_AVAIL_IO=1.0   # workstation I/O capability (with 1.0 representing average workstation)
 # if [ -n "${BAZEL_AVAIL_RAM}" -a -n "${BAZEL_AVAIL_CPU}" -a -n "${BAZEL_AVAIL_IO}" ]; then
 #     BAZEL_RESOURCES="--local_resources ${BAZEL_AVAIL_RAM},${BAZEL_AVAIL_CPU},${BAZEL_AVAIL_IO}"
 # fi
 if [ -n "${BAZEL_DRYRUN}" ]; then
    BAZEL_DEBUG_FLAGS+=" --nobuild"
 fi
 if [ -n "${BAZEL_VERBOSE}" ]; then
    BAZEL_DEBUG_FLAGS+=" -s --explain=${TF_OUTDIR}/explain.log"
 fi
 if [ -n "${BAZEL_DEBUG_FLAGS}" ]; then
    set -x
 fi

 # Download portable binary if not present
 if [ ! -x "${BAZEL_BIN}" ]; then
    BAZEL_VERSION=${BAZEL_VERSION:-"0.24.1"}
    BAZEL_FILE="bazel-${BAZEL_VERSION}-linux-x86_64"
    BAZEL_DIR="/tmp/build-tflite/bazel/${BAZEL_VERSION}"

    wget -q -nc --show-progress https://github.com/bazelbuild/bazel/releases/download/${BAZEL_VERSION}/${BAZEL_FILE} -P ${BAZEL_DIR}
    chmod +x ${BAZEL_DIR}/${BAZEL_FILE}
    ln -sf ${BAZEL_DIR}/${BAZEL_FILE} ${BAZEL_DIR}/bazel
    export PATH="${BAZEL_DIR}:${PATH}"
    BAZEL_BIN="$(command -v bazel)"
 fi

 # Python
 PYTHON_VERSION=${PYTHON_VERSION:-"2"}
 export PYTHON_BIN_PATH="$(command -v python${PYTHON_VERSION})"
 export USE_DEFAULT_PYTHON_LIB_PATH="1"

 # Android
 export ANDROID_BUILD_TOOLS_VERSION="28.0.3"
 export ANDROID_API_LEVEL="28"
 export ANDROID_NDK_API_LEVEL=${ANDROID_API_LEVEL}
 NDK_VERSION="$(sed -En 's/Pkg.Revision = ([0-9]+).*/\1/p' ${ANDROID_NDK_HOME}/source.properties)"

 # Select TensorFlow features
 TF_BUILD_VARS+=" TF_NEED_CUDA=0"
 TF_BUILD_VARS+=" TF_NEED_OPENCL_SYCL=0"
 TF_BUILD_VARS+=" TF_NEED_ROCM=0"
 TF_BUILD_VARS+=" TF_NEED_JEMALLOC=1"
 TF_BUILD_VARS+=" TF_NEED_MPI=0"
 TF_BUILD_VARS+=" TF_ENABLE_XLA=0"
 TF_BUILD_VARS+=" TF_DOWNLOAD_CLANG=0"
 TF_BUILD_VARS+=" TF_SET_ANDROID_WORKSPACE=1"
 export ${TF_BUILD_VARS}

 # Build options
 # Disable unused default-on features
 BAZEL_COPT_FLAGS+=" --config=noaws --config=nogcp --config=nohdfs --config=nokafka --config=noignite --config=nonccl --define tensorflow_mkldnn_contraction_kernel=0"
 # Android config is equivalent to:
 # --cpu=arm64-v8a --fat_apk_cpu=arm64-v8a --crosstool_top=//external:android/crosstool --host_crosstool_top=@bazel_tools//tools/cpp:toolchain
 BAZEL_COPT_FLAGS+=" --config=android_arm64 --config=monolithic --config=opt --cxxopt=-std=c++11"
 # Enable RUY
 if [ "${TF_ENABLE_RUY}" = "1" ]; then
    BAZEL_COPT_FLAGS+=" --define tflite_with_ruy=true"
 else
    BAZEL_COPT_FLAGS+=" --define tflite_with_ruy=false"
 fi

 # TFLite targets for Android
 BAZEL_TARGETS+=" //tensorflow/lite:libtensorflowlite.so"
 BAZEL_TARGETS+=" //tensorflow/lite/examples/label_image:label_image"
 BAZEL_TARGETS+=" //tensorflow/lite/tools/benchmark:benchmark_model"

 build_variant() {
    local variant="${1}"
    local ccflags="${2}"
    # Output path
    local variant_name="${TF_VERSION}_ruy${TF_ENABLE_RUY}_${variant}"
    local variant_path="${TF_OUTDIR}/${variant_name}"

    # GCC build optimisations - autoloaded during Bazel config step
    # For more info, see https://gcc.gnu.org/onlinedocs/gcc/ARM-Options.html
    export CC_OPT_FLAGS=" -O3 -DTFLITE_PROFILING_ENABLED ${ccflags}"

    # Configure and build
    if [ "${BAZEL_REBUILD}" != "1" ]; then
        ${BAZEL_BIN} clean
    fi
    ./configure
    ${BAZEL_BIN} build ${BAZEL_DEBUG_FLAGS} ${BAZEL_RESOURCES} -c opt --verbose_failures --jobs=${BAZEL_JOBS} ${BAZEL_COPT_FLAGS} ${BAZEL_TARGETS}

    if [ "${BAZEL_DRYRUN}" != "1" ]; then
        # Move to output dir
        mkdir -p ${variant_path}
        mv -f -t ${variant_path} \
            bazel-bin/tensorflow/lite/libtensorflowlite.so \
            bazel-bin/tensorflow/lite/examples/label_image/label_image \
            bazel-bin/tensorflow/lite/tools/benchmark/benchmark_model
        echo "Builds saved to: ${variant_path}"
    fi
 }

 # Generic v8-a with SIMD instructions
 build_variant "v8a" "-march=armv8-a+simd"
 # Optimised FP16 instructions
 build_variant "v8.2a" "-march=armv8.2-a+fp16+dotprod"
diff --git a/run-tflite.sh b/run-tflite.sh
 #!/usr/bin/env bash

 # README FIRST:
 # ============
 # Script to run the TFLite tools benchmark_model or label_image and log results to a file.
 #
 # Environment prerequisites:
 #   1. Export ADB_SERIAL=<your_device_id> in your shell
 #   2. Copy files to the device:
 #       - binaries to /data/local/tmp/tflite/bin/
 #       - models to /data/local/tmp/tflite/models/
 #       - test data (sample images, labels file) to /data/local/tmp/tflite/data/
 #   3. Setup device CPU/GPU/etc frequencies as appropriate
 #
 # Saved results location:
 #   By default run logs are saved to '[LOGDIR]/[tool_name]-[run_date]/<model_name>.log' where:
 #     - [LOGDIR] is set as an env variable, or defaults to working dir
 #     - [tool_name] is one of 'benchmark_model' or 'label_image'
 #     - [run_date] is the start date-time in the format 'YYYYmmdd_HHMMSS'
 #
 #   Depending on selected config, the log directory and file names may include one or more of the
 #   run options such as - fp16, nnapi, ruy.

 set -o pipefail

 README_FIRST=yes  # Set this to "yes" disable readme prompt

 show_info() {
    echo "
 Script to run the TFLite tools benchmark_model or label_image and log results to a file.

 Environment prerequisites:
  1. Export ADB_SERIAL=<your_device_id> in your shell
  2. Copy files to the device:
      - binaries to /data/local/tmp/tflite/bin/
      - models to /data/local/tmp/tflite/models/
      - test data (sample images, labels file) to /data/local/tmp/tflite/data/
  3. Setup device CPU/GPU/etc frequencies as appropriate

 Saved results location:
  By default run logs are saved to '[LOGDIR]/[tool_name]-[run_date]/<model_name>.log' where:
    - [LOGDIR] is set as an env variable, or defaults to working dir
    - [tool_name] is one of 'benchmark_model' or 'label_image'
    - [run_date] is the start date-time in the format 'YYYYmmdd_HHMMSS'

  Depending on selected config, the log directory and file names may include one or more of the
  run options such as - fp16, nnapi, ruy.
 "
 }

 if [ "$1" = "-h" -o "$1" = "--help" ]; then
    show_info
    exit 0
 fi

 if [ "$README_FIRST" != "yes" ]; then
    printf "README FIRST:\n============\n"
    show_info
    read -p "Press ENTER key to continue..."
 fi

 if [ -z "$ADB_SERIAL" ]; then
    printf "\nERROR: Environment ADB_SERIAL must be set!\n"
    exit 1
 fi

 # Use taskset instead of cpufreq to select processor affinity
 if [ "$TASKSET" = "big" ]; then
    taskset_cmd="taskset f0"
 elif [ "$TASKSET" = "little" ]; then
    taskset_cmd="taskset 0f"
 fi

 # Host to which device is connected
 ADB_SERVER=${ADB_SERVER:-localhost}
 ADB_CMD=(adb -H $ADB_SERVER -s $ADB_SERIAL shell)

 warmups=${WARMUPS:-5} # benchmark_model only
 iters=${ITERS:-50}
 threads=${THREADS:-4}
 prof=${PROFILE:-0} # label_image only
 nnapi=${NNAPI:-0}
 fp16=${FP16:-0}

 # Directory for saved logs
 [[ "$RUNTOOL" == label* ]] && tool=label_image || tool=benchmark_model
 rundate=${RUNDATE:-$(date +%Y%m%d_%H%M%S)}
 logpath=${LOGDIR:-$PWD}/$tool-$rundate

 # Append config options where necessary
 [ $nnapi = 1 ] && logpath=$logpath-nnapi
 [ $fp16 = 1 ] && logpath=$logpath-fp16
 # [ ! -d "$logpath" ] && mkdir -p $logpath
 mkdir -p $(dirname $logpath) && logpath=$logpath.log

 # Log runtime config
 printf "\nDevice: $(${ADB_CMD[@]} getprop | grep -i ro.product.device)\n" | tee -a $logpath
 printf "
 Running TFLite with the following params:
  - taskset = ${taskset_cmd:-no}
  - warmups = $warmups runs (benchmark_model)
  - iterations = $iters runs
  - threads = $threads
  - profiling = $prof (label_image)
  - nnapi = $nnapi
  - fp16 = $fp16
  - logpath = $logpath
 " | tee -a $logpath

 # Folder with tflite installation (tools and data)
 BASEDIR=/data/local/tmp/tflite

 run_tool() {
    local tool=$1
    local model=$2
    if [ "$tool" = "label_image" ]; then
        # e.g. label_image --labels data/imagenet_labels.txt --image data/grace_hopper.bmp --threads 4 --count 50 --profiling 0 --accelerated 1 --allow_fp16 0 --tflite_model models/float/squeezenet.tflite
        ${ADB_CMD[@]} $taskset_cmd $BASEDIR/bin/label_image -l $BASEDIR/data/imagenet_labels.txt -i $BASEDIR/data/grace_hopper.bmp -t $threads -p $prof -c $iters -a $nnapi -f $fp16 -m $model
    else
        # e.g. benchmark_model --num_threads=4 --warmup_runs=5 --num_runs=50 --use_nnapi=0 --allow_fp16=0 --graph=models/float/squeezenet.tflite
        ${ADB_CMD[@]} $taskset_cmd $BASEDIR/bin/benchmark_model --num_threads=$threads --warmup_runs=$warmups --num_runs=$iters --use_nnapi=$nnapi --allow_fp16=$fp16 --graph=$model
    fi
 }

 for model in $(${ADB_CMD[@]} find $BASEDIR/models -type f -name "*.tflite"); do
    # logfile=$logpath/$(echo ${model##*/} | sed 's/.tflite//').log # use model name minus path dirname and extension
    run_tool $tool $model 2>&1 | tee -a $logpath
    sleep 1
 done

 printf "\nRUN COMPLETE: Saved runtime logs to: $logpath\n"
	From b5a99e2174f115f87c0cb3de9d2a2479a0193db2 Mon Sep 17 00:00:00 2001
	From: Koan-Sin Tan <[email protected]>
	Date: Sun, 18 Nov 2018 13:11:38 +0800
	Subject: [PATCH 1/3] add cmdline option to allow running fp32 models with fp16

	Add an option for TFLite benchmark_model to allow running fp32
	models with fp16. Useful when testing NNPAI accelerators with
	fp16.
	---
	.../lite/tools/benchmark/benchmark_tflite_model.cc \| 9 ++++++++-
	1 file changed, 8 insertions(+), 1 deletion(-)

	diff --git a/tensorflow/lite/tools/benchmark/benchmark_tflite_model.cc b/tensorflow/lite/tools/benchmark/benchmark_tflite_model.cc
	index 83e0ff1f872ef7..2d8b3a198c2967 100644
	--- a/tensorflow/lite/tools/benchmark/benchmark_tflite_model.cc
	+++ b/tensorflow/lite/tools/benchmark/benchmark_tflite_model.cc
	@@ -200,6 +200,7 @@ BenchmarkParams BenchmarkTfLiteModel::DefaultParams() {
	default_params.AddParam("input_layer_shape",
	BenchmarkParam::Create<std::string>(""));
	default_params.AddParam("use_nnapi", BenchmarkParam::Create<bool>(false));
	+ default_params.AddParam("allow_fp16", BenchmarkParam::Create<bool>(false));
	return default_params;
	}

	@@ -219,7 +220,8 @@ std::vector<Flag> BenchmarkTfLiteModel::GetFlags() {
	CreateFlag<std::string>("input_layer", &params_, "input layer names"),
	CreateFlag<std::string>("input_layer_shape", &params_,
	"input layer shape"),
	- CreateFlag<bool>("use_nnapi", &params_, "use nnapi api")};
	+ CreateFlag<bool>("use_nnapi", &params_, "use nnapi api"),
	+ CreateFlag<bool>("allow_fp16", &params_, "allow fp16")};

	flags.insert(flags.end(), specific_flags.begin(), specific_flags.end());
	return flags;
	@@ -233,6 +235,7 @@ void BenchmarkTfLiteModel::LogParams() {
	TFLITE_LOG(INFO) << "Input shapes: ["
	<< params_.Get<std::string>("input_layer_shape") << "]";
	TFLITE_LOG(INFO) << "Use nnapi : [" << params_.Get<bool>("use_nnapi") << "]";
	+ TFLITE_LOG(INFO) << "Allow fp16 : [" << params_.Get<bool>("allow_fp16") << "]";
	}

	bool BenchmarkTfLiteModel::ValidateParams() {
	@@ -328,6 +331,10 @@ void BenchmarkTfLiteModel::Init() {
	interpreter->UseNNAPI(use_nnapi);
	ApplyDelegates();

	+ bool allow_fp16 = params_.Get<bool>("allow_fp16");
	+
	+ interpreter->SetAllowFp16PrecisionForFp32(allow_fp16);
	+
	auto interpreter_inputs = interpreter->inputs();

	if (!inputs.empty()) {

	From dc4b9745b41ca7b2a00efb142bb0ab1e9895b4e0 Mon Sep 17 00:00:00 2001
	From: Koan-Sin Tan <[email protected]>
	Date: Sun, 18 Nov 2018 13:31:02 +0800
	Subject: [PATCH 2/3] add option for label_image to allow running fp32 models
	with fp16

	Add an option for TFLite label_image to allow running fp32
	models with fp16. Useful when testing NNPAI accelerators with
	fp16.
	---
	tensorflow/lite/examples/label_image/label_image.cc \| 6 ++++++
	tensorflow/lite/examples/label_image/label_image.h \| 1 +
	2 files changed, 7 insertions(+)

	diff --git a/tensorflow/lite/examples/label_image/label_image.cc b/tensorflow/lite/examples/label_image/label_image.cc
	index b8dc2840dfb49f..b83563280ec173 100644
	--- a/tensorflow/lite/examples/label_image/label_image.cc
	+++ b/tensorflow/lite/examples/label_image/label_image.cc
	@@ -113,6 +113,7 @@ void RunInference(Settings* s) {
	}

	interpreter->UseNNAPI(s->accel);
	+ interpreter->SetAllowFp16PrecisionForFp32(s->allow_fp16);

	if (s->verbose) {
	LOG(INFO) << "tensors size: " << interpreter->tensors_size() << "\n";
	@@ -253,6 +254,7 @@ void RunInference(Settings* s) {
	void display_usage() {
	LOG(INFO) << "label_image\n"
	<< "--accelerated, -a: [0\|1], use Android NNAPI or not\n"
	+ << "--allow_fp16, -f: [0\|1], allow running fp32 models with fp16 not\n"
	<< "--count, -c: loop interpreter->Invoke() for certain times\n"
	<< "--input_mean, -b: input mean\n"
	<< "--input_std, -s: input standard deviation\n"
	@@ -273,6 +275,7 @@ int Main(int argc, char** argv) {
	while (1) {
	static struct option long_options[] = {
	{"accelerated", required_argument, nullptr, 'a'},
	+ {"allow_fp16", required_argument, nullptr, 'f'},
	{"count", required_argument, nullptr, 'c'},
	{"verbose", required_argument, nullptr, 'v'},
	{"image", required_argument, nullptr, 'i'},
	@@ -305,6 +308,9 @@ int Main(int argc, char** argv) {
	s.loop_count =
	strtol(optarg, nullptr, 10); // NOLINT(runtime/deprecated_fn)
	break;
	+ case 'f':
	+ s.allow_fp16 = strtol(optarg, nullptr, 10); // NOLINT(runtime/deprecated_fn)
	+ break;
	case 'i':
	s.input_bmp_name = optarg;
	break;
	diff --git a/tensorflow/lite/examples/label_image/label_image.h b/tensorflow/lite/examples/label_image/label_image.h
	index 88b047fecc4b3e..cc46e56b64a9dc 100644
	--- a/tensorflow/lite/examples/label_image/label_image.h
	+++ b/tensorflow/lite/examples/label_image/label_image.h
	@@ -26,6 +26,7 @@ struct Settings {
	bool accel = false;
	bool input_floating = false;
	bool profiling = false;
	+ bool allow_fp16 = false;
	int loop_count = 1;
	float input_mean = 127.5f;
	float input_std = 127.5f;

	From ab7b554405dc4bf5b023522095a9b4a318327e0b Mon Sep 17 00:00:00 2001
	From: Koan-Sin Tan <[email protected]>
	Date: Tue, 12 Feb 2019 16:15:22 +0800
	Subject: [PATCH 3/3] rebase and run clang-format

	---
	.../lite/examples/label_image/label_image.cc \| 32 ++++++++++---------
	1 file changed, 17 insertions(+), 15 deletions(-)

	diff --git a/tensorflow/lite/examples/label_image/label_image.cc b/tensorflow/lite/examples/label_image/label_image.cc
	index b83563280ec173..340fbab5c6fcc9 100644
	--- a/tensorflow/lite/examples/label_image/label_image.cc
	+++ b/tensorflow/lite/examples/label_image/label_image.cc
	@@ -252,20 +252,21 @@ void RunInference(Settings* s) {
	}

	void display_usage() {
	- LOG(INFO) << "label_image\n"
	- << "--accelerated, -a: [0\|1], use Android NNAPI or not\n"
	- << "--allow_fp16, -f: [0\|1], allow running fp32 models with fp16 not\n"
	- << "--count, -c: loop interpreter->Invoke() for certain times\n"
	- << "--input_mean, -b: input mean\n"
	- << "--input_std, -s: input standard deviation\n"
	- << "--image, -i: image_name.bmp\n"
	- << "--labels, -l: labels for the model\n"
	- << "--tflite_model, -m: model_name.tflite\n"
	- << "--profiling, -p: [0\|1], profiling or not\n"
	- << "--num_results, -r: number of results to show\n"
	- << "--threads, -t: number of threads\n"
	- << "--verbose, -v: [0\|1] print more information\n"
	- << "\n";
	+ LOG(INFO)
	+ << "label_image\n"
	+ << "--accelerated, -a: [0\|1], use Android NNAPI or not\n"
	+ << "--allow_fp16, -f: [0\|1], allow running fp32 models with fp16 not\n"
	+ << "--count, -c: loop interpreter->Invoke() for certain times\n"
	+ << "--input_mean, -b: input mean\n"
	+ << "--input_std, -s: input standard deviation\n"
	+ << "--image, -i: image_name.bmp\n"
	+ << "--labels, -l: labels for the model\n"
	+ << "--tflite_model, -m: model_name.tflite\n"
	+ << "--profiling, -p: [0\|1], profiling or not\n"
	+ << "--num_results, -r: number of results to show\n"
	+ << "--threads, -t: number of threads\n"
	+ << "--verbose, -v: [0\|1] print more information\n"
	+ << "\n";
	}

	int Main(int argc, char** argv) {
	@@ -309,7 +310,8 @@ int Main(int argc, char** argv) {
	strtol(optarg, nullptr, 10); // NOLINT(runtime/deprecated_fn)
	break;
	case 'f':
	- s.allow_fp16 = strtol(optarg, nullptr, 10); // NOLINT(runtime/deprecated_fn)
	+ s.allow_fp16 =
	+ strtol(optarg, nullptr, 10); // NOLINT(runtime/deprecated_fn)
	break;
	case 'i':
	s.input_bmp_name = optarg;
	diff --git a/tensorflow/lite/examples/label_image/label_image.cc b/tensorflow/lite/examples/label_image/label_image.cc
	index 7c6f523..e458423 100644
	--- a/tensorflow/lite/examples/label_image/label_image.cc
	+++ b/tensorflow/lite/examples/label_image/label_image.cc
	@@ -24,6 +24,8 @@ limitations under the License.
	#include <string>
	#include <unordered_set>
	#include <vector>
	+#include <algorithm>
	+#include <functional>

	#include <fcntl.h> // NOLINT(build/include_order)
	#include <getopt.h> // NOLINT(build/include_order)
	@@ -45,7 +47,7 @@ limitations under the License.
	namespace tflite {
	namespace label_image {

	-double get_us(struct timeval t) { return (t.tv_sec * 1000000 + t.tv_usec); }
	+double get_us(struct timeval t) { return (t.tv_sec * 1000000.0 + (double)t.tv_usec); }

	// Takes a file name, and loads a list of labels from it, one per line, and
	// returns a vector of the strings. It pads with empty strings so the length
	@@ -87,6 +89,41 @@ void PrintProfilingInfo(const profiling::ProfileEvent* e, uint32_t op_index,
	<< "\n";
	}

	+void LogTimingDistribution(std::vector<double> & timings) {
	+ int timing_count = timings.size();
	+ int p5_count = timing_count / 20;
	+ std::sort(timings.begin(), timings.end());
	+
	+ int i = 0;
	+ int c = 0;
	+ double avg = 0;
	+ for(auto t : timings) {
	+ double ms = t / 1000.0;
	+ avg += ms;
	+ ++i;
	+ ++c;
	+ if (i > p5_count \|\| c == timing_count) {
	+ LOG(INFO) << " => " << (c*100/timing_count) << "% is " << ms <<
	+ " ms. avg within bucket: " << (avg/i) << " ms\n";
	+ i = 0;
	+ avg = 0;
	+ }
	+ }
	+}
	+
	+void LogTimings(std::vector<double> & timings) {
	+ int timing_count = timings.size();
	+
	+ int i = 0;
	+ int c = 0;
	+ double avg = 0;
	+ for(auto t : timings) {
	+ double ms = t / 1000.0;
	+ LOG(INFO) << "Iteration_" << c << "=" << ms <<" ms\n";
	+ ++c;
	+ }
	+}
	+
	void RunInference(Settings* s) {
	if (!s->model_name.c_str()) {
	LOG(ERROR) << "no model file name\n";
	@@ -188,19 +226,26 @@ void RunInference(Settings* s) {

	if (s->profiling) profiler->StartProfiling();

	- struct timeval start_time, stop_time;
	+ struct timeval start_time, stop_time, act_time;
	gettimeofday(&start_time, nullptr);
	+ std::vector<double> timings;
	+ double prev_time_us = get_us(start_time);
	for (int i = 0; i < s->loop_count; i++) {
	if (interpreter->Invoke() != kTfLiteOk) {
	LOG(FATAL) << "Failed to invoke tflite!\n";
	}
	+ gettimeofday(&act_time, NULL);
	+ double act_time_us = get_us(act_time);
	+ timings.push_back(act_time_us - prev_time_us);
	+ prev_time_us = act_time_us;
	}
	gettimeofday(&stop_time, nullptr);
	LOG(INFO) << "invoked \n";
	LOG(INFO) << "average time: "
	<< (get_us(stop_time) - get_us(start_time)) / (s->loop_count * 1000)
	<< " ms \n";
	-
	+ LogTimings(timings);
	+ LogTimingDistribution(timings);
	if (s->profiling) {
	profiler->StopProfiling();
	auto profile_events = profiler->GetProfileEvents();
	#!/usr/bin/env bash

	set -eo pipefail

	# Release tag or branch name
	TF_VERSION=${TF_VERSION:-"v1.13.1"}

	# Clone a fresh copy
	if [ -n "${TF_CLONE}" ]; then
	TF_SRCDIR=/tmp/build-tflite/tensorflow_src
	rm -rf ${TF_SRCDIR}
	mkdir -p ${TF_SRCDIR}
	if [ ! -d "${TF_SRCDIR}" ]; then
	git clone --branch ${TF_VERSION} --depth 1 https://github.com/tensorflow/tensorflow ${TF_SRCDIR}
	fi

	# Download patches
	TF_PATCH_DIR=/tmp/build-tflite/tf_patches
	TF_APPLY_PATCH="yes"
	TF_PATCHES=("0001-tflite-allow-fp16-for-fp32-models.patch" "0002-tflite-label-image-log-timing-dist.patch")
	for patch in "${TF_PATCHES[@]}"; do
	wget -q -nc --show-progress https://gist.github.com/muendelezaji/47b32812a15b622f05019b0e433de9b1/raw/${patch} -P ${TF_PATCH_DIR}
	done
	fi

	# Alternatively, provide path to cloned TensorFlow repo
	TF_SRCDIR=${1:-"$TF_SRCDIR"}
	TF_SRCDIR="$(readlink -f ${1:-"$TF_SRCDIR"})" # get absolute
	# Folder with patches
	TF_PATCH_DIR="$(readlink -f ${TF_PATCH_DIR:-"patches"})"
	TF_APPLY_PATCH=${TF_APPLY_PATCH:-"yes"}
	# Output folder
	TF_OUTDIR="$(readlink -f ${TF_OUTDIR:-"out"})"

	# Sanity checks
	if [ ! -d "${TF_SRCDIR}" ]; then
	echo "ERROR: Cannot find TensorFlow source directory. Ensure it exists or set TF_CLONE to do a new clone."
	exit 1
	elif [ ! -f "${TF_SRCDIR}/configure" -o ! -f "${TF_SRCDIR}/BUILD" ]; then
	echo "ERROR: Missing configure or BUILD file in $TF_SRCDIR. Ensure it is a valid Bazel workspace."
	exit 1
	elif [ "${TF_APPLY_PATCH}" = "yes" -a ! -d "${TF_PATCH_DIR}" ]; then
	echo "ERROR: Patches directory was not found. It must exist when TF_APPLY_PATCH is set to 'yes'."
	exit 1
	elif [ -z "${ANDROID_NDK_HOME}" -o -z "${ANDROID_SDK_HOME}" ]; then
	echo "ERROR: Cannot locate Android NDK or SDK. Ensure both ANDROID_NDK_HOME and ANDROID_SDK_HOME are set."
	exit 1
	fi

	# Apply required patches
	if [ "${TF_APPLY_PATCH}" = "yes" ]; then
	pushd ${TF_SRCDIR}
	for patch in $(find "${TF_PATCH_DIR}" -type f -name "*.patch" \| sort); do
	git apply ${patch}
	done
	git config --local user.name temp
	git config --local user.email [email protected]
	git commit -am "[TFLite] Add fp16 support and log timing distribution"
	popd
	fi

	# Select features
	TF_BUILD_VARS="TF_NEED_CUDA=0"
	TF_BUILD_VARS+=" TF_NEED_OPENCL_SYCL=0"
	TF_BUILD_VARS+=" TF_NEED_ROCM=0"
	TF_BUILD_VARS+=" TF_NEED_JEMALLOC=1"
	TF_BUILD_VARS+=" TF_NEED_MPI=0"
	TF_BUILD_VARS+=" TF_ENABLE_XLA=0"
	TF_BUILD_VARS+=" TF_DOWNLOAD_CLANG=0"
	TF_BUILD_VARS+=" TF_SET_ANDROID_WORKSPACE=1"
	export ${TF_BUILD_VARS}

	# Bazel settings
	BAZEL_BIN=${BAZEL_BIN:-"$(command -v bazel \|\| true)"}
	BAZEL_JOBS=${BAZEL_JOBS:-"4"}
	# BAZEL_PATCH="yes"
	# BAZEL_AVAIL_RAM=1536 # MB
	# BAZEL_AVAIL_CPU=4.0 # number of cpu cores (1.0 representing a single full core)
	# BAZEL_AVAIL_IO=1.0 # workstation I/O capability (with 1.0 representing average workstation)
	# if [ -n "$BAZEL_AVAIL_RAM" -a -n "$BAZEL_AVAIL_CPU" -a -n "$BAZEL_AVAIL_IO" ]; then
	# BAZEL_RESOURCES="--local_resources ${BAZEL_AVAIL_RAM},${BAZEL_AVAIL_CPU},${BAZEL_AVAIL_IO}"
	# fi

	# Download if not present - use portable binary to avoid installation
	if [ ! -x "${BAZEL_BIN}" ]; then
	BAZEL_VERSION="0.20.0" # was 0.19.2
	BAZEL_FILE="bazel-${BAZEL_VERSION}-linux-x86_64"
	BAZEL_DIR="/tmp/build-tflite/bazel_bin/${BAZEL_VERSION}"
	mkdir -p ${BAZEL_DIR}
	wget -q -nc --show-progress https://github.com/bazelbuild/bazel/releases/download/${BAZEL_VERSION}/${BAZEL_FILE} -P ${BAZEL_DIR}
	chmod +x ${BAZEL_DIR}/${BAZEL_FILE}
	ln -sf ${BAZEL_DIR}/${BAZEL_FILE} ${BAZEL_DIR}/bazel
	export PATH="${BAZEL_DIR}:$PATH"
	BAZEL_BIN="$(command -v bazel)"
	fi

	# Build config
	# Disable default-on TensorFlow cloud features
	BAZEL_COPT_FLAGS=" --config=noaws --config=nogcp --config=nohdfs --config=nokafka --config=noignite --config=nonccl --define tensorflow_mkldnn_contraction_kernel=0"
	# Android "--config=android_arm64" is equivalent to:
	# --cpu=arm64-v8a --fat_apk_cpu=arm64-v8a --crosstool_top=//external:android/crosstool --host_crosstool_top=@bazel_tools//tools/cpp:toolchain
	BAZEL_COPT_FLAGS+=" --copt=-DTFLITE_PROFILING_ENABLED --cxxopt=-std=c++11 --config=monolithic --config=android_arm64 --action_env ANDROID_NDK_API_LEVEL=28" # was 21
	# TFLite targets for Android
	BAZEL_EXTRA_FLAGS=" //tensorflow/lite/examples/label_image:label_image"
	BAZEL_EXTRA_FLAGS+=" //tensorflow/lite/tools/benchmark:benchmark_model"

	# Python
	TF_PYTHON_VERSION=${TF_PYTHON_VERSION:-"2"}
	export PYTHON_BIN_PATH="$(command -v python${TF_PYTHON_VERSION})"
	export USE_DEFAULT_PYTHON_LIB_PATH="1"

	# GCC optimisations
	# For more info, see: https://gcc.gnu.org/onlinedocs/gcc/ARM-Options.html
	export CC_OPT_FLAGS="-march=armv8-a"
	# Add suffix to TF_OUTDIR for more specialised builds
	if [ "${TF_GCC_OPTS}" = "simd" ]; then
	CC_OPT_FLAGS="-march=armv8-a+simd"
	TF_OUTDIR="${TF_OUTDIR}-simd"
	elif [ "${TF_GCC_OPTS}" = "fp16" ]; then
	CC_OPT_FLAGS="-march=armv8.2-a+fp16"
	TF_OUTDIR="${TF_OUTDIR}-fp16"
	fi
	BAZEL_COPT_FLAGS+=" --copt=${CC_OPT_FLAGS}"

	# Android
	export NDK_ROOT="${ANDROID_NDK_HOME}"
	export ANDROID_API_LEVEL="28" # was 26
	export ANDROID_BUILD_TOOLS_VERSION="28.0.3"

	# Configure and build
	pushd ${TF_SRCDIR} && ./configure
	# Clean if not an incremental rebuild
	if [ -z "${TF_REBUILD}" ]; then
	${BAZEL_BIN} clean
	fi

	${BAZEL_BIN} build ${BAZEL_RESOURCES} -c opt --verbose_failures --jobs=${BAZEL_JOBS} ${BAZEL_COPT_FLAGS} ${BAZEL_EXTRA_FLAGS}

	mkdir -p ${TF_OUTDIR}
	cp -a --remove-destination -t ${TF_OUTDIR} \
	bazel-bin/tensorflow/lite/examples/label_image/label_image \
	bazel-bin/tensorflow/lite/tools/benchmark/benchmark_model

	echo "Builds saved to: ${TF_OUTDIR}"
	#!/usr/bin/env groovy

	pipeline {
	agent any

	parameters {
	choice name: 'BAZEL_VERSION', choices: ['0.19.2', '0.21.0', '0.24.1'], description: 'Bazel version to use when building'
	choice name: 'NDK_VERSION', choices: ['13', '14', '18', '19'], description: 'NDK version to use when building'
	choice name: 'SDK_VERSION', choices: ['21', '28', '29'], description: 'SDK version to use when building'
	choice name: 'TF_VERSION', choices: ['v1.13.1', 'v1.14.0', 'v2.0.0-beta1'], description: 'Tagged version of TensorFlow to download'
	}

	options {
	buildDiscarder logRotator(numToKeepStr: '10')
	skipDefaultCheckout()
	skipStagesAfterUnstable()
	timeout time: 30, unit: 'MINUTES'
	timestamps()
	}

	environment {
	ANDROID_NDK_HOME = "${env.BUILD_TOOLS}/android/android-ndk-r${params.NDK_VERSION}"
	ANDROID_SDK_HOME = "${env.BUILD_TOOLS}/android/android-sdk"
	BAZEL_HOME = "${env.BUILD_TOOLS}/bazel/bazel-${params.BAZEL_VERSION}"
	VENV_HOME = "${env.HOME}/.local"

	// Set env from params (used in build shell script)
	BAZEL_VERSION = "${params.BAZEL_VERSION}"
	NDK_VERSION = "${params.NDK_VERSION}"
	SDK_VERSION = "${params.SDK_VERSION}"
	TF_VERSION = "${params.TF_VERSION}"

	TF_SRCDIR = 'src'
	TF_OUTDIR = 'out'
	TF_PATCH_DIR = 'patches'
	TF_PATCH = (params.TF_VERSION ==~ '.1.13.') ? 'yes' : 'no'
	}

	stages {
	stage('Checkout repo') {
	steps {
	dir("${env.TF_SRCDIR}") {
	checkout([$class: 'GitSCM', branches: [[name: "refs/tags/${params.TF_VERSION}"]], userRemoteConfigs: [[url: 'https://github.com/tensorflow/tensorflow']]])
	}
	}
	}

	stage('Build TFLite') {
	steps {
	echo '====++++ executing Build TFLite ++++===='
	withEnv([
	"BAZEL_BIN=${env.BAZEL_HOME}/bin/bazel",
	"PATH+BAZEL=${env.BAZEL_HOME}/bin",
	"PATH+VENV=${env.VENV_HOME}/bin",
	]) {
	sh '''
	# Create and activate Python venv
	virtualenv .
	virtualenv --relocatable .
	. ./bin/activate

	# Install pip requirements
	# From REQUIRED_PACKAGES in tensorflow/tools/pip_package/setup.py
	pip install -U pip six numpy wheel setuptools mock future>=0.17.1
	pip install -U keras_applications==1.0.6 --no-deps
	pip install -U keras_preprocessing==1.0.5 --no-deps

	# Download patches
	GIST_URL=https://gist.github.com/muendelezaji/47b32812a15b622f05019b0e433de9b1/raw
	mkdir -p $TF_PATCH_DIR
	for patch in '0001-tflite-allow-fp16-for-fp32-models.patch' '0002-tflite-label-image-log-timing-dist.patch'; do
	curl -fsL $GIST_URL/$patch > $TF_PATCH_DIR/$patch
	done

	# Get build script and run it
	BUILD_SCRIPT='build-tflite-1.13.sh'
	curl -fsL $GIST_URL/$BUILD_SCRIPT > $BUILD_SCRIPT
	chmod +x $BUILD_SCRIPT
	bash -x ./$BUILD_SCRIPT

	deactivate
	'''
	}
	}

	post {
	success {
	echo '====++++ Build TFLite executed succesfully ++++===='
	archiveArtifacts artifacts: "${env.TF_OUTDIR}/*", fingerprint: true
	}

	failure {
	echo '====++++ Build TFLite execution failed ++++===='
	}
	}
	}

	stage('Run TFLite') {
	steps {
	echo '====++++ executing Run TFLite ++++===='
	}
	}
	}

	post {
	always {
	echo '====++++ Pipeline finished ++++===='
	deleteDir() // clean up the workspace
	}
	}
	}
	#!/bin/sh

	# Configurable build tool parameters
	BAZEL_VERSION=0.19.2
	NDK_VERSION=18
	SDK_VERSION=28
	TF_VERSION=v1.13.1
	TF_PATCH=yes
	TF_PATCH_DIR=patches

	# Setup build tools - use global config or custom tools plugin
	ANDROID_NDK_HOME=$BUILD_TOOLS/android/android-ndk-r$NDK_VERSION
	ANDROID_SDK_HOME=$BUILD_TOOLS/android/android-sdk
	BAZEL_HOME=$BUILD_TOOLS/bazel/bazel-$BAZEL_VERSION
	VENV_HOME=$HOME/.local
	# Add them to path
	PATH=$BAZEL_HOME/bin:$VENV_HOME/bin:$PATH

	# Create and activate Python venv
	virtualenv .
	virtualenv --relocatable .
	. ./bin/activate

	# Install pip requirements
	# From REQUIRED_PACKAGES in tensorflow/tools/pip_package/setup.py
	pip install -U pip six numpy wheel setuptools mock future>=0.17.1
	pip install -U keras_applications==1.0.6 --no-deps
	pip install -U keras_preprocessing==1.0.5 --no-deps

	# Download patches
	GIST_URL=https://gist.github.com/muendelezaji/47b32812a15b622f05019b0e433de9b1/raw
	mkdir -p $TF_PATCH_DIR
	for patch in '0001-tflite-allow-fp16-for-fp32-models.patch'; do
	curl -fsL $GIST_URL/$patch > $TF_PATCH_DIR/$patch
	done

	# Get build script and run it
	BUILD_SCRIPT='build-tflite.sh'
	curl -fsL $GIST_URL/$BUILD_SCRIPT > $BUILD_SCRIPT
	chmod +x $BUILD_SCRIPT
	bash -x ./$BUILD_SCRIPT

	deactivate
	#!/usr/bin/env bash

	set -eo pipefail

	if [ "${BUILD_CONFIG}" = "2.0" ]; then
	TF_VERSION=v2.0.0-beta1
	TF_PATCH=0
	TF_CLONE=1
	BAZEL_VERSION=0.24.1
	BAZEL_BIN=none # force download
	BAZEL_COPT_FLAGS+=" --config=v2"
	elif [ "${BUILD_CONFIG}" = "1.14" ]; then
	TF_VERSION=v1.14.0
	TF_PATCH=0
	TF_CLONE=1
	BAZEL_VERSION=0.24.1
	BAZEL_BIN=none
	fi

	# Release tag or branch name
	TF_VERSION=${TF_VERSION:-"v1.13.1"}
	TF_PATCH=${TF_PATCH:-"1"}
	# Shorthand
	# : ${TF_VERSION:="v1.13.1"}
	# : ${TF_PATCH:="1"}

	# Clone a fresh copy
	if [ -n "${TF_CLONE}" ]; then
	TF_SRCDIR="/tmp/build-tflite/tensorflow/${TF_VERSION}/src"
	TF_OUTDIR="/tmp/build-tflite/tensorflow/${TF_VERSION}/out"
	if [ ! -d "${TF_SRCDIR}" ]; then
	git clone --branch ${TF_VERSION} --depth 1 https://github.com/tensorflow/tensorflow ${TF_SRCDIR}
	fi

	# Download patches
	if [ "${TF_PATCH}" = "1" ]; then
	TF_PATCH_DIR="/tmp/build-tflite/tensorflow/${TF_VERSION}/patches"
	TF_PATCHES=("0001-tflite-allow-fp16-for-fp32-models.patch" "0002-tflite-label-image-log-timing-dist.patch")
	for patch in "${TF_PATCHES[@]}"; do
	wget -q -nc --show-progress https://gist.github.com/muendelezaji/47b32812a15b622f05019b0e433de9b1/raw/${patch} -P ${TF_PATCH_DIR}
	done
	fi
	fi

	# Alternatively, provide path to cloned TensorFlow repo
	TF_SRCDIR="${TF_SRCDIR:-$(readlink -f "src")}"
	TF_OUTDIR="${TF_OUTDIR:-$(readlink -f "out")}" # Build outputs folder
	TF_PATCH_DIR="${TF_PATCH_DIR:-$(readlink -f "patches")}" # Folder with patches
	# Shorthand
	# : ${TF_SRCDIR:=$(readlink -f "src")}
	# : ${TF_OUTDIR:=$(readlink -f "out")}
	# : ${TF_PATCH_DIR:=$(readlink -f "patches")}

	# Sanity checks
	if [ ! -d "${TF_SRCDIR}" ]; then
	echo "ERROR: Cannot find TensorFlow source directory. Ensure it exists or set TF_CLONE to do a new clone."
	exit 1
	elif [ ! -f "${TF_SRCDIR}/configure" -o ! -f "${TF_SRCDIR}/BUILD" ]; then
	echo "ERROR: Missing configure or BUILD file in ${TF_SRCDIR}. Ensure it is a valid Bazel workspace."
	exit 1
	elif [ "${TF_PATCH}" = "1" -a ! -d "${TF_PATCH_DIR}" ]; then
	echo "ERROR: Patches directory was not found. It must exist when TF_PATCH is set to 'yes'."
	exit 1
	elif [ -z "${ANDROID_NDK_HOME}" -o -z "${ANDROID_SDK_HOME}" ]; then
	echo "ERROR: Cannot locate Android NDK or SDK. Ensure both ANDROID_NDK_HOME and ANDROID_SDK_HOME are set."
	exit 1
	fi

	pushd ${TF_SRCDIR}

	# Apply required patches
	if [ "${TF_PATCH}" = "1" ]; then
	for patch in $(find ${TF_PATCH_DIR} -type f -name "*.patch" \| sort); do
	git apply ${patch}
	done
	git config --local user.name temp
	git config --local user.email [email protected]
	git commit -am "[TFLite] All patched up and ready to go"
	fi

	# Bazel
	BAZEL_BIN=${BAZEL_BIN:-"$(command -v bazel \|\| true)"}
	BAZEL_JOBS=${BAZEL_JOBS:-"4"}
	# BAZEL_PATCH="no"
	# BAZEL_AVAIL_RAM=2048 # MB
	# BAZEL_AVAIL_CPU=4.0 # number of cpu cores (1.0 representing a single full core)
	# BAZEL_AVAIL_IO=1.0 # workstation I/O capability (with 1.0 representing average workstation)
	# if [ -n "${BAZEL_AVAIL_RAM}" -a -n "${BAZEL_AVAIL_CPU}" -a -n "${BAZEL_AVAIL_IO}" ]; then
	# BAZEL_RESOURCES="--local_resources ${BAZEL_AVAIL_RAM},${BAZEL_AVAIL_CPU},${BAZEL_AVAIL_IO}"
	# fi
	if [ -n "${BAZEL_DRYRUN}" ]; then
	BAZEL_DEBUG_FLAGS+=" --nobuild"
	fi
	if [ -n "${BAZEL_VERBOSE}" ]; then
	BAZEL_DEBUG_FLAGS+=" -s --explain=${TF_OUTDIR}/explain.log"
	fi
	if [ -n "${BAZEL_DEBUG_FLAGS}" ]; then
	set -x
	fi

	# Download portable binary if not present
	if [ ! -x "${BAZEL_BIN}" ]; then
	BAZEL_VERSION=${BAZEL_VERSION:-"0.24.1"}
	BAZEL_FILE="bazel-${BAZEL_VERSION}-linux-x86_64"
	BAZEL_DIR="/tmp/build-tflite/bazel/${BAZEL_VERSION}"

	wget -q -nc --show-progress https://github.com/bazelbuild/bazel/releases/download/${BAZEL_VERSION}/${BAZEL_FILE} -P ${BAZEL_DIR}
	chmod +x ${BAZEL_DIR}/${BAZEL_FILE}
	ln -sf ${BAZEL_DIR}/${BAZEL_FILE} ${BAZEL_DIR}/bazel
	export PATH="${BAZEL_DIR}:${PATH}"
	BAZEL_BIN="$(command -v bazel)"
	fi

	# Python
	PYTHON_VERSION=${PYTHON_VERSION:-"2"}
	export PYTHON_BIN_PATH="$(command -v python${PYTHON_VERSION})"
	export USE_DEFAULT_PYTHON_LIB_PATH="1"

	# Android
	export ANDROID_BUILD_TOOLS_VERSION="28.0.3"
	export ANDROID_API_LEVEL="28"
	export ANDROID_NDK_API_LEVEL=${ANDROID_API_LEVEL}
	NDK_VERSION="$(sed -En 's/Pkg.Revision = ([0-9]+).*/\1/p' ${ANDROID_NDK_HOME}/source.properties)"

	# Select TensorFlow features
	TF_BUILD_VARS+=" TF_NEED_CUDA=0"
	TF_BUILD_VARS+=" TF_NEED_OPENCL_SYCL=0"
	TF_BUILD_VARS+=" TF_NEED_ROCM=0"
	TF_BUILD_VARS+=" TF_NEED_JEMALLOC=1"
	TF_BUILD_VARS+=" TF_NEED_MPI=0"
	TF_BUILD_VARS+=" TF_ENABLE_XLA=0"
	TF_BUILD_VARS+=" TF_DOWNLOAD_CLANG=0"
	TF_BUILD_VARS+=" TF_SET_ANDROID_WORKSPACE=1"
	export ${TF_BUILD_VARS}

	# Build options
	# Disable unused default-on features
	BAZEL_COPT_FLAGS+=" --config=noaws --config=nogcp --config=nohdfs --config=nokafka --config=noignite --config=nonccl --define tensorflow_mkldnn_contraction_kernel=0"
	# Android config is equivalent to:
	# --cpu=arm64-v8a --fat_apk_cpu=arm64-v8a --crosstool_top=//external:android/crosstool --host_crosstool_top=@bazel_tools//tools/cpp:toolchain
	BAZEL_COPT_FLAGS+=" --config=android_arm64 --config=monolithic --config=opt --cxxopt=-std=c++11"
	# Enable RUY
	if [ "${TF_ENABLE_RUY}" = "1" ]; then
	BAZEL_COPT_FLAGS+=" --define tflite_with_ruy=true"
	else
	BAZEL_COPT_FLAGS+=" --define tflite_with_ruy=false"
	fi

	# TFLite targets for Android
	BAZEL_TARGETS+=" //tensorflow/lite:libtensorflowlite.so"
	BAZEL_TARGETS+=" //tensorflow/lite/examples/label_image:label_image"
	BAZEL_TARGETS+=" //tensorflow/lite/tools/benchmark:benchmark_model"

	build_variant() {
	local variant="${1}"
	local ccflags="${2}"
	# Output path
	local variant_name="${TF_VERSION}_ruy${TF_ENABLE_RUY}_${variant}"
	local variant_path="${TF_OUTDIR}/${variant_name}"

	# GCC build optimisations - autoloaded during Bazel config step
	# For more info, see https://gcc.gnu.org/onlinedocs/gcc/ARM-Options.html
	export CC_OPT_FLAGS=" -O3 -DTFLITE_PROFILING_ENABLED ${ccflags}"

	# Configure and build
	if [ "${BAZEL_REBUILD}" != "1" ]; then
	${BAZEL_BIN} clean
	fi
	./configure
	${BAZEL_BIN} build ${BAZEL_DEBUG_FLAGS} ${BAZEL_RESOURCES} -c opt --verbose_failures --jobs=${BAZEL_JOBS} ${BAZEL_COPT_FLAGS} ${BAZEL_TARGETS}

	if [ "${BAZEL_DRYRUN}" != "1" ]; then
	# Move to output dir
	mkdir -p ${variant_path}
	mv -f -t ${variant_path} \
	bazel-bin/tensorflow/lite/libtensorflowlite.so \
	bazel-bin/tensorflow/lite/examples/label_image/label_image \
	bazel-bin/tensorflow/lite/tools/benchmark/benchmark_model
	echo "Builds saved to: ${variant_path}"
	fi
	}

	# Generic v8-a with SIMD instructions
	build_variant "v8a" "-march=armv8-a+simd"
	# Optimised FP16 instructions
	build_variant "v8.2a" "-march=armv8.2-a+fp16+dotprod"
	#!/usr/bin/env bash

	# README FIRST:
	# ============
	# Script to run the TFLite tools benchmark_model or label_image and log results to a file.
	#
	# Environment prerequisites:
	# 1. Export ADB_SERIAL=<your_device_id> in your shell
	# 2. Copy files to the device:
	# - binaries to /data/local/tmp/tflite/bin/
	# - models to /data/local/tmp/tflite/models/
	# - test data (sample images, labels file) to /data/local/tmp/tflite/data/
	# 3. Setup device CPU/GPU/etc frequencies as appropriate
	#
	# Saved results location:
	# By default run logs are saved to '[LOGDIR]/[tool_name]-[run_date]/<model_name>.log' where:
	# - [LOGDIR] is set as an env variable, or defaults to working dir
	# - [tool_name] is one of 'benchmark_model' or 'label_image'
	# - [run_date] is the start date-time in the format 'YYYYmmdd_HHMMSS'
	#
	# Depending on selected config, the log directory and file names may include one or more of the
	# run options such as - fp16, nnapi, ruy.

	set -o pipefail

	README_FIRST=yes # Set this to "yes" disable readme prompt

	show_info() {
	echo "
	Script to run the TFLite tools benchmark_model or label_image and log results to a file.

	Environment prerequisites:
	1. Export ADB_SERIAL=<your_device_id> in your shell
	2. Copy files to the device:
	- binaries to /data/local/tmp/tflite/bin/
	- models to /data/local/tmp/tflite/models/
	- test data (sample images, labels file) to /data/local/tmp/tflite/data/
	3. Setup device CPU/GPU/etc frequencies as appropriate

	Saved results location:
	By default run logs are saved to '[LOGDIR]/[tool_name]-[run_date]/<model_name>.log' where:
	- [LOGDIR] is set as an env variable, or defaults to working dir
	- [tool_name] is one of 'benchmark_model' or 'label_image'
	- [run_date] is the start date-time in the format 'YYYYmmdd_HHMMSS'

	Depending on selected config, the log directory and file names may include one or more of the
	run options such as - fp16, nnapi, ruy.
	"
	}

	if [ "$1" = "-h" -o "$1" = "--help" ]; then
	show_info
	exit 0
	fi

	if [ "$README_FIRST" != "yes" ]; then
	printf "README FIRST:\n============\n"
	show_info
	read -p "Press ENTER key to continue..."
	fi

	if [ -z "$ADB_SERIAL" ]; then
	printf "\nERROR: Environment ADB_SERIAL must be set!\n"
	exit 1
	fi

	# Use taskset instead of cpufreq to select processor affinity
	if [ "$TASKSET" = "big" ]; then
	taskset_cmd="taskset f0"
	elif [ "$TASKSET" = "little" ]; then
	taskset_cmd="taskset 0f"
	fi

	# Host to which device is connected
	ADB_SERVER=${ADB_SERVER:-localhost}
	ADB_CMD=(adb -H $ADB_SERVER -s $ADB_SERIAL shell)

	warmups=${WARMUPS:-5} # benchmark_model only
	iters=${ITERS:-50}
	threads=${THREADS:-4}
	prof=${PROFILE:-0} # label_image only
	nnapi=${NNAPI:-0}
	fp16=${FP16:-0}

	# Directory for saved logs
	[[ "$RUNTOOL" == label* ]] && tool=label_image \|\| tool=benchmark_model
	rundate=${RUNDATE:-$(date +%Y%m%d_%H%M%S)}
	logpath=${LOGDIR:-$PWD}/$tool-$rundate

	# Append config options where necessary
	[ $nnapi = 1 ] && logpath=$logpath-nnapi
	[ $fp16 = 1 ] && logpath=$logpath-fp16
	# [ ! -d "$logpath" ] && mkdir -p $logpath
	mkdir -p $(dirname $logpath) && logpath=$logpath.log

	# Log runtime config
	printf "\nDevice: $(${ADB_CMD[@]} getprop \| grep -i ro.product.device)\n" \| tee -a $logpath
	printf "
	Running TFLite with the following params:
	- taskset = ${taskset_cmd:-no}
	- warmups = $warmups runs (benchmark_model)
	- iterations = $iters runs
	- threads = $threads
	- profiling = $prof (label_image)
	- nnapi = $nnapi
	- fp16 = $fp16
	- logpath = $logpath
	" \| tee -a $logpath

	# Folder with tflite installation (tools and data)
	BASEDIR=/data/local/tmp/tflite

	run_tool() {
	local tool=$1
	local model=$2
	if [ "$tool" = "label_image" ]; then
	# e.g. label_image --labels data/imagenet_labels.txt --image data/grace_hopper.bmp --threads 4 --count 50 --profiling 0 --accelerated 1 --allow_fp16 0 --tflite_model models/float/squeezenet.tflite
	${ADB_CMD[@]} $taskset_cmd $BASEDIR/bin/label_image -l $BASEDIR/data/imagenet_labels.txt -i $BASEDIR/data/grace_hopper.bmp -t $threads -p $prof -c $iters -a $nnapi -f $fp16 -m $model
	else
	# e.g. benchmark_model --num_threads=4 --warmup_runs=5 --num_runs=50 --use_nnapi=0 --allow_fp16=0 --graph=models/float/squeezenet.tflite
	${ADB_CMD[@]} $taskset_cmd $BASEDIR/bin/benchmark_model --num_threads=$threads --warmup_runs=$warmups --num_runs=$iters --use_nnapi=$nnapi --allow_fp16=$fp16 --graph=$model
	fi
	}

	for model in $(${ADB_CMD[@]} find $BASEDIR/models -type f -name "*.tflite"); do
	# logfile=$logpath/$(echo ${model##*/} \| sed 's/.tflite//').log # use model name minus path dirname and extension
	run_tool $tool $model 2>&1 \| tee -a $logpath
	sleep 1
	done

	printf "\nRUN COMPLETE: Saved runtime logs to: $logpath\n"