python-universe
diff --git a/‎CMakeLists.txt
Lines changed: 123 additions & 13 deletions b/‎CMakeLists.txt
Lines changed: 123 additions & 13 deletions
diff --git a/‎README.md
Lines changed: 69 additions & 0 deletions b/‎README.md
Lines changed: 69 additions & 0 deletions
diff --git a/‎src/LICENSE renamed to ‎src/tensorflow/LICENSE b/‎src/LICENSE renamed to ‎src/tensorflow/LICENSE
diff --git a/‎src/tensorflow/lite/micro/benchmarks/keyword_scrambled_model_data.cpp
Lines changed: 2845 additions & 0 deletions b/‎src/tensorflow/lite/micro/benchmarks/keyword_scrambled_model_data.cpp
Lines changed: 2845 additions & 0 deletions
diff --git a/‎src/tensorflow/lite/micro/kernels/add.cpp renamed to ‎src/tensorflow/lite/micro/kernels/cmsis-nn/add.cpp
Lines changed: 40 additions & 55 deletions b/‎src/tensorflow/lite/micro/kernels/add.cpp renamed to ‎src/tensorflow/lite/micro/kernels/cmsis-nn/add.cpp
Lines changed: 40 additions & 55 deletions
@@ -0,0 +1,69 @@
+
+# TensorFlow Lite Micro
+
+An Open Source Machine Learning Framework for Everyone.
+
+## Introduction
+
+This is a version of the [TensorFlow Lite Micro library](https://www.tensorflow.org/lite/microcontrollers)
+for the Raspberry Pi Pico microcontroller. It allows you to run machine learning models to
+do things like voice recognition, detect people in images, recognize gestures from an accelerometer,
+and other sensor analysis tasks.
+
+## Getting Started
+
+First you'll need to follow the Pico setup instructions to initialize the development
+environment on your machine. Once that is done, make sure that the PICO_SDK_PATH
+environment variable has been set to the location of the Pico SDK, either in the shell
+you're building in, or the CMake configure environment variable setting of the extension
+if you're using VS Code.
+
+You should then be able to build the library, tests, and examples. The easiest way to
+build is using VS Code's CMake integration, by loading the project and choosing the
+build option at the bottom of the window.
+
+## What's Included
+
+There are several example applications included. The simplest one to begin with is the
+hello_world project. This demonstrates the fundamentals of deploying an ML model on a
+device, driving the Pico's LED in a learned sine-wave pattern.
+
+Other examples include simple speech recognition, a magic wand gesture recognizer,
+and spotting people in camera images, but because they require audio, accelerometer or
+image inputs you'll need to write some code to hook up your own sensors, since these
+are not included with the base microcontroller.
+
+## Contributing
+
+This repository (https://github.com/raspberrypi/pico-tflmicro) is read-only, because
+it has been automatically generated from the master TensorFlow repository at
+https://github.com/tensorflow/tensorflow. This means that all issues and pull requests
+need to be filed there. You can generate a version of this generated project by
+running the commands:
+
+```
+git clone https://github.com/tensorflow/tensorflow
+cd tensorflow
+tensorflow/lite/micro/tools/project/generate.py rp2 pico-tflmicro
+```
+
+This should create a Pico-compatible project from the latest version of the TensorFlow
+repository.
+
+## Learning More
+
+The [TensorFlow website](https://www.tensorflow.org/lite/microcontrollers) has
+information on training, tutorials, and other resources.
+
+The [TinyML Book](https://tinymlbook.com) is a guide to using TensorFlow Lite Micro
+across a variety of different systems.
+
+[TensorFlowLite Micro: Embedded Machine Learning on TinyML Systems](https://arxiv.org/pdf/2010.08678.pdf)
+has more details on the design and implementation of the framework.
+
+## Licensing
+
+The TensorFlow source code is covered by the license described in src/tensorflow/LICENSE,
+components from other libraries have the appropriate licenses included in their
+third_party folders.
+
@@ -15,8 +15,8 @@ limitations under the License.
 
 #include "tensorflow/lite/kernels/internal/reference/add.h"
 
+#include "CMSIS/NN/Include/arm_nnfunctions.h"
 #include "tensorflow/lite/c/builtin_op_data.h"
-#include "tensorflow/lite/c/common.h"
 #include "tensorflow/lite/kernels/internal/quantization_util.h"
 #include "tensorflow/lite/kernels/internal/reference/integer_ops/add.h"
 #include "tensorflow/lite/kernels/internal/reference/process_broadcast_shapes.h"
@@ -54,10 +54,6 @@ struct OpData {
   int32_t input1_offset;
   int32_t input2_offset;
   int32_t output_offset;
-
-  // Used only for float evals:
-  float output_activation_min_f32;
-  float output_activation_max_f32;
 };
 
 TfLiteStatus CalculateOpData(TfLiteContext* context, TfLiteAddParams* params,
@@ -95,10 +91,6 @@ TfLiteStatus CalculateOpData(TfLiteContext* context, TfLiteAddParams* params,
     TF_LITE_ENSURE_STATUS(CalculateActivationRangeQuantized(
         context, params->activation, output, &data->output_activation_min,
         &data->output_activation_max));
-  } else if (output->type == kTfLiteFloat32) {
-    CalculateActivationRange(params->activation,
-                             &data->output_activation_min_f32,
-                             &data->output_activation_max_f32);
   }
 
   return kTfLiteOk;
@@ -107,25 +99,24 @@ TfLiteStatus CalculateOpData(TfLiteContext* context, TfLiteAddParams* params,
 void EvalAdd(TfLiteContext* context, TfLiteNode* node, TfLiteAddParams* params,
              const OpData* data, const TfLiteEvalTensor* input1,
              const TfLiteEvalTensor* input2, TfLiteEvalTensor* output) {
+  float output_activation_min, output_activation_max;
+  CalculateActivationRange(params->activation, &output_activation_min,
+                           &output_activation_max);
   tflite::ArithmeticParams op_params;
-  SetActivationParams(data->output_activation_min_f32,
-                      data->output_activation_max_f32, &op_params);
+  SetActivationParams(output_activation_min, output_activation_max, &op_params);
+#define TF_LITE_ADD(opname)                                               \
+  reference_ops::opname(op_params, tflite::micro::GetTensorShape(input1), \
+                        tflite::micro::GetTensorData<float>(input1),      \
+                        tflite::micro::GetTensorShape(input2),            \
+                        tflite::micro::GetTensorData<float>(input2),      \
+                        tflite::micro::GetTensorShape(output),            \
+                        tflite::micro::GetTensorData<float>(output))
   if (data->requires_broadcast) {
-    reference_ops::BroadcastAdd4DSlow(
-        op_params, tflite::micro::GetTensorShape(input1),
-        tflite::micro::GetTensorData<float>(input1),
-        tflite::micro::GetTensorShape(input2),
-        tflite::micro::GetTensorData<float>(input2),
-        tflite::micro::GetTensorShape(output),
-        tflite::micro::GetTensorData<float>(output));
+    TF_LITE_ADD(BroadcastAdd4DSlow);
   } else {
-    reference_ops::Add(op_params, tflite::micro::GetTensorShape(input1),
-                       tflite::micro::GetTensorData<float>(input1),
-                       tflite::micro::GetTensorShape(input2),
-                       tflite::micro::GetTensorData<float>(input2),
-                       tflite::micro::GetTensorShape(output),
-                       tflite::micro::GetTensorData<float>(output));
+    TF_LITE_ADD(Add);
   }
+#undef TF_LITE_ADD
 }
 
 TfLiteStatus EvalAddQuantized(TfLiteContext* context, TfLiteNode* node,
@@ -150,42 +141,39 @@ TfLiteStatus EvalAddQuantized(TfLiteContext* context, TfLiteNode* node,
     bool need_broadcast = reference_ops::ProcessBroadcastShapes(
         tflite::micro::GetTensorShape(input1),
         tflite::micro::GetTensorShape(input2), &op_params);
+#define TF_LITE_ADD(type, opname, dtype)                         \
+  type::opname(op_params, tflite::micro::GetTensorShape(input1), \
+               tflite::micro::GetTensorData<dtype>(input1),      \
+               tflite::micro::GetTensorShape(input2),            \
+               tflite::micro::GetTensorData<dtype>(input2),      \
+               tflite::micro::GetTensorShape(output),            \
+               tflite::micro::GetTensorData<dtype>(output));
     if (output->type == kTfLiteInt8) {
       if (need_broadcast) {
-        reference_integer_ops::BroadcastAdd4DSlow(
-            op_params, tflite::micro::GetTensorShape(input1),
-            tflite::micro::GetTensorData<int8_t>(input1),
-            tflite::micro::GetTensorShape(input2),
-            tflite::micro::GetTensorData<int8_t>(input2),
-            tflite::micro::GetTensorShape(output),
-            tflite::micro::GetTensorData<int8_t>(output));
+        TF_LITE_ADD(reference_integer_ops, BroadcastAdd4DSlow, int8_t);
       } else {
-        reference_integer_ops::Add(
-            op_params, tflite::micro::GetTensorShape(input1),
+        arm_elementwise_add_s8(
             tflite::micro::GetTensorData<int8_t>(input1),
-            tflite::micro::GetTensorShape(input2),
             tflite::micro::GetTensorData<int8_t>(input2),
-            tflite::micro::GetTensorShape(output),
-            tflite::micro::GetTensorData<int8_t>(output));
+            op_params.input1_offset, op_params.input1_multiplier,
+            op_params.input1_shift, op_params.input2_offset,
+            op_params.input2_multiplier, op_params.input2_shift,
+            op_params.left_shift, tflite::micro::GetTensorData<int8_t>(output),
+            op_params.output_offset, op_params.output_multiplier,
+            op_params.output_shift, op_params.quantized_activation_min,
+            op_params.quantized_activation_max,
+            MatchingElementsSize(tflite::micro::GetTensorShape(input1),
+                                 tflite::micro::GetTensorShape(input2),
+                                 tflite::micro::GetTensorShape(output)));
       }
     } else {
       if (need_broadcast) {
-        reference_ops::BroadcastAdd4DSlow(
-            op_params, tflite::micro::GetTensorShape(input1),
-            tflite::micro::GetTensorData<uint8_t>(input1),
-            tflite::micro::GetTensorShape(input2),
-            tflite::micro::GetTensorData<uint8_t>(input2),
-            tflite::micro::GetTensorShape(output),
-            tflite::micro::GetTensorData<uint8_t>(output));
+        TF_LITE_ADD(reference_ops, BroadcastAdd4DSlow, uint8_t);
       } else {
-        reference_ops::Add(op_params, tflite::micro::GetTensorShape(input1),
-                           tflite::micro::GetTensorData<uint8_t>(input1),
-                           tflite::micro::GetTensorShape(input2),
-                           tflite::micro::GetTensorData<uint8_t>(input2),
-                           tflite::micro::GetTensorShape(output),
-                           tflite::micro::GetTensorData<uint8_t>(output));
+        TF_LITE_ADD(reference_ops, Add, uint8_t);
       }
     }
+#undef TF_LITE_ADD
   }
 
   return kTfLiteOk;
@@ -201,11 +189,8 @@ TfLiteStatus Prepare(TfLiteContext* context, TfLiteNode* node) {
   TFLITE_DCHECK(node->builtin_data != nullptr);
 
   const TfLiteTensor* input1 = GetInput(context, node, kInputTensor1);
-  TF_LITE_ENSURE(context, input1 != nullptr);
   const TfLiteTensor* input2 = GetInput(context, node, kInputTensor2);
-  TF_LITE_ENSURE(context, input2 != nullptr);
   TfLiteTensor* output = GetOutput(context, node, kOutputTensor);
-  TF_LITE_ENSURE(context, output != nullptr);
 
   OpData* data = static_cast<OpData*>(node->user_data);
   auto* params = reinterpret_cast<TfLiteAddParams*>(node->builtin_data);
@@ -219,16 +204,16 @@ TfLiteStatus Prepare(TfLiteContext* context, TfLiteNode* node) {
 TfLiteStatus Eval(TfLiteContext* context, TfLiteNode* node) {
   auto* params = reinterpret_cast<TfLiteAddParams*>(node->builtin_data);
 
-  TFLITE_DCHECK(node->user_data != nullptr);
-  const OpData* data = static_cast<const OpData*>(node->user_data);
-
   const TfLiteEvalTensor* input1 =
       tflite::micro::GetEvalInput(context, node, kInputTensor1);
   const TfLiteEvalTensor* input2 =
       tflite::micro::GetEvalInput(context, node, kInputTensor2);
   TfLiteEvalTensor* output =
       tflite::micro::GetEvalOutput(context, node, kOutputTensor);
 
+  TFLITE_DCHECK(node->user_data != nullptr);
+  const OpData* data = static_cast<const OpData*>(node->user_data);
+
   if (output->type == kTfLiteFloat32) {
     EvalAdd(context, node, params, data, input1, input2, output);
   } else if (output->type == kTfLiteUInt8 || output->type == kTfLiteInt8) {