1bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang/*
2bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * Copyright (C) 2017 The Android Open Source Project
3bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang *
4bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * Licensed under the Apache License, Version 2.0 (the "License");
5bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * you may not use this file except in compliance with the License.
6bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * You may obtain a copy of the License at
7bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang *
8bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang *      http://www.apache.org/licenses/LICENSE-2.0
9bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang *
10bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * Unless required by applicable law or agreed to in writing, software
11bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * distributed under the License is distributed on an "AS IS" BASIS,
12bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * See the License for the specific language governing permissions and
14bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * limitations under the License.
15bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang */
16bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang
17bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang#include "Operations.h"
18bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang#include "OperationsUtils.h"
19bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang
20bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang#include "internal/optimized/optimized_ops.h"
21bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang
22bbfd239e43526ff969699d3fc6110395edd2108bMiao Wangnamespace android {
23bbfd239e43526ff969699d3fc6110395edd2108bMiao Wangnamespace nn {
24bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang
25bbfd239e43526ff969699d3fc6110395edd2108bMiao Wangbool fullyConnectedFloat32(const float* inputData, const Shape& inputShape,
26bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang                           const float* weightsData, const Shape& weightsShape,
27bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang                           const float* biasData, const Shape& biasShape,
28bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang                           int32_t activation,
29bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang                           float* outputData, const Shape& outputShape) {
30bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang
31bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang    #define ANDROID_NN_FULLY_CONNECTED(activation)                              \
32bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang        optimized_ops::FullyConnected<FusedActivationFunctionType::activation>( \
33bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang            inputData, convertShapeToDims(inputShape),                          \
34bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang            weightsData, convertShapeToDims(weightsShape),                      \
35bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang            biasData, convertShapeToDims(biasShape),                            \
36bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang            outputData, convertShapeToDims(outputShape))
37bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang
3855cef2193279a646292fdeb355399627dd8990c8Miao Wang    ANDROID_NN_MACRO_DISPATCH(ANDROID_NN_FULLY_CONNECTED)
39bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang    #undef ANDROID_NN_FULLY_CONNECTED
40bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang    return true;
41bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang}
42bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang
43bbfd239e43526ff969699d3fc6110395edd2108bMiao Wangbool fullyConnectedQuant8(const uint8_t* inputData, const Shape& inputShape,
44bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang                          const uint8_t* weightsData, const Shape& weightsShape,
45bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang                          const int32_t* biasData, const Shape& biasShape,
46bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang                          int32_t activation,
47bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang                          uint8_t* outputData, const Shape& outputShape) {
48bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang    int32_t inputOffset = -inputShape.offset;
49bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang    int32_t weightsOffset = -weightsShape.offset;
50bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang    int32_t outputOffset = outputShape.offset;
51bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang
52bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang    float real_multiplier = 0.0;
53bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang    int32_t output_multiplier = 0;
54bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang    int32_t output_shift = 0;
55bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang    int32_t output_activation_min = 0;
56bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang    int32_t output_activation_max = 0;
57bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang
58be2b22578baf949d7be42ba002cee94304daf53cMiao Wang    if (!GetQuantizedConvolutionMultipler(inputShape, weightsShape, biasShape,
59be2b22578baf949d7be42ba002cee94304daf53cMiao Wang                                          outputShape, &real_multiplier) ||
60be2b22578baf949d7be42ba002cee94304daf53cMiao Wang            !QuantizeMultiplierSmallerThanOne(real_multiplier, &output_multiplier,
61be2b22578baf949d7be42ba002cee94304daf53cMiao Wang                                              &output_shift)) {
62be2b22578baf949d7be42ba002cee94304daf53cMiao Wang        return false;
63be2b22578baf949d7be42ba002cee94304daf53cMiao Wang    }
64bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang    CalculateActivationRangeUint8(activation, outputShape,
65bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang                                  &output_activation_min,
66bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang                                  &output_activation_max);
67bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang
688eb598abd0e77333688e97f7ed89b0dd60d144faMiao Wang    static gemmlowp::GemmContext gemm_context;
698eb598abd0e77333688e97f7ed89b0dd60d144faMiao Wang    // Alow gemmlowp automatcally decide how many threads to use.
708eb598abd0e77333688e97f7ed89b0dd60d144faMiao Wang    gemm_context.set_max_num_threads(0);
718eb598abd0e77333688e97f7ed89b0dd60d144faMiao Wang
72bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang    #define ANDROID_NN_FULLY_CONNECTED(activation)                              \
73bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang        optimized_ops::FullyConnected<FusedActivationFunctionType::activation>( \
74bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang            inputData, convertShapeToDims(inputShape), inputOffset,             \
75bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang            weightsData, convertShapeToDims(weightsShape), weightsOffset,       \
76bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang            biasData, convertShapeToDims(biasShape),                            \
77bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang            outputOffset, output_multiplier, output_shift,                      \
78bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang            output_activation_min, output_activation_max,                       \
798eb598abd0e77333688e97f7ed89b0dd60d144faMiao Wang            outputData, convertShapeToDims(outputShape), &gemm_context)
80bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang
8155cef2193279a646292fdeb355399627dd8990c8Miao Wang    ANDROID_NN_MACRO_DISPATCH(ANDROID_NN_FULLY_CONNECTED)
82bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang    #undef ANDROID_NN_FULLY_CONNECTED
83bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang    return true;
84bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang}
85bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang}  // namespace nn
86bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang}  // namespace android
87