1bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang/* 2bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * Copyright (C) 2017 The Android Open Source Project 3bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * 4bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * Licensed under the Apache License, Version 2.0 (the "License"); 5bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * you may not use this file except in compliance with the License. 6bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * You may obtain a copy of the License at 7bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * 8bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * http://www.apache.org/licenses/LICENSE-2.0 9bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * 10bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * Unless required by applicable law or agreed to in writing, software 11bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * distributed under the License is distributed on an "AS IS" BASIS, 12bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * See the License for the specific language governing permissions and 14bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang * limitations under the License. 15bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang */ 16bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang 17bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang#include "Operations.h" 18bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang#include "OperationsUtils.h" 19bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang 20bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang#include "internal/optimized/optimized_ops.h" 21bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang 22bbfd239e43526ff969699d3fc6110395edd2108bMiao Wangnamespace android { 23bbfd239e43526ff969699d3fc6110395edd2108bMiao Wangnamespace nn { 24bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang 25bbfd239e43526ff969699d3fc6110395edd2108bMiao Wangbool fullyConnectedFloat32(const float* inputData, const Shape& inputShape, 26bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang const float* weightsData, const Shape& weightsShape, 27bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang const float* biasData, const Shape& biasShape, 28bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang int32_t activation, 29bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang float* outputData, const Shape& outputShape) { 30bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang 31bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang #define ANDROID_NN_FULLY_CONNECTED(activation) \ 32bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang optimized_ops::FullyConnected<FusedActivationFunctionType::activation>( \ 33bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang inputData, convertShapeToDims(inputShape), \ 34bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang weightsData, convertShapeToDims(weightsShape), \ 35bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang biasData, convertShapeToDims(biasShape), \ 36bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang outputData, convertShapeToDims(outputShape)) 37bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang 3855cef2193279a646292fdeb355399627dd8990c8Miao Wang ANDROID_NN_MACRO_DISPATCH(ANDROID_NN_FULLY_CONNECTED) 39bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang #undef ANDROID_NN_FULLY_CONNECTED 40bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang return true; 41bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang} 42bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang 43bbfd239e43526ff969699d3fc6110395edd2108bMiao Wangbool fullyConnectedQuant8(const uint8_t* inputData, const Shape& inputShape, 44bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang const uint8_t* weightsData, const Shape& weightsShape, 45bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang const int32_t* biasData, const Shape& biasShape, 46bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang int32_t activation, 47bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang uint8_t* outputData, const Shape& outputShape) { 48bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang int32_t inputOffset = -inputShape.offset; 49bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang int32_t weightsOffset = -weightsShape.offset; 50bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang int32_t outputOffset = outputShape.offset; 51bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang 52bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang float real_multiplier = 0.0; 53bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang int32_t output_multiplier = 0; 54bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang int32_t output_shift = 0; 55bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang int32_t output_activation_min = 0; 56bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang int32_t output_activation_max = 0; 57bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang 58be2b22578baf949d7be42ba002cee94304daf53cMiao Wang if (!GetQuantizedConvolutionMultipler(inputShape, weightsShape, biasShape, 59be2b22578baf949d7be42ba002cee94304daf53cMiao Wang outputShape, &real_multiplier) || 60be2b22578baf949d7be42ba002cee94304daf53cMiao Wang !QuantizeMultiplierSmallerThanOne(real_multiplier, &output_multiplier, 61be2b22578baf949d7be42ba002cee94304daf53cMiao Wang &output_shift)) { 62be2b22578baf949d7be42ba002cee94304daf53cMiao Wang return false; 63be2b22578baf949d7be42ba002cee94304daf53cMiao Wang } 64bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang CalculateActivationRangeUint8(activation, outputShape, 65bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang &output_activation_min, 66bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang &output_activation_max); 67bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang 688eb598abd0e77333688e97f7ed89b0dd60d144faMiao Wang static gemmlowp::GemmContext gemm_context; 698eb598abd0e77333688e97f7ed89b0dd60d144faMiao Wang // Alow gemmlowp automatcally decide how many threads to use. 708eb598abd0e77333688e97f7ed89b0dd60d144faMiao Wang gemm_context.set_max_num_threads(0); 718eb598abd0e77333688e97f7ed89b0dd60d144faMiao Wang 72bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang #define ANDROID_NN_FULLY_CONNECTED(activation) \ 73bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang optimized_ops::FullyConnected<FusedActivationFunctionType::activation>( \ 74bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang inputData, convertShapeToDims(inputShape), inputOffset, \ 75bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang weightsData, convertShapeToDims(weightsShape), weightsOffset, \ 76bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang biasData, convertShapeToDims(biasShape), \ 77bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang outputOffset, output_multiplier, output_shift, \ 78bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang output_activation_min, output_activation_max, \ 798eb598abd0e77333688e97f7ed89b0dd60d144faMiao Wang outputData, convertShapeToDims(outputShape), &gemm_context) 80bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang 8155cef2193279a646292fdeb355399627dd8990c8Miao Wang ANDROID_NN_MACRO_DISPATCH(ANDROID_NN_FULLY_CONNECTED) 82bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang #undef ANDROID_NN_FULLY_CONNECTED 83bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang return true; 84bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang} 85bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang} // namespace nn 86bbfd239e43526ff969699d3fc6110395edd2108bMiao Wang} // namespace android 87