/external/tensorflow/tensorflow/contrib/fused_conv/kernels/ |
H A D | fused_conv2d_bias_activation_op.cc | 541 dnn::AlgorithmConfig algorithm_config; local 543 fused_conv_parameters, &algorithm_config)) { 583 algorithm_config.set_algorithm(best_result.algorithm()); 586 algorithm_config.set_algorithm_no_scratch( 590 algorithm_config); 600 &output_ptr, &scratch_allocator, algorithm_config,
|
/external/tensorflow/tensorflow/core/kernels/ |
H A D | conv_grad_filter_ops.cc | 907 AlgorithmConfig algorithm_config; local 909 conv_parameters, &algorithm_config)) { 947 algorithm_config.set_algorithm(best_result.algorithm()); 950 algorithm_config.set_algorithm_no_scratch( 954 algorithm_config); 963 algorithm_config, nullptr)
|
H A D | conv_grad_input_ops.cc | 956 AlgorithmConfig algorithm_config; local 958 conv_parameters, &algorithm_config)) { 995 algorithm_config.set_algorithm(best_result.algorithm()); 998 algorithm_config.set_algorithm_no_scratch( 1002 algorithm_config); 1009 algorithm_config, nullptr)
|
H A D | conv_ops.cc | 707 AlgorithmConfig algorithm_config; local 709 !AutoTuneConv::GetInstance()->Find(conv_parameters, &algorithm_config)) { 747 algorithm_config.set_algorithm(best_result.algorithm()); 750 algorithm_config.set_algorithm_no_scratch( 753 AutoTuneConv::GetInstance()->Insert(conv_parameters, algorithm_config); 762 algorithm_config, nullptr)
|
/external/tensorflow/tensorflow/stream_executor/ |
H A D | stream.cc | 580 const dnn::AlgorithmConfig &algorithm_config, 587 PARAM(algorithm_config)); 596 algorithm_config, output_profile_result); 619 const dnn::AlgorithmConfig &algorithm_config, 626 PARAM(output_descriptor), PARAM(output), PARAM(algorithm_config)); 635 algorithm_config, output_profile_result); 657 const dnn::AlgorithmConfig &algorithm_config, 664 PARAM(output_descriptor), PARAM(output), PARAM(algorithm_config)); 673 algorithm_config, output_profile_result); 692 const dnn::AlgorithmConfig &algorithm_config, 569 ThenFusedConvolveWithAlgorithm( const dnn::BatchDescriptor &conv_input_descriptor, const DeviceMemory<float> &conv_input_data, float conv_input_scale, const dnn::FilterDescriptor &filter_descriptor, const DeviceMemory<float> &filter_data, const dnn::ConvolutionDescriptor &convolution_descriptor, const DeviceMemory<float> &side_input_data, float side_input_scale, const dnn::BatchDescriptor &bias_descriptor, const DeviceMemory<float> &biases, dnn::ActivationMode activation_mode, const dnn::BatchDescriptor &output_descriptor, DeviceMemory<float> *output, ScratchAllocator *scratch_allocator, const dnn::AlgorithmConfig &algorithm_config, dnn::ProfileResult *output_profile_result) argument 607 ThenFusedConvolveWithAlgorithm( const dnn::BatchDescriptor &conv_input_descriptor, const DeviceMemory<Eigen::half> &conv_input_data, float conv_input_scale, const dnn::FilterDescriptor &filter_descriptor, const DeviceMemory<Eigen::half> &filter_data, const dnn::ConvolutionDescriptor &convolution_descriptor, const DeviceMemory<Eigen::half> &side_input_data, float side_input_scale, const dnn::BatchDescriptor &bias_descriptor, const DeviceMemory<Eigen::half> &biases, dnn::ActivationMode activation_mode, const dnn::BatchDescriptor &output_descriptor, DeviceMemory<Eigen::half> *output, ScratchAllocator *scratch_allocator, const dnn::AlgorithmConfig &algorithm_config, dnn::ProfileResult *output_profile_result) argument 646 ThenFusedConvolveWithAlgorithm( const dnn::BatchDescriptor &conv_input_descriptor, const DeviceMemory<int8> &conv_input_data, float conv_input_scale, const dnn::FilterDescriptor &filter_descriptor, const DeviceMemory<int8> &filter_data, const dnn::ConvolutionDescriptor &convolution_descriptor, const DeviceMemory<int8> &side_input_data, float side_input_scale, const dnn::BatchDescriptor &bias_descriptor, const DeviceMemory<float> &biases, dnn::ActivationMode activation_mode, const dnn::BatchDescriptor &output_descriptor, DeviceMemory<int8> *output, ScratchAllocator *scratch_allocator, const dnn::AlgorithmConfig &algorithm_config, dnn::ProfileResult *output_profile_result) argument 684 ThenConvolveWithAlgorithm( const dnn::BatchDescriptor &input_descriptor, const DeviceMemory<float> &input_data, const dnn::FilterDescriptor &filter_descriptor, const DeviceMemory<float> &filter_data, const dnn::ConvolutionDescriptor &convolution_descriptor, const dnn::BatchDescriptor &output_descriptor, DeviceMemory<float> *output, ScratchAllocator *scratch_allocator, const dnn::AlgorithmConfig &algorithm_config, dnn::ProfileResult *output_profile_result) argument 715 ThenConvolveWithAlgorithm( const dnn::BatchDescriptor &input_descriptor, const DeviceMemory<Eigen::half> &input_data, const dnn::FilterDescriptor &filter_descriptor, const DeviceMemory<Eigen::half> &filter_data, const dnn::ConvolutionDescriptor &convolution_descriptor, const dnn::BatchDescriptor &output_descriptor, DeviceMemory<Eigen::half> *output, ScratchAllocator *scratch_allocator, const dnn::AlgorithmConfig &algorithm_config, dnn::ProfileResult *output_profile_result) argument 893 ThenConvolveBackwardDataWithAlgorithm( const dnn::FilterDescriptor &filter_descriptor, const DeviceMemory<float> &filter_data, const dnn::BatchDescriptor &output_descriptor, DeviceMemory<float> backward_output_data, const dnn::ConvolutionDescriptor &convolution_descriptor, const dnn::BatchDescriptor &input_descriptor, DeviceMemory<float> *backward_input_data, ScratchAllocator *scratch_allocator, const dnn::AlgorithmConfig &algorithm_config, dnn::ProfileResult *output_profile_result) argument 926 ThenConvolveBackwardDataWithAlgorithm( const dnn::FilterDescriptor &filter_descriptor, const DeviceMemory<Eigen::half> &filter_data, const dnn::BatchDescriptor &output_descriptor, DeviceMemory<Eigen::half> backward_output_data, const dnn::ConvolutionDescriptor &convolution_descriptor, const dnn::BatchDescriptor &input_descriptor, DeviceMemory<Eigen::half> *backward_input_data, ScratchAllocator *scratch_allocator, const dnn::AlgorithmConfig &algorithm_config, dnn::ProfileResult *output_profile_result) argument 1029 ThenConvolveBackwardFilterWithAlgorithm( const dnn::BatchDescriptor &input_descriptor, const DeviceMemory<float> &input_data, const dnn::BatchDescriptor &output_descriptor, DeviceMemory<float> backward_output_data, const dnn::ConvolutionDescriptor &convolution_descriptor, const dnn::FilterDescriptor &filter_descriptor, DeviceMemory<float> *backward_filter_data, ScratchAllocator *scratch_allocator, const dnn::AlgorithmConfig &algorithm_config, dnn::ProfileResult *output_profile_result) argument 1090 ThenConvolveBackwardFilterWithAlgorithm( const dnn::BatchDescriptor &input_descriptor, const DeviceMemory<Eigen::half> &input_data, const dnn::BatchDescriptor &output_descriptor, DeviceMemory<Eigen::half> backward_output_data, const dnn::ConvolutionDescriptor &convolution_descriptor, const dnn::FilterDescriptor &filter_descriptor, DeviceMemory<Eigen::half> *backward_filter_data, ScratchAllocator *scratch_allocator, const dnn::AlgorithmConfig &algorithm_config, dnn::ProfileResult *output_profile_result) argument [all...] |
H A D | dnn.h | 1057 const dnn::AlgorithmConfig& algorithm_config, 1074 const dnn::AlgorithmConfig& algorithm_config, 1094 const dnn::AlgorithmConfig& algorithm_config, 1112 const dnn::AlgorithmConfig& algorithm_config, 1163 const dnn::AlgorithmConfig& algorithm_config, 1188 const dnn::AlgorithmConfig& algorithm_config, 1267 const dnn::AlgorithmConfig& algorithm_config, 1285 const dnn::AlgorithmConfig& algorithm_config, 1316 const dnn::AlgorithmConfig& algorithm_config, 1334 const dnn::AlgorithmConfig& algorithm_config, 1046 DoFusedConvolve( Stream* stream, const dnn::BatchDescriptor& conv_input_descriptor, const DeviceMemory<double>& conv_input_data, double conv_input_scale, const dnn::FilterDescriptor& filter_descriptor, const DeviceMemory<double>& filter_data, const dnn::ConvolutionDescriptor& convolution_descriptor, const DeviceMemory<double>& side_input_data, double side_input_scale, const dnn::BatchDescriptor& bias_descriptor, const DeviceMemory<double>& biases, dnn::ActivationMode activation_mode, const dnn::BatchDescriptor& output_descriptor, DeviceMemory<double>* output_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument 1063 DoFusedConvolve( Stream* stream, const dnn::BatchDescriptor& conv_input_descriptor, const DeviceMemory<float>& conv_input_data, float conv_input_scale, const dnn::FilterDescriptor& filter_descriptor, const DeviceMemory<float>& filter_data, const dnn::ConvolutionDescriptor& convolution_descriptor, const DeviceMemory<float>& side_input_data, float side_input_scale, const dnn::BatchDescriptor& bias_descriptor, const DeviceMemory<float>& biases, dnn::ActivationMode activation_mode, const dnn::BatchDescriptor& output_descriptor, DeviceMemory<float>* output_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument 1081 DoFusedConvolve( Stream* stream, const dnn::BatchDescriptor& conv_input_descriptor, const DeviceMemory<Eigen::half>& conv_input_data, float conv_input_scale, const dnn::FilterDescriptor& filter_descriptor, const DeviceMemory<Eigen::half>& filter_data, const dnn::ConvolutionDescriptor& convolution_descriptor, const DeviceMemory<Eigen::half>& side_input_data, float side_input_scale, const dnn::BatchDescriptor& bias_descriptor, const DeviceMemory<Eigen::half>& biases, dnn::ActivationMode activation_mode, const dnn::BatchDescriptor& output_descriptor, DeviceMemory<Eigen::half>* output_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument 1101 DoFusedConvolve( Stream* stream, const dnn::BatchDescriptor& conv_input_descriptor, const DeviceMemory<int8>& conv_input_data, float conv_input_scale, const dnn::FilterDescriptor& filter_descriptor, const DeviceMemory<int8>& filter_data, const dnn::ConvolutionDescriptor& convolution_descriptor, const DeviceMemory<int8>& side_input_data, float side_input_scale, const dnn::BatchDescriptor& bias_descriptor, const DeviceMemory<float>& biases, dnn::ActivationMode activation_mode, const dnn::BatchDescriptor& output_descriptor, DeviceMemory<int8>* output_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument [all...] |
/external/tensorflow/tensorflow/stream_executor/cuda/ |
H A D | cuda_dnn.cc | 2146 const dnn::AlgorithmConfig& algorithm_config, bool is_profiling, 2154 if (algorithm_config.algorithm().is_default()) { 2161 use_tensor_ops = algorithm_config.algorithm().tensor_ops_enabled(); 2162 algo = ToConvForwardAlgo(algorithm_config.algorithm()); 2174 << algorithm_config.algorithm().algo_id() << " " 2199 CHECK(!algorithm_config.algorithm_no_scratch().is_default()) 2205 if (algorithm_config.algorithm_no_scratch().is_default()) { 2211 use_tensor_ops = algorithm_config.algorithm().tensor_ops_enabled(); 2212 algo = ToConvForwardAlgo(algorithm_config.algorithm_no_scratch()); 2310 const dnn::AlgorithmConfig& algorithm_config, 2144 GetCudnnConvolutionForwardAlgorithm( Stream* stream, CUDAExecutor* parent, void* dnn_handle, const dnn::AlgorithmConfig& algorithm_config, bool is_profiling, const ScopedTensorDescriptor& input_nd, const ScopedFilterDescriptor& filter, const ScopedConvolutionDescriptor& conv, const ScopedTensorDescriptor& output_nd, ScratchAllocator* scratch_allocator, DeviceMemory<uint8>* scratch) argument 2302 DoConvolveImpl( Stream* stream, const BatchDescriptor& batch_descriptor, const DeviceMemory<T>& input_data, const FilterDescriptor& filter_descriptor, const DeviceMemory<T>& filter_data, const ConvolutionDescriptor& convolution_descriptor, const BatchDescriptor& output_descriptor, DeviceMemory<T>* output_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument 2502 DoFusedConvolveImpl( Stream* stream, const dnn::BatchDescriptor& conv_input_descriptor, const DeviceMemory<Type>& conv_input_data, ScaleType conv_input_scale, const dnn::FilterDescriptor& filter_descriptor, const DeviceMemory<Type>& filter_data, const dnn::ConvolutionDescriptor& convolution_descriptor, const DeviceMemory<Type>& side_input_data, ScaleType side_input_scale, const dnn::BatchDescriptor& bias_descriptor, const DeviceMemory<BiasType>& biases, dnn::ActivationMode activation_mode, const dnn::BatchDescriptor& output_descriptor, DeviceMemory<Type>* output_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument 2924 DoConvolve( Stream* stream, const BatchDescriptor& batch_descriptor, const DeviceMemory<float>& input_data, const FilterDescriptor& filter_descriptor, const DeviceMemory<float>& filter_data, const ConvolutionDescriptor& convolution_descriptor, const BatchDescriptor& output_descriptor, DeviceMemory<float>* output_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument 2952 DoConvolve( Stream* stream, const BatchDescriptor& batch_descriptor, const DeviceMemory<Eigen::half>& input_data, const FilterDescriptor& filter_descriptor, const DeviceMemory<Eigen::half>& filter_data, const ConvolutionDescriptor& convolution_descriptor, const BatchDescriptor& output_descriptor, DeviceMemory<Eigen::half>* output_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument 2968 DoFusedConvolve( Stream* stream, const dnn::BatchDescriptor& conv_input_descriptor, const DeviceMemory<double>& conv_input_data, double conv_input_scale, const dnn::FilterDescriptor& filter_descriptor, const DeviceMemory<double>& filter_data, const dnn::ConvolutionDescriptor& convolution_descriptor, const DeviceMemory<double>& side_input_data, double side_input_scale, const dnn::BatchDescriptor& bias_descriptor, const DeviceMemory<double>& biases, dnn::ActivationMode activation_mode, const dnn::BatchDescriptor& output_descriptor, DeviceMemory<double>* output_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument 2990 DoFusedConvolve( Stream* stream, const dnn::BatchDescriptor& conv_input_descriptor, const DeviceMemory<float>& conv_input_data, float conv_input_scale, const dnn::FilterDescriptor& filter_descriptor, const DeviceMemory<float>& filter_data, const dnn::ConvolutionDescriptor& convolution_descriptor, const DeviceMemory<float>& side_input_data, float side_input_scale, const dnn::BatchDescriptor& bias_descriptor, const DeviceMemory<float>& biases, dnn::ActivationMode activation_mode, const dnn::BatchDescriptor& output_descriptor, DeviceMemory<float>* output_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument 3012 DoFusedConvolve( Stream* stream, const dnn::BatchDescriptor& conv_input_descriptor, const DeviceMemory<Eigen::half>& conv_input_data, float conv_input_scale, const dnn::FilterDescriptor& filter_descriptor, const DeviceMemory<Eigen::half>& filter_data, const dnn::ConvolutionDescriptor& convolution_descriptor, const DeviceMemory<Eigen::half>& side_input_data, float side_input_scale, const dnn::BatchDescriptor& bias_descriptor, const DeviceMemory<Eigen::half>& biases, dnn::ActivationMode activation_mode, const dnn::BatchDescriptor& output_descriptor, DeviceMemory<Eigen::half>* output_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument 3035 DoFusedConvolve( Stream* stream, const dnn::BatchDescriptor& conv_input_descriptor, const DeviceMemory<int8>& conv_input_data, float conv_input_scale, const dnn::FilterDescriptor& filter_descriptor, const DeviceMemory<int8>& filter_data, const dnn::ConvolutionDescriptor& convolution_descriptor, const DeviceMemory<int8>& side_input_data, float side_input_scale, const dnn::BatchDescriptor& bias_descriptor, const DeviceMemory<float>& biases, dnn::ActivationMode activation_mode, const dnn::BatchDescriptor& output_descriptor, DeviceMemory<int8>* output_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument 3136 DoConvolveBackwardDataImpl( Stream* stream, const FilterDescriptor& filter_descriptor, const DeviceMemory<T>& filter_data, const BatchDescriptor& output_descriptor_in, DeviceMemory<T> backward_output_data, const ConvolutionDescriptor& convolution_descriptor, const BatchDescriptor& input_descriptor, DeviceMemory<T>* backward_input_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument 3347 DoConvolveBackwardData( Stream* stream, const FilterDescriptor& filter_descriptor, const DeviceMemory<float>& filter_data, const BatchDescriptor& output_descriptor_in, DeviceMemory<float> backward_output_data, const ConvolutionDescriptor& convolution_descriptor, const BatchDescriptor& input_descriptor, DeviceMemory<float>* backward_input_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument 3365 DoConvolveBackwardData( Stream* stream, const FilterDescriptor& filter_descriptor, const DeviceMemory<Eigen::half>& filter_data, const BatchDescriptor& output_descriptor_in, DeviceMemory<Eigen::half> backward_output_data, const ConvolutionDescriptor& convolution_descriptor, const BatchDescriptor& input_descriptor, DeviceMemory<Eigen::half>* backward_input_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument 3384 DoConvolveBackwardFilterImpl( Stream* stream, const dnn::BatchDescriptor& input_descriptor, const DeviceMemory<T>& input_data, const dnn::BatchDescriptor& output_descriptor_in, DeviceMemory<T> backward_output_data, const dnn::ConvolutionDescriptor& convolution_descriptor, const dnn::FilterDescriptor& filter_descriptor, DeviceMemory<T>* backward_filter_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument 3595 DoConvolveBackwardFilter( Stream* stream, const dnn::BatchDescriptor& input_descriptor, const DeviceMemory<float>& input_data, const dnn::BatchDescriptor& output_descriptor_in, DeviceMemory<float> backward_output_data, const dnn::ConvolutionDescriptor& convolution_descriptor, const dnn::FilterDescriptor& filter_descriptor, DeviceMemory<float>* backward_filter_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument 3613 DoConvolveBackwardFilter( Stream* stream, const dnn::BatchDescriptor& input_descriptor, const DeviceMemory<Eigen::half>& input_data, const dnn::BatchDescriptor& output_descriptor_in, DeviceMemory<Eigen::half> backward_output_data, const dnn::ConvolutionDescriptor& convolution_descriptor, const dnn::FilterDescriptor& filter_descriptor, DeviceMemory<Eigen::half>* backward_filter_data, ScratchAllocator* scratch_allocator, const dnn::AlgorithmConfig& algorithm_config, dnn::ProfileResult* output_profile_result) argument [all...] |