Back to Cutlass

CUTLASS: reduction_operators.h Source File

docs/reduction__operators_8h_source.html

4.4.29.5 KB
Original Source

| | CUTLASS

CUDA Templates for Linear Algebra Subroutines and Solvers |

reduction_operators.h

Go to the documentation of this file.

1 /***************************************************************************************************

2 * Copyright (c) 2017-2019, NVIDIA CORPORATION. All rights reserved.

3 *

4 * Redistribution and use in source and binary forms, with or without modification, are permitted

5 * provided that the following conditions are met:

6 * * Redistributions of source code must retain the above copyright notice, this list of

7 * conditions and the following disclaimer.

8 * * Redistributions in binary form must reproduce the above copyright notice, this list of

9 * conditions and the following disclaimer in the documentation and/or other materials

10 * provided with the distribution.

11 * * Neither the name of the NVIDIA CORPORATION nor the names of its contributors may be used

12 * to endorse or promote products derived from this software without specific prior written

13 * permission.

14 *

15 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS" AND ANY EXPRESS OR

16 * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND

17 * FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL NVIDIA CORPORATION BE LIABLE

18 * FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,

19 * BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS;

20 * OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT,

21 * STRICT LIABILITY, OR TOR (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE

22 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.

23 *

24 **************************************************************************************************/

29 #pragma once

30

31 #include "cutlass/cutlass.h"

32 #include "cutlass/tensor_ref.h"

33 #include "cutlass/numeric_types.h"

34 #include "cutlass/array.h"

35 #include "cutlass/functional.h"

36 #include "cutlass/numeric_conversion.h"

37

38 namespace cutlass {

39 namespace reduction {

40 namespace thread {

41

43

45 template <

46typename ElementAccumulator_,

47typename Element_,

48int Count = 1

49 >

50 struct ReduceAdd {

51

52//

53// Type definitions

54//

55

56using ElementAccumulator = ElementAccumulator_;

57using Element = Element_;

58static int const kCount = Count;

59

60using FragmentAccumulator = cutlass::Array<ElementAccumulator, kCount>;

61using FragmentElement = cutlass::Array<Element, kCount>;

62

63struct Params { };

64

65//

66// Data members

67//

68

70Params params;

71

72//

73// Methods

74//

75

77CUTLASS_HOST_DEVICE

78ReduceAdd(Params params_ = Params()): params(params_) { }

79

81CUTLASS_HOST_DEVICE

82FragmentAccumulator operator()(

83FragmentAccumulator accumulator,

84FragmentElement element) const {

85

86plus<FragmentAccumulator> op;

87

88return op(accumulator, element);

89 }

90 };

91

93

94 } // namespace thread

95 } // namespace reduction

96 } // namespace cutlass

cutlass::reduction::thread::ReduceAdd::ReduceAdd

CUTLASS_HOST_DEVICE ReduceAdd(Params params_=Params())

Constructor.

Definition: reduction_operators.h:78

cutlass::reduction::thread::ReduceAdd::ElementAccumulator

ElementAccumulator_ ElementAccumulator

Definition: reduction_operators.h:56

cutlass

Definition: aligned_buffer.h:35

tensor_ref.h

Defines a structure containing strides, bounds, and a pointer to tensor data.

cutlass::reduction::thread::ReduceAdd

Mixed-precision reduction.

Definition: reduction_operators.h:50

cutlass::plus

Definition: functional.h:46

cutlass::reduction::thread::ReduceAdd::FragmentElement

cutlass::Array< Element, kCount > FragmentElement

Definition: reduction_operators.h:61

cutlass::reduction::thread::ReduceAdd::params

Params params

Parameters object.

Definition: reduction_operators.h:70

array.h

Statically sized array of elements that accommodates all CUTLASS-supported numeric types and is safe ...

cutlass::reduction::thread::ReduceAdd::kCount

static int const kCount

Definition: reduction_operators.h:58

numeric_conversion.h

Boost-like numeric conversion operator for CUTLASS numeric types.

CUTLASS_HOST_DEVICE

#define CUTLASS_HOST_DEVICE

Definition: cutlass.h:89

numeric_types.h

Top-level include for all CUTLASS numeric types.

cutlass::reduction::thread::ReduceAdd::Element

Element_ Element

Definition: reduction_operators.h:57

cutlass::reduction::thread::ReduceAdd::Params

Definition: reduction_operators.h:63

cutlass::reduction::thread::ReduceAdd::operator()

CUTLASS_HOST_DEVICE FragmentAccumulator operator()(FragmentAccumulator accumulator, FragmentElement element) const

Operator.

Definition: reduction_operators.h:82

cutlass::reduction::thread::ReduceAdd::FragmentAccumulator

cutlass::Array< ElementAccumulator, kCount > FragmentAccumulator

Definition: reduction_operators.h:60

cutlass.h

Basic include for CUTLASS.

functional.h

Define basic numeric operators with specializations for Array<T, N>. SIMD-ize where possible...


Generated by 1.8.11