NForge
Tensor library
Loading...
Searching...
No Matches
tensor_impl_CPU.h
1#ifndef TENSOR_IMPL_CPU_H
2#define TENSOR_IMPL_CPU_H
3
4#include "../tensor_impl.h"
5#include "nforge/core/tensor_layout.h"
6#include "nforge/core/tensor_shape.h"
7
15public:
16 CPUImpl(const Tensor::Shape& shape);
17 CPUImpl(const Tensor::Shape& shape, float value);
18 ~CPUImpl();
19
20 void fillAll(float value) override;
21 void fillRand() override;
22
23 void print() const override;
24 void print(const std::vector<size_t>& position) const override;
25
26 size_t getNumElements() const override;
27 Tensor::Shape getShape() const override;
28
30 float* dataPtr() const;
31 std::vector<float> toVector() const override;
32 std::string toString() const override;
33
34 std::unique_ptr<Tensor::Impl> clone() const override;
35
36 void copyFromHost(const float* data, size_t count) override;
37
38 void set(const TensorLayout& lhsLayout, const Tensor::Impl* rhsImpl,
39 const TensorLayout& rhsLayout) override;
40
41 bool compare(const TensorLayout& lhsLayout, const Tensor::Impl* rhsImpl,
42 const TensorLayout& rhsLayout) const override;
43
44 std::unique_ptr<Tensor::Impl> add(const TensorLayout& lhsLayout, const Tensor::Impl* rhsImpl,
45 const TensorLayout& rhsLayout,
46 const TensorLayout& outLayout) const override;
47
48 std::unique_ptr<Tensor::Impl> sub(const TensorLayout& lhsLayout, const Tensor::Impl* rhsImpl,
49 const TensorLayout& rhsLayout,
50 const TensorLayout& outLayout) const override;
51
52 std::unique_ptr<Tensor::Impl> mul(const TensorLayout& lhsLayout, const Tensor::Impl* rhsImpl,
53 const TensorLayout& rhsLayout,
54 const TensorLayout& outLayout) const override;
55
56 std::unique_ptr<Tensor::Impl> div(const TensorLayout& lhsLayout, const Tensor::Impl* rhsImpl,
57 const TensorLayout& rhsLayout,
58 const TensorLayout& outLayout) const override;
59
60 void iadd(const TensorLayout& lhsLayout, const Tensor::Impl* rhsImpl,
61 const TensorLayout& rhsLayout) override;
62
63 void isub(const TensorLayout& lhsLayout, const Tensor::Impl* rhsImpl,
64 const TensorLayout& rhsLayout) override;
65
66 void imul(const TensorLayout& lhsLayout, const Tensor::Impl* rhsImpl,
67 const TensorLayout& rhsLayout) override;
68
69 void idiv(const TensorLayout& lhsLayout, const Tensor::Impl* rhsImpl,
70 const TensorLayout& rhsLayout) override;
71
72 std::unique_ptr<Tensor::Impl> sum(const TensorLayout& layout, const TensorLayout& blockLayout,
73 const TensorLayout& outLayout) const override;
74
75 std::unique_ptr<Tensor::Impl> min(const TensorLayout& layout, const TensorLayout& blockLayout,
76 const TensorLayout& outLayout) const override;
77
78 std::unique_ptr<Tensor::Impl> max(const TensorLayout& layout, const TensorLayout& blockLayout,
79 const TensorLayout& outLayout) const override;
80
81 std::unique_ptr<Tensor::Impl> prod(const TensorLayout& layout, const TensorLayout& blockLayout,
82 const TensorLayout& outLayout) const override;
83
84 std::unique_ptr<Tensor::Impl> norm(const TensorLayout& layout) const override;
85
86
87 std::unique_ptr<Tensor::Impl> matmul(const TensorLayout& lhsLayout, const Tensor::Impl* rhsImpl,
88 const TensorLayout& rhsLayout,
89 const TensorLayout& outLayout, size_t batch, size_t m,
90 size_t k, size_t p) const override;
91
92
93 std::unique_ptr<Tensor::Impl> less(const TensorLayout& lhsLayout, const Tensor::Impl* rhsImpl,
94 const TensorLayout& rhsLayout,
95 const TensorLayout& outLayout) const override;
96
97 std::unique_ptr<Tensor::Impl> lessEqual(const TensorLayout& lhsLayout,
98 const Tensor::Impl* rhsImpl,
99 const TensorLayout& rhsLayout,
100 const TensorLayout& outLayout) const override;
101
102 std::unique_ptr<Tensor::Impl> greater(const TensorLayout& lhsLayout,
103 const Tensor::Impl* rhsImpl,
104 const TensorLayout& rhsLayout,
105 const TensorLayout& outLayout) const override;
106
107 std::unique_ptr<Tensor::Impl> greaterEqual(const TensorLayout& lhsLayout,
108 const Tensor::Impl* rhsImpl,
109 const TensorLayout& rhsLayout,
110 const TensorLayout& outLayout) const override;
111
112 std::unique_ptr<Tensor::Impl> isClose(const TensorLayout& lhsLayout,
113 const Tensor::Impl* rhsImpl,
114 const TensorLayout& rhsLayout,
115 const TensorLayout& outLayout,
116 float tolerance) const override;
117
118private:
119 Tensor::Shape m_shape;
120 std::vector<float> m_data;
121
122 template <typename BinaryOp>
123 std::unique_ptr<Tensor::Impl> applyBinaryOp(const TensorLayout& lhsLayout,
124 const Tensor::Impl* rhsImpl,
125 const TensorLayout& rhsLayout,
126 const TensorLayout& outLayout, BinaryOp op) const;
127
128 template <typename BinaryOp>
129 void applyInplaceBinaryOp(const TensorLayout& lhsLayout, const Tensor::Impl* rhsImpl,
130 const TensorLayout& rhsLayout, BinaryOp op);
131
132 // reduction must be associative
133 template <typename ReductionOp>
134 std::unique_ptr<Tensor::Impl> applyReductionOp(const TensorLayout& layout,
135 const TensorLayout& blockLayout,
136 const TensorLayout& outLayout,
137 ReductionOp op) const;
138};
139
140#endif // TENSOR_IMPL_CPU_H
Definition tensor_impl_CPU.h:14
Tensor::Shape getShape() const override
Returns the tensor shape.
Definition tensor_impl_CPU.cpp:101
bool compare(const TensorLayout &lhsLayout, const Tensor::Impl *rhsImpl, const TensorLayout &rhsLayout) const override
Returns true if the data with lhsLayout matches rhsImpl with rhsLayout.
Definition tensor_impl_CPU.cpp:151
std::unique_ptr< Tensor::Impl > add(const TensorLayout &lhsLayout, const Tensor::Impl *rhsImpl, const TensorLayout &rhsLayout, const TensorLayout &outLayout) const override
Elementwise addition. Returns a new Impl with the result with outLayout.
Definition tensor_impl_CPU.cpp:198
std::unique_ptr< Tensor::Impl > div(const TensorLayout &lhsLayout, const Tensor::Impl *rhsImpl, const TensorLayout &rhsLayout, const TensorLayout &outLayout) const override
Elementwise division. Returns a new Impl with the result with outLayout.
Definition tensor_impl_CPU.cpp:222
void idiv(const TensorLayout &lhsLayout, const Tensor::Impl *rhsImpl, const TensorLayout &rhsLayout) override
In-place elementwise division. Modifies lhsLayout in place.
Definition tensor_impl_CPU.cpp:263
std::unique_ptr< Tensor::Impl > lessEqual(const TensorLayout &lhsLayout, const Tensor::Impl *rhsImpl, const TensorLayout &rhsLayout, const TensorLayout &outLayout) const override
Elementwise less or equal. Returns a tensor of 0.0 / 1.0 with outLayout.
Definition tensor_impl_CPU.cpp:385
std::unique_ptr< Tensor::Impl > greater(const TensorLayout &lhsLayout, const Tensor::Impl *rhsImpl, const TensorLayout &rhsLayout, const TensorLayout &outLayout) const override
Elementwise greater than. Returns a tensor of 0.0 / 1.0 with outLayout.
Definition tensor_impl_CPU.cpp:393
void isub(const TensorLayout &lhsLayout, const Tensor::Impl *rhsImpl, const TensorLayout &rhsLayout) override
In-place elementwise subtraction. Modifies lhsLayout in place.
Definition tensor_impl_CPU.cpp:253
std::unique_ptr< Tensor::Impl > max(const TensorLayout &layout, const TensorLayout &blockLayout, const TensorLayout &outLayout) const override
Reduces dimensions [dim, rank) by taking the maximum. Output with outLayout.
Definition tensor_impl_CPU.cpp:311
void fillRand() override
Fills all elements with random values in [-1, 1].
Definition tensor_impl_CPU.cpp:24
std::unique_ptr< Tensor::Impl > prod(const TensorLayout &layout, const TensorLayout &blockLayout, const TensorLayout &outLayout) const override
Reduces dimensions [dim, rank) by taking the product. Output with outLayout.
Definition tensor_impl_CPU.cpp:318
std::unique_ptr< Tensor::Impl > isClose(const TensorLayout &lhsLayout, const Tensor::Impl *rhsImpl, const TensorLayout &rhsLayout, const TensorLayout &outLayout, float tolerance) const override
Elementwise closeness within tolerance. Returns a tensor of 0.0 / 1.0 with outLayout.
Definition tensor_impl_CPU.cpp:409
std::string toString() const override
Returns a string representation of the data.
Definition tensor_impl_CPU.cpp:103
void print() const override
Prints the entire tensor to stdout.
Definition tensor_impl_CPU.cpp:33
void set(const TensorLayout &lhsLayout, const Tensor::Impl *rhsImpl, const TensorLayout &rhsLayout) override
Copies data from rhsImpl with rhsLayout into this with lhsLayout.
Definition tensor_impl_CPU.cpp:136
float * dataPtr() const
Returns a raw pointer to the internal data buffer.
Definition tensor_impl_CPU.cpp:130
std::unique_ptr< Tensor::Impl > clone() const override
Deep copies this implementation.
Definition tensor_impl_CPU.cpp:132
void copyFromHost(const float *data, size_t count) override
Definition tensor_impl_CPU.cpp:126
std::unique_ptr< Tensor::Impl > mul(const TensorLayout &lhsLayout, const Tensor::Impl *rhsImpl, const TensorLayout &rhsLayout, const TensorLayout &outLayout) const override
Elementwise multiplication. Returns a new Impl with the result with outLayout.
Definition tensor_impl_CPU.cpp:214
std::unique_ptr< Tensor::Impl > less(const TensorLayout &lhsLayout, const Tensor::Impl *rhsImpl, const TensorLayout &rhsLayout, const TensorLayout &outLayout) const override
Elementwise less than. Returns a tensor of 0.0 / 1.0 with outLayout.
Definition tensor_impl_CPU.cpp:377
std::unique_ptr< Tensor::Impl > greaterEqual(const TensorLayout &lhsLayout, const Tensor::Impl *rhsImpl, const TensorLayout &rhsLayout, const TensorLayout &outLayout) const override
Elementwise greater or equal. Returns a tensor of 0.0 / 1.0 with outLayout.
Definition tensor_impl_CPU.cpp:401
std::unique_ptr< Tensor::Impl > sum(const TensorLayout &layout, const TensorLayout &blockLayout, const TensorLayout &outLayout) const override
Reduces dimensions [dim, rank) by summation. Output with outLayout.
Definition tensor_impl_CPU.cpp:298
void imul(const TensorLayout &lhsLayout, const Tensor::Impl *rhsImpl, const TensorLayout &rhsLayout) override
In-place elementwise multiplication. Modifies lhsLayout in place.
Definition tensor_impl_CPU.cpp:258
std::unique_ptr< Tensor::Impl > sub(const TensorLayout &lhsLayout, const Tensor::Impl *rhsImpl, const TensorLayout &rhsLayout, const TensorLayout &outLayout) const override
Elementwise subtraction. Returns a new Impl with the result with outLayout.
Definition tensor_impl_CPU.cpp:206
void fillAll(float value) override
Fills all elements with value.
Definition tensor_impl_CPU.cpp:22
size_t getNumElements() const override
Returns the total number of elements.
Definition tensor_impl_CPU.cpp:115
std::unique_ptr< Tensor::Impl > min(const TensorLayout &layout, const TensorLayout &blockLayout, const TensorLayout &outLayout) const override
Reduces dimensions [dim, rank) by taking the minimum. Output with outLayout.
Definition tensor_impl_CPU.cpp:304
std::unique_ptr< Tensor::Impl > matmul(const TensorLayout &lhsLayout, const Tensor::Impl *rhsImpl, const TensorLayout &rhsLayout, const TensorLayout &outLayout, size_t batch, size_t m, size_t k, size_t p) const override
Definition tensor_impl_CPU.cpp:343
void iadd(const TensorLayout &lhsLayout, const Tensor::Impl *rhsImpl, const TensorLayout &rhsLayout) override
In-place elementwise addition. Modifies lhsLayout in place.
Definition tensor_impl_CPU.cpp:248
std::vector< float > toVector() const override
Copies all elements into a flat vector (row-major order).
Definition tensor_impl_CPU.cpp:124
Definition tensor_impl.h:15
Definition tensor_shape.h:15
Tensor norm() const
L2 norm (scalar tensor equal to sqrt(sum(x^2))).
Definition tensor.cpp:223
Definition tensor_layout.h:15