Blame - common/OperationsUtils.cpp - platform/packages/modules/NeuralNetworks

2017-07-12 01:37:27 -0700

[diff] [blame]

/*

*

* Licensed under the Apache License, Version 2.0 (the "License");

5

* you may not use this file except in compliance with the License.

6

* You may obtain a copy of the License at

7

*

8

* http://www.apache.org/licenses/LICENSE-2.0

9

*

10

* Unless required by applicable law or agreed to in writing, software

11

* distributed under the License is distributed on an "AS IS" BASIS,

12

* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

13

* See the License for the specific language governing permissions and

14

* limitations under the License.

15

*/

16

17

#define LOG_TAG "OperationsUtils"

18

19

#include "OperationsUtils.h"

Lev Proleev

0ca9520

2019-10-23 11:40:41 +0100

[diff] [blame]

#include <algorithm>

#include <cmath>

#include <limits>

#include <sstream>

#include <vector>

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

27

#include "Operations.h"

Jean-Luc Brouillet

2017-07-12 01:37:27 -0700

[diff] [blame]

#include "Utils.h"

namespace android {

namespace nn {

Slava Shklyaev

2018-11-06 15:32:44 +0000

[diff] [blame]

33

namespace {

34

Michael Butler

6bf05b2

2019-07-11 11:45:01 -0700

[diff] [blame]

35

using namespace hal;

36

Slava Shklyaev

a694425

2018-11-06 15:32:44 +0000

[diff] [blame]

37

bool validateOperandTypes(const std::vector<OperandType>& expectedTypes, const char* tag,

38

uint32_t operandCount,

39

std::function<OperandType(uint32_t)> getOperandType) {

40

NN_RET_CHECK_EQ(operandCount, expectedTypes.size());

41

for (uint32_t i = 0; i < operandCount; ++i) {

42

OperandType type = getOperandType(i);

43

NN_RET_CHECK(type == expectedTypes[i])

44

<< "Invalid " << tag << " tensor type " << toString(type) << " for " << tag << " "

45

<< i << ", expected " << toString(expectedTypes[i]);

}

return true;

}

Lev Proleev

2019-10-23 17:24:57 +0100

[diff] [blame]

50

void CalculateActivationRangeImpl(int32_t activation, const Shape& outputShape, int32_t qmin,

51

int32_t qmax, int32_t* act_min, int32_t* act_max) {

52

const auto scale = outputShape.scale;

53

const auto zero_point = outputShape.offset;

54

55

auto quantize = [scale, zero_point](float f) {

56

return zero_point + static_cast<int32_t>(std::round(f / scale));

57

};

58

59

if (activation == kActivationRelu) {

60

*act_min = std::max(qmin, quantize(0.0));

61

*act_max = qmax;

62

} else if (activation == kActivationRelu6) {

63

*act_min = std::max(qmin, quantize(0.0));

64

*act_max = std::min(qmax, quantize(6.0));

65

} else if (activation == kActivationRelu1) {

66

*act_min = std::max(qmin, quantize(-1.0));

67

*act_max = std::min(qmax, quantize(1.0));

68

} else if (activation == kActivationNone) {

*act_min = qmin;

*act_max = qmax;

} else {

LOG(ERROR) << "Unsupported fused activation function.";

}

}

Slava Shklyaev

2018-11-06 15:32:44 +0000

[diff] [blame]

76

} // namespace

77

78

bool validateInputTypes(const IOperationValidationContext* context,

79

const std::vector<OperandType>& expectedTypes) {

80

return validateOperandTypes(expectedTypes, "input", context->getNumInputs(),

81

[context](uint32_t index) { return context->getInputType(index); });

82

}

83

84

bool validateOutputTypes(const IOperationValidationContext* context,

85

const std::vector<OperandType>& expectedTypes) {

86

return validateOperandTypes(

87

expectedTypes, "output", context->getNumOutputs(),

88

[context](uint32_t index) { return context->getOutputType(index); });

89

}

90

91

bool validateHalVersion(const IOperationValidationContext* context,

92

HalVersion minSupportedHalVersion) {

93

if (context->getHalVersion() < minSupportedHalVersion) {

Slava Shklyaev

57f2c71

2019-09-30 16:04:43 +0100

[diff] [blame]

94

std::ostringstream message;

95

message << "Operation " << context->getOperationName() << " with inputs {";

96

for (uint32_t i = 0, n = context->getNumInputs(); i < n; ++i) {

if (i != 0) {

message << ", ";

}

message << toString(context->getInputType(i));

101

}

102

message << "} and outputs {";

103

for (uint32_t i = 0, n = context->getNumOutputs(); i < n; ++i) {

if (i != 0) {

message << ", ";

}

message << toString(context->getOutputType(i));

108

}

109

message << "} is only supported since " << toString(minSupportedHalVersion)

110

<< " (validating using " << toString(context->getHalVersion()) << ")";

111

NN_RET_CHECK_FAIL() << message.str();

Slava Shklyaev

a694425

2018-11-06 15:32:44 +0000

[diff] [blame]

}

return true;

}

Jean-Luc Brouillet

2017-07-12 01:37:27 -0700

[diff] [blame]

116

bool SameShape(const Shape& in1, const Shape& in2) {

Miao Wang

2017-07-25 17:06:18 -0700

[diff] [blame]

117

if (in1.type != in2.type || in1.dimensions.size() != in2.dimensions.size()) {

Jean-Luc Brouillet

2017-07-12 01:37:27 -0700

[diff] [blame]

118

return false;

119

}

Miao Wang

2017-07-25 17:06:18 -0700

[diff] [blame]

120

for (size_t i = 0; i < in1.dimensions.size(); i++) {

Jean-Luc Brouillet

2017-07-12 01:37:27 -0700

[diff] [blame]

121

if (in1.dimensions[i] != in2.dimensions[i]) {

return false;

}

}

return true;

}

Miao Wang

2017-07-25 17:06:18 -0700

[diff] [blame]

128

bool SetShape(const Shape& in, Shape* out) {

Xusong Wang

603ebb6

2018-11-07 15:03:29 -0800

[diff] [blame]

129

if (in.type != out->type) {

Jean-Luc Brouillet

2017-07-12 01:37:27 -0700

[diff] [blame]

130

return false;

131

}

Miao Wang

2017-07-25 17:06:18 -0700

[diff] [blame]

132

out->dimensions = in.dimensions;

Jean-Luc Brouillet

2017-07-12 01:37:27 -0700

[diff] [blame]

return true;

}

uint32_t getNumberOfElements(const Shape& shape) {

137

uint32_t count = 1;

Miao Wang

2017-07-25 17:06:18 -0700

[diff] [blame]

138

for (size_t i = 0; i < shape.dimensions.size(); i++) {

Jean-Luc Brouillet

2017-07-12 01:37:27 -0700

[diff] [blame]

139

count *= shape.dimensions[i];

}

return count;

}

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

144

uint32_t getNumberOfElements(const Shape& shape, size_t firstAxisInclusive,

Slava Shklyaev

2018-09-17 11:58:40 +0100

[diff] [blame]

145

size_t lastAxisExclusive) {

Slava Shklyaev

2018-10-22 12:04:16 +0100

[diff] [blame]

146

nnAssert(0 <= firstAxisInclusive);

147

nnAssert(firstAxisInclusive <= lastAxisExclusive);

148

nnAssert(lastAxisExclusive <= shape.dimensions.size());

Slava Shklyaev

2018-09-17 11:58:40 +0100

[diff] [blame]

149

uint32_t count = 1;

150

for (size_t i = firstAxisInclusive; i < lastAxisExclusive; i++) {

151

count *= shape.dimensions[i];

}

return count;

}

Jean-Luc Brouillet

2017-07-25 00:17:50 -0700

[diff] [blame]

156

uint32_t getNumberOfDimensions(const Shape& shape) {

Miao Wang

2017-07-25 17:06:18 -0700

[diff] [blame]

157

return shape.dimensions.size();

Jean-Luc Brouillet

873c008

2017-07-25 00:17:50 -0700

[diff] [blame]

158

}

159

160

uint32_t getSizeOfDimension(const Shape& shape, uint32_t dimensionIdx) {

Slava Shklyaev

2018-10-22 12:04:16 +0100

[diff] [blame]

161

nnAssert(0 <= dimensionIdx && dimensionIdx < shape.dimensions.size());

Jean-Luc Brouillet

873c008

2017-07-25 00:17:50 -0700

[diff] [blame]

162

return shape.dimensions[dimensionIdx];

163

}

164

Lev Proleev

88a3bba

2020-03-18 15:20:46 +0000

[diff] [blame]

165

uint32_t hasKnownRank(const Shape& shape) {

166

return !shape.dimensions.empty();

167

}

168

Slava Shklyaev

2018-10-22 12:04:16 +0100

[diff] [blame]

169

bool handleNegativeAxis(int32_t numberOfDimensions, int32_t* axis) {

170

NN_CHECK(-numberOfDimensions <= *axis && *axis < numberOfDimensions);

171

if (*axis < 0) {

172

*axis += numberOfDimensions;

Slava Shklyaev

3970918

2018-09-27 18:25:43 +0100

[diff] [blame]

173

}

Slava Shklyaev

2018-10-22 12:04:16 +0100

[diff] [blame]

174

return true;

Slava Shklyaev

9057e9f

2018-09-27 15:13:47 +0100

[diff] [blame]

175

}

176

Lev Proleev

2019-10-23 17:24:57 +0100

[diff] [blame]

177

bool QuantizeMultiplier(double double_multiplier, int32_t* quantized_multiplier, int32_t* shift) {

Lev Proleev

1431a6f

2019-03-07 18:02:46 +0000

[diff] [blame]

178

if (double_multiplier == 0.) {

179

*quantized_multiplier = 0;

*shift = 0;

return true;

}

const double q = std::frexp(double_multiplier, shift);

184

auto q_fixed = static_cast<int64_t>(std::round(q * (1ll << 31)));

185

NN_RET_CHECK(q_fixed <= (1ll << 31));

186

if (q_fixed == (1ll << 31)) {

q_fixed /= 2;

++*shift;

}

NN_RET_CHECK_LE(q_fixed, std::numeric_limits<int32_t>::max());

Viet Dang

d0137f7

2019-12-04 16:18:08 +0000

[diff] [blame]

191

// A shift amount smaller than -31 would cause all bits to be shifted out

192

// and thus all results would be zero. We implement that instead with

193

// q_fixed==0, so as to avoid hitting issues with right-shift

194

// operations with shift amounts greater than 31. Note that this happens

195

// roughly when abs(double_multiplier) < 2^-31 and the present handling means

196

// that we're effectively flushing tiny double_multiplier's to zero.

197

// We could conceivably handle values in the range (roughly) [32, 63]

198

// as 'denormals' i.e. (shift==0, q_fixed < 2^30). In that point of view

199

// the present handling is just doing 'flush denormals to zero'. We could

200

// reconsider and actually generate nonzero denormals if a need arises.

if (*shift < -31) {

*shift = 0;

q_fixed = 0;

}

Lev Proleev

1431a6f

2019-03-07 18:02:46 +0000

[diff] [blame]

205

*quantized_multiplier = static_cast<int32_t>(q_fixed);

return true;

}

Lev Proleev

2019-10-23 17:24:57 +0100

[diff] [blame]

209

bool QuantizeMultiplierSmallerThanOneExp(double double_multiplier, int32_t* quantized_multiplier,

210

int32_t* left_shift) {

211

NN_RET_CHECK(double_multiplier > 0.);

212

NN_RET_CHECK(double_multiplier < 1.);

213

NN_RET_CHECK(QuantizeMultiplier(double_multiplier, quantized_multiplier, left_shift));

214

NN_RET_CHECK(*left_shift <= 0);

return true;

}

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

218

bool QuantizeMultiplierSmallerThanOne(double double_multiplier, int32_t* quantized_multiplier,

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

219

int32_t* right_shift) {

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

220

NN_OPS_CHECK(double_multiplier >= 0.);

221

NN_OPS_CHECK(double_multiplier < 1.);

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

222

if (double_multiplier == 0.) {

223

*quantized_multiplier = 0;

224

*right_shift = 0;

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

225

return true;

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

226

}

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

227

NN_OPS_CHECK(double_multiplier > 0.);

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

228

const double q = std::frexp(double_multiplier, right_shift);

229

*right_shift *= -1;

Chih-Hung Hsieh

bafa138

2018-12-10 14:08:34 -0800

[diff] [blame]

230

int64_t q_fixed = static_cast<int64_t>(std::round(q * (1LL << 31)));

231

NN_OPS_CHECK(q_fixed <= (1LL << 31));

232

if (q_fixed == (1LL << 31)) {

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

233

q_fixed /= 2;

234

--*right_shift;

235

}

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

236

NN_OPS_CHECK(*right_shift >= 0);

237

NN_OPS_CHECK(q_fixed <= std::numeric_limits<int32_t>::max());

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

238

*quantized_multiplier = static_cast<int32_t>(q_fixed);

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

239

return true;

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

240

}

241

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

242

bool QuantizeMultiplierGreaterThanOne(double double_multiplier, int32_t* quantized_multiplier,

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

243

int* left_shift) {

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

244

NN_OPS_CHECK(double_multiplier > 1.);

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

245

const double q = std::frexp(double_multiplier, left_shift);

Chih-Hung Hsieh

bafa138

2018-12-10 14:08:34 -0800

[diff] [blame]

246

int64_t q_fixed = static_cast<int64_t>(std::round(q * (1LL << 31)));

247

NN_OPS_CHECK(q_fixed <= (1LL << 31));

248

if (q_fixed == (1LL << 31)) {

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

249

q_fixed /= 2;

250

++*left_shift;

251

}

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

252

NN_OPS_CHECK(*left_shift >= 0);

253

NN_OPS_CHECK(q_fixed <= std::numeric_limits<int32_t>::max());

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

254

*quantized_multiplier = static_cast<int32_t>(q_fixed);

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

255

return true;

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

256

}

257

Przemyslaw Szczepaniak

fdfeec9

2019-05-02 10:03:44 +0100

[diff] [blame]

258

bool GetQuantizedConvolutionMultipler(const Shape& inputShape, const Shape& filterShape,

259

const Shape& biasShape, const Shape& outputShape,

260

double* multiplier) {

261

// Upcast bias and input_product to double

262

const double input_product_scale = inputShape.scale * filterShape.scale;

263

const double bias_scale = biasShape.scale;

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

264

265

// The following conditions must be guaranteed by the training pipeline.

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

266

NN_OPS_CHECK(std::abs(input_product_scale - bias_scale) <=

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

267

1e-6 * std::min(input_product_scale, bias_scale));

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

268

NN_OPS_CHECK(input_product_scale >= 0);

Przemyslaw Szczepaniak

fdfeec9

2019-05-02 10:03:44 +0100

[diff] [blame]

269

*multiplier = input_product_scale / outputShape.scale;

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

270

return true;

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

271

}

272

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

273

void CalculateActivationRangeUint8(int32_t activation, const Shape& outputShape, int32_t* act_min,

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

274

int32_t* act_max) {

275

const int32_t qmin = std::numeric_limits<uint8_t>::min();

276

const int32_t qmax = std::numeric_limits<uint8_t>::max();

277

Lev Proleev

2019-10-23 17:24:57 +0100

[diff] [blame]

278

CalculateActivationRangeImpl(activation, outputShape, qmin, qmax, act_min, act_max);

279

}

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

280

Lev Proleev

2019-10-23 17:24:57 +0100

[diff] [blame]

281

void CalculateActivationRangeInt8(int32_t activation, const Shape& outputShape, int32_t* act_min,

282

int32_t* act_max) {

283

const int32_t qmin = std::numeric_limits<int8_t>::min();

284

const int32_t qmax = std::numeric_limits<int8_t>::max();

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

285

Lev Proleev

2019-10-23 17:24:57 +0100

[diff] [blame]

286

CalculateActivationRangeImpl(activation, outputShape, qmin, qmax, act_min, act_max);

Miao Wang

658dc37

2017-12-14 15:01:31 -0800

[diff] [blame]

287

}

288

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

289

void CalculateActivationRangeFloat(int32_t activation, float* activation_min,

Miao Wang

658dc37

2017-12-14 15:01:31 -0800

[diff] [blame]

290

float* activation_max) {

291

if (activation == kActivationRelu) {

292

*activation_min = 0.f;

293

*activation_max = std::numeric_limits<float>::max();

294

} else if (activation == kActivationRelu6) {

295

*activation_min = 0.f;

296

*activation_max = 6.f;

297

} else if (activation == kActivationRelu1) {

298

*activation_min = -1.f;

299

*activation_max = 1.f;

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

300

} else if (activation == kActivationNone) {

Miao Wang

658dc37

2017-12-14 15:01:31 -0800

[diff] [blame]

301

*activation_min = std::numeric_limits<float>::lowest();

302

*activation_max = std::numeric_limits<float>::max();

303

} else {

304

LOG(ERROR) << "Unsupported fused activation function.";

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

}

}

int32_t CalculateInputRadius(int input_integer_bits, int input_left_shift) {

309

const double max_input_rescaled = 1.0 * ((1 << input_integer_bits) - 1) *

Chih-Hung Hsieh

bafa138

2018-12-10 14:08:34 -0800

[diff] [blame]

310

(1LL << (31 - input_integer_bits)) /

311

(1LL << input_left_shift);

Miao Wang

2017-08-02 18:58:17 -0700

[diff] [blame]

312

// Tighten bound using floor. Suppose that we could use the exact value.

313

// After scaling the difference, the result would be at the maximum. Thus we

314

// must ensure that our value has lower magnitude.

315

return static_cast<int32_t>(std::floor(max_input_rescaled));

316

}

317

Xusong Wang

d0cc11f

2019-04-12 13:38:49 -0700

[diff] [blame]

318

void calculateExplicitPaddingImpl(int32_t in_size, int32_t stride, int32_t dilation_factor,

319

int32_t filter_size, int32_t padding_implicit,

320

bool isTransposeConv, int32_t* padding_head,

321

int32_t* padding_tail) {

*padding_head = 0;

*padding_tail = 0;

int32_t effective_filter_size = (filter_size - 1) * dilation_factor + 1;

326

327

if (padding_implicit == kPaddingSame) {

328

int32_t out_size = (in_size + stride - 1) / stride;

329

int32_t tmp = (out_size - 1) * stride + effective_filter_size;

330

if (tmp > in_size) {

331

*padding_head = (tmp - in_size) / 2;

332

*padding_tail = (tmp - in_size) - *padding_head;

333

}

334

// For transpose conv, make padding tail fit tightly to the end of the last stride.

335

if (isTransposeConv) {

336

*padding_tail = (tmp - in_size) - *padding_head;

}

}

}

Lev Proleev

2018-10-18 14:33:39 +0100

[diff] [blame]

341

bool calculateBroadcastedShape(const Shape& in1, const Shape& in2, Shape* out) {

Xusong Wang

ced4b70

2019-03-14 13:55:20 -0700

[diff] [blame]

342

NN_RET_CHECK(in1.type == in2.type);

Lev Proleev

8e3e09f

2018-10-18 14:33:39 +0100

[diff] [blame]

343

uint32_t numberOfDims1 = getNumberOfDimensions(in1);

344

uint32_t numberOfDims2 = getNumberOfDimensions(in2);

345

uint32_t maxDims = std::max(numberOfDims1, numberOfDims2);

346

out->dimensions = std::vector<uint32_t>(maxDims);

347

for (uint32_t i = 1; i <= maxDims; i++) {

348

uint32_t dim1 = 1;

349

if (i <= numberOfDims1) {

350

dim1 = getSizeOfDimension(in1, numberOfDims1 - i);

351

}

352

uint32_t dim2 = 1;

353

if (i <= numberOfDims2) {

354

dim2 = getSizeOfDimension(in2, numberOfDims2 - i);

355

}

356

if (dim1 != dim2 && dim1 != 1 && dim2 != 1) {

357

LOG(ERROR) << "Dimensions mismatch for broadcast:\n"

358

<< "First tensor: dimension " << numberOfDims1 - i << " of size " << dim1

David Gross

94597f0

2020-08-14 15:30:49 -0700

[diff] [blame^]

359

<< "\nSecond tensor: dimension " << numberOfDims2 - i << " of size " << dim2;

Lev Proleev

8e3e09f

2018-10-18 14:33:39 +0100

[diff] [blame]

360

return false;

361

}

Xusong Wang

ced4b70

2019-03-14 13:55:20 -0700

[diff] [blame]

362

out->dimensions[maxDims - i] = (dim1 == 1) ? dim2 : dim1;

Lev Proleev

8e3e09f

2018-10-18 14:33:39 +0100

[diff] [blame]

}

return true;

}

Przemyslaw Szczepaniak

14c1213

2019-11-28 11:25:21 +0000

[diff] [blame]

367

template <>

368

uint8_t requantize<uint8_t>(uint8_t value, const Shape& oldShape, const Shape& newShape) {

Lev Proleev

5d7c6b4

2018-12-10 11:47:19 +0000

[diff] [blame]

369

double doubleValue = (value - oldShape.offset) * oldShape.scale;

Xusong Wang

9a8dde7

2019-04-24 12:49:07 -0700

[diff] [blame]

370

double doubleRet = doubleValue / newShape.scale + newShape.offset;

371

if (doubleRet < 0) return 0;

372

if (doubleRet > 255) return 255;

Xusong Wang

7c1bc2c

2019-05-30 18:23:33 -0700

[diff] [blame]

373

return static_cast<uint8_t>(std::round(doubleRet));

Lev Proleev

5d7c6b4

2018-12-10 11:47:19 +0000

[diff] [blame]

374

}

375

Przemyslaw Szczepaniak

14c1213

2019-11-28 11:25:21 +0000

[diff] [blame]

376

template <>

377

int8_t requantize<int8_t>(int8_t value, const Shape& oldShape, const Shape& newShape) {

Lev Proleev

0ca9520

2019-10-23 11:40:41 +0100

[diff] [blame]

378

double doubleValue = (value - oldShape.offset) * oldShape.scale;

379

double doubleRet = doubleValue / newShape.scale + newShape.offset;

380

if (doubleRet < -128) return -128;

381

if (doubleRet > 127) return 127;

382

return static_cast<int8_t>(std::round(doubleRet));

383

}

384

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

385

bool reshapePrepare(const Shape& input, const int32_t* targetDims, const int32_t targetDimsSize,

Miao Wang

2017-09-11 14:16:14 -0700

[diff] [blame]

386

Shape* output) {

387

// Reshape allows one of the targetDims components to have the

388

// special -1 value, meaning it will be calculated automatically based on the

389

// input. Here we calculate what that dimension should be so that the number

390

// of output elements in the same as the number of input elements.

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

391

int32_t numInputElements = (int32_t)getNumberOfElements(input);

Miao Wang

2017-09-11 14:16:14 -0700

[diff] [blame]

392

393

std::vector<uint32_t> outDims(targetDimsSize);

394

int32_t numOutputElements = 1;

395

int32_t strechDim = -1;

396

for (int32_t i = 0; i < targetDimsSize; ++i) {

397

int32_t value = targetDims[i];

398

if (value == -1) {

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

399

NN_OPS_CHECK(strechDim == -1);

Miao Wang

2017-09-11 14:16:14 -0700

[diff] [blame]

400

strechDim = i;

401

} else {

402

numOutputElements *= value;

403

outDims[i] = (uint32_t)value;

404

}

405

}

406

if (strechDim != -1) {

407

int32_t strechValue = numInputElements / numOutputElements;

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

408

outDims[strechDim] = (uint32_t)strechValue;

Miao Wang

2017-09-11 14:16:14 -0700

[diff] [blame]

409

numOutputElements *= strechValue;

410

}

411

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

412

NN_OPS_CHECK(numInputElements == numOutputElements);

Miao Wang

2017-09-11 14:16:14 -0700

[diff] [blame]

413

414

output->type = input.type;

415

output->dimensions = outDims;

416

output->offset = input.offset;

417

output->scale = input.scale;

return true;

}

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

422

bool depthToSpacePrepare(const Shape& input, int32_t blockSize, Shape* output) {

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

423

NN_OPS_CHECK(getNumberOfDimensions(input) == 4);

424

NN_OPS_CHECK(blockSize > 0);

Miao Wang

2017-09-11 14:16:14 -0700

[diff] [blame]

425

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

426

uint32_t batches = getSizeOfDimension(input, 0);

427

uint32_t height = getSizeOfDimension(input, 1);

428

uint32_t width = getSizeOfDimension(input, 2);

Miao Wang

2017-09-11 14:16:14 -0700

[diff] [blame]

429

uint32_t channels = getSizeOfDimension(input, 3);

430

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

431

NN_OPS_CHECK(channels % (blockSize * blockSize) == 0);

Miao Wang

2017-09-11 14:16:14 -0700

[diff] [blame]

432

output->type = input.type;

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

433

output->dimensions = {batches, height * blockSize, width * blockSize,

Miao Wang

2017-09-11 14:16:14 -0700

[diff] [blame]

434

channels / (blockSize * blockSize)};

435

output->offset = input.offset;

436

output->scale = input.scale;

return true;

}

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

441

bool spaceToDepthPrepare(const Shape& input, int32_t blockSize, Shape* output) {

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

442

NN_OPS_CHECK(getNumberOfDimensions(input) == 4);

443

NN_OPS_CHECK(blockSize > 0);

Miao Wang

2017-09-11 14:16:14 -0700

[diff] [blame]

444

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

445

uint32_t batches = getSizeOfDimension(input, 0);

446

uint32_t height = getSizeOfDimension(input, 1);

447

uint32_t width = getSizeOfDimension(input, 2);

Miao Wang

2017-09-11 14:16:14 -0700

[diff] [blame]

448

uint32_t channels = getSizeOfDimension(input, 3);

449

Miao Wang

2017-09-21 17:04:31 -0700

[diff] [blame]

450

NN_OPS_CHECK(height % blockSize == 0);

451

NN_OPS_CHECK(width % blockSize == 0);

Miao Wang

2017-09-11 14:16:14 -0700

[diff] [blame]

452

453

output->type = input.type;

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

454

output->dimensions = {batches, height / blockSize, width / blockSize,

Miao Wang

2017-09-11 14:16:14 -0700

[diff] [blame]

455

channels * (blockSize * blockSize)};

456

output->offset = input.offset;

457

output->scale = input.scale;

return true;

}

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

462

bool embeddingLookupPrepare(const Shape& valueShape, const Shape& lookupShape, Shape* outputShape) {

Yang Ni

2017-09-27 10:26:52 -0700

[diff] [blame]

463

NN_OPS_CHECK(getNumberOfDimensions(valueShape) >= 2);

464

NN_OPS_CHECK(getNumberOfDimensions(lookupShape) == 1);

465

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

466

const uint32_t columns = getSizeOfDimension(valueShape, 1);

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

467

const uint32_t lookups = getSizeOfDimension(lookupShape, 0);

Yang Ni

2017-09-27 10:26:52 -0700

[diff] [blame]

468

469

outputShape->type = valueShape.type;

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

470

outputShape->dimensions = {lookups, columns};

Yang Ni

2017-09-27 10:26:52 -0700

[diff] [blame]

471

for (uint32_t i = 2; i < getNumberOfDimensions(valueShape); i++) {

Miao Wang

0cc3223

2017-10-09 10:43:21 -0700

[diff] [blame]

472

outputShape->dimensions.push_back(getSizeOfDimension(valueShape, i));

Yang Ni

2017-09-27 10:26:52 -0700

[diff] [blame]

473

}

474

outputShape->offset = valueShape.offset;

475

outputShape->scale = valueShape.scale;

return true;

}

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

480

bool hashtableLookupPrepare(const Shape& lookupShape, const Shape& keyShape,

481

const Shape& valueShape, Shape* outputShape, Shape* hitShape) {

Yang Ni

2017-09-27 10:26:52 -0700

[diff] [blame]

482

NN_OPS_CHECK(getNumberOfDimensions(lookupShape) == 1);

483

NN_OPS_CHECK(getNumberOfDimensions(keyShape) == 1);

484

NN_OPS_CHECK(getNumberOfDimensions(valueShape) >= 1);

485

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

486

const uint32_t lookups = getSizeOfDimension(lookupShape, 0);

Yang Ni

2017-09-27 10:26:52 -0700

[diff] [blame]

487

outputShape->type = valueShape.type;

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

488

outputShape->dimensions = {lookups};

Yang Ni

2017-09-27 10:26:52 -0700

[diff] [blame]

489

for (uint32_t i = 1; i < getNumberOfDimensions(valueShape); i++) {

Miao Wang

0cc3223

2017-10-09 10:43:21 -0700

[diff] [blame]

490

outputShape->dimensions.push_back(getSizeOfDimension(valueShape, i));

Yang Ni

2017-09-27 10:26:52 -0700

[diff] [blame]

491

}

492

outputShape->offset = valueShape.offset;

493

outputShape->scale = valueShape.scale;

494

495

hitShape->type = OperandType::TENSOR_QUANT8_ASYMM;

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

496

hitShape->dimensions = {lookups};

Yang Ni

2017-09-27 10:26:52 -0700

[diff] [blame]

497

hitShape->offset = 0;

498

hitShape->scale = 1.f;

return true;

}

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

503

bool padPrepare(const Shape& input, const int32_t* paddingsData, const Shape& paddingsShape,

Miao Wang

2018-01-21 02:39:41 -0800

[diff] [blame]

504

Shape* output) {

Miao Wang

2018-01-21 02:39:41 -0800

[diff] [blame]

505

uint32_t numInputDims = getNumberOfDimensions(input);

Miao Wang

2018-01-21 02:39:41 -0800

[diff] [blame]

506

507

// paddings need to be provided as a 2-D int32 tensor.

508

NN_OPS_CHECK(paddingsShape.type == OperandType::TENSOR_INT32);

509

NN_OPS_CHECK(getNumberOfDimensions(paddingsShape) == 2);

510

NN_OPS_CHECK(getSizeOfDimension(paddingsShape, 0) == numInputDims);

511

NN_OPS_CHECK(getSizeOfDimension(paddingsShape, 1) == 2);

512

513

std::vector<uint32_t> outDims(numInputDims);

514

for (uint32_t i = 0; i < numInputDims; ++i) {

515

int32_t beforePadding = *paddingsData++;

516

int32_t afterPadding = *paddingsData++;

517

// Pad value has to be greater than equal to 0.

518

NN_OPS_CHECK(beforePadding >= 0 && afterPadding >= 0);

519

outDims[i] = beforePadding + getSizeOfDimension(input, i) + afterPadding;

520

}

521

output->type = input.type;

522

output->dimensions = outDims;

523

output->offset = input.offset;

524

output->scale = input.scale;

return true;

}

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

529

bool batchToSpacePrepare(const Shape& input, const int32_t* blockSizeData,

530

const Shape& blockSizeShape, Shape* output) {

Miao Wang

2018-01-21 02:39:41 -0800

[diff] [blame]

531

// Only 4D NHWC tensors are supported.

532

NN_OPS_CHECK(getNumberOfDimensions(input) == 4);

533

534

// blockSize need to be provided as a 1-D int32 tensor.

535

NN_OPS_CHECK(blockSizeShape.type == OperandType::TENSOR_INT32);

536

NN_OPS_CHECK(getNumberOfDimensions(blockSizeShape) == 1);

537

// Only applies to spatial dimensions.

538

NN_OPS_CHECK(getSizeOfDimension(blockSizeShape, 0) == 2);

539

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

540

uint32_t batches = getSizeOfDimension(input, 0);

541

uint32_t height = getSizeOfDimension(input, 1);

542

uint32_t width = getSizeOfDimension(input, 2);

Miao Wang

2018-01-21 02:39:41 -0800

[diff] [blame]

543

uint32_t channels = getSizeOfDimension(input, 3);

544

545

NN_OPS_CHECK(batches % (blockSizeData[0] * blockSizeData[1]) == 0);

546

output->type = input.type;

547

output->dimensions = {batches / (blockSizeData[0] * blockSizeData[1]),

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

548

height * blockSizeData[0], width * blockSizeData[1], channels};

Miao Wang

2018-01-21 02:39:41 -0800

[diff] [blame]

549

output->offset = input.offset;

550

output->scale = input.scale;

return true;

}

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

555

bool spaceToBatchPrepare(const Shape& input, const int32_t* blockSizeData,

556

const Shape& blockSizeShape, const int32_t* paddingsData,

557

const Shape& paddingsShape, Shape* output) {

Miao Wang

2018-01-21 02:39:41 -0800

[diff] [blame]

558

// Only 4D NHWC tensors are supported.

559

NN_OPS_CHECK(getNumberOfDimensions(input) == 4);

560

561

// blockSize need to be provided as a 1-D int32 tensor.

562

NN_OPS_CHECK(blockSizeShape.type == OperandType::TENSOR_INT32);

563

NN_OPS_CHECK(getNumberOfDimensions(blockSizeShape) == 1);

564

// Only applies to spatial dimensions.

565

NN_OPS_CHECK(getSizeOfDimension(blockSizeShape, 0) == 2);

566

567

// paddings need to be provided as a 2-D int32 tensor.

568

NN_OPS_CHECK(paddingsShape.type == OperandType::TENSOR_INT32);

569

NN_OPS_CHECK(getNumberOfDimensions(paddingsShape) == 2);

570

NN_OPS_CHECK(getSizeOfDimension(paddingsShape, 0) == 2);

571

NN_OPS_CHECK(getSizeOfDimension(paddingsShape, 1) == 2);

572

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

573

uint32_t batches = getSizeOfDimension(input, 0);

574

uint32_t height = getSizeOfDimension(input, 1);

575

uint32_t width = getSizeOfDimension(input, 2);

Miao Wang

2018-01-21 02:39:41 -0800

[diff] [blame]

576

uint32_t channels = getSizeOfDimension(input, 3);

577

578

uint32_t paddedHeight = paddingsData[0] + height + paddingsData[1];

579

uint32_t paddedWidth = paddingsData[2] + width + paddingsData[3];

580

581

NN_OPS_CHECK(paddedHeight % blockSizeData[0] == 0);

Miao Wang

5fbe3e1

2018-02-20 14:34:00 -0800

[diff] [blame]

582

NN_OPS_CHECK(paddedWidth % blockSizeData[1] == 0);

Miao Wang

2018-01-21 02:39:41 -0800

[diff] [blame]

583

584

output->type = input.type;

585

output->dimensions = {batches * (blockSizeData[0] * blockSizeData[1]),

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

586

paddedHeight / blockSizeData[0], paddedWidth / blockSizeData[1],

Miao Wang

2018-01-21 02:39:41 -0800

[diff] [blame]

587

channels};

588

output->offset = input.offset;

589

output->scale = input.scale;

return true;

}

Michael Butler

2019-07-22 18:59:46 -0700

[diff] [blame]

594

bool meanPrepare(const Shape& input, const int32_t* axisData, const Shape& axisShape, bool keepDims,

Miao Wang

2018-01-21 02:39:41 -0800

[diff] [blame]

595

Shape* output) {

Miao Wang

2018-01-21 02:39:41 -0800

[diff] [blame]

596

// perm need to be provided as a 1-D int32 tensor.

597

NN_OPS_CHECK(axisShape.type == OperandType::TENSOR_INT32);

598

NN_OPS_CHECK(getNumberOfDimensions(axisShape) == 1);

599

600

int32_t numInputDims = static_cast<int32_t>(getNumberOfDimensions(input));

601

int32_t axisSize = static_cast<int32_t>(getSizeOfDimension(axisShape, 0));

602

603

// Determines size of output tensor.

604

if (keepDims) {

605

std::vector<uint32_t> outDims(numInputDims);

606

for (int32_t idx = 0; idx < numInputDims; ++idx) {

607

bool isAxis = false;

608

for (int32_t axisIdx = 0; axisIdx < axisSize; ++axisIdx) {

609

if (axisData[axisIdx] == idx || axisData[axisIdx] + numInputDims == idx) {

isAxis = true;

break;

}

}

if (isAxis) {

outDims[idx] = 1;

} else {

outDims[idx] = getSizeOfDimension(input, idx);

618

}

619

}

620

output->dimensions = outDims;

621

} else {

622

// Calculates size of reducing axis.

623

int32_t numReduceAxis = axisSize;

624

for (int32_t i = 0; i < axisSize; ++i) {

625

int32_t current = axisData[i];

626

if (current < 0) {

627

current += numInputDims;

628

}

629

NN_OPS_CHECK(current >= 0 && current < numInputDims);

630

for (int32_t j = 0; j < i; ++j) {

631

int32_t previous = axisData[j];

632

if (previous < 0) {

633

previous += numInputDims;

634

}

635

if (current == previous) {

--numReduceAxis;

break;

}

}

}

// Determines output dimensions.

642

std::vector<uint32_t> outDims(numInputDims - numReduceAxis);

643

int32_t numSkipAxis = 0;

644

for (int32_t idx = 0; idx < numInputDims; ++idx) {

645

bool isAxis = false;

646

for (int32_t axisIdx = 0; axisIdx < axisSize; ++axisIdx) {

647

if (axisData[axisIdx] == idx || axisData[axisIdx] + numInputDims == idx) {

++numSkipAxis;

isAxis = true;

break;

}

}

if (!isAxis) {

outDims[idx - numSkipAxis] = getSizeOfDimension(input, idx);

655

}

656

}

Lev Proleev

7391083

2020-05-05 17:26:26 +0100

[diff] [blame]

657

// Handle the case when all dimensions are removed

658

if (outDims.empty()) {

659

outDims.push_back(1);

660

}

Miao Wang

2018-01-21 02:39:41 -0800

[diff] [blame]

661

output->dimensions = outDims;

662

}

663

664

output->type = input.type;

665

output->offset = input.offset;

666

output->scale = input.scale;

return true;

}

Slava Shklyaev

2018-09-17 11:58:40 +0100

[diff] [blame]

671

bool argMinMaxPrepare(const Shape& input, int32_t axis, Shape* output) {

Slava Shklyaev

2018-10-22 12:04:16 +0100

[diff] [blame]

672

NN_CHECK(handleNegativeAxis(input, &axis));

Slava Shklyaev

2018-09-17 11:58:40 +0100

[diff] [blame]

673

674

output->type = OperandType::TENSOR_INT32;

675

676

// Copy the input dimensions, omitting the axis dimension.

677

output->dimensions.clear();

Lev Proleev

7391083

2020-05-05 17:26:26 +0100

[diff] [blame]

678

if (getNumberOfDimensions(input) > 1) {

679

output->dimensions.reserve(getNumberOfDimensions(input) - 1);

680

output->dimensions.insert(output->dimensions.end(), input.dimensions.begin(),

681

input.dimensions.begin() + axis);

682

output->dimensions.insert(output->dimensions.end(), input.dimensions.begin() + axis + 1,

683

input.dimensions.end());

684

} else {

685

output->dimensions.push_back(1);

686

}

Slava Shklyaev

2018-09-17 11:58:40 +0100

[diff] [blame]

687

688

return true;

689

}

Lev Proleev

dfc2f41

2018-09-13 16:17:58 +0100

[diff] [blame]

690

691

bool splitPrepare(const Shape& input, int32_t axis, int32_t numOutputs,

692

std::vector<Shape>* output) {

Slava Shklyaev

2018-10-22 12:04:16 +0100

[diff] [blame]

693

NN_CHECK(handleNegativeAxis(input, &axis));

Lev Proleev

dfc2f41

2018-09-13 16:17:58 +0100

[diff] [blame]

694

695

const int32_t sizeOfAxisToSplit = input.dimensions[axis];

696

NN_OPS_CHECK(sizeOfAxisToSplit % numOutputs == 0);

697

const int32_t sliceSize = sizeOfAxisToSplit / numOutputs;

698

699

for (int i = 0; i < numOutputs; ++i) {

700

output->at(i).type = input.type;

701

output->at(i).dimensions = input.dimensions;

702

output->at(i).dimensions[axis] = sliceSize;

703

output->at(i).offset = input.offset;

704

output->at(i).scale = input.scale;

}

return true;

}

Xusong Wang

2018-08-17 15:38:32 -0700

[diff] [blame]

709

bool groupedConvPrepare(const Shape& input, const Shape& filter, const Shape& bias,

710

int32_t padding_left, int32_t padding_right, int32_t padding_top,

711

int32_t padding_bottom, int32_t stride_width, int32_t stride_height,

712

int32_t numGroups, Shape* output) {

Przemyslaw Szczepaniak

a4e6a65

2018-12-28 11:52:32 +0000

[diff] [blame]

713

if (filter.type == OperandType::TENSOR_QUANT8_SYMM_PER_CHANNEL) {

Lev Proleev

5976d73

2019-12-18 14:50:37 +0000

[diff] [blame]

714

NN_OPS_CHECK(input.type == OperandType::TENSOR_QUANT8_ASYMM ||

715

input.type == OperandType::TENSOR_QUANT8_ASYMM_SIGNED);

Przemyslaw Szczepaniak

a4e6a65

2018-12-28 11:52:32 +0000

[diff] [blame]

716

} else {

717

NN_OPS_CHECK(input.type == filter.type);

718

}

Lev Proleev

5976d73

2019-12-18 14:50:37 +0000

[diff] [blame]

719

if (input.type == OperandType::TENSOR_QUANT8_ASYMM ||

720

input.type == OperandType::TENSOR_QUANT8_ASYMM_SIGNED) {

Xusong Wang

5339dc3

2018-08-17 15:38:32 -0700

[diff] [blame]

721

NN_OPS_CHECK(bias.type == OperandType::TENSOR_INT32);

722

} else {

723

NN_OPS_CHECK(input.type == bias.type);

724

}

725

NN_OPS_CHECK(getNumberOfDimensions(input) == 4);

726

NN_OPS_CHECK(getNumberOfDimensions(filter) == 4);

727

NN_OPS_CHECK(getNumberOfDimensions(bias) == 1);

728

729

NN_OPS_CHECK(getSizeOfDimension(filter, 0) == getSizeOfDimension(bias, 0));

730

731

NN_OPS_CHECK(getSizeOfDimension(filter, 3) * numGroups == getSizeOfDimension(input, 3));

732

NN_OPS_CHECK(getSizeOfDimension(filter, 0) % numGroups == 0);

733

734

uint32_t channels_out = getSizeOfDimension(filter, 0);

735

uint32_t width = getSizeOfDimension(input, 2);

736

uint32_t height = getSizeOfDimension(input, 1);

737

uint32_t filterWidth = getSizeOfDimension(filter, 2);

738

uint32_t filterHeight = getSizeOfDimension(filter, 1);

739

uint32_t batches = getSizeOfDimension(input, 0);

740

Xusong Wang

d0cc11f

2019-04-12 13:38:49 -0700

[diff] [blame]

741

NN_RET_CHECK_GT(static_cast<int32_t>(filterWidth), padding_left);

742

NN_RET_CHECK_GT(static_cast<int32_t>(filterWidth), padding_right);

743

NN_RET_CHECK_GT(static_cast<int32_t>(filterHeight), padding_top);

744

NN_RET_CHECK_GT(static_cast<int32_t>(filterHeight), padding_bottom);

Xusong Wang

fa3b942

2019-02-27 14:44:14 -0800

[diff] [blame]

745

Xusong Wang

5339dc3

2018-08-17 15:38:32 -0700

[diff] [blame]

746

uint32_t outWidth =

747

computeOutSize(width, filterWidth, stride_width, padding_left, padding_right);

748

uint32_t outHeight =

749

computeOutSize(height, filterHeight, stride_height, padding_top, padding_bottom);

750

751

output->type = input.type;

752

output->dimensions = {batches, outHeight, outWidth, channels_out};

753

return true;

754

}

Xusong Wang

4588d3c

2018-08-20 14:18:15 -0700

[diff] [blame]

755

Michael Butler