forked from pytorch/FBGEMM
-
Notifications
You must be signed in to change notification settings - Fork 0
/
spmmUtilsAvx2.h
36 lines (34 loc) · 1.06 KB
/
spmmUtilsAvx2.h
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
/*
* Copyright (c) Meta Platforms, Inc. and affiliates.
* All rights reserved.
* This source code is licensed under the BSD-style license found in the
* LICENSE file in the root directory of this source tree.
*/
#pragma once
#include "./FbgemmBuild.h"
#include "fbgemm/UtilsAvx2.h"
namespace fbgemm {
struct FBGEMM_API trRequantizationParams_t {
std::int32_t act_zero_point; // activation zero point
const std::int32_t* weight_zero_points; // weight zero point(s)
std::int32_t C_zero_point;
const float C_scale;
const std::int32_t* weight_row_offsets;
const std::int32_t* act_col_offsets;
const float* bias;
const float* act_times_w_scale;
};
template <
bool FUSE_RELU,
bool ACT_SYMMETRIC, // whether activation matrix is symmetric
bool WEIGHT_SYMMETRIC, // whether weight matrix is symmetric
bool HAS_BIAS,
QuantizationGranularity Q_GRAN>
FBGEMM_API void trRequantizeOpt(
uint8_t* out,
const int32_t* inp,
const block_type_t& block,
int ld_out,
int ld_in,
const trRequantizationParams_t& rParams);
} // namespace fbgemm