forked from pytorch/FBGEMM
-
Notifications
You must be signed in to change notification settings - Fork 0
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Add support for AVX512-256(YMM) in FBGEMM16 (pytorch#209)
Summary: Pull Request resolved: pytorch#209 Add AVX512-256 support to FBGEMM operation. This benefits Intel(r) Xeon(r) D processors by running at higher turbo frequency. Reviewed By: jianyuh Differential Revision: D18138146 fbshipit-source-id: 7f25247b92e62a058797b2a44ba57b147cb7f5f6
- Loading branch information
1 parent
3839cba
commit 6394aab
Showing
14 changed files
with
3,431 additions
and
1,716 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,35 @@ | ||
/* | ||
* Copyright (c) Facebook, Inc. and its affiliates. | ||
* All rights reserved. | ||
* This source code is licensed under the BSD-style license found in the | ||
* LICENSE file in the root directory of this source tree. | ||
*/ | ||
#pragma once | ||
|
||
#include <array> | ||
#include <fbgemm/Types.h> | ||
#include <fbgemm/Utils.h> | ||
|
||
namespace fbgemm { | ||
using partition_array_t = std::array<std::array<std::array<int, 2>, 2>, 121>; | ||
|
||
template<typename T> | ||
struct GemmParams { | ||
uint64_t k; | ||
float* A; | ||
const T* B; | ||
float beta; | ||
float* C; | ||
uint64_t ldc; | ||
uint64_t b_block_cols; | ||
uint64_t b_block_size; | ||
}; | ||
|
||
template<typename T> | ||
using funcptr_t = void(*)(GemmParams<T>*); | ||
|
||
using fp16 = float16; | ||
using fp32 = float; | ||
using GemmParamsFP16 = GemmParams<fp16>; | ||
|
||
} |
Oops, something went wrong.