Skip to content

Commit

Permalink
+add AMX-BF16 optimizations of class SynetDeconvolution16bNhwcGemm.
Browse files Browse the repository at this point in the history
  • Loading branch information
ermig1979 committed Sep 12, 2024
1 parent 0f893d4 commit d7d69b1
Show file tree
Hide file tree
Showing 11 changed files with 500 additions and 10 deletions.
2 changes: 1 addition & 1 deletion docs/2024.html
Original file line number Diff line number Diff line change
Expand Up @@ -40,7 +40,7 @@ <h4>Algorithms</h4>
<h5>New features</h5>
<ul>
<li>Base implementation of class SynetDeconvolution16bGemm.</li>
<li>Base implementation, SSE4.1, AVX2, AVX-512BW optimizations of class SynetDeconvolution16bNhwcGemm.</li>
<li>Base implementation, SSE4.1, AVX2, AVX-512BW, AMX-BF16 optimizations of class SynetDeconvolution16bNhwcGemm.</li>
</ul>

<h4>Test framework</h4>
Expand Down
3 changes: 3 additions & 0 deletions prj/vs2019/AmxBf16.vcxproj
Original file line number Diff line number Diff line change
Expand Up @@ -52,6 +52,7 @@
<ClInclude Include="..\..\src\Simd\SimdSynetConvolution8i.h" />
<ClInclude Include="..\..\src\Simd\SimdSynetConvolution8iCommon.h" />
<ClInclude Include="..\..\src\Simd\SimdSynetConvParam.h" />
<ClInclude Include="..\..\src\Simd\SimdSynetDeconvolution16b.h" />
<ClInclude Include="..\..\src\Simd\SimdSynetInnerProduct16b.h" />
<ClInclude Include="..\..\src\Simd\SimdSynetMergedConvolution16b.h" />
<ClInclude Include="..\..\src\Simd\SimdSynetMergedConvolution32f.h" />
Expand All @@ -78,6 +79,8 @@
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetConvolution8iDirect.cpp" />
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetConvolution8iDirect1x1.cpp" />
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetConvolution8iDirectAny.cpp" />
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetDeconvolution16b.cpp" />
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetDeconvolution16bNhwcGemm.cpp" />
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetInnerProduct16b.cpp" />
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetInnerProduct16bGemmNN.cpp" />
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetMergedConvolution16b.cpp" />
Expand Down
9 changes: 9 additions & 0 deletions prj/vs2019/AmxBf16.vcxproj.filters
Original file line number Diff line number Diff line change
Expand Up @@ -154,6 +154,9 @@
<ClInclude Include="..\..\src\Simd\SimdSynetActivation.h">
<Filter>Inc</Filter>
</ClInclude>
<ClInclude Include="..\..\src\Simd\SimdSynetDeconvolution16b.h">
<Filter>Inc</Filter>
</ClInclude>
</ItemGroup>
<ItemGroup>
<Filter Include="AmxBf16">
Expand Down Expand Up @@ -248,5 +251,11 @@
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetConvolution16bNchwGemm.cpp">
<Filter>AmxBf16</Filter>
</ClCompile>
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetDeconvolution16bNhwcGemm.cpp">
<Filter>AmxBf16</Filter>
</ClCompile>
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetDeconvolution16b.cpp">
<Filter>AmxBf16</Filter>
</ClCompile>
</ItemGroup>
</Project>
3 changes: 3 additions & 0 deletions prj/vs2022/AmxBf16.vcxproj
Original file line number Diff line number Diff line change
Expand Up @@ -52,6 +52,7 @@
<ClInclude Include="..\..\src\Simd\SimdSynetConvolution8i.h" />
<ClInclude Include="..\..\src\Simd\SimdSynetConvolution8iCommon.h" />
<ClInclude Include="..\..\src\Simd\SimdSynetConvParam.h" />
<ClInclude Include="..\..\src\Simd\SimdSynetDeconvolution16b.h" />
<ClInclude Include="..\..\src\Simd\SimdSynetInnerProduct16b.h" />
<ClInclude Include="..\..\src\Simd\SimdSynetMergedConvolution16b.h" />
<ClInclude Include="..\..\src\Simd\SimdSynetMergedConvolution32f.h" />
Expand All @@ -78,6 +79,8 @@
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetConvolution8iDirect.cpp" />
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetConvolution8iDirect1x1.cpp" />
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetConvolution8iDirectAny.cpp" />
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetDeconvolution16b.cpp" />
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetDeconvolution16bNhwcGemm.cpp" />
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetInnerProduct16b.cpp" />
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetInnerProduct16bGemmNN.cpp" />
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetMergedConvolution16b.cpp" />
Expand Down
9 changes: 9 additions & 0 deletions prj/vs2022/AmxBf16.vcxproj.filters
Original file line number Diff line number Diff line change
Expand Up @@ -154,6 +154,9 @@
<ClInclude Include="..\..\src\Simd\SimdSynetActivation.h">
<Filter>Inc</Filter>
</ClInclude>
<ClInclude Include="..\..\src\Simd\SimdSynetDeconvolution16b.h">
<Filter>Inc</Filter>
</ClInclude>
</ItemGroup>
<ItemGroup>
<Filter Include="AmxBf16">
Expand Down Expand Up @@ -248,5 +251,11 @@
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetConvolution16bNchwGemm.cpp">
<Filter>AmxBf16</Filter>
</ClCompile>
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetDeconvolution16bNhwcGemm.cpp">
<Filter>AmxBf16</Filter>
</ClCompile>
<ClCompile Include="..\..\src\Simd\SimdAmxBf16SynetDeconvolution16b.cpp">
<Filter>AmxBf16</Filter>
</ClCompile>
</ItemGroup>
</Project>
42 changes: 42 additions & 0 deletions src/Simd/SimdAmxBf16SynetDeconvolution16b.cpp
Original file line number Diff line number Diff line change
@@ -0,0 +1,42 @@
/*
* Simd Library (http://ermig1979.github.io/Simd).
*
* Copyright (c) 2011-2024 Yermalayeu Ihar.
*
* Permission is hereby granted, free of charge, to any person obtaining a copy
* of this software and associated documentation files (the "Software"), to deal
* in the Software without restriction, including without limitation the rights
* to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
* copies of the Software, and to permit persons to whom the Software is
* furnished to do so, subject to the following conditions:
*
* The above copyright notice and this permission notice shall be included in
* all copies or substantial portions of the Software.
*
* THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
* IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
* FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
* AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
* LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
* OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
* SOFTWARE.
*/
#include "Simd/SimdSynetDeconvolution16b.h"

namespace Simd
{
#if (defined(SIMD_AMXBF16_ENABLE) || (defined(SIMD_AVX512BW_ENABLE) && defined(SIMD_AMX_EMULATE)))
namespace AmxBf16
{
void* SynetDeconvolution16bInit(size_t batch, const SimdConvolutionParameters* conv, SimdSynetCompatibilityType compatibility)
{
DeconvParam param(batch, conv, compatibility);
if (!param.Valid(SimdTensorData32f, SimdTensorData16b))
return NULL;
if (SynetDeconvolution16bNhwcGemm::Preferable(param))
return new AmxBf16::SynetDeconvolution16bNhwcGemm(param);
return new Base::SynetDeconvolution16bGemm(param);
}
}
#endif
}
Loading

0 comments on commit d7d69b1

Please sign in to comment.