We read every piece of feedback, and take your input very seriously.
To see all available qualifiers, see our documentation.
There was an error while loading. Please reload this page.
1 parent 623de33 commit 93091baCopy full SHA for 93091ba
modules/dnn/src/layers/layers_common.avx2.cpp
@@ -50,6 +50,8 @@
50
namespace cv {
51
namespace dnn {
52
53
+#define _mm256_load_ps _mm256_loadu_ps // "weights" in fastConv_avx2 is not always aligned to 32 bytes
54
+
55
void fastConv_avx2( const float* weights, size_t wstep, const float* bias,
56
const float* rowbuf, float* output, const int* outShape,
57
int blockSize, int vecsize, int vecsize_aligned,
0 commit comments