core: fix missing vec_cvfo on POWER9 due to unavailable VSX float64 conversion

hillwoodroc · hillwoodroc · commit f7b67b85d494 · 2025-08-06T22:39:17.000+08:00
Some POWER9 systems fail to build downstream projects (e.g. ncnn) due to
undefined references to `vec_cvfo`. This happens because POWER9 does not
support the VSX float64 conversion instructions introduced in POWER10.

This patch introduces a fallback for `vec_cvfo` using scalar operations
when building on POWER9. All other architectures (including POWER10,
x86, ARM) will continue using the optimized VSX conversions.

Fixes: undefined symbol vec_cvfo on POWER9 with OpenCV 4.12.0

Tested on:
- POWER9 (fallback used, links correctly)
- POWER10 and x86 (optimized path used as expected)
diff --git a/modules/core/include/opencv2/core/vsx_utils.hpp b/modules/core/include/opencv2/core/vsx_utils.hpp
@@ -5,6 +5,12 @@
 #ifndef OPENCV_HAL_VSX_UTILS_HPP
 #define OPENCV_HAL_VSX_UTILS_HPP
 
+#if defined(__PPC64__) && defined(__power9__)
+#define CV_VSX_HAS_FLOAT64_CONVERT 0
+#else
+#define CV_VSX_HAS_FLOAT64_CONVERT 1
+#endif
+
 #include "opencv2/core/cvdef.h"
 
 #ifndef SKIP_INCLUDES
@@ -257,8 +263,27 @@ VSX_IMPL_1VRG(vec_udword2, vec_udword2, vpopcntd, vec_popcntu)
 VSX_IMPL_1VRG(vec_udword2, vec_dword2,  vpopcntd, vec_popcntu)
 
 // converts between single and double-precision
-VSX_REDIRECT_1RG(vec_float4,  vec_double2, vec_cvfo, vec_floate)
-VSX_REDIRECT_1RG(vec_double2, vec_float4,  vec_cvfo, vec_doubleo)
+
+#if CV_VSX_HAS_FLOAT64_CONVERT
+//  Use VSX double<->float conversion instructions (if supported by the architecture)
+    VSX_REDIRECT_1RG(vec_float4,  vec_double2, vec_cvfo, vec_floate)
+    VSX_REDIRECT_1RG(vec_double2, vec_float4,  vec_cvfo, vec_doubleo)
+#else
+//  Fallback: implement vec_cvfo using scalar operations (to ensure successful linking)
+    static inline vec_float4 vec_cvfo(const vec_double2& a)
+    {
+        float r0 = static_cast<float>(reinterpret_cast<const double*>(&a)[0]);
+        float r1 = static_cast<float>(reinterpret_cast<const double*>(&a)[1]);
+        return (vec_float4){r0, r1, 0.f, 0.f};
+    }
+
+    static inline vec_double2 vec_cvfo(const vec_float4& a)
+    {
+        double r0 = static_cast<double>(reinterpret_cast<const float*>(&a)[0]);
+        double r1 = static_cast<double>(reinterpret_cast<const float*>(&a)[1]);
+        return (vec_double2){r0, r1};
+    }
+#endif
 
 // converts word and doubleword to double-precision
 #undef vec_ctd