serge-sans-paille · serge-sans-paille · Dec 14, 2021 · Dec 8, 2021 · Dec 12, 2021 · Dec 6, 2021
diff --git a/Changelog b/Changelog
@@ -1,3 +1,18 @@
+2021-12-08 Serge Guelton <serge.guelton@telecom-bretagne.eu>
+
+	* Upgrade xsimd version to 8.0.5
+
+	* Performance fix on np.dot with transposed parameters
+
+	* Raise an error when no specs are given and we want to generate a native module
+
+	* Support more complex transpose expression
+
+	* Honor quotes in config files for *FLAGS
+
+	* Add pythran option -ftime-report to print out the time spent on optimizations
+	* Support isinstance when second argument is a tuple
+
 2021-09-08 Serge Guelton <serge.guelton@telecom-bretagne.eu>
 
 	* Fix performance issue with assert handling

diff --git a/docs/CLI.rst b/docs/CLI.rst
@@ -29,7 +29,7 @@ The generated native ``.so`` module can then be used with the Python interpreter
 Pythran version can be dumped through ``--version``::
 
   $> pythran --version 2>&1
-  0.11.0.dev0
+  0.11.0
 
 The module-level ``__pythran__`` variable indicates that the module loaded has been pythranized::
 

diff --git a/pythran/pythonic/include/numpy/conjugate.hpp b/pythran/pythonic/include/numpy/conjugate.hpp
@@ -7,6 +7,16 @@
 
 #include <xsimd/xsimd.hpp>
 
+// Inject some extra symbol in xsimd namespace, until that's fixed upstream
+#if XSIMD_VERSION_MAJOR < 8 ||                                                 \
+    (XSIMD_VERSION_MAJOR == 8 && XSIMD_VERSION_MINOR == 0 &&                   \
+     XSIMD_VERSION_PATCH <= 5)
+namespace xsimd
+{
+  using std::conj;
+}
+#endif
+
 PYTHONIC_NS_BEGIN
 
 namespace numpy

diff --git a/pythran/version.py b/pythran/version.py
@@ -1,3 +1,3 @@
-__version__ = '0.11.0.dev0'
+__version__ = '0.11.0'
 __url__ = 'https://github.com/serge-sans-paille/pythran'
 __descr__ = 'Ahead of Time compiler for numeric kernels'
diff --git a/third_party/xsimd/arch/generic/xsimd_generic_arithmetic.hpp b/third_party/xsimd/arch/generic/xsimd_generic_arithmetic.hpp
@@ -1,13 +1,13 @@
 /***************************************************************************
-* Copyright (c) Johan Mabille, Sylvain Corlay, Wolf Vollprecht and         *
-* Martin Renou                                                             *
-* Copyright (c) QuantStack                                                 *
-* Copyright (c) Serge Guelton                                              *
-*                                                                          *
-* Distributed under the terms of the BSD 3-Clause License.                 *
-*                                                                          *
-* The full license is in the file LICENSE, distributed with this software. *
-****************************************************************************/
+ * Copyright (c) Johan Mabille, Sylvain Corlay, Wolf Vollprecht and         *
+ * Martin Renou                                                             *
+ * Copyright (c) QuantStack                                                 *
+ * Copyright (c) Serge Guelton                                              *
+ *                                                                          *
+ * Distributed under the terms of the BSD 3-Clause License.                 *
+ *                                                                          *
+ * The full license is in the file LICENSE, distributed with this software. *
+ ****************************************************************************/
 
 #ifndef XSIMD_GENERIC_ARITHMETIC_HPP
 #define XSIMD_GENERIC_ARITHMETIC_HPP
@@ -17,85 +17,112 @@
 
 #include "./xsimd_generic_details.hpp"
 
-namespace xsimd {
+namespace xsimd
+{
+
+    namespace kernel
+    {
+
+        using namespace types;
+
+        // bitwise_lshift
+        template <class A, class T, class /*=typename std::enable_if<std::is_integral<T>::value, void>::type*/>
+        inline batch<T, A> bitwise_lshift(batch<T, A> const& self, batch<T, A> const& other, requires_arch<generic>) noexcept
+        {
+            return detail::apply([](T x, T y) noexcept
+                                 { return x << y; },
+                                 self, other);
+        }
+
+        // bitwise_rshift
+        template <class A, class T, class /*=typename std::enable_if<std::is_integral<T>::value, void>::type*/>
+        inline batch<T, A> bitwise_rshift(batch<T, A> const& self, batch<T, A> const& other, requires_arch<generic>) noexcept
+        {
+            return detail::apply([](T x, T y) noexcept
+                                 { return x >> y; },
+                                 self, other);
+        }
+
+        // div
+        template <class A, class T, class = typename std::enable_if<std::is_integral<T>::value, void>::type>
+        inline batch<T, A> div(batch<T, A> const& self, batch<T, A> const& other, requires_arch<generic>) noexcept
+        {
+            return detail::apply([](T x, T y) noexcept -> T
+                                 { return x / y; },
+                                 self, other);
+        }
+
+        // fma
+        template <class A, class T>
+        inline batch<T, A> fma(batch<T, A> const& x, batch<T, A> const& y, batch<T, A> const& z, requires_arch<generic>) noexcept
+        {
+            return x * y + z;
+        }
+
+        template <class A, class T>
+        inline batch<std::complex<T>, A> fma(batch<std::complex<T>, A> const& x, batch<std::complex<T>, A> const& y, batch<std::complex<T>, A> const& z, requires_arch<generic>) noexcept
+        {
+            auto res_r = fms(x.real(), y.real(), fms(x.imag(), y.imag(), z.real()));
+            auto res_i = fma(x.real(), y.imag(), fma(x.imag(), y.real(), z.imag()));
+            return { res_r, res_i };
+        }
+
+        // fms
+        template <class A, class T>
+        inline batch<T, A> fms(batch<T, A> const& x, batch<T, A> const& y, batch<T, A> const& z, requires_arch<generic>) noexcept
+        {
+            return x * y - z;
+        }
+
+        template <class A, class T>
+        inline batch<std::complex<T>, A> fms(batch<std::complex<T>, A> const& x, batch<std::complex<T>, A> const& y, batch<std::complex<T>, A> const& z, requires_arch<generic>) noexcept
+        {
+            auto res_r = fms(x.real(), y.real(), fma(x.imag(), y.imag(), z.real()));
+            auto res_i = fma(x.real(), y.imag(), fms(x.imag(), y.real(), z.imag()));
+            return { res_r, res_i };
+        }
+
+        // fnma
+        template <class A, class T>
+        inline batch<T, A> fnma(batch<T, A> const& x, batch<T, A> const& y, batch<T, A> const& z, requires_arch<generic>) noexcept
+        {
+            return -x * y + z;
+        }
+
+        template <class A, class T>
+        inline batch<std::complex<T>, A> fnma(batch<std::complex<T>, A> const& x, batch<std::complex<T>, A> const& y, batch<std::complex<T>, A> const& z, requires_arch<generic>) noexcept
+        {
+            auto res_r = -fms(x.real(), y.real(), fma(x.imag(), y.imag(), z.real()));
+            auto res_i = -fma(x.real(), y.imag(), fms(x.imag(), y.real(), z.imag()));
+            return { res_r, res_i };
+        }
+
+        // fnms
+        template <class A, class T>
+        inline batch<T, A> fnms(batch<T, A> const& x, batch<T, A> const& y, batch<T, A> const& z, requires_arch<generic>) noexcept
+        {
+            return -x * y - z;
+        }
+
+        template <class A, class T>
+        inline batch<std::complex<T>, A> fnms(batch<std::complex<T>, A> const& x, batch<std::complex<T>, A> const& y, batch<std::complex<T>, A> const& z, requires_arch<generic>) noexcept
+        {
+            auto res_r = -fms(x.real(), y.real(), fms(x.imag(), y.imag(), z.real()));
+            auto res_i = -fma(x.real(), y.imag(), fma(x.imag(), y.real(), z.imag()));
+            return { res_r, res_i };
+        }
+
+        // mul
+        template <class A, class T, class /*=typename std::enable_if<std::is_integral<T>::value, void>::type*/>
+        inline batch<T, A> mul(batch<T, A> const& self, batch<T, A> const& other, requires_arch<generic>) noexcept
+        {
+            return detail::apply([](T x, T y) noexcept -> T
+                                 { return x * y; },
+                                 self, other);
+        }
 
-  namespace kernel {
-
-    using namespace types;
-
-    // bitwise_lshift
-    template<class A, class T, class/*=typename std::enable_if<std::is_integral<T>::value, void>::type*/>
-    batch<T, A> bitwise_lshift(batch<T, A> const& self, batch<T, A> const& other, requires_arch<generic>) {
-      return detail::apply([](T x, T y) { return x << y;}, self, other);
-    }
-
-    // bitwise_rshift
-    template<class A, class T, class/*=typename std::enable_if<std::is_integral<T>::value, void>::type*/>
-    batch<T, A> bitwise_rshift(batch<T, A> const& self, batch<T, A> const& other, requires_arch<generic>) {
-      return detail::apply([](T x, T y) { return x >> y;}, self, other);
-    }
-
-    // div
-    template<class A, class T, class=typename std::enable_if<std::is_integral<T>::value, void>::type>
-    batch<T, A> div(batch<T, A> const& self, batch<T, A> const& other, requires_arch<generic>) {
-      return detail::apply([](T x, T y) -> T { return x / y;}, self, other);
-    }
-
-    // fma
-    template<class A, class T> batch<T, A> fma(batch<T, A> const& x, batch<T, A> const& y, batch<T, A> const& z, requires_arch<generic>) {
-      return x * y + z;
-    }
-
-    template<class A, class T> batch<std::complex<T>, A> fma(batch<std::complex<T>, A> const& x, batch<std::complex<T>, A> const& y, batch<std::complex<T>, A> const& z, requires_arch<generic>) {
-      auto res_r = fms(x.real(), y.real(), fms(x.imag(), y.imag(), z.real()));
-      auto res_i = fma(x.real(), y.imag(), fma(x.imag(), y.real(), z.imag()));
-      return {res_r, res_i};
-    }
-
-    // fms
-    template<class A, class T> batch<T, A> fms(batch<T, A> const& x, batch<T, A> const& y, batch<T, A> const& z, requires_arch<generic>) {
-      return x * y - z;
-    }
-
-    template<class A, class T> batch<std::complex<T>, A> fms(batch<std::complex<T>, A> const& x, batch<std::complex<T>, A> const& y, batch<std::complex<T>, A> const& z, requires_arch<generic>) {
-      auto res_r = fms(x.real(), y.real(), fma(x.imag(), y.imag(), z.real()));
-      auto res_i = fma(x.real(), y.imag(), fms(x.imag(), y.real(), z.imag()));
-      return {res_r, res_i};
     }
 
-    // fnma
-    template<class A, class T> batch<T, A> fnma(batch<T, A> const& x, batch<T, A> const& y, batch<T, A> const& z, requires_arch<generic>) {
-      return -x * y + z;
-    }
-
-    template<class A, class T> batch<std::complex<T>, A> fnma(batch<std::complex<T>, A> const& x, batch<std::complex<T>, A> const& y, batch<std::complex<T>, A> const& z, requires_arch<generic>) {
-      auto res_r = - fms(x.real(), y.real(), fma(x.imag(), y.imag(), z.real()));
-      auto res_i = - fma(x.real(), y.imag(), fms(x.imag(), y.real(), z.imag()));
-      return {res_r, res_i};
-    }
-
-    // fnms
-    template<class A, class T> batch<T, A> fnms(batch<T, A> const& x, batch<T, A> const& y, batch<T, A> const& z, requires_arch<generic>) {
-      return -x * y - z;
-    }
-
-    template<class A, class T> batch<std::complex<T>, A> fnms(batch<std::complex<T>, A> const& x, batch<std::complex<T>, A> const& y, batch<std::complex<T>, A> const& z, requires_arch<generic>) {
-      auto res_r = - fms(x.real(), y.real(), fms(x.imag(), y.imag(), z.real()));
-      auto res_i = - fma(x.real(), y.imag(), fma(x.imag(), y.real(), z.imag()));
-      return {res_r, res_i};
-    }
-
-
-
-    // mul
-    template<class A, class T, class/*=typename std::enable_if<std::is_integral<T>::value, void>::type*/>
-    batch<T, A> mul(batch<T, A> const& self, batch<T, A> const& other, requires_arch<generic>) {
-      return detail::apply([](T x, T y) -> T { return x * y;}, self, other);
-    }
-
-  }
-
 }
 
 #endif
-