if (src_offset < PAYLOAD_OFFSET) {
                while (bytes >= 4) {
-                       *dst = le32_to_cpu(__raw_readl(src));
+                       *dst = readl_relaxed(src);
                        bytes -= 4;
                        src++;
                        dst++;
         * allocated.
         */
        if (src_offset < PAYLOAD_OFFSET)
-               val = le32_to_cpu(__raw_readl(src));
+               val = readl_relaxed(src);
        else
                val = __raw_readl(src);
 
 
        if (dst_offset < PAYLOAD_OFFSET) {
                while (bytes >= 4) {
-                       __raw_writel(cpu_to_le32(*src), dst);
+                       writel_relaxed(*src, dst);
                        bytes -= 4;
                        src++;
                        dst++;
         */
 
        if (dst_offset < PAYLOAD_OFFSET)
-               __raw_writel(cpu_to_le32(*src), dst);
+               writel_relaxed(*src, dst);
        else
                __raw_writel(*src, dst);
 }