struct netdev_rx_queue *rxqueue;
                struct rps_dev_flow_table *flow_table;
                struct rps_dev_flow *old_rflow;
-               u32 flow_id;
+               u32 flow_id, head;
                u16 rxq_index;
                int rc;
 
                        old_rflow->filter = RPS_NO_FILTER;
        out:
 #endif
-               rflow->last_qtail =
-                       READ_ONCE(per_cpu(softnet_data, next_cpu).input_queue_head);
+               head = READ_ONCE(per_cpu(softnet_data, next_cpu).input_queue_head);
+               rps_input_queue_tail_save(&rflow->last_qtail, head);
        }
 
        rflow->cpu = next_cpu;
                if (unlikely(tcpu != next_cpu) &&
                    (tcpu >= nr_cpu_ids || !cpu_online(tcpu) ||
                     ((int)(READ_ONCE(per_cpu(softnet_data, tcpu).input_queue_head) -
-                     READ_ONCE(rflow->last_qtail))) >= 0)) {
+                     rflow->last_qtail)) >= 0)) {
                        tcpu = next_cpu;
                        rflow = set_rps_cpu(dev, skb, rflow, next_cpu);
                }