spinlock_t lock;
 
        void __iomem *base;
+       struct spi_engine_message_state msg_state;
        struct completion msg_complete;
        unsigned int int_enable;
 };
        return IRQ_HANDLED;
 }
 
-static int spi_engine_prepare_message(struct spi_controller *host,
-                                     struct spi_message *msg)
+static int spi_engine_optimize_message(struct spi_message *msg)
 {
        struct spi_engine_program p_dry, *p;
-       struct spi_engine_message_state *st;
        size_t size;
 
-       st = kzalloc(sizeof(*st), GFP_KERNEL);
-       if (!st)
-               return -ENOMEM;
-
        spi_engine_precompile_message(msg);
 
        p_dry.length = 0;
 
        size = sizeof(*p->instructions) * (p_dry.length + 1);
        p = kzalloc(sizeof(*p) + size, GFP_KERNEL);
-       if (!p) {
-               kfree(st);
+       if (!p)
                return -ENOMEM;
-       }
 
        spi_engine_compile_message(msg, false, p);
 
        spi_engine_program_add_cmd(p, false, SPI_ENGINE_CMD_SYNC(
                                                AXI_SPI_ENGINE_CUR_MSG_SYNC_ID));
 
-       st->p = p;
-       st->cmd_buf = p->instructions;
-       st->cmd_length = p->length;
-       msg->state = st;
+       msg->opt_state = p;
 
        return 0;
 }
 
-static int spi_engine_unprepare_message(struct spi_controller *host,
-                                       struct spi_message *msg)
+static int spi_engine_unoptimize_message(struct spi_message *msg)
 {
-       struct spi_engine_message_state *st = msg->state;
-
-       kfree(st->p);
-       kfree(st);
+       kfree(msg->opt_state);
 
        return 0;
 }
        struct spi_message *msg)
 {
        struct spi_engine *spi_engine = spi_controller_get_devdata(host);
-       struct spi_engine_message_state *st = msg->state;
+       struct spi_engine_message_state *st = &spi_engine->msg_state;
+       struct spi_engine_program *p = msg->opt_state;
        unsigned int int_enable = 0;
        unsigned long flags;
 
+       /* reinitialize message state for this transfer */
+       memset(st, 0, sizeof(*st));
+       st->p = p;
+       st->cmd_buf = p->instructions;
+       st->cmd_length = p->length;
+       msg->state = st;
+
        reinit_completion(&spi_engine->msg_complete);
 
        spin_lock_irqsave(&spi_engine->lock, flags);
        host->bits_per_word_mask = SPI_BPW_RANGE_MASK(1, 32);
        host->max_speed_hz = clk_get_rate(spi_engine->ref_clk) / 2;
        host->transfer_one_message = spi_engine_transfer_one_message;
-       host->prepare_message = spi_engine_prepare_message;
-       host->unprepare_message = spi_engine_unprepare_message;
+       host->optimize_message = spi_engine_optimize_message;
+       host->unoptimize_message = spi_engine_unoptimize_message;
        host->num_chipselect = 8;
 
        if (host->max_speed_hz == 0)