u8 enable_dma;
        u8 bits_per_word;       /* 8 or 16 */
        u8 cs_change_per_word;
-       u8 cs_chg_udelay;
+       u16 cs_chg_udelay;      /* Some devices require > 255usec delay */
        void (*write) (struct driver_data *);
        void (*read) (struct driver_data *);
        void (*duplex) (struct driver_data *);
        flag |= (chip->flag << 8);
 
        write_FLAG(drv_data, flag);
+
+       /* Move delay here for consistency */
+       if (chip->cs_chg_udelay)
+               udelay(chip->cs_chg_udelay);
 }
 
 #define MAX_SPI_SSEL   7
                write_TDBR(drv_data, (*(u8 *) (drv_data->tx)));
                while (read_STAT(drv_data) & BIT_STAT_TXS)
                        continue;
+
                cs_deactive(drv_data, chip);
 
-               if (chip->cs_chg_udelay)
-                       udelay(chip->cs_chg_udelay);
                ++drv_data->tx;
        }
 }
        while (drv_data->rx < drv_data->rx_end - 1) {
                cs_deactive(drv_data, chip);
 
-               if (chip->cs_chg_udelay)
-                       udelay(chip->cs_chg_udelay);
-
                while (!(read_STAT(drv_data) & BIT_STAT_RXS))
                        continue;
                cs_active(drv_data, chip);
                while (!(read_STAT(drv_data) & BIT_STAT_RXS))
                        continue;
                *(u8 *) (drv_data->rx) = read_RDBR(drv_data);
+
                cs_deactive(drv_data, chip);
 
-               if (chip->cs_chg_udelay)
-                       udelay(chip->cs_chg_udelay);
                ++drv_data->rx;
                ++drv_data->tx;
        }
                write_TDBR(drv_data, (*(u16 *) (drv_data->tx)));
                while ((read_STAT(drv_data) & BIT_STAT_TXS))
                        continue;
+
                cs_deactive(drv_data, chip);
 
-               if (chip->cs_chg_udelay)
-                       udelay(chip->cs_chg_udelay);
                drv_data->tx += 2;
        }
 }
        while (drv_data->rx < drv_data->rx_end - 2) {
                cs_deactive(drv_data, chip);
 
-               if (chip->cs_chg_udelay)
-                       udelay(chip->cs_chg_udelay);
-
                while (!(read_STAT(drv_data) & BIT_STAT_RXS))
                        continue;
                cs_active(drv_data, chip);
                while (!(read_STAT(drv_data) & BIT_STAT_RXS))
                        continue;
                *(u16 *) (drv_data->rx) = read_RDBR(drv_data);
+
                cs_deactive(drv_data, chip);
 
-               if (chip->cs_chg_udelay)
-                       udelay(chip->cs_chg_udelay);
                drv_data->rx += 2;
                drv_data->tx += 2;
        }