u8 *dst, const u8 *src,
                                       int nrounds, unsigned int nbytes);
 asmlinkage void hchacha_block_arm(const struct chacha_state *state,
-                                 u32 *out, int nrounds);
+                                 u32 out[HCHACHA_OUT_WORDS], int nrounds);
 asmlinkage void hchacha_block_neon(const struct chacha_state *state,
-                                  u32 *out, int nrounds);
+                                  u32 out[HCHACHA_OUT_WORDS], int nrounds);
 
 asmlinkage void chacha_doarm(u8 *dst, const u8 *src, unsigned int bytes,
                             const struct chacha_state *state, int nrounds);
        }
 }
 
-void hchacha_block_arch(const struct chacha_state *state, u32 *stream,
-                       int nrounds)
+void hchacha_block_arch(const struct chacha_state *state,
+                       u32 out[HCHACHA_OUT_WORDS], int nrounds)
 {
        if (!IS_ENABLED(CONFIG_KERNEL_MODE_NEON) || !neon_usable()) {
-               hchacha_block_arm(state, stream, nrounds);
+               hchacha_block_arm(state, out, nrounds);
        } else {
                kernel_neon_begin();
-               hchacha_block_neon(state, stream, nrounds);
+               hchacha_block_neon(state, out, nrounds);
                kernel_neon_end();
        }
 }
 
 
 /*
  * void hchacha_block_arm(const struct chacha_state *state,
- *                       u32 out[8], int nrounds);
+ *                       u32 out[HCHACHA_OUT_WORDS], int nrounds);
  */
 ENTRY(hchacha_block_arm)
        push            {r1,r4-r11,lr}
 
                                       u8 *dst, const u8 *src,
                                       int nrounds, int bytes);
 asmlinkage void hchacha_block_neon(const struct chacha_state *state,
-                                  u32 *out, int nrounds);
+                                  u32 out[HCHACHA_OUT_WORDS], int nrounds);
 
 static __ro_after_init DEFINE_STATIC_KEY_FALSE(have_neon);
 
        }
 }
 
-void hchacha_block_arch(const struct chacha_state *state, u32 *stream,
-                       int nrounds)
+void hchacha_block_arch(const struct chacha_state *state,
+                       u32 out[HCHACHA_OUT_WORDS], int nrounds)
 {
        if (!static_branch_likely(&have_neon) || !crypto_simd_usable()) {
-               hchacha_block_generic(state, stream, nrounds);
+               hchacha_block_generic(state, out, nrounds);
        } else {
                kernel_neon_begin();
-               hchacha_block_neon(state, stream, nrounds);
+               hchacha_block_neon(state, out, nrounds);
                kernel_neon_end();
        }
 }
 
 EXPORT_SYMBOL(chacha_crypt_arch);
 
 asmlinkage void hchacha_block_arch(const struct chacha_state *state,
-                                  u32 *stream, int nrounds);
+                                  u32 out[HCHACHA_OUT_WORDS], int nrounds);
 EXPORT_SYMBOL(hchacha_block_arch);
 
 bool chacha_is_arch_optimized(void)
 
 }
 
 void hchacha_block_arch(const struct chacha_state *state,
-                       u32 *stream, int nrounds)
+                       u32 out[HCHACHA_OUT_WORDS], int nrounds)
 {
-       hchacha_block_generic(state, stream, nrounds);
+       hchacha_block_generic(state, out, nrounds);
 }
 EXPORT_SYMBOL(hchacha_block_arch);
 
 
 asmlinkage void chacha_zvkb(struct chacha_state *state, const u8 *in, u8 *out,
                            size_t nblocks, int nrounds);
 
-void hchacha_block_arch(const struct chacha_state *state, u32 *out, int nrounds)
+void hchacha_block_arch(const struct chacha_state *state,
+                       u32 out[HCHACHA_OUT_WORDS], int nrounds)
 {
        hchacha_block_generic(state, out, nrounds);
 }
 
 #include "chacha-s390.h"
 
 void hchacha_block_arch(const struct chacha_state *state,
-                       u32 *stream, int nrounds)
+                       u32 out[HCHACHA_OUT_WORDS], int nrounds)
 {
        /* TODO: implement hchacha_block_arch() in assembly */
-       hchacha_block_generic(state, stream, nrounds);
+       hchacha_block_generic(state, out, nrounds);
 }
 EXPORT_SYMBOL(hchacha_block_arch);
 
 
                                        u8 *dst, const u8 *src,
                                        unsigned int len, int nrounds);
 asmlinkage void hchacha_block_ssse3(const struct chacha_state *state,
-                                   u32 *out, int nrounds);
+                                   u32 out[HCHACHA_OUT_WORDS], int nrounds);
 
 asmlinkage void chacha_2block_xor_avx2(const struct chacha_state *state,
                                       u8 *dst, const u8 *src,
 }
 
 void hchacha_block_arch(const struct chacha_state *state,
-                       u32 *stream, int nrounds)
+                       u32 out[HCHACHA_OUT_WORDS], int nrounds)
 {
        if (!static_branch_likely(&chacha_use_simd)) {
-               hchacha_block_generic(state, stream, nrounds);
+               hchacha_block_generic(state, out, nrounds);
        } else {
                kernel_fpu_begin();
-               hchacha_block_ssse3(state, stream, nrounds);
+               hchacha_block_ssse3(state, out, nrounds);
                kernel_fpu_end();
        }
 }
 
 }
 
 static int chacha_stream_xor(struct skcipher_request *req,
-                            const struct chacha_ctx *ctx, const u8 *iv,
-                            bool arch)
+                            const struct chacha_ctx *ctx,
+                            const u8 iv[CHACHA_IV_SIZE], bool arch)
 {
        struct skcipher_walk walk;
        struct chacha_state state;
 
 #define CHACHA_BLOCK_SIZE      64
 #define CHACHAPOLY_IV_SIZE     12
 
-#define CHACHA_STATE_WORDS     (CHACHA_BLOCK_SIZE / sizeof(u32))
+#define CHACHA_KEY_WORDS       8
+#define CHACHA_STATE_WORDS     16
+#define HCHACHA_OUT_WORDS      8
 
 /* 192-bit nonce, then 64-bit stream position */
 #define XCHACHA_IV_SIZE                32
        u32 x[CHACHA_STATE_WORDS];
 };
 
-void chacha_block_generic(struct chacha_state *state, u8 *stream, int nrounds);
-static inline void chacha20_block(struct chacha_state *state, u8 *stream)
+void chacha_block_generic(struct chacha_state *state,
+                         u8 out[CHACHA_BLOCK_SIZE], int nrounds);
+static inline void chacha20_block(struct chacha_state *state,
+                                 u8 out[CHACHA_BLOCK_SIZE])
 {
-       chacha_block_generic(state, stream, 20);
+       chacha_block_generic(state, out, 20);
 }
 
-void hchacha_block_arch(const struct chacha_state *state, u32 *out,
-                       int nrounds);
-void hchacha_block_generic(const struct chacha_state *state, u32 *out,
-                          int nrounds);
+void hchacha_block_arch(const struct chacha_state *state,
+                       u32 out[HCHACHA_OUT_WORDS], int nrounds);
+void hchacha_block_generic(const struct chacha_state *state,
+                          u32 out[HCHACHA_OUT_WORDS], int nrounds);
 
-static inline void hchacha_block(const struct chacha_state *state, u32 *out,
-                                int nrounds)
+static inline void hchacha_block(const struct chacha_state *state,
+                                u32 out[HCHACHA_OUT_WORDS], int nrounds)
 {
        if (IS_ENABLED(CONFIG_CRYPTO_ARCH_HAVE_LIB_CHACHA))
                hchacha_block_arch(state, out, nrounds);
 }
 
 static inline void chacha_init(struct chacha_state *state,
-                              const u32 *key, const u8 *iv)
+                              const u32 key[CHACHA_KEY_WORDS],
+                              const u8 iv[CHACHA_IV_SIZE])
 {
        chacha_init_consts(state);
        state->x[4]  = key[0];
 
 /**
  * chacha_block_generic - generate one keystream block and increment block counter
  * @state: input state matrix
- * @stream: output keystream block (64 bytes)
+ * @out: output keystream block
  * @nrounds: number of rounds (20 or 12; 20 is recommended)
  *
  * This is the ChaCha core, a function from 64-byte strings to 64-byte strings.
  * The caller has already converted the endianness of the input.  This function
  * also handles incrementing the block counter in the input matrix.
  */
-void chacha_block_generic(struct chacha_state *state, u8 *stream, int nrounds)
+void chacha_block_generic(struct chacha_state *state,
+                         u8 out[CHACHA_BLOCK_SIZE], int nrounds)
 {
        struct chacha_state permuted_state = *state;
        int i;
 
        for (i = 0; i < ARRAY_SIZE(state->x); i++)
                put_unaligned_le32(permuted_state.x[i] + state->x[i],
-                                  &stream[i * sizeof(u32)]);
+                                  &out[i * sizeof(u32)]);
 
        state->x[12]++;
 }
 /**
  * hchacha_block_generic - abbreviated ChaCha core, for XChaCha
  * @state: input state matrix
- * @stream: output (8 32-bit words)
+ * @out: the output words
  * @nrounds: number of rounds (20 or 12; 20 is recommended)
  *
  * HChaCha is the ChaCha equivalent of HSalsa and is an intermediate step
  * of the state.  It should not be used for streaming directly.
  */
 void hchacha_block_generic(const struct chacha_state *state,
-                          u32 *stream, int nrounds)
+                          u32 out[HCHACHA_OUT_WORDS], int nrounds)
 {
        struct chacha_state permuted_state = *state;
 
        chacha_permute(&permuted_state, nrounds);
 
-       memcpy(&stream[0], &permuted_state.x[0], 16);
-       memcpy(&stream[4], &permuted_state.x[12], 16);
+       memcpy(&out[0], &permuted_state.x[0], 16);
+       memcpy(&out[4], &permuted_state.x[12], 16);
 }
 EXPORT_SYMBOL(hchacha_block_generic);
 
 #include <linux/mm.h>
 #include <linux/module.h>
 
-#define CHACHA_KEY_WORDS       (CHACHA_KEY_SIZE / sizeof(u32))
-
 static void chacha_load_key(u32 *k, const u8 *in)
 {
        k[0] = get_unaligned_le32(in);