| /* |
| * Ultra Wide Band |
| * AES-128 CCM Encryption |
| * |
| * Copyright (C) 2007 Intel Corporation |
| * Inaky Perez-Gonzalez <inaky.perez-gonzalez@intel.com> |
| * |
| * This program is free software; you can redistribute it and/or |
| * modify it under the terms of the GNU General Public License version |
| * 2 as published by the Free Software Foundation. |
| * |
| * This program is distributed in the hope that it will be useful, |
| * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| * GNU General Public License for more details. |
| * |
| * You should have received a copy of the GNU General Public License |
| * along with this program; if not, write to the Free Software |
| * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA |
| * 02110-1301, USA. |
| * |
| * |
| * We don't do any encryption here; we use the Linux Kernel's AES-128 |
| * crypto modules to construct keys and payload blocks in a way |
| * defined by WUSB1.0[6]. Check the erratas, as typos are are patched |
| * there. |
| * |
| * Thanks a zillion to John Keys for his help and clarifications over |
| * the designed-by-a-committee text. |
| * |
| * So the idea is that there is this basic Pseudo-Random-Function |
| * defined in WUSB1.0[6.5] which is the core of everything. It works |
| * by tweaking some blocks, AES crypting them and then xoring |
| * something else with them (this seems to be called CBC(AES) -- can |
| * you tell I know jack about crypto?). So we just funnel it into the |
| * Linux Crypto API. |
| * |
| * We leave a crypto test module so we can verify that vectors match, |
| * every now and then. |
| * |
| * Block size: 16 bytes -- AES seems to do things in 'block sizes'. I |
| * am learning a lot... |
| * |
| * Conveniently, some data structures that need to be |
| * funneled through AES are...16 bytes in size! |
| */ |
| |
| #include <linux/crypto.h> |
| #include <linux/module.h> |
| #include <linux/err.h> |
| #include <linux/uwb.h> |
| #include <linux/slab.h> |
| #include <linux/usb/wusb.h> |
| #include <linux/scatterlist.h> |
| |
| static int debug_crypto_verify = 0; |
| |
| module_param(debug_crypto_verify, int, 0); |
| MODULE_PARM_DESC(debug_crypto_verify, "verify the key generation algorithms"); |
| |
| static void wusb_key_dump(const void *buf, size_t len) |
| { |
| print_hex_dump(KERN_ERR, " ", DUMP_PREFIX_OFFSET, 16, 1, |
| buf, len, 0); |
| } |
| |
| /* |
| * Block of data, as understood by AES-CCM |
| * |
| * The code assumes this structure is nothing but a 16 byte array |
| * (packed in a struct to avoid common mess ups that I usually do with |
| * arrays and enforcing type checking). |
| */ |
| struct aes_ccm_block { |
| u8 data[16]; |
| } __attribute__((packed)); |
| |
| /* |
| * Counter-mode Blocks (WUSB1.0[6.4]) |
| * |
| * According to CCM (or so it seems), for the purpose of calculating |
| * the MIC, the message is broken in N counter-mode blocks, B0, B1, |
| * ... BN. |
| * |
| * B0 contains flags, the CCM nonce and l(m). |
| * |
| * B1 contains l(a), the MAC header, the encryption offset and padding. |
| * |
| * If EO is nonzero, additional blocks are built from payload bytes |
| * until EO is exhausted (FIXME: padding to 16 bytes, I guess). The |
| * padding is not xmitted. |
| */ |
| |
| /* WUSB1.0[T6.4] */ |
| struct aes_ccm_b0 { |
| u8 flags; /* 0x59, per CCM spec */ |
| struct aes_ccm_nonce ccm_nonce; |
| __be16 lm; |
| } __attribute__((packed)); |
| |
| /* WUSB1.0[T6.5] */ |
| struct aes_ccm_b1 { |
| __be16 la; |
| u8 mac_header[10]; |
| __le16 eo; |
| u8 security_reserved; /* This is always zero */ |
| u8 padding; /* 0 */ |
| } __attribute__((packed)); |
| |
| /* |
| * Encryption Blocks (WUSB1.0[6.4.4]) |
| * |
| * CCM uses Ax blocks to generate a keystream with which the MIC and |
| * the message's payload are encoded. A0 always encrypts/decrypts the |
| * MIC. Ax (x>0) are used for the successive payload blocks. |
| * |
| * The x is the counter, and is increased for each block. |
| */ |
| struct aes_ccm_a { |
| u8 flags; /* 0x01, per CCM spec */ |
| struct aes_ccm_nonce ccm_nonce; |
| __be16 counter; /* Value of x */ |
| } __attribute__((packed)); |
| |
| static void bytewise_xor(void *_bo, const void *_bi1, const void *_bi2, |
| size_t size) |
| { |
| u8 *bo = _bo; |
| const u8 *bi1 = _bi1, *bi2 = _bi2; |
| size_t itr; |
| for (itr = 0; itr < size; itr++) |
| bo[itr] = bi1[itr] ^ bi2[itr]; |
| } |
| |
| /* |
| * CC-MAC function WUSB1.0[6.5] |
| * |
| * Take a data string and produce the encrypted CBC Counter-mode MIC |
| * |
| * Note the names for most function arguments are made to (more or |
| * less) match those used in the pseudo-function definition given in |
| * WUSB1.0[6.5]. |
| * |
| * @tfm_cbc: CBC(AES) blkcipher handle (initialized) |
| * |
| * @tfm_aes: AES cipher handle (initialized) |
| * |
| * @mic: buffer for placing the computed MIC (Message Integrity |
| * Code). This is exactly 8 bytes, and we expect the buffer to |
| * be at least eight bytes in length. |
| * |
| * @key: 128 bit symmetric key |
| * |
| * @n: CCM nonce |
| * |
| * @a: ASCII string, 14 bytes long (I guess zero padded if needed; |
| * we use exactly 14 bytes). |
| * |
| * @b: data stream to be processed; cannot be a global or const local |
| * (will confuse the scatterlists) |
| * |
| * @blen: size of b... |
| * |
| * Still not very clear how this is done, but looks like this: we |
| * create block B0 (as WUSB1.0[6.5] says), then we AES-crypt it with |
| * @key. We bytewise xor B0 with B1 (1) and AES-crypt that. Then we |
| * take the payload and divide it in blocks (16 bytes), xor them with |
| * the previous crypto result (16 bytes) and crypt it, repeat the next |
| * block with the output of the previous one, rinse wash (I guess this |
| * is what AES CBC mode means...but I truly have no idea). So we use |
| * the CBC(AES) blkcipher, that does precisely that. The IV (Initial |
| * Vector) is 16 bytes and is set to zero, so |
| * |
| * See rfc3610. Linux crypto has a CBC implementation, but the |
| * documentation is scarce, to say the least, and the example code is |
| * so intricated that is difficult to understand how things work. Most |
| * of this is guess work -- bite me. |
| * |
| * (1) Created as 6.5 says, again, using as l(a) 'Blen + 14', and |
| * using the 14 bytes of @a to fill up |
| * b1.{mac_header,e0,security_reserved,padding}. |
| * |
| * NOTE: The definition of l(a) in WUSB1.0[6.5] vs the definition of |
| * l(m) is orthogonal, they bear no relationship, so it is not |
| * in conflict with the parameter's relation that |
| * WUSB1.0[6.4.2]) defines. |
| * |
| * NOTE: WUSB1.0[A.1]: Host Nonce is missing a nibble? (1e); fixed in |
| * first errata released on 2005/07. |
| * |
| * NOTE: we need to clean IV to zero at each invocation to make sure |
| * we start with a fresh empty Initial Vector, so that the CBC |
| * works ok. |
| * |
| * NOTE: blen is not aligned to a block size, we'll pad zeros, that's |
| * what sg[4] is for. Maybe there is a smarter way to do this. |
| */ |
| static int wusb_ccm_mac(struct crypto_blkcipher *tfm_cbc, |
| struct crypto_cipher *tfm_aes, void *mic, |
| const struct aes_ccm_nonce *n, |
| const struct aes_ccm_label *a, const void *b, |
| size_t blen) |
| { |
| int result = 0; |
| struct blkcipher_desc desc; |
| struct aes_ccm_b0 b0; |
| struct aes_ccm_b1 b1; |
| struct aes_ccm_a ax; |
| struct scatterlist sg[4], sg_dst; |
| void *iv, *dst_buf; |
| size_t ivsize, dst_size; |
| const u8 bzero[16] = { 0 }; |
| size_t zero_padding; |
| |
| /* |
| * These checks should be compile time optimized out |
| * ensure @a fills b1's mac_header and following fields |
| */ |
| WARN_ON(sizeof(*a) != sizeof(b1) - sizeof(b1.la)); |
| WARN_ON(sizeof(b0) != sizeof(struct aes_ccm_block)); |
| WARN_ON(sizeof(b1) != sizeof(struct aes_ccm_block)); |
| WARN_ON(sizeof(ax) != sizeof(struct aes_ccm_block)); |
| |
| result = -ENOMEM; |
| zero_padding = blen % sizeof(struct aes_ccm_block); |
| if (zero_padding) |
| zero_padding = sizeof(struct aes_ccm_block) - zero_padding; |
| dst_size = blen + sizeof(b0) + sizeof(b1) + zero_padding; |
| dst_buf = kzalloc(dst_size, GFP_KERNEL); |
| if (dst_buf == NULL) { |
| printk(KERN_ERR "E: can't alloc destination buffer\n"); |
| goto error_dst_buf; |
| } |
| |
| iv = crypto_blkcipher_crt(tfm_cbc)->iv; |
| ivsize = crypto_blkcipher_ivsize(tfm_cbc); |
| memset(iv, 0, ivsize); |
| |
| /* Setup B0 */ |
| b0.flags = 0x59; /* Format B0 */ |
| b0.ccm_nonce = *n; |
| b0.lm = cpu_to_be16(0); /* WUSB1.0[6.5] sez l(m) is 0 */ |
| |
| /* Setup B1 |
| * |
| * The WUSB spec is anything but clear! WUSB1.0[6.5] |
| * says that to initialize B1 from A with 'l(a) = blen + |
| * 14'--after clarification, it means to use A's contents |
| * for MAC Header, EO, sec reserved and padding. |
| */ |
| b1.la = cpu_to_be16(blen + 14); |
| memcpy(&b1.mac_header, a, sizeof(*a)); |
| |
| sg_init_table(sg, ARRAY_SIZE(sg)); |
| sg_set_buf(&sg[0], &b0, sizeof(b0)); |
| sg_set_buf(&sg[1], &b1, sizeof(b1)); |
| sg_set_buf(&sg[2], b, blen); |
| /* 0 if well behaved :) */ |
| sg_set_buf(&sg[3], bzero, zero_padding); |
| sg_init_one(&sg_dst, dst_buf, dst_size); |
| |
| desc.tfm = tfm_cbc; |
| desc.flags = 0; |
| result = crypto_blkcipher_encrypt(&desc, &sg_dst, sg, dst_size); |
| if (result < 0) { |
| printk(KERN_ERR "E: can't compute CBC-MAC tag (MIC): %d\n", |
| result); |
| goto error_cbc_crypt; |
| } |
| |
| /* Now we crypt the MIC Tag (*iv) with Ax -- values per WUSB1.0[6.5] |
| * The procedure is to AES crypt the A0 block and XOR the MIC |
| * Tag against it; we only do the first 8 bytes and place it |
| * directly in the destination buffer. |
| * |
| * POS Crypto API: size is assumed to be AES's block size. |
| * Thanks for documenting it -- tip taken from airo.c |
| */ |
| ax.flags = 0x01; /* as per WUSB 1.0 spec */ |
| ax.ccm_nonce = *n; |
| ax.counter = 0; |
| crypto_cipher_encrypt_one(tfm_aes, (void *)&ax, (void *)&ax); |
| bytewise_xor(mic, &ax, iv, 8); |
| result = 8; |
| error_cbc_crypt: |
| kfree(dst_buf); |
| error_dst_buf: |
| return result; |
| } |
| |
| /* |
| * WUSB Pseudo Random Function (WUSB1.0[6.5]) |
| * |
| * @b: buffer to the source data; cannot be a global or const local |
| * (will confuse the scatterlists) |
| */ |
| ssize_t wusb_prf(void *out, size_t out_size, |
| const u8 key[16], const struct aes_ccm_nonce *_n, |
| const struct aes_ccm_label *a, |
| const void *b, size_t blen, size_t len) |
| { |
| ssize_t result, bytes = 0, bitr; |
| struct aes_ccm_nonce n = *_n; |
| struct crypto_blkcipher *tfm_cbc; |
| struct crypto_cipher *tfm_aes; |
| u64 sfn = 0; |
| __le64 sfn_le; |
| |
| tfm_cbc = crypto_alloc_blkcipher("cbc(aes)", 0, CRYPTO_ALG_ASYNC); |
| if (IS_ERR(tfm_cbc)) { |
| result = PTR_ERR(tfm_cbc); |
| printk(KERN_ERR "E: can't load CBC(AES): %d\n", (int)result); |
| goto error_alloc_cbc; |
| } |
| result = crypto_blkcipher_setkey(tfm_cbc, key, 16); |
| if (result < 0) { |
| printk(KERN_ERR "E: can't set CBC key: %d\n", (int)result); |
| goto error_setkey_cbc; |
| } |
| |
| tfm_aes = crypto_alloc_cipher("aes", 0, CRYPTO_ALG_ASYNC); |
| if (IS_ERR(tfm_aes)) { |
| result = PTR_ERR(tfm_aes); |
| printk(KERN_ERR "E: can't load AES: %d\n", (int)result); |
| goto error_alloc_aes; |
| } |
| result = crypto_cipher_setkey(tfm_aes, key, 16); |
| if (result < 0) { |
| printk(KERN_ERR "E: can't set AES key: %d\n", (int)result); |
| goto error_setkey_aes; |
| } |
| |
| for (bitr = 0; bitr < (len + 63) / 64; bitr++) { |
| sfn_le = cpu_to_le64(sfn++); |
| memcpy(&n.sfn, &sfn_le, sizeof(n.sfn)); /* n.sfn++... */ |
| result = wusb_ccm_mac(tfm_cbc, tfm_aes, out + bytes, |
| &n, a, b, blen); |
| if (result < 0) |
| goto error_ccm_mac; |
| bytes += result; |
| } |
| result = bytes; |
| error_ccm_mac: |
| error_setkey_aes: |
| crypto_free_cipher(tfm_aes); |
| error_alloc_aes: |
| error_setkey_cbc: |
| crypto_free_blkcipher(tfm_cbc); |
| error_alloc_cbc: |
| return result; |
| } |
| |
| /* WUSB1.0[A.2] test vectors */ |
| static const u8 stv_hsmic_key[16] = { |
| 0x4b, 0x79, 0xa3, 0xcf, 0xe5, 0x53, 0x23, 0x9d, |
| 0xd7, 0xc1, 0x6d, 0x1c, 0x2d, 0xab, 0x6d, 0x3f |
| }; |
| |
| static const struct aes_ccm_nonce stv_hsmic_n = { |
| .sfn = { 0 }, |
| .tkid = { 0x76, 0x98, 0x01, }, |
| .dest_addr = { .data = { 0xbe, 0x00 } }, |
| .src_addr = { .data = { 0x76, 0x98 } }, |
| }; |
| |
| /* |
| * Out-of-band MIC Generation verification code |
| * |
| */ |
| static int wusb_oob_mic_verify(void) |
| { |
| int result; |
| u8 mic[8]; |
| /* WUSB1.0[A.2] test vectors |
| * |
| * Need to keep it in the local stack as GCC 4.1.3something |
| * messes up and generates noise. |
| */ |
| struct usb_handshake stv_hsmic_hs = { |
| .bMessageNumber = 2, |
| .bStatus = 00, |
| .tTKID = { 0x76, 0x98, 0x01 }, |
| .bReserved = 00, |
| .CDID = { 0x30, 0x31, 0x32, 0x33, 0x34, 0x35, |
| 0x36, 0x37, 0x38, 0x39, 0x3a, 0x3b, |
| 0x3c, 0x3d, 0x3e, 0x3f }, |
| .nonce = { 0x20, 0x21, 0x22, 0x23, 0x24, 0x25, |
| 0x26, 0x27, 0x28, 0x29, 0x2a, 0x2b, |
| 0x2c, 0x2d, 0x2e, 0x2f }, |
| .MIC = { 0x75, 0x6a, 0x97, 0x51, 0x0c, 0x8c, |
| 0x14, 0x7b } , |
| }; |
| size_t hs_size; |
| |
| result = wusb_oob_mic(mic, stv_hsmic_key, &stv_hsmic_n, &stv_hsmic_hs); |
| if (result < 0) |
| printk(KERN_ERR "E: WUSB OOB MIC test: failed: %d\n", result); |
| else if (memcmp(stv_hsmic_hs.MIC, mic, sizeof(mic))) { |
| printk(KERN_ERR "E: OOB MIC test: " |
| "mismatch between MIC result and WUSB1.0[A2]\n"); |
| hs_size = sizeof(stv_hsmic_hs) - sizeof(stv_hsmic_hs.MIC); |
| printk(KERN_ERR "E: Handshake2 in: (%zu bytes)\n", hs_size); |
| wusb_key_dump(&stv_hsmic_hs, hs_size); |
| printk(KERN_ERR "E: CCM Nonce in: (%zu bytes)\n", |
| sizeof(stv_hsmic_n)); |
| wusb_key_dump(&stv_hsmic_n, sizeof(stv_hsmic_n)); |
| printk(KERN_ERR "E: MIC out:\n"); |
| wusb_key_dump(mic, sizeof(mic)); |
| printk(KERN_ERR "E: MIC out (from WUSB1.0[A.2]):\n"); |
| wusb_key_dump(stv_hsmic_hs.MIC, sizeof(stv_hsmic_hs.MIC)); |
| result = -EINVAL; |
| } else |
| result = 0; |
| return result; |
| } |
| |
| /* |
| * Test vectors for Key derivation |
| * |
| * These come from WUSB1.0[6.5.1], the vectors in WUSB1.0[A.1] |
| * (errata corrected in 2005/07). |
| */ |
| static const u8 stv_key_a1[16] __attribute__ ((__aligned__(4))) = { |
| 0xf0, 0xe1, 0xd2, 0xc3, 0xb4, 0xa5, 0x96, 0x87, |
| 0x78, 0x69, 0x5a, 0x4b, 0x3c, 0x2d, 0x1e, 0x0f |
| }; |
| |
| static const struct aes_ccm_nonce stv_keydvt_n_a1 = { |
| .sfn = { 0 }, |
| .tkid = { 0x76, 0x98, 0x01, }, |
| .dest_addr = { .data = { 0xbe, 0x00 } }, |
| .src_addr = { .data = { 0x76, 0x98 } }, |
| }; |
| |
| static const struct wusb_keydvt_out stv_keydvt_out_a1 = { |
| .kck = { |
| 0x4b, 0x79, 0xa3, 0xcf, 0xe5, 0x53, 0x23, 0x9d, |
| 0xd7, 0xc1, 0x6d, 0x1c, 0x2d, 0xab, 0x6d, 0x3f |
| }, |
| .ptk = { |
| 0xc8, 0x70, 0x62, 0x82, 0xb6, 0x7c, 0xe9, 0x06, |
| 0x7b, 0xc5, 0x25, 0x69, 0xf2, 0x36, 0x61, 0x2d |
| } |
| }; |
| |
| /* |
| * Performa a test to make sure we match the vectors defined in |
| * WUSB1.0[A.1](Errata2006/12) |
| */ |
| static int wusb_key_derive_verify(void) |
| { |
| int result = 0; |
| struct wusb_keydvt_out keydvt_out; |
| /* These come from WUSB1.0[A.1] + 2006/12 errata |
| * NOTE: can't make this const or global -- somehow it seems |
| * the scatterlists for crypto get confused and we get |
| * bad data. There is no doc on this... */ |
| struct wusb_keydvt_in stv_keydvt_in_a1 = { |
| .hnonce = { |
| 0x10, 0x11, 0x12, 0x13, 0x14, 0x15, 0x16, 0x17, |
| 0x18, 0x19, 0x1a, 0x1b, 0x1c, 0x1d, 0x1e, 0x1f |
| }, |
| .dnonce = { |
| 0x20, 0x21, 0x22, 0x23, 0x24, 0x25, 0x26, 0x27, |
| 0x28, 0x29, 0x2a, 0x2b, 0x2c, 0x2d, 0x2e, 0x2f |
| } |
| }; |
| |
| result = wusb_key_derive(&keydvt_out, stv_key_a1, &stv_keydvt_n_a1, |
| &stv_keydvt_in_a1); |
| if (result < 0) |
| printk(KERN_ERR "E: WUSB key derivation test: " |
| "derivation failed: %d\n", result); |
| if (memcmp(&stv_keydvt_out_a1, &keydvt_out, sizeof(keydvt_out))) { |
| printk(KERN_ERR "E: WUSB key derivation test: " |
| "mismatch between key derivation result " |
| "and WUSB1.0[A1] Errata 2006/12\n"); |
| printk(KERN_ERR "E: keydvt in: key\n"); |
| wusb_key_dump(stv_key_a1, sizeof(stv_key_a1)); |
| printk(KERN_ERR "E: keydvt in: nonce\n"); |
| wusb_key_dump( &stv_keydvt_n_a1, sizeof(stv_keydvt_n_a1)); |
| printk(KERN_ERR "E: keydvt in: hnonce & dnonce\n"); |
| wusb_key_dump(&stv_keydvt_in_a1, sizeof(stv_keydvt_in_a1)); |
| printk(KERN_ERR "E: keydvt out: KCK\n"); |
| wusb_key_dump(&keydvt_out.kck, sizeof(keydvt_out.kck)); |
| printk(KERN_ERR "E: keydvt out: PTK\n"); |
| wusb_key_dump(&keydvt_out.ptk, sizeof(keydvt_out.ptk)); |
| result = -EINVAL; |
| } else |
| result = 0; |
| return result; |
| } |
| |
| /* |
| * Initialize crypto system |
| * |
| * FIXME: we do nothing now, other than verifying. Later on we'll |
| * cache the encryption stuff, so that's why we have a separate init. |
| */ |
| int wusb_crypto_init(void) |
| { |
| int result; |
| |
| if (debug_crypto_verify) { |
| result = wusb_key_derive_verify(); |
| if (result < 0) |
| return result; |
| return wusb_oob_mic_verify(); |
| } |
| return 0; |
| } |
| |
| void wusb_crypto_exit(void) |
| { |
| /* FIXME: free cached crypto transforms */ |
| } |