1/* Copyright (c) 2018, Mellanox Technologies All rights reserved.
2 *
3 * This software is available to you under a choice of one of two
4 * licenses.  You may choose to be licensed under the terms of the GNU
5 * General Public License (GPL) Version 2, available from the file
6 * COPYING in the main directory of this source tree, or the
7 * OpenIB.org BSD license below:
8 *
9 *     Redistribution and use in source and binary forms, with or
10 *     without modification, are permitted provided that the following
11 *     conditions are met:
12 *
13 *      - Redistributions of source code must retain the above
14 *        copyright notice, this list of conditions and the following
15 *        disclaimer.
16 *
17 *      - Redistributions in binary form must reproduce the above
18 *        copyright notice, this list of conditions and the following
19 *        disclaimer in the documentation and/or other materials
20 *        provided with the distribution.
21 *
22 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
23 * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
24 * MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
25 * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS
26 * BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN
27 * ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN
28 * CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
29 * SOFTWARE.
30 */
31
32#include <net/tls.h>
33#include <crypto/aead.h>
34#include <crypto/scatterwalk.h>
35#include <net/ip6_checksum.h>
36
37#include "tls.h"
38
39static void chain_to_walk(struct scatterlist *sg, struct scatter_walk *walk)
40{
41	struct scatterlist *src = walk->sg;
42	int diff = walk->offset - src->offset;
43
44	sg_set_page(sg, sg_page(src),
45		    src->length - diff, walk->offset);
46
47	scatterwalk_crypto_chain(sg, sg_next(src), 2);
48}
49
50static int tls_enc_record(struct aead_request *aead_req,
51			  struct crypto_aead *aead, char *aad,
52			  char *iv, __be64 rcd_sn,
53			  struct scatter_walk *in,
54			  struct scatter_walk *out, int *in_len,
55			  struct tls_prot_info *prot)
56{
57	unsigned char buf[TLS_HEADER_SIZE + MAX_IV_SIZE];
58	const struct tls_cipher_desc *cipher_desc;
59	struct scatterlist sg_in[3];
60	struct scatterlist sg_out[3];
61	unsigned int buf_size;
62	u16 len;
63	int rc;
64
65	switch (prot->cipher_type) {
66	case TLS_CIPHER_AES_GCM_128:
67	case TLS_CIPHER_AES_GCM_256:
68		break;
69	default:
70		return -EINVAL;
71	}
72	cipher_desc = get_cipher_desc(prot->cipher_type);
73
74	buf_size = TLS_HEADER_SIZE + cipher_desc->iv;
75	len = min_t(int, *in_len, buf_size);
76
77	scatterwalk_copychunks(buf, in, len, 0);
78	scatterwalk_copychunks(buf, out, len, 1);
79
80	*in_len -= len;
81	if (!*in_len)
82		return 0;
83
84	scatterwalk_pagedone(in, 0, 1);
85	scatterwalk_pagedone(out, 1, 1);
86
87	len = buf[4] | (buf[3] << 8);
88	len -= cipher_desc->iv;
89
90	tls_make_aad(aad, len - cipher_desc->tag, (char *)&rcd_sn, buf[0], prot);
91
92	memcpy(iv + cipher_desc->salt, buf + TLS_HEADER_SIZE, cipher_desc->iv);
93
94	sg_init_table(sg_in, ARRAY_SIZE(sg_in));
95	sg_init_table(sg_out, ARRAY_SIZE(sg_out));
96	sg_set_buf(sg_in, aad, TLS_AAD_SPACE_SIZE);
97	sg_set_buf(sg_out, aad, TLS_AAD_SPACE_SIZE);
98	chain_to_walk(sg_in + 1, in);
99	chain_to_walk(sg_out + 1, out);
100
101	*in_len -= len;
102	if (*in_len < 0) {
103		*in_len += cipher_desc->tag;
104		/* the input buffer doesn't contain the entire record.
105		 * trim len accordingly. The resulting authentication tag
106		 * will contain garbage, but we don't care, so we won't
107		 * include any of it in the output skb
108		 * Note that we assume the output buffer length
109		 * is larger then input buffer length + tag size
110		 */
111		if (*in_len < 0)
112			len += *in_len;
113
114		*in_len = 0;
115	}
116
117	if (*in_len) {
118		scatterwalk_copychunks(NULL, in, len, 2);
119		scatterwalk_pagedone(in, 0, 1);
120		scatterwalk_copychunks(NULL, out, len, 2);
121		scatterwalk_pagedone(out, 1, 1);
122	}
123
124	len -= cipher_desc->tag;
125	aead_request_set_crypt(aead_req, sg_in, sg_out, len, iv);
126
127	rc = crypto_aead_encrypt(aead_req);
128
129	return rc;
130}
131
132static void tls_init_aead_request(struct aead_request *aead_req,
133				  struct crypto_aead *aead)
134{
135	aead_request_set_tfm(aead_req, aead);
136	aead_request_set_ad(aead_req, TLS_AAD_SPACE_SIZE);
137}
138
139static struct aead_request *tls_alloc_aead_request(struct crypto_aead *aead,
140						   gfp_t flags)
141{
142	unsigned int req_size = sizeof(struct aead_request) +
143		crypto_aead_reqsize(aead);
144	struct aead_request *aead_req;
145
146	aead_req = kzalloc(req_size, flags);
147	if (aead_req)
148		tls_init_aead_request(aead_req, aead);
149	return aead_req;
150}
151
152static int tls_enc_records(struct aead_request *aead_req,
153			   struct crypto_aead *aead, struct scatterlist *sg_in,
154			   struct scatterlist *sg_out, char *aad, char *iv,
155			   u64 rcd_sn, int len, struct tls_prot_info *prot)
156{
157	struct scatter_walk out, in;
158	int rc;
159
160	scatterwalk_start(&in, sg_in);
161	scatterwalk_start(&out, sg_out);
162
163	do {
164		rc = tls_enc_record(aead_req, aead, aad, iv,
165				    cpu_to_be64(rcd_sn), &in, &out, &len, prot);
166		rcd_sn++;
167
168	} while (rc == 0 && len);
169
170	scatterwalk_done(&in, 0, 0);
171	scatterwalk_done(&out, 1, 0);
172
173	return rc;
174}
175
176/* Can't use icsk->icsk_af_ops->send_check here because the ip addresses
177 * might have been changed by NAT.
178 */
179static void update_chksum(struct sk_buff *skb, int headln)
180{
181	struct tcphdr *th = tcp_hdr(skb);
182	int datalen = skb->len - headln;
183	const struct ipv6hdr *ipv6h;
184	const struct iphdr *iph;
185
186	/* We only changed the payload so if we are using partial we don't
187	 * need to update anything.
188	 */
189	if (likely(skb->ip_summed == CHECKSUM_PARTIAL))
190		return;
191
192	skb->ip_summed = CHECKSUM_PARTIAL;
193	skb->csum_start = skb_transport_header(skb) - skb->head;
194	skb->csum_offset = offsetof(struct tcphdr, check);
195
196	if (skb->sk->sk_family == AF_INET6) {
197		ipv6h = ipv6_hdr(skb);
198		th->check = ~csum_ipv6_magic(&ipv6h->saddr, &ipv6h->daddr,
199					     datalen, IPPROTO_TCP, 0);
200	} else {
201		iph = ip_hdr(skb);
202		th->check = ~csum_tcpudp_magic(iph->saddr, iph->daddr, datalen,
203					       IPPROTO_TCP, 0);
204	}
205}
206
207static void complete_skb(struct sk_buff *nskb, struct sk_buff *skb, int headln)
208{
209	struct sock *sk = skb->sk;
210	int delta;
211
212	skb_copy_header(nskb, skb);
213
214	skb_put(nskb, skb->len);
215	memcpy(nskb->data, skb->data, headln);
216
217	nskb->destructor = skb->destructor;
218	nskb->sk = sk;
219	skb->destructor = NULL;
220	skb->sk = NULL;
221
222	update_chksum(nskb, headln);
223
224	/* sock_efree means skb must gone through skb_orphan_partial() */
225	if (nskb->destructor == sock_efree)
226		return;
227
228	delta = nskb->truesize - skb->truesize;
229	if (likely(delta < 0))
230		WARN_ON_ONCE(refcount_sub_and_test(-delta, &sk->sk_wmem_alloc));
231	else if (delta)
232		refcount_add(delta, &sk->sk_wmem_alloc);
233}
234
235/* This function may be called after the user socket is already
236 * closed so make sure we don't use anything freed during
237 * tls_sk_proto_close here
238 */
239
240static int fill_sg_in(struct scatterlist *sg_in,
241		      struct sk_buff *skb,
242		      struct tls_offload_context_tx *ctx,
243		      u64 *rcd_sn,
244		      s32 *sync_size,
245		      int *resync_sgs)
246{
247	int tcp_payload_offset = skb_tcp_all_headers(skb);
248	int payload_len = skb->len - tcp_payload_offset;
249	u32 tcp_seq = ntohl(tcp_hdr(skb)->seq);
250	struct tls_record_info *record;
251	unsigned long flags;
252	int remaining;
253	int i;
254
255	spin_lock_irqsave(&ctx->lock, flags);
256	record = tls_get_record(ctx, tcp_seq, rcd_sn);
257	if (!record) {
258		spin_unlock_irqrestore(&ctx->lock, flags);
259		return -EINVAL;
260	}
261
262	*sync_size = tcp_seq - tls_record_start_seq(record);
263	if (*sync_size < 0) {
264		int is_start_marker = tls_record_is_start_marker(record);
265
266		spin_unlock_irqrestore(&ctx->lock, flags);
267		/* This should only occur if the relevant record was
268		 * already acked. In that case it should be ok
269		 * to drop the packet and avoid retransmission.
270		 *
271		 * There is a corner case where the packet contains
272		 * both an acked and a non-acked record.
273		 * We currently don't handle that case and rely
274		 * on TCP to retransmit a packet that doesn't contain
275		 * already acked payload.
276		 */
277		if (!is_start_marker)
278			*sync_size = 0;
279		return -EINVAL;
280	}
281
282	remaining = *sync_size;
283	for (i = 0; remaining > 0; i++) {
284		skb_frag_t *frag = &record->frags[i];
285
286		__skb_frag_ref(frag);
287		sg_set_page(sg_in + i, skb_frag_page(frag),
288			    skb_frag_size(frag), skb_frag_off(frag));
289
290		remaining -= skb_frag_size(frag);
291
292		if (remaining < 0)
293			sg_in[i].length += remaining;
294	}
295	*resync_sgs = i;
296
297	spin_unlock_irqrestore(&ctx->lock, flags);
298	if (skb_to_sgvec(skb, &sg_in[i], tcp_payload_offset, payload_len) < 0)
299		return -EINVAL;
300
301	return 0;
302}
303
304static void fill_sg_out(struct scatterlist sg_out[3], void *buf,
305			struct tls_context *tls_ctx,
306			struct sk_buff *nskb,
307			int tcp_payload_offset,
308			int payload_len,
309			int sync_size,
310			void *dummy_buf)
311{
312	const struct tls_cipher_desc *cipher_desc =
313		get_cipher_desc(tls_ctx->crypto_send.info.cipher_type);
314
315	sg_set_buf(&sg_out[0], dummy_buf, sync_size);
316	sg_set_buf(&sg_out[1], nskb->data + tcp_payload_offset, payload_len);
317	/* Add room for authentication tag produced by crypto */
318	dummy_buf += sync_size;
319	sg_set_buf(&sg_out[2], dummy_buf, cipher_desc->tag);
320}
321
322static struct sk_buff *tls_enc_skb(struct tls_context *tls_ctx,
323				   struct scatterlist sg_out[3],
324				   struct scatterlist *sg_in,
325				   struct sk_buff *skb,
326				   s32 sync_size, u64 rcd_sn)
327{
328	struct tls_offload_context_tx *ctx = tls_offload_ctx_tx(tls_ctx);
329	int tcp_payload_offset = skb_tcp_all_headers(skb);
330	int payload_len = skb->len - tcp_payload_offset;
331	const struct tls_cipher_desc *cipher_desc;
332	void *buf, *iv, *aad, *dummy_buf, *salt;
333	struct aead_request *aead_req;
334	struct sk_buff *nskb = NULL;
335	int buf_len;
336
337	aead_req = tls_alloc_aead_request(ctx->aead_send, GFP_ATOMIC);
338	if (!aead_req)
339		return NULL;
340
341	switch (tls_ctx->crypto_send.info.cipher_type) {
342	case TLS_CIPHER_AES_GCM_128:
343		salt = tls_ctx->crypto_send.aes_gcm_128.salt;
344		break;
345	case TLS_CIPHER_AES_GCM_256:
346		salt = tls_ctx->crypto_send.aes_gcm_256.salt;
347		break;
348	default:
349		goto free_req;
350	}
351	cipher_desc = get_cipher_desc(tls_ctx->crypto_send.info.cipher_type);
352	buf_len = cipher_desc->salt + cipher_desc->iv + TLS_AAD_SPACE_SIZE +
353		  sync_size + cipher_desc->tag;
354	buf = kmalloc(buf_len, GFP_ATOMIC);
355	if (!buf)
356		goto free_req;
357
358	iv = buf;
359	memcpy(iv, salt, cipher_desc->salt);
360	aad = buf + cipher_desc->salt + cipher_desc->iv;
361	dummy_buf = aad + TLS_AAD_SPACE_SIZE;
362
363	nskb = alloc_skb(skb_headroom(skb) + skb->len, GFP_ATOMIC);
364	if (!nskb)
365		goto free_buf;
366
367	skb_reserve(nskb, skb_headroom(skb));
368
369	fill_sg_out(sg_out, buf, tls_ctx, nskb, tcp_payload_offset,
370		    payload_len, sync_size, dummy_buf);
371
372	if (tls_enc_records(aead_req, ctx->aead_send, sg_in, sg_out, aad, iv,
373			    rcd_sn, sync_size + payload_len,
374			    &tls_ctx->prot_info) < 0)
375		goto free_nskb;
376
377	complete_skb(nskb, skb, tcp_payload_offset);
378
379	/* validate_xmit_skb_list assumes that if the skb wasn't segmented
380	 * nskb->prev will point to the skb itself
381	 */
382	nskb->prev = nskb;
383
384free_buf:
385	kfree(buf);
386free_req:
387	kfree(aead_req);
388	return nskb;
389free_nskb:
390	kfree_skb(nskb);
391	nskb = NULL;
392	goto free_buf;
393}
394
395static struct sk_buff *tls_sw_fallback(struct sock *sk, struct sk_buff *skb)
396{
397	int tcp_payload_offset = skb_tcp_all_headers(skb);
398	struct tls_context *tls_ctx = tls_get_ctx(sk);
399	struct tls_offload_context_tx *ctx = tls_offload_ctx_tx(tls_ctx);
400	int payload_len = skb->len - tcp_payload_offset;
401	struct scatterlist *sg_in, sg_out[3];
402	struct sk_buff *nskb = NULL;
403	int sg_in_max_elements;
404	int resync_sgs = 0;
405	s32 sync_size = 0;
406	u64 rcd_sn;
407
408	/* worst case is:
409	 * MAX_SKB_FRAGS in tls_record_info
410	 * MAX_SKB_FRAGS + 1 in SKB head and frags.
411	 */
412	sg_in_max_elements = 2 * MAX_SKB_FRAGS + 1;
413
414	if (!payload_len)
415		return skb;
416
417	sg_in = kmalloc_array(sg_in_max_elements, sizeof(*sg_in), GFP_ATOMIC);
418	if (!sg_in)
419		goto free_orig;
420
421	sg_init_table(sg_in, sg_in_max_elements);
422	sg_init_table(sg_out, ARRAY_SIZE(sg_out));
423
424	if (fill_sg_in(sg_in, skb, ctx, &rcd_sn, &sync_size, &resync_sgs)) {
425		/* bypass packets before kernel TLS socket option was set */
426		if (sync_size < 0 && payload_len <= -sync_size)
427			nskb = skb_get(skb);
428		goto put_sg;
429	}
430
431	nskb = tls_enc_skb(tls_ctx, sg_out, sg_in, skb, sync_size, rcd_sn);
432
433put_sg:
434	while (resync_sgs)
435		put_page(sg_page(&sg_in[--resync_sgs]));
436	kfree(sg_in);
437free_orig:
438	if (nskb)
439		consume_skb(skb);
440	else
441		kfree_skb(skb);
442	return nskb;
443}
444
445struct sk_buff *tls_validate_xmit_skb(struct sock *sk,
446				      struct net_device *dev,
447				      struct sk_buff *skb)
448{
449	if (dev == rcu_dereference_bh(tls_get_ctx(sk)->netdev) ||
450	    netif_is_bond_master(dev))
451		return skb;
452
453	return tls_sw_fallback(sk, skb);
454}
455EXPORT_SYMBOL_GPL(tls_validate_xmit_skb);
456
457struct sk_buff *tls_validate_xmit_skb_sw(struct sock *sk,
458					 struct net_device *dev,
459					 struct sk_buff *skb)
460{
461	return tls_sw_fallback(sk, skb);
462}
463
464struct sk_buff *tls_encrypt_skb(struct sk_buff *skb)
465{
466	return tls_sw_fallback(skb->sk, skb);
467}
468EXPORT_SYMBOL_GPL(tls_encrypt_skb);
469
470int tls_sw_fallback_init(struct sock *sk,
471			 struct tls_offload_context_tx *offload_ctx,
472			 struct tls_crypto_info *crypto_info)
473{
474	const struct tls_cipher_desc *cipher_desc;
475	int rc;
476
477	cipher_desc = get_cipher_desc(crypto_info->cipher_type);
478	if (!cipher_desc || !cipher_desc->offloadable)
479		return -EINVAL;
480
481	offload_ctx->aead_send =
482	    crypto_alloc_aead(cipher_desc->cipher_name, 0, CRYPTO_ALG_ASYNC);
483	if (IS_ERR(offload_ctx->aead_send)) {
484		rc = PTR_ERR(offload_ctx->aead_send);
485		pr_err_ratelimited("crypto_alloc_aead failed rc=%d\n", rc);
486		offload_ctx->aead_send = NULL;
487		goto err_out;
488	}
489
490	rc = crypto_aead_setkey(offload_ctx->aead_send,
491				crypto_info_key(crypto_info, cipher_desc),
492				cipher_desc->key);
493	if (rc)
494		goto free_aead;
495
496	rc = crypto_aead_setauthsize(offload_ctx->aead_send, cipher_desc->tag);
497	if (rc)
498		goto free_aead;
499
500	return 0;
501free_aead:
502	crypto_free_aead(offload_ctx->aead_send);
503err_out:
504	return rc;
505}
506