blob: 4e38a61fbe5dc7747b4b3ea0b67d0069850b263b [file] [log] [blame]
Tom Lendacky63b94502013-11-12 11:46:16 -06001/*
2 * AMD Cryptographic Coprocessor (CCP) driver
3 *
Gary R Hook553d2372016-03-01 13:49:04 -06004 * Copyright (C) 2013,2016 Advanced Micro Devices, Inc.
Tom Lendacky63b94502013-11-12 11:46:16 -06005 *
6 * Author: Tom Lendacky <thomas.lendacky@amd.com>
Gary R Hookfba88552016-07-26 19:09:20 -05007 * Author: Gary R Hook <gary.hook@amd.com>
Tom Lendacky63b94502013-11-12 11:46:16 -06008 *
9 * This program is free software; you can redistribute it and/or modify
10 * it under the terms of the GNU General Public License version 2 as
11 * published by the Free Software Foundation.
12 */
13
14#ifndef __CCP_DEV_H__
15#define __CCP_DEV_H__
16
17#include <linux/device.h>
18#include <linux/pci.h>
19#include <linux/spinlock.h>
20#include <linux/mutex.h>
21#include <linux/list.h>
22#include <linux/wait.h>
23#include <linux/dmapool.h>
24#include <linux/hw_random.h>
Tom Lendacky8db88462015-02-03 13:07:05 -060025#include <linux/bitops.h>
Gary R Hook58ea8ab2016-04-18 09:21:44 -050026#include <linux/interrupt.h>
27#include <linux/irqreturn.h>
28#include <linux/dmaengine.h>
Tom Lendacky63b94502013-11-12 11:46:16 -060029
Gary R Hook553d2372016-03-01 13:49:04 -060030#define MAX_CCP_NAME_LEN 16
Tom Lendacky63b94502013-11-12 11:46:16 -060031#define MAX_DMAPOOL_NAME_LEN 32
32
33#define MAX_HW_QUEUES 5
34#define MAX_CMD_QLEN 100
35
36#define TRNG_RETRIES 10
37
Tom Lendacky126ae9a2014-07-10 10:58:35 -050038#define CACHE_NONE 0x00
Tom Lendackyc4f4b322014-06-05 10:17:57 -050039#define CACHE_WB_NO_ALLOC 0xb7
40
Tom Lendacky63b94502013-11-12 11:46:16 -060041/****** Register Mappings ******/
42#define Q_MASK_REG 0x000
43#define TRNG_OUT_REG 0x00c
44#define IRQ_MASK_REG 0x040
45#define IRQ_STATUS_REG 0x200
46
47#define DEL_CMD_Q_JOB 0x124
48#define DEL_Q_ACTIVE 0x00000200
49#define DEL_Q_ID_SHIFT 6
50
51#define CMD_REQ0 0x180
52#define CMD_REQ_INCR 0x04
53
54#define CMD_Q_STATUS_BASE 0x210
55#define CMD_Q_INT_STATUS_BASE 0x214
56#define CMD_Q_STATUS_INCR 0x20
57
Tom Lendackyc4f4b322014-06-05 10:17:57 -050058#define CMD_Q_CACHE_BASE 0x228
Tom Lendacky63b94502013-11-12 11:46:16 -060059#define CMD_Q_CACHE_INC 0x20
60
Tom Lendacky8db88462015-02-03 13:07:05 -060061#define CMD_Q_ERROR(__qs) ((__qs) & 0x0000003f)
62#define CMD_Q_DEPTH(__qs) (((__qs) >> 12) & 0x0000000f)
Tom Lendacky63b94502013-11-12 11:46:16 -060063
64/****** REQ0 Related Values ******/
65#define REQ0_WAIT_FOR_WRITE 0x00000004
66#define REQ0_INT_ON_COMPLETE 0x00000002
67#define REQ0_STOP_ON_COMPLETE 0x00000001
68
69#define REQ0_CMD_Q_SHIFT 9
70#define REQ0_JOBID_SHIFT 3
71
72/****** REQ1 Related Values ******/
73#define REQ1_PROTECT_SHIFT 27
74#define REQ1_ENGINE_SHIFT 23
75#define REQ1_KEY_KSB_SHIFT 2
76
77#define REQ1_EOM 0x00000002
78#define REQ1_INIT 0x00000001
79
80/* AES Related Values */
81#define REQ1_AES_TYPE_SHIFT 21
82#define REQ1_AES_MODE_SHIFT 18
83#define REQ1_AES_ACTION_SHIFT 17
84#define REQ1_AES_CFB_SIZE_SHIFT 10
85
86/* XTS-AES Related Values */
87#define REQ1_XTS_AES_SIZE_SHIFT 10
88
89/* SHA Related Values */
90#define REQ1_SHA_TYPE_SHIFT 21
91
92/* RSA Related Values */
93#define REQ1_RSA_MOD_SIZE_SHIFT 10
94
95/* Pass-Through Related Values */
96#define REQ1_PT_BW_SHIFT 12
97#define REQ1_PT_BS_SHIFT 10
98
99/* ECC Related Values */
100#define REQ1_ECC_AFFINE_CONVERT 0x00200000
101#define REQ1_ECC_FUNCTION_SHIFT 18
102
103/****** REQ4 Related Values ******/
104#define REQ4_KSB_SHIFT 18
105#define REQ4_MEMTYPE_SHIFT 16
106
107/****** REQ6 Related Values ******/
108#define REQ6_MEMTYPE_SHIFT 16
109
Tom Lendacky63b94502013-11-12 11:46:16 -0600110/****** Key Storage Block ******/
111#define KSB_START 77
112#define KSB_END 127
113#define KSB_COUNT (KSB_END - KSB_START + 1)
Gary R Hook956ee212016-07-26 19:09:40 -0500114#define CCP_SB_BITS 256
Tom Lendacky63b94502013-11-12 11:46:16 -0600115
116#define CCP_JOBID_MASK 0x0000003f
117
118#define CCP_DMAPOOL_MAX_SIZE 64
Tom Lendacky8db88462015-02-03 13:07:05 -0600119#define CCP_DMAPOOL_ALIGN BIT(5)
Tom Lendacky63b94502013-11-12 11:46:16 -0600120
121#define CCP_REVERSE_BUF_SIZE 64
122
Gary R Hook956ee212016-07-26 19:09:40 -0500123#define CCP_AES_KEY_SB_COUNT 1
124#define CCP_AES_CTX_SB_COUNT 1
Tom Lendacky63b94502013-11-12 11:46:16 -0600125
Gary R Hook956ee212016-07-26 19:09:40 -0500126#define CCP_XTS_AES_KEY_SB_COUNT 1
127#define CCP_XTS_AES_CTX_SB_COUNT 1
Tom Lendacky63b94502013-11-12 11:46:16 -0600128
Gary R Hook956ee212016-07-26 19:09:40 -0500129#define CCP_SHA_SB_COUNT 1
Tom Lendacky63b94502013-11-12 11:46:16 -0600130
131#define CCP_RSA_MAX_WIDTH 4096
132
133#define CCP_PASSTHRU_BLOCKSIZE 256
134#define CCP_PASSTHRU_MASKSIZE 32
Gary R Hook956ee212016-07-26 19:09:40 -0500135#define CCP_PASSTHRU_SB_COUNT 1
Tom Lendacky63b94502013-11-12 11:46:16 -0600136
137#define CCP_ECC_MODULUS_BYTES 48 /* 384-bits */
138#define CCP_ECC_MAX_OPERANDS 6
139#define CCP_ECC_MAX_OUTPUTS 3
140#define CCP_ECC_SRC_BUF_SIZE 448
141#define CCP_ECC_DST_BUF_SIZE 192
142#define CCP_ECC_OPERAND_SIZE 64
143#define CCP_ECC_OUTPUT_SIZE 64
144#define CCP_ECC_RESULT_OFFSET 60
145#define CCP_ECC_RESULT_SUCCESS 0x0001
146
Gary R Hook956ee212016-07-26 19:09:40 -0500147#define CCP_SB_BYTES 32
148
Gary R Hookea0375a2016-03-01 13:49:25 -0600149struct ccp_op;
Tom Lendacky63b94502013-11-12 11:46:16 -0600150struct ccp_device;
151struct ccp_cmd;
152
Gary R Hook58ea8ab2016-04-18 09:21:44 -0500153struct ccp_dma_cmd {
154 struct list_head entry;
155
156 struct ccp_cmd ccp_cmd;
157};
158
159struct ccp_dma_desc {
160 struct list_head entry;
161
162 struct ccp_device *ccp;
163
164 struct list_head pending;
165 struct list_head active;
166
167 enum dma_status status;
168 struct dma_async_tx_descriptor tx_desc;
169 size_t len;
170};
171
172struct ccp_dma_chan {
173 struct ccp_device *ccp;
174
175 spinlock_t lock;
176 struct list_head pending;
177 struct list_head active;
178 struct list_head complete;
179
180 struct tasklet_struct cleanup_tasklet;
181
182 enum dma_status status;
183 struct dma_chan dma_chan;
184};
185
Tom Lendacky63b94502013-11-12 11:46:16 -0600186struct ccp_cmd_queue {
187 struct ccp_device *ccp;
188
189 /* Queue identifier */
190 u32 id;
191
192 /* Queue dma pool */
193 struct dma_pool *dma_pool;
194
Gary R Hook956ee212016-07-26 19:09:40 -0500195 /* Per-queue reserved storage block(s) */
196 u32 sb_key;
197 u32 sb_ctx;
Tom Lendacky63b94502013-11-12 11:46:16 -0600198
199 /* Queue processing thread */
200 struct task_struct *kthread;
201 unsigned int active;
202 unsigned int suspended;
203
204 /* Number of free command slots available */
205 unsigned int free_slots;
206
207 /* Interrupt masks */
208 u32 int_ok;
209 u32 int_err;
210
211 /* Register addresses for queue */
212 void __iomem *reg_status;
213 void __iomem *reg_int_status;
214
215 /* Status values from job */
216 u32 int_status;
217 u32 q_status;
218 u32 q_int_status;
219 u32 cmd_error;
220
221 /* Interrupt wait queue */
222 wait_queue_head_t int_queue;
223 unsigned int int_rcvd;
224} ____cacheline_aligned;
225
226struct ccp_device {
Gary R Hook553d2372016-03-01 13:49:04 -0600227 struct list_head entry;
228
Gary R Hookc7019c42016-03-01 13:49:15 -0600229 struct ccp_vdata *vdata;
Gary R Hook553d2372016-03-01 13:49:04 -0600230 unsigned int ord;
231 char name[MAX_CCP_NAME_LEN];
232 char rngname[MAX_CCP_NAME_LEN];
233
Tom Lendacky63b94502013-11-12 11:46:16 -0600234 struct device *dev;
235
Gary R Hookfa242e82016-07-26 18:09:46 -0500236 /* Bus specific device information
Tom Lendacky63b94502013-11-12 11:46:16 -0600237 */
238 void *dev_specific;
239 int (*get_irq)(struct ccp_device *ccp);
240 void (*free_irq)(struct ccp_device *ccp);
Tom Lendacky3d775652014-06-05 10:17:45 -0500241 unsigned int irq;
Tom Lendacky63b94502013-11-12 11:46:16 -0600242
Gary R Hookfa242e82016-07-26 18:09:46 -0500243 /* I/O area used for device communication. The register mapping
Tom Lendacky63b94502013-11-12 11:46:16 -0600244 * starts at an offset into the mapped bar.
245 * The CMD_REQx registers and the Delete_Cmd_Queue_Job register
246 * need to be protected while a command queue thread is accessing
247 * them.
248 */
249 struct mutex req_mutex ____cacheline_aligned;
250 void __iomem *io_map;
251 void __iomem *io_regs;
252
Gary R Hookfa242e82016-07-26 18:09:46 -0500253 /* Master lists that all cmds are queued on. Because there can be
Tom Lendacky63b94502013-11-12 11:46:16 -0600254 * more than one CCP command queue that can process a cmd a separate
255 * backlog list is neeeded so that the backlog completion call
256 * completes before the cmd is available for execution.
257 */
258 spinlock_t cmd_lock ____cacheline_aligned;
259 unsigned int cmd_count;
260 struct list_head cmd;
261 struct list_head backlog;
262
Gary R Hookfa242e82016-07-26 18:09:46 -0500263 /* The command queues. These represent the queues available on the
Tom Lendacky63b94502013-11-12 11:46:16 -0600264 * CCP that are available for processing cmds
265 */
266 struct ccp_cmd_queue cmd_q[MAX_HW_QUEUES];
267 unsigned int cmd_q_count;
268
Gary R Hookfa242e82016-07-26 18:09:46 -0500269 /* Support for the CCP True RNG
Tom Lendacky63b94502013-11-12 11:46:16 -0600270 */
271 struct hwrng hwrng;
272 unsigned int hwrng_retries;
273
Gary R Hookfa242e82016-07-26 18:09:46 -0500274 /* Support for the CCP DMA capabilities
Gary R Hook58ea8ab2016-04-18 09:21:44 -0500275 */
276 struct dma_device dma_dev;
277 struct ccp_dma_chan *ccp_dma_chan;
278 struct kmem_cache *dma_cmd_cache;
279 struct kmem_cache *dma_desc_cache;
280
Gary R Hookfa242e82016-07-26 18:09:46 -0500281 /* A counter used to generate job-ids for cmds submitted to the CCP
Tom Lendacky63b94502013-11-12 11:46:16 -0600282 */
283 atomic_t current_id ____cacheline_aligned;
284
Gary R Hook58a690b2016-07-26 19:09:50 -0500285 /* The v3 CCP uses key storage blocks (SB) to maintain context for
286 * certain operations. To prevent multiple cmds from using the same
287 * SB range a command queue reserves an SB range for the duration of
288 * the cmd. Each queue, will however, reserve 2 SB blocks for
289 * operations that only require single SB entries (eg. AES context/iv
290 * and key) in order to avoid allocation contention. This will reserve
291 * at most 10 SB entries, leaving 40 SB entries available for dynamic
292 * allocation.
293 *
294 * The v5 CCP Local Storage Block (LSB) is broken up into 8
295 * memrory ranges, each of which can be enabled for access by one
296 * or more queues. Device initialization takes this into account,
297 * and attempts to assign one region for exclusive use by each
298 * available queue; the rest are then aggregated as "public" use.
299 * If there are fewer regions than queues, all regions are shared
300 * amongst all queues.
Tom Lendacky63b94502013-11-12 11:46:16 -0600301 */
Gary R Hook956ee212016-07-26 19:09:40 -0500302 struct mutex sb_mutex ____cacheline_aligned;
303 DECLARE_BITMAP(sb, KSB_COUNT);
304 wait_queue_head_t sb_queue;
305 unsigned int sb_avail;
306 unsigned int sb_count;
307 u32 sb_start;
Tom Lendacky63b94502013-11-12 11:46:16 -0600308
309 /* Suspend support */
310 unsigned int suspending;
311 wait_queue_head_t suspend_queue;
Tom Lendacky126ae9a2014-07-10 10:58:35 -0500312
313 /* DMA caching attribute support */
314 unsigned int axcache;
Tom Lendacky63b94502013-11-12 11:46:16 -0600315};
316
Gary R Hookea0375a2016-03-01 13:49:25 -0600317enum ccp_memtype {
318 CCP_MEMTYPE_SYSTEM = 0,
Gary R Hook956ee212016-07-26 19:09:40 -0500319 CCP_MEMTYPE_SB,
Gary R Hookea0375a2016-03-01 13:49:25 -0600320 CCP_MEMTYPE_LOCAL,
321 CCP_MEMTYPE__LAST,
322};
323
324struct ccp_dma_info {
325 dma_addr_t address;
326 unsigned int offset;
327 unsigned int length;
328 enum dma_data_direction dir;
329};
330
331struct ccp_dm_workarea {
332 struct device *dev;
333 struct dma_pool *dma_pool;
334 unsigned int length;
335
336 u8 *address;
337 struct ccp_dma_info dma;
338};
339
340struct ccp_sg_workarea {
341 struct scatterlist *sg;
342 int nents;
343
344 struct scatterlist *dma_sg;
345 struct device *dma_dev;
346 unsigned int dma_count;
347 enum dma_data_direction dma_dir;
348
349 unsigned int sg_used;
350
351 u64 bytes_left;
352};
353
354struct ccp_data {
355 struct ccp_sg_workarea sg_wa;
356 struct ccp_dm_workarea dm_wa;
357};
358
359struct ccp_mem {
360 enum ccp_memtype type;
361 union {
362 struct ccp_dma_info dma;
Gary R Hook956ee212016-07-26 19:09:40 -0500363 u32 sb;
Gary R Hookea0375a2016-03-01 13:49:25 -0600364 } u;
365};
366
367struct ccp_aes_op {
368 enum ccp_aes_type type;
369 enum ccp_aes_mode mode;
370 enum ccp_aes_action action;
371};
372
373struct ccp_xts_aes_op {
374 enum ccp_aes_action action;
375 enum ccp_xts_aes_unit_size unit_size;
376};
377
378struct ccp_sha_op {
379 enum ccp_sha_type type;
380 u64 msg_bits;
381};
382
383struct ccp_rsa_op {
384 u32 mod_size;
385 u32 input_len;
386};
387
388struct ccp_passthru_op {
389 enum ccp_passthru_bitwise bit_mod;
390 enum ccp_passthru_byteswap byte_swap;
391};
392
393struct ccp_ecc_op {
394 enum ccp_ecc_function function;
395};
396
397struct ccp_op {
398 struct ccp_cmd_queue *cmd_q;
399
400 u32 jobid;
401 u32 ioc;
402 u32 soc;
Gary R Hook956ee212016-07-26 19:09:40 -0500403 u32 sb_key;
404 u32 sb_ctx;
Gary R Hookea0375a2016-03-01 13:49:25 -0600405 u32 init;
406 u32 eom;
407
408 struct ccp_mem src;
409 struct ccp_mem dst;
410
411 union {
412 struct ccp_aes_op aes;
413 struct ccp_xts_aes_op xts;
414 struct ccp_sha_op sha;
415 struct ccp_rsa_op rsa;
416 struct ccp_passthru_op passthru;
417 struct ccp_ecc_op ecc;
418 } u;
419};
420
421static inline u32 ccp_addr_lo(struct ccp_dma_info *info)
422{
423 return lower_32_bits(info->address + info->offset);
424}
425
426static inline u32 ccp_addr_hi(struct ccp_dma_info *info)
427{
428 return upper_32_bits(info->address + info->offset) & 0x0000ffff;
429}
430
Tom Lendacky63b94502013-11-12 11:46:16 -0600431int ccp_pci_init(void);
432void ccp_pci_exit(void);
433
Tom Lendackyc4f4b322014-06-05 10:17:57 -0500434int ccp_platform_init(void);
435void ccp_platform_exit(void);
436
Gary R Hookea0375a2016-03-01 13:49:25 -0600437void ccp_add_device(struct ccp_device *ccp);
438void ccp_del_device(struct ccp_device *ccp);
Tom Lendacky63b94502013-11-12 11:46:16 -0600439
Gary R Hookea0375a2016-03-01 13:49:25 -0600440struct ccp_device *ccp_alloc_struct(struct device *dev);
441bool ccp_queues_suspended(struct ccp_device *ccp);
442int ccp_cmd_queue_thread(void *data);
Tom Lendacky63b94502013-11-12 11:46:16 -0600443
444int ccp_run_cmd(struct ccp_cmd_queue *cmd_q, struct ccp_cmd *cmd);
445
Gary R Hook58ea8ab2016-04-18 09:21:44 -0500446int ccp_dmaengine_register(struct ccp_device *ccp);
447void ccp_dmaengine_unregister(struct ccp_device *ccp);
448
Gary R Hook58a690b2016-07-26 19:09:50 -0500449/* Structure for computation functions that are device-specific */
450struct ccp_actions {
451 int (*aes)(struct ccp_op *);
452 int (*xts_aes)(struct ccp_op *);
453 int (*sha)(struct ccp_op *);
454 int (*rsa)(struct ccp_op *);
455 int (*passthru)(struct ccp_op *);
456 int (*ecc)(struct ccp_op *);
457 u32 (*sballoc)(struct ccp_cmd_queue *, unsigned int);
458 void (*sbfree)(struct ccp_cmd_queue *, unsigned int,
459 unsigned int);
460 int (*init)(struct ccp_device *);
461 void (*destroy)(struct ccp_device *);
462 irqreturn_t (*irqhandler)(int, void *);
463};
464
465/* Structure to hold CCP version-specific values */
466struct ccp_vdata {
467 unsigned int version;
468 int (*init)(struct ccp_device *);
469 const struct ccp_actions *perform;
470 const unsigned int bar;
471 const unsigned int offset;
472};
473
474extern struct ccp_vdata ccpv3;
475
Tom Lendacky63b94502013-11-12 11:46:16 -0600476#endif