b244682e38
Signed-off-by: Felix Fietkau <nbd@openwrt.org> SVN-Revision: 37769
515 lines
13 KiB
C
515 lines
13 KiB
C
/*
|
|
* A loadable module that benchmarks the OCF crypto speed from kernel space.
|
|
*
|
|
* Copyright (C) 2004-2010 David McCullough <david_mccullough@mcafee.com>
|
|
*
|
|
* LICENSE TERMS
|
|
*
|
|
* The free distribution and use of this software in both source and binary
|
|
* form is allowed (with or without changes) provided that:
|
|
*
|
|
* 1. distributions of this source code include the above copyright
|
|
* notice, this list of conditions and the following disclaimer;
|
|
*
|
|
* 2. distributions in binary form include the above copyright
|
|
* notice, this list of conditions and the following disclaimer
|
|
* in the documentation and/or other associated materials;
|
|
*
|
|
* 3. the copyright holder's name is not used to endorse products
|
|
* built using this software without specific written permission.
|
|
*
|
|
* ALTERNATIVELY, provided that this notice is retained in full, this product
|
|
* may be distributed under the terms of the GNU General Public License (GPL),
|
|
* in which case the provisions of the GPL apply INSTEAD OF those given above.
|
|
*
|
|
* DISCLAIMER
|
|
*
|
|
* This software is provided 'as is' with no explicit or implied warranties
|
|
* in respect of its properties, including, but not limited to, correctness
|
|
* and/or fitness for purpose.
|
|
*/
|
|
|
|
|
|
#include <linux/version.h>
|
|
#if LINUX_VERSION_CODE < KERNEL_VERSION(2,6,38) && !defined(AUTOCONF_INCLUDED)
|
|
#include <linux/config.h>
|
|
#endif
|
|
#include <linux/module.h>
|
|
#include <linux/init.h>
|
|
#include <linux/list.h>
|
|
#include <linux/slab.h>
|
|
#include <linux/wait.h>
|
|
#include <linux/sched.h>
|
|
#include <linux/spinlock.h>
|
|
#include <linux/interrupt.h>
|
|
#include <cryptodev.h>
|
|
|
|
#ifdef I_HAVE_AN_XSCALE_WITH_INTEL_SDK
|
|
#define BENCH_IXP_ACCESS_LIB 1
|
|
#endif
|
|
#ifdef BENCH_IXP_ACCESS_LIB
|
|
#include <IxTypes.h>
|
|
#include <IxOsBuffMgt.h>
|
|
#include <IxNpeDl.h>
|
|
#include <IxCryptoAcc.h>
|
|
#include <IxQMgr.h>
|
|
#include <IxOsServices.h>
|
|
#include <IxOsCacheMMU.h>
|
|
#endif
|
|
|
|
/*
|
|
* support for access lib version 1.4
|
|
*/
|
|
#ifndef IX_MBUF_PRIV
|
|
#define IX_MBUF_PRIV(x) ((x)->priv)
|
|
#endif
|
|
|
|
/*
|
|
* the number of simultaneously active requests
|
|
*/
|
|
static int request_q_len = 40;
|
|
module_param(request_q_len, int, 0);
|
|
MODULE_PARM_DESC(request_q_len, "Number of outstanding requests");
|
|
|
|
/*
|
|
* how many requests we want to have processed
|
|
*/
|
|
static int request_num = 1024;
|
|
module_param(request_num, int, 0);
|
|
MODULE_PARM_DESC(request_num, "run for at least this many requests");
|
|
|
|
/*
|
|
* the size of each request
|
|
*/
|
|
static int request_size = 1488;
|
|
module_param(request_size, int, 0);
|
|
MODULE_PARM_DESC(request_size, "size of each request");
|
|
|
|
/*
|
|
* OCF batching of requests
|
|
*/
|
|
static int request_batch = 1;
|
|
module_param(request_batch, int, 0);
|
|
MODULE_PARM_DESC(request_batch, "enable OCF request batching");
|
|
|
|
/*
|
|
* OCF immediate callback on completion
|
|
*/
|
|
static int request_cbimm = 1;
|
|
module_param(request_cbimm, int, 0);
|
|
MODULE_PARM_DESC(request_cbimm, "enable OCF immediate callback on completion");
|
|
|
|
/*
|
|
* a structure for each request
|
|
*/
|
|
typedef struct {
|
|
struct work_struct work;
|
|
#ifdef BENCH_IXP_ACCESS_LIB
|
|
IX_MBUF mbuf;
|
|
#endif
|
|
unsigned char *buffer;
|
|
} request_t;
|
|
|
|
static request_t *requests;
|
|
|
|
static spinlock_t ocfbench_counter_lock;
|
|
static int outstanding;
|
|
static int total;
|
|
|
|
/*************************************************************************/
|
|
/*
|
|
* OCF benchmark routines
|
|
*/
|
|
|
|
static uint64_t ocf_cryptoid;
|
|
static unsigned long jstart, jstop;
|
|
|
|
static int ocf_init(void);
|
|
static int ocf_cb(struct cryptop *crp);
|
|
static void ocf_request(void *arg);
|
|
#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,20)
|
|
static void ocf_request_wq(struct work_struct *work);
|
|
#endif
|
|
|
|
static int
|
|
ocf_init(void)
|
|
{
|
|
int error;
|
|
struct cryptoini crie, cria;
|
|
struct cryptodesc crda, crde;
|
|
|
|
memset(&crie, 0, sizeof(crie));
|
|
memset(&cria, 0, sizeof(cria));
|
|
memset(&crde, 0, sizeof(crde));
|
|
memset(&crda, 0, sizeof(crda));
|
|
|
|
cria.cri_alg = CRYPTO_SHA1_HMAC;
|
|
cria.cri_klen = 20 * 8;
|
|
cria.cri_key = "0123456789abcdefghij";
|
|
|
|
//crie.cri_alg = CRYPTO_3DES_CBC;
|
|
crie.cri_alg = CRYPTO_AES_CBC;
|
|
crie.cri_klen = 24 * 8;
|
|
crie.cri_key = "0123456789abcdefghijklmn";
|
|
|
|
crie.cri_next = &cria;
|
|
|
|
error = crypto_newsession(&ocf_cryptoid, &crie,
|
|
CRYPTOCAP_F_HARDWARE | CRYPTOCAP_F_SOFTWARE);
|
|
if (error) {
|
|
printk("crypto_newsession failed %d\n", error);
|
|
return -1;
|
|
}
|
|
return 0;
|
|
}
|
|
|
|
static int
|
|
ocf_cb(struct cryptop *crp)
|
|
{
|
|
request_t *r = (request_t *) crp->crp_opaque;
|
|
unsigned long flags;
|
|
|
|
if (crp->crp_etype)
|
|
printk("Error in OCF processing: %d\n", crp->crp_etype);
|
|
crypto_freereq(crp);
|
|
crp = NULL;
|
|
|
|
/* do all requests but take at least 1 second */
|
|
spin_lock_irqsave(&ocfbench_counter_lock, flags);
|
|
total++;
|
|
if (total > request_num && jstart + HZ < jiffies) {
|
|
outstanding--;
|
|
spin_unlock_irqrestore(&ocfbench_counter_lock, flags);
|
|
return 0;
|
|
}
|
|
spin_unlock_irqrestore(&ocfbench_counter_lock, flags);
|
|
|
|
schedule_work(&r->work);
|
|
return 0;
|
|
}
|
|
|
|
|
|
static void
|
|
ocf_request(void *arg)
|
|
{
|
|
request_t *r = arg;
|
|
struct cryptop *crp = crypto_getreq(2);
|
|
struct cryptodesc *crde, *crda;
|
|
unsigned long flags;
|
|
|
|
if (!crp) {
|
|
spin_lock_irqsave(&ocfbench_counter_lock, flags);
|
|
outstanding--;
|
|
spin_unlock_irqrestore(&ocfbench_counter_lock, flags);
|
|
return;
|
|
}
|
|
|
|
crde = crp->crp_desc;
|
|
crda = crde->crd_next;
|
|
|
|
crda->crd_skip = 0;
|
|
crda->crd_flags = 0;
|
|
crda->crd_len = request_size;
|
|
crda->crd_inject = request_size;
|
|
crda->crd_alg = CRYPTO_SHA1_HMAC;
|
|
crda->crd_key = "0123456789abcdefghij";
|
|
crda->crd_klen = 20 * 8;
|
|
|
|
crde->crd_skip = 0;
|
|
crde->crd_flags = CRD_F_IV_EXPLICIT | CRD_F_ENCRYPT;
|
|
crde->crd_len = request_size;
|
|
crde->crd_inject = request_size;
|
|
//crde->crd_alg = CRYPTO_3DES_CBC;
|
|
crde->crd_alg = CRYPTO_AES_CBC;
|
|
crde->crd_key = "0123456789abcdefghijklmn";
|
|
crde->crd_klen = 24 * 8;
|
|
|
|
crp->crp_ilen = request_size + 64;
|
|
crp->crp_flags = 0;
|
|
if (request_batch)
|
|
crp->crp_flags |= CRYPTO_F_BATCH;
|
|
if (request_cbimm)
|
|
crp->crp_flags |= CRYPTO_F_CBIMM;
|
|
crp->crp_buf = (caddr_t) r->buffer;
|
|
crp->crp_callback = ocf_cb;
|
|
crp->crp_sid = ocf_cryptoid;
|
|
crp->crp_opaque = (caddr_t) r;
|
|
crypto_dispatch(crp);
|
|
}
|
|
|
|
#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,20)
|
|
static void
|
|
ocf_request_wq(struct work_struct *work)
|
|
{
|
|
request_t *r = container_of(work, request_t, work);
|
|
ocf_request(r);
|
|
}
|
|
#endif
|
|
|
|
static void
|
|
ocf_done(void)
|
|
{
|
|
crypto_freesession(ocf_cryptoid);
|
|
}
|
|
|
|
/*************************************************************************/
|
|
#ifdef BENCH_IXP_ACCESS_LIB
|
|
/*************************************************************************/
|
|
/*
|
|
* CryptoAcc benchmark routines
|
|
*/
|
|
|
|
static IxCryptoAccCtx ixp_ctx;
|
|
static UINT32 ixp_ctx_id;
|
|
static IX_MBUF ixp_pri;
|
|
static IX_MBUF ixp_sec;
|
|
static int ixp_registered = 0;
|
|
|
|
static void ixp_register_cb(UINT32 ctx_id, IX_MBUF *bufp,
|
|
IxCryptoAccStatus status);
|
|
static void ixp_perform_cb(UINT32 ctx_id, IX_MBUF *sbufp, IX_MBUF *dbufp,
|
|
IxCryptoAccStatus status);
|
|
static void ixp_request(void *arg);
|
|
#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,20)
|
|
static void ixp_request_wq(struct work_struct *work);
|
|
#endif
|
|
|
|
static int
|
|
ixp_init(void)
|
|
{
|
|
IxCryptoAccStatus status;
|
|
|
|
ixp_ctx.cipherCtx.cipherAlgo = IX_CRYPTO_ACC_CIPHER_3DES;
|
|
ixp_ctx.cipherCtx.cipherMode = IX_CRYPTO_ACC_MODE_CBC;
|
|
ixp_ctx.cipherCtx.cipherKeyLen = 24;
|
|
ixp_ctx.cipherCtx.cipherBlockLen = IX_CRYPTO_ACC_DES_BLOCK_64;
|
|
ixp_ctx.cipherCtx.cipherInitialVectorLen = IX_CRYPTO_ACC_DES_IV_64;
|
|
memcpy(ixp_ctx.cipherCtx.key.cipherKey, "0123456789abcdefghijklmn", 24);
|
|
|
|
ixp_ctx.authCtx.authAlgo = IX_CRYPTO_ACC_AUTH_SHA1;
|
|
ixp_ctx.authCtx.authDigestLen = 12;
|
|
ixp_ctx.authCtx.aadLen = 0;
|
|
ixp_ctx.authCtx.authKeyLen = 20;
|
|
memcpy(ixp_ctx.authCtx.key.authKey, "0123456789abcdefghij", 20);
|
|
|
|
ixp_ctx.useDifferentSrcAndDestMbufs = 0;
|
|
ixp_ctx.operation = IX_CRYPTO_ACC_OP_ENCRYPT_AUTH ;
|
|
|
|
IX_MBUF_MLEN(&ixp_pri) = IX_MBUF_PKT_LEN(&ixp_pri) = 128;
|
|
IX_MBUF_MDATA(&ixp_pri) = (unsigned char *) kmalloc(128, SLAB_ATOMIC);
|
|
IX_MBUF_MLEN(&ixp_sec) = IX_MBUF_PKT_LEN(&ixp_sec) = 128;
|
|
IX_MBUF_MDATA(&ixp_sec) = (unsigned char *) kmalloc(128, SLAB_ATOMIC);
|
|
|
|
status = ixCryptoAccCtxRegister(&ixp_ctx, &ixp_pri, &ixp_sec,
|
|
ixp_register_cb, ixp_perform_cb, &ixp_ctx_id);
|
|
|
|
if (IX_CRYPTO_ACC_STATUS_SUCCESS == status) {
|
|
while (!ixp_registered)
|
|
schedule();
|
|
return ixp_registered < 0 ? -1 : 0;
|
|
}
|
|
|
|
printk("ixp: ixCryptoAccCtxRegister failed %d\n", status);
|
|
return -1;
|
|
}
|
|
|
|
static void
|
|
ixp_register_cb(UINT32 ctx_id, IX_MBUF *bufp, IxCryptoAccStatus status)
|
|
{
|
|
if (bufp) {
|
|
IX_MBUF_MLEN(bufp) = IX_MBUF_PKT_LEN(bufp) = 0;
|
|
kfree(IX_MBUF_MDATA(bufp));
|
|
IX_MBUF_MDATA(bufp) = NULL;
|
|
}
|
|
|
|
if (IX_CRYPTO_ACC_STATUS_WAIT == status)
|
|
return;
|
|
if (IX_CRYPTO_ACC_STATUS_SUCCESS == status)
|
|
ixp_registered = 1;
|
|
else
|
|
ixp_registered = -1;
|
|
}
|
|
|
|
static void
|
|
ixp_perform_cb(
|
|
UINT32 ctx_id,
|
|
IX_MBUF *sbufp,
|
|
IX_MBUF *dbufp,
|
|
IxCryptoAccStatus status)
|
|
{
|
|
request_t *r = NULL;
|
|
unsigned long flags;
|
|
|
|
/* do all requests but take at least 1 second */
|
|
spin_lock_irqsave(&ocfbench_counter_lock, flags);
|
|
total++;
|
|
if (total > request_num && jstart + HZ < jiffies) {
|
|
outstanding--;
|
|
spin_unlock_irqrestore(&ocfbench_counter_lock, flags);
|
|
return;
|
|
}
|
|
|
|
if (!sbufp || !(r = IX_MBUF_PRIV(sbufp))) {
|
|
printk("crappo %p %p\n", sbufp, r);
|
|
outstanding--;
|
|
spin_unlock_irqrestore(&ocfbench_counter_lock, flags);
|
|
return;
|
|
}
|
|
spin_unlock_irqrestore(&ocfbench_counter_lock, flags);
|
|
|
|
schedule_work(&r->work);
|
|
}
|
|
|
|
static void
|
|
ixp_request(void *arg)
|
|
{
|
|
request_t *r = arg;
|
|
IxCryptoAccStatus status;
|
|
unsigned long flags;
|
|
|
|
memset(&r->mbuf, 0, sizeof(r->mbuf));
|
|
IX_MBUF_MLEN(&r->mbuf) = IX_MBUF_PKT_LEN(&r->mbuf) = request_size + 64;
|
|
IX_MBUF_MDATA(&r->mbuf) = r->buffer;
|
|
IX_MBUF_PRIV(&r->mbuf) = r;
|
|
status = ixCryptoAccAuthCryptPerform(ixp_ctx_id, &r->mbuf, NULL,
|
|
0, request_size, 0, request_size, request_size, r->buffer);
|
|
if (IX_CRYPTO_ACC_STATUS_SUCCESS != status) {
|
|
printk("status1 = %d\n", status);
|
|
spin_lock_irqsave(&ocfbench_counter_lock, flags);
|
|
outstanding--;
|
|
spin_unlock_irqrestore(&ocfbench_counter_lock, flags);
|
|
return;
|
|
}
|
|
return;
|
|
}
|
|
|
|
#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,20)
|
|
static void
|
|
ixp_request_wq(struct work_struct *work)
|
|
{
|
|
request_t *r = container_of(work, request_t, work);
|
|
ixp_request(r);
|
|
}
|
|
#endif
|
|
|
|
static void
|
|
ixp_done(void)
|
|
{
|
|
/* we should free the session here but I am lazy :-) */
|
|
}
|
|
|
|
/*************************************************************************/
|
|
#endif /* BENCH_IXP_ACCESS_LIB */
|
|
/*************************************************************************/
|
|
|
|
int
|
|
ocfbench_init(void)
|
|
{
|
|
int i;
|
|
unsigned long mbps;
|
|
unsigned long flags;
|
|
|
|
printk("Crypto Speed tests\n");
|
|
|
|
requests = kmalloc(sizeof(request_t) * request_q_len, GFP_KERNEL);
|
|
if (!requests) {
|
|
printk("malloc failed\n");
|
|
return -EINVAL;
|
|
}
|
|
|
|
for (i = 0; i < request_q_len; i++) {
|
|
/* +64 for return data */
|
|
#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,20)
|
|
INIT_WORK(&requests[i].work, ocf_request_wq);
|
|
#else
|
|
INIT_WORK(&requests[i].work, ocf_request, &requests[i]);
|
|
#endif
|
|
requests[i].buffer = kmalloc(request_size + 128, GFP_DMA);
|
|
if (!requests[i].buffer) {
|
|
printk("malloc failed\n");
|
|
return -EINVAL;
|
|
}
|
|
memset(requests[i].buffer, '0' + i, request_size + 128);
|
|
}
|
|
|
|
/*
|
|
* OCF benchmark
|
|
*/
|
|
printk("OCF: testing ...\n");
|
|
if (ocf_init() == -1)
|
|
return -EINVAL;
|
|
|
|
spin_lock_init(&ocfbench_counter_lock);
|
|
total = outstanding = 0;
|
|
jstart = jiffies;
|
|
for (i = 0; i < request_q_len; i++) {
|
|
spin_lock_irqsave(&ocfbench_counter_lock, flags);
|
|
outstanding++;
|
|
spin_unlock_irqrestore(&ocfbench_counter_lock, flags);
|
|
ocf_request(&requests[i]);
|
|
}
|
|
while (outstanding > 0)
|
|
schedule();
|
|
jstop = jiffies;
|
|
|
|
mbps = 0;
|
|
if (jstop > jstart) {
|
|
mbps = (unsigned long) total * (unsigned long) request_size * 8;
|
|
mbps /= ((jstop - jstart) * 1000) / HZ;
|
|
}
|
|
printk("OCF: %d requests of %d bytes in %d jiffies (%d.%03d Mbps)\n",
|
|
total, request_size, (int)(jstop - jstart),
|
|
((int)mbps) / 1000, ((int)mbps) % 1000);
|
|
ocf_done();
|
|
|
|
#ifdef BENCH_IXP_ACCESS_LIB
|
|
/*
|
|
* IXP benchmark
|
|
*/
|
|
printk("IXP: testing ...\n");
|
|
ixp_init();
|
|
total = outstanding = 0;
|
|
jstart = jiffies;
|
|
for (i = 0; i < request_q_len; i++) {
|
|
#if LINUX_VERSION_CODE >= KERNEL_VERSION(2,6,20)
|
|
INIT_WORK(&requests[i].work, ixp_request_wq);
|
|
#else
|
|
INIT_WORK(&requests[i].work, ixp_request, &requests[i]);
|
|
#endif
|
|
spin_lock_irqsave(&ocfbench_counter_lock, flags);
|
|
outstanding++;
|
|
spin_unlock_irqrestore(&ocfbench_counter_lock, flags);
|
|
ixp_request(&requests[i]);
|
|
}
|
|
while (outstanding > 0)
|
|
schedule();
|
|
jstop = jiffies;
|
|
|
|
mbps = 0;
|
|
if (jstop > jstart) {
|
|
mbps = (unsigned long) total * (unsigned long) request_size * 8;
|
|
mbps /= ((jstop - jstart) * 1000) / HZ;
|
|
}
|
|
printk("IXP: %d requests of %d bytes in %d jiffies (%d.%03d Mbps)\n",
|
|
total, request_size, jstop - jstart,
|
|
((int)mbps) / 1000, ((int)mbps) % 1000);
|
|
ixp_done();
|
|
#endif /* BENCH_IXP_ACCESS_LIB */
|
|
|
|
for (i = 0; i < request_q_len; i++)
|
|
kfree(requests[i].buffer);
|
|
kfree(requests);
|
|
return -EINVAL; /* always fail to load so it can be re-run quickly ;-) */
|
|
}
|
|
|
|
static void __exit ocfbench_exit(void)
|
|
{
|
|
}
|
|
|
|
module_init(ocfbench_init);
|
|
module_exit(ocfbench_exit);
|
|
|
|
MODULE_LICENSE("Dual BSD/GPL");
|
|
MODULE_AUTHOR("David McCullough <david_mccullough@mcafee.com>");
|
|
MODULE_DESCRIPTION("Benchmark various in-kernel crypto speeds");
|