/****************************************************************************** * function: * qat_engine_init(ENGINE *e) * * @param e [IN] - OpenSSL engine pointer * * description: * Qat engine init function, associated with Crypto memory setup * and cpaStartInstance setups. ******************************************************************************/ static int qat_engine_init(ENGINE *e) { int instNum, err, checkLimitStatus; CpaStatus status = CPA_STATUS_SUCCESS; CpaBoolean limitDevAccess = CPA_FALSE; pthread_mutex_lock(&qat_engine_mutex); if(engine_inited) { pthread_mutex_unlock(&qat_engine_mutex); return 1; } DEBUG("[%s] ---- Engine Initing\n\n", __func__); CRYPTO_INIT_QAT_LOG(); if ((err = pthread_key_create(&qatInstanceForThread, NULL)) != 0) { fprintf(stderr, "pthread_key_create: %s\n", strerror(err)); pthread_mutex_unlock(&qat_engine_mutex); return 0; } checkLimitStatus = checkLimitDevAccessValue((int *)&limitDevAccess, ICPConfigSectionName_libcrypto); if (!checkLimitStatus) { WARN("Assuming LimitDevAccess = 0\n"); } /* Initialise the QAT hardware */ if (CPA_STATUS_SUCCESS != icp_sal_userStartMultiProcess(ICPConfigSectionName_libcrypto, limitDevAccess)) { WARN("icp_sal_userStart failed\n"); pthread_mutex_unlock(&qat_engine_mutex); return 0; } /* Get the number of available instances */ status = cpaCyGetNumInstances(&numInstances); if (CPA_STATUS_SUCCESS != status) { WARN("cpaCyGetNumInstances failed, status=%d\n", status); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } if (!numInstances) { WARN("No crypto instances found\n"); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } DEBUG("%s: %d Cy instances got\n", __func__, numInstances); /* Allocate memory for the instance handle array */ qatInstanceHandles = (CpaInstanceHandle *) OPENSSL_zalloc(((int)numInstances) * sizeof(CpaInstanceHandle)); if (NULL == qatInstanceHandles) { WARN("OPENSSL_zalloc() failed for instance handles.\n"); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } /* Get the Cy instances */ status = cpaCyGetInstances(numInstances, qatInstanceHandles); if (CPA_STATUS_SUCCESS != status) { WARN("cpaCyGetInstances failed, status=%d\n", status); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } if (0 == enable_external_polling) { if (qat_is_event_driven()) { CpaStatus status; int flags; int engine_fd; icp_polling_threads = (pthread_t *) OPENSSL_zalloc(sizeof(pthread_t)); /* Add the file descriptor to an epoll event list */ internal_efd = epoll_create1(0); if (-1 == internal_efd) { WARN("Error creating epoll fd\n"); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } for (instNum = 0; instNum < numInstances; instNum++) { /* Get the file descriptor for the instance */ status = icp_sal_CyGetFileDescriptor(qatInstanceHandles[instNum], &engine_fd); if (CPA_STATUS_FAIL == status) { WARN("Error getting file descriptor for instance\n"); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } /* Make the file descriptor non-blocking */ eng_poll_st[instNum].eng_fd = engine_fd; eng_poll_st[instNum].inst_index = instNum; flags = fcntl(engine_fd, F_GETFL, 0); fcntl(engine_fd, F_SETFL, flags | O_NONBLOCK); eng_epoll_events[instNum].data.ptr = &eng_poll_st[instNum]; eng_epoll_events[instNum].events = EPOLLIN | EPOLLET; if (-1 == epoll_ctl(internal_efd, EPOLL_CTL_ADD, engine_fd, &eng_epoll_events[instNum])) { WARN("Error adding fd to epoll\n"); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } } } else { icp_polling_threads = (pthread_t *) OPENSSL_zalloc(((int)numInstances) * sizeof(pthread_t)); } if (NULL == icp_polling_threads) { WARN("OPENSSL_malloc() failed for icp_polling_threads.\n"); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } } /* Set translation function and start each instance */ for (instNum = 0; instNum < numInstances; instNum++) { /* Set the address translation function */ status = cpaCySetAddressTranslation(qatInstanceHandles[instNum], virtualToPhysical); if (CPA_STATUS_SUCCESS != status) { WARN("cpaCySetAddressTranslation failed, status=%d\n", status); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } /* Start the instances */ status = cpaCyStartInstance(qatInstanceHandles[instNum]); if (CPA_STATUS_SUCCESS != status) { WARN("cpaCyStartInstance failed, status=%d\n", status); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } if (0 == enable_external_polling && !qat_is_event_driven()) { /* Create the polling threads */ if (qat_create_thread(&icp_polling_threads[instNum], NULL, sendPoll_ns, qatInstanceHandles[instNum])) { WARN("Polling thread create failed\n"); instance_started[instNum] = 1; pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } if (qat_adjust_thread_affinity(icp_polling_threads[instNum]) == 0) { instance_started[instNum] = 1; pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } } instance_started[instNum] = 1; } if (0 == enable_external_polling && qat_is_event_driven()) { if (qat_create_thread(&icp_polling_threads[0], NULL, eventPoll_ns, NULL)) { WARN("Epoll thread create failed\n"); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } if (qat_adjust_thread_affinity(icp_polling_threads[0]) == 0) { pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } } /* Reset currInst */ currInst = 0; engine_inited = 1; pthread_mutex_unlock(&qat_engine_mutex); return 1; }
/** ***************************************************************************** * @ingroup dsaPerformance * dsaPerformance * * @description * This function is called by the framework to execute the dsaPerform * thread * *****************************************************************************/ void dsaPerformance(single_thread_test_data_t* testSetup) { dsa_test_params_t dsaSetup; Cpa16U numInstances = 0; CpaInstanceHandle *cyInstances = NULL; CpaStatus status = CPA_STATUS_FAIL; dsa_test_params_t* params = (dsa_test_params_t*)testSetup->setupPtr; CpaInstanceInfo2 instanceInfo = {0}; /*this barrier is to halt this thread when run in user space context, the * startThreads function releases this barrier, in kernel space it does * nothing, but kernel space threads do not start until we call startThreads * anyway */ startBarrier(); /*give our thread a unique memory location to store performance stats */ dsaSetup.threadID = testSetup->threadID; dsaSetup.performanceStats = testSetup->performanceStats; dsaSetup.hashAlg= params->hashAlg; dsaSetup.pLenInBytes= params->pLenInBytes; dsaSetup.qLenInBytes= params->qLenInBytes; dsaSetup.numBuffers = params->numBuffers; dsaSetup.numLoops = params->numLoops; dsaSetup.syncMode = params->syncMode; /*get the instance handles so that we can start our thread on the selected * instance */ status = cpaCyGetNumInstances(&numInstances); if(CPA_STATUS_SUCCESS != status || numInstances == 0) { PRINT_ERR("Could not get any instances\n"); PRINT_ERR("DSA Thread FAILED\n"); dsaSetup.performanceStats->threadReturnStatus = CPA_STATUS_FAIL; sampleCodeThreadExit(); } cyInstances = qaeMemAlloc(sizeof(CpaInstanceHandle) * numInstances); if(NULL == cyInstances) { PRINT_ERR("Could not allocate memory for logical instances\n"); dsaSetup.performanceStats->threadReturnStatus = CPA_STATUS_FAIL; sampleCodeThreadExit(); } cpaCyGetInstances(numInstances, cyInstances); /* give our thread a logical crypto instance to use * use % to wrap around the max number of instances */ dsaSetup.cyInstanceHandle = cyInstances[(testSetup->logicalQaInstance)%numInstances]; status = cpaCyInstanceGetInfo2(dsaSetup.cyInstanceHandle, &instanceInfo); if(CPA_STATUS_SUCCESS != status) { PRINT_ERR("%s::%d cpaCyInstanceGetInfo2 failed", __func__,__LINE__); qaeMemFree((void**)&cyInstances); dsaSetup.performanceStats->threadReturnStatus = CPA_STATUS_FAIL; sampleCodeThreadExit(); } if(instanceInfo.physInstId.packageId > packageIdCount_g) { packageIdCount_g = instanceInfo.physInstId.packageId; } /*launch function that does all the work */ status = dsaPerform(&dsaSetup); if(CPA_STATUS_SUCCESS != status) { PRINT("DSA Thread %u FAILED\n", testSetup->threadID); dsaSetup.performanceStats->threadReturnStatus = CPA_STATUS_FAIL; } else { /*set the print function that can be used to print stats at the end of * the test */ testSetup->statsPrintFunc=(stats_print_func_t)dsaPrintStats; } qaeMemFree((void**)&cyInstances); sampleCodeThreadExit(); }
/***************************************************************************** *@ingroup cryptoThreads * * @description * This function sets up an IKE-RSA thread ******************************************************************************/ void ikeRsaPerformance(single_thread_test_data_t* testSetup) { asym_test_params_t ikeRsaSetup; asym_test_params_t* setup = (asym_test_params_t*)testSetup->setupPtr; Cpa16U numInstances = 0; CpaInstanceHandle *cyInstances = NULL; CpaStatus status = CPA_STATUS_FAIL; /* This barrier is to halt this thread when run in user space context, the * startThreads function releases this barrier, in kernel space it does * nothing, but kernel space threads do not start until we call startThreads * anyway*/ startBarrier(); /*give our thread a unique memory location to store performance stats*/ ikeRsaSetup.performanceStats = testSetup->performanceStats; /*get the instance handles so that we can start our thread on the selected * instance*/ status = cpaCyGetNumInstances(&numInstances); if( CPA_STATUS_SUCCESS != status || numInstances == 0) { PRINT_ERR("cpaCyGetNumInstances error, status:%d, numInstanaces:%d\n", status, numInstances); ikeRsaSetup.performanceStats->threadReturnStatus = CPA_STATUS_FAIL; sampleCodeThreadExit(); } cyInstances = qaeMemAlloc(sizeof(CpaInstanceHandle)*numInstances); if(cyInstances == NULL) { PRINT_ERR("Error allocating memory for instance handles\n"); ikeRsaSetup.performanceStats->threadReturnStatus = CPA_STATUS_FAIL; sampleCodeThreadExit(); } if(cpaCyGetInstances(numInstances, cyInstances) != CPA_STATUS_SUCCESS) { PRINT_ERR("Failed to get instances\n"); ikeRsaSetup.performanceStats->threadReturnStatus = CPA_STATUS_FAIL; qaeMemFree((void**)&cyInstances); sampleCodeThreadExit(); } if(testSetup->logicalQaInstance > numInstances) { PRINT_ERR("%u is Invalid Logical QA Instance, max is: %u\n", testSetup->logicalQaInstance, numInstances); ikeRsaSetup.performanceStats->threadReturnStatus = CPA_STATUS_FAIL; qaeMemFree((void**)&cyInstances); sampleCodeThreadExit(); } /* give our thread a logical crypto instance to use * use % to wrap around the max number of instances*/ ikeRsaSetup.cyInstanceHandle = cyInstances[testSetup->logicalQaInstance]; ikeRsaSetup.modulusSizeInBytes = setup->modulusSizeInBytes; ikeRsaSetup.exponentSizeInBytes = setup->exponentSizeInBytes; ikeRsaSetup.numBuffers = setup->numBuffers; ikeRsaSetup.numLoops = setup->numLoops; ikeRsaSetup.rsaKeyRepType = setup->rsaKeyRepType; ikeRsaSetup.syncMode = ASYNC; /*launch function that does all the work*/ status = ikeRsaPerform(&ikeRsaSetup); if(CPA_STATUS_SUCCESS != status) { PRINT("ikeRsa Thread FAILED with status: %d\n", status); ikeRsaSetup.performanceStats->threadReturnStatus = CPA_STATUS_FAIL; } else { /*set the print function that can be used to print stats at the end of * the test*/ testSetup->statsPrintFunc=(stats_print_func_t)ikeRsaPrintStats; } qaeMemFree((void**)&cyInstances); sampleCodeThreadExit(); }
int qat_engine_init(ENGINE *e) { int instNum, err; CpaStatus status = CPA_STATUS_SUCCESS; CpaBoolean limitDevAccess = CPA_FALSE; int ret_pthread_sigmask; pthread_mutex_lock(&qat_engine_mutex); if(engine_inited) { pthread_mutex_unlock(&qat_engine_mutex); return 1; } DEBUG("QAT Engine initialization:\n"); DEBUG("- External polling: %s\n", enable_external_polling ? "ON": "OFF"); DEBUG("- Inline polling: %s\n", enable_inline_polling ? "ON": "OFF"); DEBUG("- Internal poll interval: %dns\n", qat_poll_interval); DEBUG("- Epoll timeout: %dms\n", qat_epoll_timeout); DEBUG("- Event driven polling mode: %s\n", enable_event_driven_polling ? "ON": "OFF"); DEBUG("- Instance for thread: %s\n", enable_instance_for_thread ? "ON": "OFF"); DEBUG("- Max retry count: %d\n", qat_max_retry_count); CRYPTO_INIT_QAT_LOG(); polling_thread = pthread_self(); if ((err = pthread_key_create(&qatInstanceForThread, NULL)) != 0) { WARN("pthread_key_create failed: %s\n", strerror(err)); QATerr(QAT_F_QAT_ENGINE_INIT, QAT_R_PTHREAD_CREATE_FAILURE); pthread_mutex_unlock(&qat_engine_mutex); return 0; } #ifndef OPENSSL_ENABLE_QAT_UPSTREAM_DRIVER /* limitDevAccess is passed as an input to icp_sal_userStartMultiProcess(). * However, in upstream driver the value is ignored and read directly from * the configuration file -> No need to parse the file here. */ if (!checkLimitDevAccessValue((int *)&limitDevAccess, ICPConfigSectionName_libcrypto)) { WARN("Could not load driver config file. Assuming LimitDevAccess = 0\n"); } #endif /* Initialise the QAT hardware */ if (CPA_STATUS_SUCCESS != icp_sal_userStartMultiProcess(ICPConfigSectionName_libcrypto, limitDevAccess)) { WARN("icp_sal_userStart failed\n"); QATerr(QAT_F_QAT_ENGINE_INIT, QAT_R_ICP_SAL_USERSTART_FAIL); pthread_mutex_unlock(&qat_engine_mutex); return 0; } /* Get the number of available instances */ status = cpaCyGetNumInstances(&qat_num_instances); if (CPA_STATUS_SUCCESS != status) { WARN("cpaCyGetNumInstances failed, status=%d\n", status); QATerr(QAT_F_QAT_ENGINE_INIT, QAT_R_GET_NUM_INSTANCE_FAILURE); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } if (!qat_num_instances) { WARN("No crypto instances found\n"); QATerr(QAT_F_QAT_ENGINE_INIT, QAT_R_INSTANCE_UNAVAILABLE); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } DEBUG("Found %d Cy instances\n", qat_num_instances); /* Allocate memory for the instance handle array */ qat_instance_handles = (CpaInstanceHandle *) OPENSSL_zalloc(((int)qat_num_instances) * sizeof(CpaInstanceHandle)); if (NULL == qat_instance_handles) { WARN("OPENSSL_zalloc() failed for instance handles.\n"); QATerr(QAT_F_QAT_ENGINE_INIT, QAT_R_INSTANCE_HANDLE_MALLOC_FAILURE); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } /* Get the Cy instances */ status = cpaCyGetInstances(qat_num_instances, qat_instance_handles); if (CPA_STATUS_SUCCESS != status) { WARN("cpaCyGetInstances failed, status=%d\n", status); QATerr(QAT_F_QAT_ENGINE_INIT, QAT_R_GET_INSTANCE_FAILURE); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } if (!enable_external_polling && !enable_inline_polling) { if (qat_is_event_driven()) { CpaStatus status; int flags; int engine_fd; /* Add the file descriptor to an epoll event list */ internal_efd = epoll_create1(0); if (-1 == internal_efd) { WARN("Error creating epoll fd\n"); QATerr(QAT_F_QAT_ENGINE_INIT, QAT_R_EPOLL_CREATE_FAILURE); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } for (instNum = 0; instNum < qat_num_instances; instNum++) { /* Get the file descriptor for the instance */ status = icp_sal_CyGetFileDescriptor(qat_instance_handles[instNum], &engine_fd); if (CPA_STATUS_FAIL == status) { WARN("Error getting file descriptor for instance\n"); QATerr(QAT_F_QAT_ENGINE_INIT, QAT_R_GET_FILE_DESCRIPTOR_FAILURE); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } /* Make the file descriptor non-blocking */ eng_poll_st[instNum].eng_fd = engine_fd; eng_poll_st[instNum].inst_index = instNum; flags = fcntl(engine_fd, F_GETFL, 0); fcntl(engine_fd, F_SETFL, flags | O_NONBLOCK); eng_epoll_events[instNum].data.ptr = &eng_poll_st[instNum]; eng_epoll_events[instNum].events = EPOLLIN | EPOLLET; if (-1 == epoll_ctl(internal_efd, EPOLL_CTL_ADD, engine_fd, &eng_epoll_events[instNum])) { WARN("Error adding fd to epoll\n"); QATerr(QAT_F_QAT_ENGINE_INIT, QAT_R_EPOLL_CTL_FAILURE); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } } } } /* Set translation function and start each instance */ for (instNum = 0; instNum < qat_num_instances; instNum++) { /* Set the address translation function */ status = cpaCySetAddressTranslation(qat_instance_handles[instNum], virtualToPhysical); if (CPA_STATUS_SUCCESS != status) { WARN("cpaCySetAddressTranslation failed, status=%d\n", status); QATerr(QAT_F_QAT_ENGINE_INIT, QAT_R_SET_ADDRESS_TRANSLATION_FAILURE); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } /* Start the instances */ status = cpaCyStartInstance(qat_instance_handles[instNum]); if (CPA_STATUS_SUCCESS != status) { WARN("cpaCyStartInstance failed, status=%d\n", status); QATerr(QAT_F_QAT_ENGINE_INIT, QAT_R_START_INSTANCE_FAILURE); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } instance_started[instNum] = 1; } if (!enable_external_polling && !enable_inline_polling) { if (!qat_is_event_driven()) { sigemptyset(&set); sigaddset(&set, SIGUSR1); ret_pthread_sigmask = pthread_sigmask(SIG_BLOCK, &set, NULL); if (ret_pthread_sigmask != 0) { WARN("pthread_sigmask error\n"); QATerr(QAT_F_QAT_ENGINE_INIT, QAT_R_POLLING_THREAD_SIGMASK_FAILURE); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } } if (qat_create_thread(&polling_thread, NULL, qat_is_event_driven() ? event_poll_func : timer_poll_func, NULL)) { WARN("Creation of polling thread failed\n"); QATerr(QAT_F_QAT_ENGINE_INIT, QAT_R_POLLING_THREAD_CREATE_FAILURE); polling_thread = pthread_self(); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } if (qat_adjust_thread_affinity(polling_thread) == 0) { WARN("Setting polling thread affinity failed\n"); QATerr(QAT_F_QAT_ENGINE_INIT, QAT_R_SET_POLLING_THREAD_AFFINITY_FAILURE); pthread_mutex_unlock(&qat_engine_mutex); qat_engine_finish(e); return 0; } if (!qat_is_event_driven()) { while (!cleared_to_start) sleep(1); } } /* Reset curr_inst */ curr_inst = 0; engine_inited = 1; pthread_mutex_unlock(&qat_engine_mutex); return 1; }