Example #1
0
int main()
{
    Timer timer;

	cout << "sleeping for 1 second and reporting:\n";
	timer.Start();
	sleep(1);
	timer.Pause();
	cout << "timed %lf secs\n", timer.ElapsedTime();

    timer.Clear();
	cout << "sleeping 2 times for 1 second and reporting:\n";
	timer.Start();
	sleep(1);
	timer.Pause();

	sleep(1);

	timer.Start();
	sleep(1);
	timer.Pause();
	cout << "timed %lf secs\n", timer.ElapsedTime();
	
	return 0;
}
Example #2
0
/* SpMV kernel implemented with Intel MKL */
void mkl_spmv(spx_index_t *rowptr, spx_index_t *colind, spx_value_t *values,
              spx_index_t nrows, spx_index_t ncols, spx_index_t nnz,
              spx_value_t *x, spx_value_t *y,
              spx_value_t ALPHA, spx_value_t BETA)
{
    /* 1. Matrix loading phase */
    MKL_INT *pointerB, *pointerE;
    char    transa;
    char    matdescra[6];

    transa = 'n';
    matdescra[0] = 'g';
    matdescra[1] = '-';
    matdescra[2] = '-';
    matdescra[3] = 'c';

	pointerB = (MKL_INT *) malloc(sizeof(MKL_INT) * nrows);
	pointerE = (MKL_INT *) malloc(sizeof(MKL_INT) * nrows);
    for (int i = 0; i < nrows; i++) {
        pointerB[i] = rowptr[i];
        pointerE[i] = rowptr[i+1];
    }
    
    /* 2. SpMV benchmarking phase */
    vector<double> mt(OUTER_LOOPS);
    for (size_t i = 0; i < OUTER_LOOPS; i++) {
        t.Clear();
        t.Start();
        for (size_t j = 0; j < LOOPS; j++) {
            mkl_dcsrmv(&transa, &nrows, &ncols, &ALPHA, matdescra, values,
                       colind, pointerB, pointerE, x, &BETA, y);            
        }
        t.Pause();
        mt[i] = t.ElapsedTime();
    }

    sort(mt.begin(), mt.end());
    double mt_median = 
        (OUTER_LOOPS % 2) ? mt[((OUTER_LOOPS+1)/2)-1]
        : ((mt[OUTER_LOOPS/2-1] + mt[OUTER_LOOPS/2])/2);  
    double flops = (double)(LOOPS*nnz*2)/((double)1000*1000*mt_median);
    cout << "m: " << MATRIX
         << " mt(median): " << mt_median
         << " flops: " << flops << endl;

    /* 3. Cleanup */
    free(pointerB);
    free(pointerE);
}
Example #3
0
/* SpMV kernel implemented with pOSKI */
void poski_spmv(spx_index_t *Aptr, spx_index_t *Aind, spx_value_t *Aval,
                spx_index_t nrows, spx_index_t ncols, spx_index_t nnz,
                spx_value_t *x, spx_value_t *y,
                spx_value_t ALPHA, spx_value_t BETA)
{
  poski_Init();

  /* 1. Matrix loading phase */
  poski_threadarg_t *poski_thread = poski_InitThreads();
  poski_ThreadHints(poski_thread, NULL, POSKI_THREADPOOL, NR_THREADS);
  // poski_ThreadHints(poski_thread, NULL, POSKI_PTHREAD, NR_THREADS);
  poski_partitionarg_t *partitionMat = poski_partitionMatHints(OneD, NR_THREADS,
							       KERNEL_MatMult,
							       OP_NORMAL);
  poski_mat_t A_tunable = 
    poski_CreateMatCSR(Aptr, Aind, Aval, nrows, ncols, nnz, SHARE_INPUTMAT,
		       poski_thread, partitionMat, 2, INDEX_ZERO_BASED, 
		       MAT_GENERAL);

  /* 2. Vector loading */
  poski_partitionvec_t *partitionVecX = 
    poski_PartitionVecHints(A_tunable, KERNEL_MatMult, OP_NORMAL, INPUTVEC);
  poski_vec_t x_view = poski_CreateVec(x, ncols, STRIDE_UNIT, partitionVecX);
  poski_partitionvec_t *partitionVecY = 
    poski_PartitionVecHints(A_tunable, KERNEL_MatMult, OP_NORMAL, OUTPUTVEC);
  poski_vec_t y_view = poski_CreateVec(y, nrows, STRIDE_UNIT, partitionVecY);

  /* 3. Tuning phase */
  t.Clear();
  t.Start();
  poski_TuneHint_MatMult(A_tunable, OP_NORMAL, ALPHA, x_view, BETA, 
			 y_view, ALWAYS_TUNE_AGGRESSIVELY);
  poski_TuneMat(A_tunable);
  t.Pause();
  double pt = t.ElapsedTime();

  /* 4. SpMV benchmarking phase */
  vector<double> mt(OUTER_LOOPS);
  for (size_t i = 0; i < OUTER_LOOPS; i++) {
    t.Clear();
    t.Start();
    for (size_t  j = 0; j < LOOPS; j++) {
      poski_MatMult(A_tunable, OP_NORMAL, ALPHA, x_view, BETA, y_view);
    }
    t.Pause();
    mt[i] = t.ElapsedTime();
  }

  sort(mt.begin(), mt.end());
  double mt_median = 
    (OUTER_LOOPS % 2) ? mt[((OUTER_LOOPS+1)/2)-1]
    : ((mt[OUTER_LOOPS/2-1] + mt[OUTER_LOOPS/2])/2);  
  double flops = (double)(LOOPS*nnz*2)/((double)1000*1000*mt_median);
  cout << "m: " << MATRIX 
       << " pt: " << pt 
       << " mt(median): " << mt_median
       << " flops: " << flops << endl;

  /* 4. Cleanup */
  poski_DestroyPartitionVec(partitionVecX);
  poski_DestroyPartitionVec(partitionVecY);
  poski_DestroyVec(x_view);
  poski_DestroyVec(y_view);
  poski_DestroyPartitionMat(partitionMat);
  poski_DestroyMat(A_tunable);
  poski_DestroyThreads(poski_thread);
  poski_Close();
}