int TestMaxwell2D() { bool test = true; field f; init_empty_field(&f); f.model.cfl = 0.05; f.model.m = 7; // num of conservative variables f.model.NumFlux = Maxwell2DNumFlux_uncentered; //f.model.NumFlux = Maxwell2DNumFlux_centered; f.model.BoundaryFlux = Maxwell2DBoundaryFlux_uncentered; f.model.InitData = Maxwell2DInitData; f.model.ImposedData = Maxwell2DImposedData; f.varindex = GenericVarindex; f.model.Source = Maxwell2DSource; f.interp.interp_param[0] = f.model.m; f.interp.interp_param[1] = 3; // x direction degree f.interp.interp_param[2] = 3; // y direction degree f.interp.interp_param[3] = 0; // z direction degree f.interp.interp_param[4] = 4; // x direction refinement f.interp.interp_param[5] = 4; // y direction refinement f.interp.interp_param[6] = 1; // z direction refinement ReadMacroMesh(&(f.macromesh), "../test/testcube.msh"); Detect2DMacroMesh(&(f.macromesh)); assert(f.macromesh.is2d); BuildConnectivity(&(f.macromesh)); char buf[1000]; sprintf(buf, "-D _M=%d", f.model.m); strcat(cl_buildoptions, buf); set_source_CL(&f, "Maxwell2DSource"); sprintf(numflux_cl_name, "%s", "Maxwell2DNumFlux_uncentered"); sprintf(buf," -D NUMFLUX="); strcat(buf, numflux_cl_name); strcat(cl_buildoptions, buf); sprintf(buf, " -D BOUNDARYFLUX=%s", "Maxwell2DBoundaryFlux_uncentered"); strcat(cl_buildoptions, buf); Initfield(&f); CheckMacroMesh(&(f.macromesh), f.interp.interp_param + 1); real tmax = 0.1; f.vmax = 1; real dt = set_dt(&f); #if 0 // C version RK2(&f, tmax, dt); #else // OpenCL version CopyfieldtoGPU(&f); RK2_CL(&f, tmax, dt, 0, 0, 0); CopyfieldtoCPU(&f); printf("\nOpenCL Kernel time:\n"); show_cl_timing(&f); printf("\n"); #endif // Save the results and the error /* Plotfield(0, false, &f, NULL, "dgvisu.msh"); */ /* Plotfield(0, true, &f, "error", "dgerror.msh"); */ real dd = L2error(&f); real tolerance = 1.1e-2; test = test && (dd < tolerance); printf("L2 error: %f\n", dd); return test; }
int TestDtfield_CL(void){ bool test = true; if(!cldevice_is_acceptable(nplatform_cl, ndevice_cl)) { printf("OpenCL device not acceptable.\n"); return true; } field f; // 2D meshes: // test/disque2d.msh // test/testdisque2d.msh // test/testmacromesh.msh // test/unit-cube.msh char *mshname = "test/disque2d.msh"; ReadMacroMesh(&(f.macromesh), mshname); Detect2DMacroMesh(&f.macromesh); BuildConnectivity(&f.macromesh); #if 1 // 2D version assert(f.macromesh.is2d); f.model.cfl = 0.05; f.model.m = 1; m = f.model.m; f.model.NumFlux = TransNumFlux2d; f.model.BoundaryFlux = TransBoundaryFlux2d; f.model.InitData = TransInitData2d; f.model.ImposedData = TransImposedData2d; f.varindex = GenericVarindex; f.interp.interp_param[0] = f.model.m; f.interp.interp_param[1] = 2; // x direction degree f.interp.interp_param[2] = 2; // y direction degree f.interp.interp_param[3] = 0; // z direction degree f.interp.interp_param[4] = 4; // x direction refinement f.interp.interp_param[5] = 4; // y direction refinement f.interp.interp_param[6] = 1; // z direction refinement #else // 3D version f.model.cfl = 0.05; f.model.m = 1; f.model.NumFlux = TransNumFlux; f.model.BoundaryFlux = TestTransBoundaryFlux; f.model.InitData = TestTransInitData; f.model.ImposedData = TestTransImposedData; f.varindex = GenericVarindex; f.interp.interp_param[0] = f.model.m; f.interp.interp_param[1] = 2; // x direction degree f.interp.interp_param[2] = 2; // y direction degree f.interp.interp_param[3] = 2; // z direction degree f.interp.interp_param[4] = 3; // x direction refinement f.interp.interp_param[5] = 3; // y direction refinement f.interp.interp_param[6] = 3; // z direction refinement #endif set_global_m(f.model.m); set_source_CL(&f, "OneSource"); Initfield(&f); cl_event clv_dtfield = clCreateUserEvent(f.cli.context, NULL); dtfield_CL(&f, &f.wn_cl, 0, NULL, &clv_dtfield); clWaitForEvents(1, &clv_dtfield); CopyfieldtoCPU(&f); // Displayfield(&f); show_cl_timing(&f); real *saveptr = f.dtwn; f.dtwn = calloc(f.wsize, sizeof(real)); f.model.Source = OneSource; dtfield(&f, f.wn, f.dtwn); real maxerr = 0; for(int i = 0; i < f.wsize; i++) { real error = f.dtwn[i] - saveptr[i]; //printf("error= \t%f\t%f\t%f\n", error, f.dtwn[i], saveptr[i]); maxerr = fmax(fabs(error), maxerr); } printf("max error: %f\n", maxerr); test = (maxerr < 1e-8); return test; }
int TestKernelFlux() { bool test=true; if(!cldevice_is_acceptable(nplatform_cl, ndevice_cl)) { printf("OpenCL device not acceptable.\n"); return true; } field f; init_empty_field(&f); f.model.cfl = 0.05; f.model.m = 1; // only one conservative variable f.model.NumFlux = TransNumFlux2d; f.model.BoundaryFlux = TransBoundaryFlux2d; f.model.InitData = TransInitData2d; f.model.ImposedData = TransImposedData2d; f.varindex = GenericVarindex; f.interp.interp_param[0] = f.model.m; f.interp.interp_param[1] = 2; // x direction degree f.interp.interp_param[2] = 2; // y direction degree f.interp.interp_param[3] = 0; // z direction degree f.interp.interp_param[4] = 3; // x direction refinement f.interp.interp_param[5] = 3; // y direction refinement f.interp.interp_param[6] = 1; // z direction refinement ReadMacroMesh(&f.macromesh,"../test/testmacromesh.msh"); //ReadMacroMesh(&f.macromesh,"test/testcube.msh"); Detect2DMacroMesh(&f.macromesh); assert(f.macromesh.is2d); BuildConnectivity(&f.macromesh); Initfield(&f); CopyfieldtoGPU(&f); clFinish(f.cli.commandqueue); for(int ie = 0; ie < f.macromesh.nbelems; ++ie) { MacroCell *mcell = f.mcell + ie; DGFlux_CL(mcell, &f, 0, f.wn_cl + ie, 0, NULL, NULL); clFinish(f.cli.commandqueue); DGFlux_CL(mcell, &f, 1, f.wn_cl + ie, 0, NULL, NULL); clFinish(f.cli.commandqueue); if(!f.macromesh.is2d) { DGFlux_CL(mcell, &f, 2, f.wn_cl + ie, 0, NULL, NULL); clFinish(f.cli.commandqueue); } } CopyfieldtoCPU(&f); //Displayfield(&f); // save the dtwn pointer real *dtwn_cl = f.dtwn; // malloc a new dtwn. f.dtwn = calloc(f.wsize, sizeof(real)); for(int ie = 0; ie < f.macromesh.nbelems; ++ie) { MacroCell *mcell = f.mcell + ie; real *wmc = f.wn + mcell->woffset; real *dtwmc = f.dtwn + mcell->woffset; DGSubCellInterface(f.mcell + ie, &f, wmc, dtwmc); //DGVolume((void*) &f.mcell[ie], &f, f.wn, f.dtwn); } //Displayfield(&f); //check that the results are the same real maxerr = 0.0; printf("\nDifference\tC\t\tOpenCL\n"); for(int i = 0; i < f.wsize; ++i) { printf("%f\t%f\t%f\n", f.dtwn[i] - dtwn_cl[i], f.dtwn[i], dtwn_cl[i]); maxerr = fmax(fabs(f.dtwn[i] - dtwn_cl[i]), maxerr); } printf("max error: %f\n",maxerr); real tolerance; if(sizeof(real) == sizeof(double)) tolerance = 1e-8; else tolerance = 1e-4; test = (maxerr < tolerance); return test; }
int TestMHD(int argc, char *argv[]) { real cfl = 0.1; real tmax = 0.1; bool writemsh = false; real vmax = 6.0; bool usegpu = true; real dt = 0.0; real periodsize = 6.2831853; for (;;) { int cc = getopt(argc, argv, "c:t:w:D:P:g:s:"); if (cc == -1) break; switch (cc) { case 0: break; case 'c': cfl = atof(optarg); break; case 'g': usegpu = atoi(optarg); break; case 't': tmax = atof(optarg); break; case 'w': writemsh = true; break; case 'D': ndevice_cl= atoi(optarg); break; case 'P': nplatform_cl = atoi(optarg); break; default: printf("Error: invalid option.\n"); printf("Usage:\n"); printf("./testmanyv -c <cfl> -d <deg> -n <nraf> -t <tmax> -C\n -P <cl platform number> -D <cl device number> FIXME"); exit(1); } } bool test = true; field f; init_empty_field(&f); f.varindex = GenericVarindex; f.model.m = 9; f.model.cfl = cfl; strcpy(f.model.name,"MHD"); f.model.NumFlux=MHDNumFluxP2; f.model.BoundaryFlux=MHDBoundaryFlux; f.model.InitData=MHDInitData; f.model.ImposedData=MHDImposedData; char buf[1000]; sprintf(buf, "-D _M=%d -D _PERIODX=%f -D _PERIODY=%f", f.model.m, periodsize, periodsize); strcat(cl_buildoptions, buf); sprintf(numflux_cl_name, "%s", "MHDNumFluxP2"); sprintf(buf," -D NUMFLUX="); strcat(buf, numflux_cl_name); strcat(cl_buildoptions, buf); sprintf(buf, " -D BOUNDARYFLUX=%s", "MHDBoundaryFlux"); strcat(cl_buildoptions, buf); // Set the global parameters for the Vlasov equation f.interp.interp_param[0] = f.model.m; // _M f.interp.interp_param[1] = 1; // x direction degree f.interp.interp_param[2] = 1; // y direction degree f.interp.interp_param[3] = 0; // z direction degree f.interp.interp_param[4] = 4; // x direction refinement f.interp.interp_param[5] = 4; // y direction refinement f.interp.interp_param[6] = 1; // z direction refinement //set_vlasov_params(&(f.model)); // Read the gmsh file //ReadMacroMesh(&(f.macromesh), "test/testcartesiangrid2d2.msh"); ReadMacroMesh(&(f.macromesh), "../test/testOTgrid.msh"); //ReadMacroMesh(&(f.macromesh), "test/testcube.msh"); // Try to detect a 2d mesh Detect2DMacroMesh(&(f.macromesh)); bool is2d=f.macromesh.is2d; assert(is2d); f.macromesh.period[0]=periodsize; f.macromesh.period[1]=periodsize; // Mesh preparation BuildConnectivity(&(f.macromesh)); // Prepare the initial fields Initfield(&f); // Prudence... CheckMacroMesh(&(f.macromesh), f.interp.interp_param + 1); //Plotfield(0, (1==0), &f, "Rho", "dginit.msh"); f.vmax=vmax; real executiontime; if(usegpu) { printf("Using OpenCL:\n"); //executiontime = seconds(); //assert(1==2); RK4_CL(&f, tmax, dt, 0, NULL, NULL); CopyfieldtoCPU(&f); show_cl_timing(&f); //executiontime = seconds() - executiontime; show_cl_timing(&f); } else { printf("Using C:\n"); //executiontime = seconds(); RK4(&f, tmax, dt); //executiontime = seconds() - executiontime; } //Plotfield(0,false,&f, "Rho", "rho.msh"); //Plotfield(2,false,&f, "P", "p.msh"); //Gnuplot(&f,0,0.0,"data1D.dat"); printf("tmax: %f, cfl: %f\n", tmax, f.model.cfl); printf("deltax:\n"); printf("%f\n", f.hmin); printf("deltat:\n"); printf("%f\n", dt); printf("DOF:\n"); printf("%d\n", f.wsize); printf("executiontime (s):\n"); printf("%f\n", executiontime); printf("time per RK2 (s):\n"); printf("%f\n", executiontime / (real)f.itermax); return test; }
int TestKernelVolume(void){ bool test=true; if(!cldevice_is_acceptable(nplatform_cl, ndevice_cl)) { printf("OpenCL device not acceptable.\n"); return true; } field f; init_empty_field(&f); f.model.cfl = 0.05; f.model.m = 1; // only one conservative variable f.model.NumFlux = TransNumFlux2d; f.model.BoundaryFlux = TransBoundaryFlux2d; f.model.InitData = TransInitData2d; f.model.ImposedData = TransImposedData2d; f.varindex = GenericVarindex; f.interp.interp_param[0] = 1; // _M f.interp.interp_param[1] = 1; // x direction degree f.interp.interp_param[2] = 1; // y direction degree f.interp.interp_param[3] = 0; // z direction degree f.interp.interp_param[4] = 3; // x direction refinement f.interp.interp_param[5] = 3; // y direction refinement f.interp.interp_param[6] = 1; // z direction refinement ReadMacroMesh(&f.macromesh,"../test/testmacromesh.msh"); //ReadMacroMesh(&f.macromesh,"test/testcube.msh"); Detect2DMacroMesh(&f.macromesh); assert(f.macromesh.is2d); BuildConnectivity(&f.macromesh); //PrintMacroMesh(&f.macromesh); //AffineMapMacroMesh(&f.macromesh); Initfield(&f); CopyfieldtoGPU(&f); /* // set dtwn to 1 for testing */ /* void* chkptr; */ /* cl_int status; */ /* chkptr=clEnqueueMapBuffer(f.cli.commandqueue, */ /* f.dtwn_cl, // buffer to copy from */ /* CL_TRUE, // block until the buffer is available */ /* CL_MAP_WRITE, */ /* 0, // offset */ /* sizeof(real)*(f.wsize), // buffersize */ /* 0,NULL,NULL, // events management */ /* &status); */ /* assert(status == CL_SUCCESS); */ /* assert(chkptr == f.dtwn); */ /* for(int i=0;i<f.wsize;i++){ */ /* f.dtwn[i]=1; */ /* } */ /* status=clEnqueueUnmapMemObject (f.cli.commandqueue, */ /* f.dtwn_cl, */ /* f.dtwn, */ /* 0,NULL,NULL); */ /* assert(status == CL_SUCCESS); */ /* status=clFinish(f.cli.commandqueue); */ /* assert(status == CL_SUCCESS); */ clFinish(f.cli.commandqueue); for(int ie = 0; ie < f.macromesh.nbelems; ++ie) { DGVolume_CL(f.mcell + ie, &f, f.wn_cl + ie, 0, NULL, NULL); clFinish(f.cli.commandqueue); } clFinish(f.cli.commandqueue); CopyfieldtoCPU(&f); //Displayfield(&f); // save the dtwn pointer real *dtwn_cl = f.dtwn; // malloc a new dtwn. f.dtwn = calloc(f.wsize, sizeof(real)); for(int ie = 0; ie < f.macromesh.nbelems; ++ie) { MacroCell *mcell = f.mcell + ie; real *dtwmc = f.dtwn + mcell->woffset; real *wmc = f.wn + mcell->woffset; DGVolume(f.mcell + ie, &f, wmc, dtwmc); } //Displayfield(&f); //check that the results are the same real maxerr = 0.0; //printf("\nDifference\tC\t\tOpenCL\n"); for(int i = 0; i < f.wsize; ++i) { real err = fabs(f.dtwn[i] - dtwn_cl[i]); //printf("%f\t%f\t%f\n", err, f.dtwn[i], dtwn_cl[i]); maxerr = fmax(err, maxerr); } printf("max error: %f\n",maxerr); real tolerance; if(sizeof(real) == sizeof(double)) tolerance = 1e-8; else tolerance = 1e-4; test = (maxerr < tolerance); return test; }