Beispiel #1
0
int
load_csv_graph (struct stinger * S, char * filename, int use_numerics)
{
  FILE * fp = fopen (filename, "r");
  if (!fp)
  {
    char errmsg[257];
    snprintf (errmsg, 256, "Opening \"%s\" failed", filename);
    errmsg[256] = '\0';
    perror (errmsg);
    exit (-1);
  }

  char * buf = NULL;
  char ** fields = NULL;
  uint64_t bufSize = 0;
  uint64_t * lengths = NULL;
  uint64_t fieldsSize = 0;
  uint64_t count = 0;
  int64_t line = 0;

  while (!feof(fp))
  {
    int64_t src = 0;
    int64_t dst = 0;
    int64_t wgt = 0;
    int64_t time = 0;
    int64_t type = 0;

    line++;
    readCSVLineDynamic(',', fp, &buf, &bufSize, &fields, &lengths, &fieldsSize, &count);

    if (count <= 1)
      continue;
    if (count < 3) {
      E_A("ERROR: too few elemnts on line %ld", (long) line);
      continue;
    }

    if (!use_numerics)
    {
      /* values are strings */
      stinger_mapping_create (S, fields[FIELD_SOURCE], lengths[FIELD_SOURCE], &src);
      stinger_mapping_create (S, fields[FIELD_DEST], lengths[FIELD_DEST], &dst);
      if (count > 2)
	wgt = atol(fields[FIELD_WEIGHT]);
      if (count > 3)
	time = atol(fields[FIELD_TIME]);
      if (count > 4)
      {
	type = stinger_etype_names_lookup_type (S, fields[FIELD_TYPE]);
	if (type == -1) {
	  stinger_etype_names_create_type (S, fields[FIELD_TYPE], &type);
	}
	if (type == -1) {
	  perror ("Failed to create new edge type");
	  exit(-1);
	}
      }

    } else {
      /* values are integers */
      src = atol(fields[FIELD_SOURCE]);
      dst = atol(fields[FIELD_DEST]);
      if (count > 2)
	wgt = atol(fields[FIELD_WEIGHT]);
      if (count > 3)
	time = atol(fields[FIELD_TIME]);
      if (count > 4)
	type = atol(fields[FIELD_TYPE]);
    }

    //printf("Inserting type=%ld %ld %ld %ld %ld\n", type, src, dst, wgt, time);
    stinger_insert_edge (S, type, src, dst, wgt, time);

  }

  fclose (fp);

  return 0;
}
Beispiel #2
0
int
main(int argc, char *argv[])
{
  /* ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ *
   * Setup and register algorithm with the server
   * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ */
  char name[1024];
  char type_str[1024];

  int type_specified = 0;
  int directed = 0;

  double epsilon = EPSILON_DEFAULT;
  double dampingfactor = DAMPINGFACTOR_DEFAULT;
  int64_t maxiter = MAXITER_DEFAULT;
  
  int opt = 0;
  while(-1 != (opt = getopt(argc, argv, "t:e:f:i:d?h"))) {
    switch(opt) {
      case 't': {
        sprintf(name, "pagerank_%s", optarg);
        strcpy(type_str,optarg);
        type_specified = 1;
      } break;   
      case 'd': {
        directed = 1;
      } break;
      case 'e': {
        epsilon = atof(optarg);
      } break;
      case 'f': {
        dampingfactor = atof(optarg);
      } break;
      case 'i': {
        maxiter = atol(optarg);
      } break;
      default: 
        printf("Unknown option '%c'\n", opt);
      case '?':
      case 'h': {
        printf(
          "PageRank\n"
          "==================================\n"
          "\n"
          "  -t <str>  Specify an edge type to run page rank over\n"
          "  -d        Use a PageRank that is safe on directed graphs\n"
          "  -e        Set PageRank Epsilon (default: %0.1e)\n"
          "  -f        Set PageRank Damping Factor (default: %lf)\n"
          "  -i        Set PageRank Max Iterations (default: %ld)\n"
          "\n",EPSILON_DEFAULT,DAMPINGFACTOR_DEFAULT,MAXITER_DEFAULT);
        return(opt);
      }
    }
  }

  stinger_registered_alg * alg = 
    stinger_register_alg(
      .name=type_specified ? name : "pagerank",
      .data_per_vertex=sizeof(double),
      .data_description="d pagerank",
      .host="localhost",
    );

  if(!alg) {
    LOG_E("Registering algorithm failed.  Exiting");
    return -1;
  }

  double * pr = (double *)alg->alg_data;
  OMP("omp parallel for")
  for(uint64_t v = 0; v < alg->stinger->max_nv; v++) {
    pr[v] = 1 / ((double)alg->stinger->max_nv);
  }

  double * tmp_pr = (double *)xcalloc(alg->stinger->max_nv, sizeof(double));

  double time;
  init_timer();
  
  /* ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ *
   * Initial static computation
   * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ */
  stinger_alg_begin_init(alg); {
    int64_t type = -1;
    if(type_specified) {
      type = stinger_etype_names_lookup_type(alg->stinger, type_str);
    }
    if(type_specified && type > -1) {
      if (directed) {
        page_rank_type_directed(alg->stinger, stinger_mapping_nv(alg->stinger), pr, tmp_pr, epsilon, dampingfactor, maxiter, type);
      } else {
        page_rank_type(alg->stinger, stinger_mapping_nv(alg->stinger), pr, tmp_pr, epsilon, dampingfactor, maxiter, type);
      }
    } else if (!type_specified) {
      if (directed) {
        page_rank_directed(alg->stinger, stinger_mapping_nv(alg->stinger), pr, tmp_pr, epsilon, dampingfactor, maxiter);
      } else {
        page_rank(alg->stinger, stinger_mapping_nv(alg->stinger), pr, tmp_pr, epsilon, dampingfactor, maxiter);
      }
    }
  } stinger_alg_end_init(alg);

  /* ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ *
   * Streaming Phase
   * ~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~~ */
  while(alg->enabled) {
    /* Pre processing */
    if(stinger_alg_begin_pre(alg)) {
      /* nothing to do */
      time = timer();
      stinger_alg_end_pre(alg);
      time = timer() - time;
      LOG_I_A("Pre time : %20.15e", time);
    }

    /* Post processing */
      time = timer();
    if(stinger_alg_begin_post(alg)) {
      int64_t type = -1;
      if(type_specified) {
      	type = stinger_etype_names_lookup_type(alg->stinger, type_str);
      	if(type > -1) {
          if (directed) {
            page_rank_type_directed(alg->stinger, stinger_mapping_nv(alg->stinger), pr, tmp_pr, epsilon, dampingfactor, maxiter, type);
          } else {
            page_rank_type(alg->stinger, stinger_mapping_nv(alg->stinger), pr, tmp_pr, epsilon, dampingfactor, maxiter, type);
          }
      	} else {
      	  LOG_W_A("TYPE DOES NOT EXIST %s", type_str);
      	  LOG_W("Existing types:");
          // TODO: Don't go through the loop if LOG_W isn't enabled
      	  for(int64_t t = 0; t < stinger_etype_names_count(alg->stinger); t++) {
      	    LOG_W_A("  > %ld %s", (long) t, stinger_etype_names_lookup_name(alg->stinger, t));
      	  }
      	}
      } else {
        if (directed) {
          page_rank_directed(alg->stinger, stinger_mapping_nv(alg->stinger), pr, tmp_pr, epsilon, dampingfactor, maxiter);
        } else {
          page_rank(alg->stinger, stinger_mapping_nv(alg->stinger), pr, tmp_pr, epsilon, dampingfactor, maxiter);
        }
      }
      stinger_alg_end_post(alg);
    }
    time = timer() - time;
    LOG_I_A("Post time : %20.15e", time);
  }

  LOG_I("Algorithm complete... shutting down");

  free(tmp_pr);
}