void crfsuite_attribute_set(crfsuite_attribute_t* cont, int aid, floatval_t value) { crfsuite_attribute_init(cont); cont->aid = aid; cont->value = value; }
int read_data(FILE *fpi, FILE *fpo, crfsuite_data_t* data, int group) { int i = 0; int n = 0; int lid = -1; int * lids = NULL; crfsuite_instance_t inst; crfsuite_item_t item; crfsuite_attribute_t cont; crfsuite_fuzzy_labels_t fuzzy; iwa_t* iwa = NULL; crfsuite_dictionary_t *attrs = data->attrs; crfsuite_dictionary_t *labels = data->labels; const iwa_token_t *token = NULL; long filesize = 0, begin = 0, offset = 0; int prev = 0, current = 0; /* Initialize the instance.*/ crfsuite_instance_init(&inst); inst.group = group; /* Obtain the file size. */ begin = ftell(fpi); fseek(fpi, 0, SEEK_END); filesize = ftell(fpi) - begin; fseek(fpi, begin, SEEK_SET); /* */ fprintf(fpo, "0"); fflush(fpo); prev = 0; /* allocate a lid from the data*/ iwa = iwa_reader(fpi); while (token = iwa_read(iwa), token != NULL) { /* Progress report. */ offset = ftell(fpi); current = (int)((offset - begin) * 100.0 / (double)filesize); prev = progress(fpo, prev, current); switch (token->type) { case IWA_BOI: /* Initialize an item. */ lid = -1; crfsuite_item_init(&item); break; case IWA_EOI: /* Append the item to the instance. */ if (0 <= lid) { crfsuite_instance_append(&inst, &item, &fuzzy, lid); } crfsuite_item_finish(&item); break; case IWA_ITEM: if (lid == -1) { if (strncmp(token->attr, "@", 1) == 0) { /* Declaration. */ if (strcmp(token->attr, "@weight") == 0) { /* Instance weighting. */ inst.weight = atof(token->value); } else { /* Unrecognized declaration. */ fprintf(fpo, "\n"); fprintf(fpo, "ERROR: unrecognized declaration: %s\n", token->attr); iwa_delete(iwa); return -1; } } else { /* Label. */ crfsuite_fuzzy_labels_init(&fuzzy); parse_fuzzy_labels(token->attr, &fuzzy, labels); if (1 == fuzzy.num_labels) { lid = fuzzy.labels[0]; } else if (1 < fuzzy.num_labels) { lid = 0; /* Just a Pseudo label */ } else { fprintf(stderr, "?\n"); } } } else { crfsuite_attribute_init(&cont); cont.aid = attrs->get(attrs, token->attr); if (token->value && *token->value) { cont.value = atof(token->value); } else { cont.value = 1.0; } crfsuite_item_append_attribute(&item, &cont); } break; case IWA_NONE: case IWA_EOF: /* Put the training instance. */ crfsuite_data_append(data, &inst); crfsuite_instance_finish(&inst); inst.group = group; inst.weight = 1.; ++n; break; } } progress(fpo, prev, 100); fprintf(fpo, "\n"); iwa_delete(iwa); return n; }