void ct_extract(struct ct_global_state *state, struct ct_op *op) { struct ct_extract_args *cea = op->op_args; const char *ctfile = cea->cea_local_ctfile; char **filelist = cea->cea_filelist; int match_mode = cea->cea_matchmode; struct ct_extract_priv *ex_priv = op->op_priv; int ret; struct ct_trans *trans; char shat[SHA_DIGEST_STRING_LENGTH]; /* if we were woken up due to fatal, just clean up local state */ if (state->ct_dying != 0) goto dying; CNDBG(CT_LOG_TRANS, "entry"); switch (ct_get_file_state(state)) { case CT_S_STARTING: if (ex_priv == NULL) { ex_priv = e_calloc(1, sizeof(*ex_priv)); TAILQ_INIT(&ex_priv->extract_head); if ((ret = ct_match_compile(&ex_priv->inc_match, match_mode, filelist)) != 0) { ct_fatal(state, "failed to compile include pattern", ret); goto dying; } if (cea->cea_excllist != NULL && (ret = ct_match_compile(&ex_priv->ex_match, match_mode, cea->cea_excllist)) != 0) { ct_fatal(state, "failed to compile exclude pattern", ret); goto dying; } op->op_priv = ex_priv; RB_INIT(&ex_priv->pending_tree); } if ((ret = ct_file_extract_init(&state->extract_state, cea->cea_tdir, cea->cea_attr, cea->cea_follow_symlinks, ex_priv->allfiles, cea->cea_log_state, cea->cea_log_chown_failed)) != 0) { ct_fatal(state, "Can not initialize extract state", ret); goto dying; } if (ct_extract_calculate_total(state, cea, ex_priv->inc_match, ex_priv->ex_match) != 0) { CWARNX("failed to calculate stats"); goto dying; } if ((ret = ct_extract_setup(&ex_priv->extract_head, &ex_priv->xdr_ctx, ctfile, cea->cea_ctfile_basedir, &ex_priv->allfiles)) != 0) { ct_fatal(state, "can't setup extract queue", ret); goto dying; } state->ct_print_ctfile_info(state->ct_print_state, ex_priv->xdr_ctx.xs_filename, &ex_priv->xdr_ctx.xs_gh); /* XXX we should handle this better */ if (state->ct_max_block_size < ex_priv->xdr_ctx.xs_gh.cmg_chunk_size) CABORTX("block size negotiated with server %d is " "smaller than file max block size %d", state->ct_max_block_size, ex_priv->xdr_ctx.xs_gh.cmg_chunk_size); /* create rb tree head, prepare to start inserting */ if (ex_priv->allfiles) { ex_priv->fillrb = 1; } break; case CT_S_FINISHED: return; default: break; } ct_set_file_state(state, CT_S_RUNNING); while (1) { trans = ct_trans_alloc(state); if (trans == NULL) { /* system busy, return */ CNDBG(CT_LOG_TRANS, "ran out of transactions, waiting"); ct_set_file_state(state, CT_S_WAITING_TRANS); return; } trans->tr_statemachine = ct_state_extract; switch ((ret = ctfile_parse(&ex_priv->xdr_ctx))) { case XS_RET_FILE: if (ex_priv->fillrb == 0 && ex_priv->xdr_ctx.xs_hdr.cmh_nr_shas == -1) { if (ex_priv->allfiles == 0) CINFO("file %s has negative shas " "and backup is not allfiles", ex_priv->xdr_ctx.xs_hdr.cmh_filename); ex_priv->doextract = 0; goto skip; /* skip ze file for now */ } trans = ct_trans_realloc_local(state, trans); trans->tr_fl_node = ex_priv->fl_ex_node = ct_alloc_fnode(); ct_populate_fnode(state->extract_state, &ex_priv->xdr_ctx, trans->tr_fl_node, &trans->tr_state, ex_priv->allfiles, cea->cea_strip_slash); if (trans->tr_state == TR_S_EX_SPECIAL) { trans->tr_complete = ct_extract_complete_special; } else { trans->tr_complete = ct_extract_complete_file_start; } trans->tr_cleanup = ct_extract_cleanup_fnode; if (ex_priv->haverb) { struct ct_pending_file *cpf; if ((cpf = ct_extract_find_entry( &ex_priv->pending_tree, trans->tr_fl_node->fn_fullname)) != NULL) { struct fnode *hardlink; /* copy permissions over */ trans->tr_fl_node->fn_uid = cpf->cpf_uid; trans->tr_fl_node->fn_gid = cpf->cpf_gid; trans->tr_fl_node->fn_mode = cpf->cpf_mode; trans->tr_fl_node->fn_mtime = cpf->cpf_mtime; trans->tr_fl_node->fn_atime = cpf->cpf_atime; /* copy list of pending links over */ while ((hardlink = TAILQ_FIRST(&cpf->cpf_links))) { TAILQ_REMOVE(&cpf->cpf_links, hardlink, fn_list); TAILQ_INSERT_TAIL( &trans->tr_fl_node->fn_hardlinks, hardlink, fn_list); } ex_priv->doextract = 1; ct_extract_free_entry( &ex_priv->pending_tree, cpf); } else { ex_priv->doextract = 0; } } else { ex_priv->doextract = !ct_match(ex_priv->inc_match, trans->tr_fl_node->fn_fullname); if (ex_priv->doextract && ex_priv->ex_match != NULL && !ct_match(ex_priv->ex_match, trans->tr_fl_node->fn_fullname)) { ex_priv->doextract = 0; } } if (ex_priv->doextract && trans->tr_fl_node->fn_hardlink) { struct ct_pending_file *file; if ((file = ct_extract_find_entry( &ex_priv->pending_tree, trans->tr_fl_node->fn_hlname)) != NULL) { CNDBG(CT_LOG_FILE, "adding pending link for %s to %s", file->cpf_name, trans->tr_fl_node->fn_fullname); /* our reference to node passed */ ct_pending_file_add_link(file, trans->tr_fl_node); ex_priv->doextract = 0; goto skip; } } /* * If we're on the first ctfile in an allfiles backup * put the matches with -1 on the rb tree so we'll * remember to extract it from older files. */ if (ex_priv->doextract == 1 && ex_priv->fillrb && ex_priv->xdr_ctx.xs_hdr.cmh_nr_shas == -1) { ct_extract_insert_entry(&ex_priv->pending_tree, trans->tr_fl_node); ex_priv->doextract = 0; /* XXX reconsider the freeing */ } if (ex_priv->doextract == 0) { ct_free_fnode(trans->tr_fl_node); skip: ex_priv->fl_ex_node = NULL; ct_trans_free(state, trans); continue; } CNDBG(CT_LOG_CTFILE, "file %s numshas %" PRId64, trans->tr_fl_node->fn_fullname, ex_priv->xdr_ctx.xs_hdr.cmh_nr_shas); /* * special files we give our refcount up * regular files we need a new one since we need to * keep ours. */ if (trans->tr_state != TR_S_EX_SPECIAL) { ct_ref_fnode(trans->tr_fl_node); } else { ex_priv->fl_ex_node = NULL; } ct_queue_first(state, trans); break; case XS_RET_SHA: if (ex_priv->doextract == 0 || ex_priv->fl_ex_node->fn_skip_file != 0) { if (ctfile_parse_seek(&ex_priv->xdr_ctx)) { ct_fatal(state, "Can't seek past shas", ex_priv->xdr_ctx.xs_errno); goto dying; } ct_trans_free(state, trans); continue; } /* use saved fnode */ trans->tr_fl_node = ex_priv->fl_ex_node; if (memcmp(zerosha, ex_priv->xdr_ctx.xs_sha, SHA_DIGEST_LENGTH) == 0) { CWARNX("\"%s\" truncated during backup", trans->tr_fl_node->fn_fullname); if (ctfile_parse_seek(&ex_priv->xdr_ctx)) { ct_fatal(state, "Can't seek past " "truncation shas", ex_priv->xdr_ctx.xs_errno); goto dying; } ct_trans_free(state, trans); continue; } if (ex_priv->xdr_ctx.xs_gh.cmg_flags & CT_MD_CRYPTO) { /* * yes csha and sha are reversed, we want * to download csha, but putting it in sha * simplifies the code */ bcopy(ex_priv->xdr_ctx.xs_sha, trans->tr_csha, sizeof(trans->tr_csha)); bcopy(ex_priv->xdr_ctx.xs_csha, trans->tr_sha, sizeof(trans->tr_sha)); bcopy(ex_priv->xdr_ctx.xs_iv, trans->tr_iv, sizeof(trans->tr_iv)); } else { bcopy(ex_priv->xdr_ctx.xs_sha, trans->tr_sha, sizeof(trans->tr_sha)); } if (clog_mask_is_set(CT_LOG_SHA)) { ct_sha1_encode(trans->tr_sha, shat); CNDBG(CT_LOG_SHA, "extracting sha %s", shat); } trans->tr_state = TR_S_EX_SHA; trans->tr_complete = ct_extract_complete_file_read; trans->tr_dataslot = 0; ct_ref_fnode(trans->tr_fl_node); trans->tr_cleanup = ct_extract_cleanup_fnode; ct_queue_first(state, trans); break; case XS_RET_FILE_END: trans = ct_trans_realloc_local(state, trans); if (ex_priv->doextract == 0 || ex_priv->fl_ex_node->fn_skip_file != 0) { /* release our reference done with file */ if (ex_priv->fl_ex_node) { ct_free_fnode(ex_priv->fl_ex_node); ex_priv->fl_ex_node = NULL; } ct_trans_free(state, trans); continue; } /* use saved fnode from state */ trans->tr_fl_node = ex_priv->fl_ex_node; bcopy(ex_priv->xdr_ctx.xs_trl.cmt_sha, trans->tr_sha, sizeof(trans->tr_sha)); trans->tr_state = TR_S_EX_FILE_END; trans->tr_complete = ct_extract_complete_file_end; trans->tr_cleanup = ct_extract_cleanup_fnode; trans->tr_fl_node->fn_size = ex_priv->xdr_ctx.xs_trl.cmt_orig_size; /* * no reference here since we give our reference to the * last transaction on that file. We are done with it. */ ex_priv->fl_ex_node = NULL; ct_queue_first(state, trans); break; case XS_RET_EOF: CNDBG(CT_LOG_CTFILE, "Hit end of ctfile"); ctfile_parse_close(&ex_priv->xdr_ctx); /* if rb tree and rb is empty, goto end state */ if ((ex_priv->haverb || ex_priv->fillrb) && ct_extract_rb_empty(&ex_priv->pending_tree)) { /* * Cleanup extract queue, in case we had files * left. */ ct_extract_cleanup_queue( &ex_priv->extract_head); goto we_re_done_here; } if (!TAILQ_EMPTY(&ex_priv->extract_head)) { /* * if allfiles and this was the first pass. * free the current match lists * switch to rb tree mode */ if (ex_priv->fillrb) { ct_match_unwind(ex_priv->inc_match); if (ex_priv->ex_match) ct_match_unwind( ex_priv->ex_match); ex_priv->ex_match = NULL; ex_priv->inc_match = NULL; ex_priv->haverb = 1; ex_priv->fillrb = 0; } ct_trans_free(state, trans); /* reinits ex_priv->xdr_ctx */ if ((ret = ct_extract_open_next(&ex_priv->extract_head, &ex_priv->xdr_ctx)) != 0) { ct_fatal(state, "Can't open next ctfile", ret); goto dying; } state->ct_print_ctfile_info( state->ct_print_state, ex_priv->xdr_ctx.xs_filename, &ex_priv->xdr_ctx.xs_gh); /* poke file into action */ ct_wakeup_file(state->event_state); } else { /* * If rb tree and it is still has entries, * bitch about it */ /* XXX print out missing files */ if ((ex_priv->haverb || ex_priv->fillrb) && ct_extract_rb_empty( &ex_priv->pending_tree)) { CWARNX("out of ctfiles but some " "files are not found"); } we_re_done_here: if (ex_priv->inc_match) ct_match_unwind(ex_priv->inc_match); if (ex_priv->ex_match) ct_match_unwind( ex_priv->ex_match); ct_extract_pending_cleanup( &ex_priv->pending_tree); e_free(&ex_priv); op->op_priv = NULL; trans->tr_state = TR_S_DONE; trans->tr_complete = ct_extract_complete_done; trans->tr_cleanup = ct_extract_cleanup_done; /* * Technically this should be a local * transaction. However, since we are done * it doesn't really matter either way. */ ct_queue_first(state, trans); CNDBG(CT_LOG_TRANS, "extract finished"); ct_set_file_state(state, CT_S_FINISHED); } return; break; case XS_RET_FAIL: ct_fatal(state, "Failed to parse ctfile", ex_priv->xdr_ctx.xs_errno); goto dying; break; } } return; dying: /* only if we hadn't sent the final transaction yet */ if (ex_priv != NULL) { ct_extract_cleanup_queue(&ex_priv->extract_head); if (ex_priv->inc_match) ct_match_unwind(ex_priv->inc_match); if (ex_priv->ex_match) ct_match_unwind(ex_priv->ex_match); if (!ct_extract_rb_empty(&ex_priv->pending_tree)) { ct_extract_pending_cleanup(&ex_priv->pending_tree); } if (ex_priv->fl_ex_node != NULL) { ct_free_fnode(ex_priv->fl_ex_node); } /* XXX what about ex_priv->xdr_ctx ? */ e_free(&ex_priv); op->op_priv = NULL; /* if ex_priv is gone then the trans will clean this up */ if (state->extract_state) ct_file_extract_cleanup(state->extract_state); } return; }
/* * Extract an individual file that has been passed into the op by op_priv. */ void ct_extract_file(struct ct_global_state *state, struct ct_op *op) { struct ct_extract_file_args *cefa = op->op_args; struct ct_file_extract_priv *ex_priv = op->op_priv; const char *localfile = cefa->cefa_filename; struct ct_trans *trans; int ret; char shat[SHA_DIGEST_STRING_LENGTH]; if (state->ct_dying != 0) goto dying; CNDBG(CT_LOG_TRANS, "entry"); switch (ct_get_file_state(state)) { case CT_S_STARTING: CNDBG(CT_LOG_TRANS, "starting"); ex_priv = e_calloc(1, sizeof(*ex_priv)); /* open file and seek to beginning of file */ if ((ret = ctfile_parse_init_at(&ex_priv->xdr_ctx, cefa->cefa_ctfile, NULL, cefa->cefa_ctfile_off)) != 0) { /* XXX add pathname */ ct_fatal(state, "Can't open ctfile", ret); e_free(&ex_priv); goto dying; } /* XXX we should handle this better */ if (state->ct_max_block_size < ex_priv->xdr_ctx.xs_gh.cmg_chunk_size) CABORTX("block size negotiated with server %d is " "smaller than file max block size %d", state->ct_max_block_size, ex_priv->xdr_ctx.xs_gh.cmg_chunk_size); if ((ret = ct_file_extract_init(&state->extract_state, NULL, 0, 0, 0, NULL, NULL)) != 0) { ct_fatal(state, "Can not initialise extract state", ret); e_free(&ex_priv); goto dying; } op->op_priv = ex_priv; break; case CT_S_FINISHED: return; default: break; } ct_set_file_state(state, CT_S_RUNNING); while (1) { if ((trans = ct_trans_alloc(state)) == NULL) { CNDBG(CT_LOG_TRANS, "ran out of transactions, waiting"); ct_set_file_state(state, CT_S_WAITING_TRANS); return; } trans->tr_statemachine = ct_state_extract; if (ex_priv->done) { CNDBG(CT_LOG_CTFILE, "Hit end of ctfile"); ctfile_parse_close(&ex_priv->xdr_ctx); e_free(&ex_priv); op->op_priv = NULL; trans->tr_state = TR_S_DONE; trans->tr_complete = ct_extract_complete_done; trans->tr_cleanup = ct_extract_cleanup_done; ct_queue_first(state, trans); CNDBG(CT_LOG_TRANS, "extract finished"); ct_set_file_state(state, CT_S_FINISHED); return; } /* unless start of file this is right */ trans->tr_fl_node = ex_priv->fl_ex_node; switch ((ret = ctfile_parse(&ex_priv->xdr_ctx))) { case XS_RET_FILE: CNDBG(CT_LOG_CTFILE, "opening file"); if (ex_priv->xdr_ctx.xs_hdr.cmh_nr_shas == -1) CABORTX("can't extract file with -1 shas"); trans = ct_trans_realloc_local(state, trans); trans->tr_fl_node = ex_priv->fl_ex_node = ct_alloc_fnode(); /* Make it local directory, it won't be set up right. */ ex_priv->xdr_ctx.xs_hdr.cmh_parent_dir = -1; /* * Allfiles doesn't matter, only processing one file. * We have a full path to extract to so always strip * slash. */ ct_populate_fnode(state->extract_state, &ex_priv->xdr_ctx, trans->tr_fl_node, &trans->tr_state, 0, 1); if (trans->tr_state == TR_S_EX_SPECIAL) { trans->tr_complete = ct_extract_complete_special; } else { trans->tr_complete = ct_extract_complete_file_start; } trans->tr_cleanup = ct_extract_cleanup_fnode; e_free(&trans->tr_fl_node->fn_fullname); trans->tr_fl_node->fn_fullname = e_strdup(localfile); e_free(&trans->tr_fl_node->fn_name); trans->tr_fl_node->fn_name = e_strdup(localfile); /* Set name pointer to something else passed in */ CNDBG(CT_LOG_CTFILE, "file %s numshas %" PRId64, trans->tr_fl_node->fn_fullname, ex_priv->xdr_ctx.xs_hdr.cmh_nr_shas); /* * special files we give our refcount up * regular files we need a new one since we need to * keep ours. */ if (trans->tr_state != TR_S_EX_SPECIAL) { ct_ref_fnode(trans->tr_fl_node); } else { ex_priv->fl_ex_node = NULL; } break; case XS_RET_SHA: CNDBG(CT_LOG_SHA, "sha!"); if (ex_priv->xdr_ctx.xs_gh.cmg_flags & CT_MD_CRYPTO) { /* * yes csha and sha are reversed, we want * to download csha, but putting it in sha * simplifies the code */ bcopy(ex_priv->xdr_ctx.xs_sha, trans->tr_csha, sizeof(trans->tr_csha)); bcopy(ex_priv->xdr_ctx.xs_csha, trans->tr_sha, sizeof(trans->tr_sha)); bcopy(ex_priv->xdr_ctx.xs_iv, trans->tr_iv, sizeof(trans->tr_iv)); } else { bcopy(ex_priv->xdr_ctx.xs_sha, trans->tr_sha, sizeof(trans->tr_sha)); } if (clog_mask_is_set(CT_LOG_SHA)) { ct_sha1_encode(trans->tr_sha, shat); CNDBG(CT_LOG_SHA, "extracting sha %s", shat); } trans->tr_state = TR_S_EX_SHA; trans->tr_complete = ct_extract_complete_file_read; trans->tr_cleanup = ct_extract_cleanup_fnode; trans->tr_dataslot = 0; ct_ref_fnode(trans->tr_fl_node); break; case XS_RET_FILE_END: trans = ct_trans_realloc_local(state, trans); trans->tr_fl_node = ex_priv->fl_ex_node; /* reload */ CNDBG(CT_LOG_CTFILE, "file end!"); bcopy(ex_priv->xdr_ctx.xs_trl.cmt_sha, trans->tr_sha, sizeof(trans->tr_sha)); trans->tr_state = TR_S_EX_FILE_END; trans->tr_complete = ct_extract_complete_file_end; trans->tr_cleanup = ct_extract_cleanup_fnode; trans->tr_fl_node->fn_size = ex_priv->xdr_ctx.xs_trl.cmt_orig_size; /* Done now, don't parse further. */ ex_priv->done = 1; /* * no reference here since we give our reference to the * last transaction on that file. */ ex_priv->fl_ex_node = NULL; break; case XS_RET_FAIL: ct_fatal(state, "Failed to parse ctfile", ex_priv->xdr_ctx.xs_errno); goto dying; break; default: CABORTX("%s: invalid state %d", __func__, ret); } ct_queue_first(state, trans); } return; dying: if (ex_priv) { ctfile_parse_close(&ex_priv->xdr_ctx); if (ex_priv->fl_ex_node != NULL) { ct_free_fnode(ex_priv->fl_ex_node); } e_free(&ex_priv); /* will be cleaned up by trans if ex_priv already gone */ if (state->extract_state) ct_file_extract_cleanup(state->extract_state); } return; }
/* * So that we can provide correct statistics we have to go through all ctfiles * being extracted and sum the sizes to be extracted. This is kinda expensive, * but not really avoidable if we want to provide the statistics. * * Failure means we have called ct fatal. */ int ct_extract_calculate_total(struct ct_global_state *state, struct ct_extract_args *cea, struct ct_match *inc_match, struct ct_match *ex_match) { struct ct_extract_head extract_head; struct ctfile_parse_state xdr_ctx; struct ct_match *rb_match = NULL; struct fnode *fnode; int allfiles; int fillrb = 0, haverb = 0; int doextract = 0; int tr_state; int ret; int retval = 1; TAILQ_INIT(&extract_head); if ((ret = ct_extract_setup(&extract_head, &xdr_ctx, cea->cea_local_ctfile, cea->cea_ctfile_basedir, &allfiles)) != 0) { ct_fatal(state, "can't setup extract queue", ret); goto done; } if (allfiles) { char *nothing = NULL; if ((ret = ct_match_compile(&rb_match, CT_MATCH_RB, ¬hing)) != 0) { ct_fatal(state, "Couldn't create match tree", ret); goto done; } fillrb = 1; } while (1) { switch ((ret = ctfile_parse(&xdr_ctx))) { case XS_RET_FILE: if (fillrb == 0 && xdr_ctx.xs_hdr.cmh_nr_shas == -1) { continue; } fnode = ct_alloc_fnode(); /* XXX need the fnode for the correct paths */ ct_populate_fnode(state->extract_state, &xdr_ctx, fnode, &tr_state, allfiles, cea->cea_strip_slash); /* we don't care about individual shas */ if (C_ISREG(fnode->fn_type)) { ctfile_parse_seek(&xdr_ctx); } doextract = !ct_match(inc_match, fnode->fn_fullname); if (doextract && ex_match != NULL && !ct_match(ex_match, fnode->fn_fullname)) doextract = 0; /* * If we're on the first ctfile in an allfiles backup * put the matches with -1 on the rb tree so we'll * remember to extract it from older files. */ if (doextract == 1 && fillrb && xdr_ctx.xs_hdr.cmh_nr_shas == -1) { ct_match_insert_rb(rb_match, fnode->fn_fullname); doextract = 0; } ct_free_fnode(fnode); break; case XS_RET_FILE_END: if (doextract == 0) continue; /* update statistics */ state->ct_stats->st_bytes_tot += xdr_ctx.xs_trl.cmt_orig_size; break; case XS_RET_EOF: ctfile_parse_close(&xdr_ctx); /* if rb tree and rb is empty, goto end state */ if ((haverb && ct_match_rb_is_empty(inc_match)) || (fillrb && ct_match_rb_is_empty(rb_match))) { retval = 0; goto done; } if (!TAILQ_EMPTY(&extract_head)) { /* * if allfiles and this was the first pass. * free the current match lists * switch to rb tree mode */ if (fillrb) { ex_match = NULL; inc_match = rb_match; rb_match = NULL; haverb = 1; fillrb = 0; } /* reinits xdr_ctx */ if ((ret = ct_extract_open_next(&extract_head, &xdr_ctx)) != 0) { ct_fatal(state, "Can't open next ctfile", ret); goto done; } continue; } retval = 0; goto done; break; case XS_RET_FAIL: ct_fatal(state, "Failed to parse ctfile", xdr_ctx.xs_errno); goto done; break; } } done: /* empty unless we quit early */ ct_extract_cleanup_queue(&extract_head); /* only have control of the rb tree we made */ if (haverb) ct_match_unwind(inc_match); if (rb_match != NULL) ct_match_unwind(rb_match); return (retval); }
/* * Perform EXISTS checking on every sha in a ctfile chain. * * We don't do any filtering. It is assumed that the localdb has been * flushed/made good before this operation starts so that we can trust lookups. */ void ct_exists_file(struct ct_global_state *state, struct ct_op *op) { struct ct_exists_args *ce = op->op_args; struct ct_exists_priv *ex_priv = op->op_priv; struct ct_trans *trans; int ret, allfiles; /* if we were woken up due to fatal, just clean up local state */ if (state->ct_dying != 0) goto dying; CNDBG(CT_LOG_TRANS, "entry"); switch (ct_get_file_state(state)) { case CT_S_STARTING: if (ex_priv == NULL) { ex_priv = e_calloc(1, sizeof(*ex_priv)); TAILQ_INIT(&ex_priv->extract_head); op->op_priv = ex_priv; } if ((ret = ct_extract_setup(&ex_priv->extract_head, &ex_priv->xdr_ctx, ce->ce_ctfile, ce->ce_ctfile_basedir, &allfiles)) != 0) { ct_fatal(state, "can't setup extract queue", ret); goto dying; } break; case CT_S_FINISHED: return; default: break; } ct_set_file_state(state, CT_S_RUNNING); while (1) { if ((trans = ct_trans_alloc(state)) == NULL) { CNDBG(CT_LOG_TRANS, "ran out of transactions, waiting"); ct_set_file_state(state, CT_S_WAITING_TRANS); return; } trans->tr_statemachine = ct_state_exists; switch ((ret = ctfile_parse(&ex_priv->xdr_ctx))) { case XS_RET_FILE: case XS_RET_FILE_END: ct_trans_free(state, trans); break; case XS_RET_SHA: if (memcmp(zerosha, ex_priv->xdr_ctx.xs_sha, SHA_DIGEST_LENGTH) == 0) { if (ctfile_parse_seek(&ex_priv->xdr_ctx)) { ct_fatal(state, "Can't seek past " "truncation shas", ex_priv->xdr_ctx.xs_errno); goto dying; } ct_trans_free(state, trans); continue; } if (ex_priv->xdr_ctx.xs_gh.cmg_flags & CT_MD_CRYPTO) { /* * yes csha and sha are reversed, we want * to download csha, but putting it in sha * simplifies the code */ bcopy(ex_priv->xdr_ctx.xs_sha, trans->tr_sha, sizeof(trans->tr_csha)); bcopy(ex_priv->xdr_ctx.xs_csha, trans->tr_csha, sizeof(trans->tr_sha)); bcopy(ex_priv->xdr_ctx.xs_iv, trans->tr_iv, sizeof(trans->tr_iv)); trans->tr_state = TR_S_COMPSHA_ED; } else { trans->tr_state = TR_S_UNCOMPSHA_ED; bcopy(ex_priv->xdr_ctx.xs_sha, trans->tr_sha, sizeof(trans->tr_sha)); } if (clog_mask_is_set(CT_LOG_SHA)) { char shat[SHA_DIGEST_STRING_LENGTH]; ct_sha1_encode(trans->tr_sha, shat); CNDBG(CT_LOG_SHA, "EXISTSing sha %s", shat); } trans->tr_old_genid = -1; /* XXX */ if (ctdb_lookup_sha(state->ct_db_state, trans->tr_sha, trans->tr_csha, trans->tr_iv, &trans->tr_old_genid)) { CNDBG(CT_LOG_SHA, "sha already in localdb"); state->ct_stats->st_bytes_exists += trans->tr_chsize; ct_trans_free(state, trans); continue; } trans->tr_complete = ct_exists_complete; trans->tr_cleanup = NULL; trans->tr_dataslot = 0; ct_queue_first(state, trans); break; case XS_RET_EOF: CNDBG(CT_LOG_CTFILE, "Hit end of ctfile"); ctfile_parse_close(&ex_priv->xdr_ctx); if (!TAILQ_EMPTY(&ex_priv->extract_head)) { /* * if allfiles and this was the first pass. * free the current match lists * switch to rb tree mode */ ct_trans_free(state, trans); /* reinits ex_priv->xdr_ctx */ if ((ret = ct_extract_open_next(&ex_priv->extract_head, &ex_priv->xdr_ctx)) != 0) { ct_fatal(state, "Can't open next ctfile", ret); goto dying; } } else { e_free(&ex_priv); op->op_priv = NULL; trans->tr_state = TR_S_DONE; trans->tr_complete = ct_exists_complete_done; trans->tr_cleanup = NULL; /* * Technically this should be a local * transaction. However, since we are done * it doesn't really matter either way. */ ct_queue_first(state, trans); CNDBG(CT_LOG_TRANS, "extract finished"); ct_set_file_state(state, CT_S_FINISHED); } return; break; case XS_RET_FAIL: ct_fatal(state, "Failed to parse ctfile", ex_priv->xdr_ctx.xs_errno); goto dying; break; } } return; dying: /* only if we hadn't sent the final transaction yet */ if (ex_priv != NULL) { ct_extract_cleanup_queue(&ex_priv->extract_head); /* XXX what about ex_priv->xdr_ctx ? */ e_free(&ex_priv); op->op_priv = NULL; } return; }
/* * Main guts of ctd_build_version_tree. Factored out to avoid deep nesting. * Insert or update an entry in the tree with the information received from * the ctfile. */ static int ct_vertree_add(struct ct_vertree_dnode_cache *dnode_cache, struct ct_vertree_entry *head, struct ctfile_parse_state *parse_state, struct ct_vertree_ctfile *ctfile, off_t fileoffset, int allfiles) { struct ctfile_header *hdr = &parse_state->xs_hdr; struct ctfile_header *hdrlnk= &parse_state->xs_lnkhdr; struct dnode *dnode; struct ct_vertree_dnode *fb_dnode; struct ct_vertree_entry *parent = NULL, sentry, *entry; struct ct_vertree_ver *lastver, *ver; struct ct_vertree_file *file; struct ct_vertree_spec *spec; struct ct_vertree_link *linkver; size_t sz; bool root_dnode = false; entry = NULL; /* First find parent directory if any */ if (hdr->cmh_parent_dir != -1 && hdr->cmh_parent_dir != -2) { if ((dnode = ctfile_parse_finddir(parse_state, hdr->cmh_parent_dir)) == NULL) { CNDBG(CT_LOG_VERTREE, "can't find dir %" PRId64, hdr->cmh_parent_dir); return (CTE_CTFILE_CORRUPT); } fb_dnode = (struct ct_vertree_dnode *)dnode; if (fb_dnode == dnode_cache->root_dnode) { // If we have the root dnode, store in head. parent = head; } else { parent = fb_dnode->cvd_dir; } } else { parent = head; } if (parent == head && strcmp(hdr->cmh_filename, CT_PATHSEP_STR) == 0) { root_dnode = true; } /* * Have parent node, search children to see if we already exist. * Else make a new one and insert. */ sentry.cve_name = hdr->cmh_filename; if ((entry = RB_FIND(ct_vertree_entries, &parent->cve_children, &sentry)) == NULL) { /* new name, insert node */ entry = e_calloc(1, sizeof(*entry)); TAILQ_INIT(&entry->cve_versions); RB_INIT(&entry->cve_children); entry->cve_parent = parent; entry->cve_name = e_strdup(sentry.cve_name); /* don't insert root dnodes, just do dnode dance */ if (root_dnode) { goto rootdir; } if (RB_INSERT(ct_vertree_entries, &parent->cve_children, entry) != NULL) { CNDBG(CT_LOG_VERTREE, "entry %s already exists", sentry.cve_name); e_free(&sentry.cve_name); goto err; } } /* * then check version tags -> head/tail if mtime and type match, we're * good else prepare version entry. */ if (allfiles) { lastver = TAILQ_FIRST(&entry->cve_versions); } else { lastver = TAILQ_LAST(&entry->cve_versions, ct_vertree_vers); } /* Don't check atime, it doesn't matter */ if (lastver != NULL && lastver->cvv_type == hdr->cmh_type && lastver->cvv_mtime == hdr->cmh_mtime && lastver->cvv_uid == hdr->cmh_uid && lastver->cvv_gid == hdr->cmh_gid && lastver->cvv_mode == hdr->cmh_mode) { ver = lastver; } else { /* something changed. make a new one */ if (C_ISDIR(hdr->cmh_type)) { sz = sizeof(struct ct_vertree_dir); } else if (C_ISBLK(hdr->cmh_type) || C_ISCHR(hdr->cmh_type)) { sz = sizeof(struct ct_vertree_spec); } else if (C_ISLINK(hdr->cmh_type)) { sz = sizeof(struct ct_vertree_link); } else if (C_ISREG(hdr->cmh_type)) { sz = sizeof(struct ct_vertree_file); } else { CNDBG(CT_LOG_VERTREE, "invalid type %d", hdr->cmh_type); goto err; } ver = e_calloc(1, sz); ver->cvv_type = hdr->cmh_type; ver->cvv_mtime = hdr->cmh_mtime; ver->cvv_atime = hdr->cmh_atime; ver->cvv_uid = hdr->cmh_uid; ver->cvv_gid = hdr->cmh_gid; ver->cvv_mode = hdr->cmh_mode; /* dir handled below */ if (C_ISBLK(hdr->cmh_type) || C_ISCHR(hdr->cmh_type)) { spec = (struct ct_vertree_spec *)ver; spec->cvs_rdev = hdr->cmh_rdev; } else if (C_ISLINK(hdr->cmh_type)) { /* hardlink/symlink */ linkver = (struct ct_vertree_link *)ver; linkver->cvl_linkname = e_strdup(hdrlnk->cmh_filename); linkver->cvl_hardlink = !C_ISLINK(hdrlnk->cmh_type); } else if (C_ISREG(hdr->cmh_type)) { file = (struct ct_vertree_file *)ver; file->cvf_nr_shas = -1; } if (allfiles) { TAILQ_INSERT_HEAD(&entry->cve_versions, ver, cvv_link); } else { TAILQ_INSERT_TAIL(&entry->cve_versions, ver, cvv_link); } } /* * Each ctfile only has each directory referenced once, so put it * in the cache regardless of whether it was known of before, that * will be a previous run and the cache will have been wiped since * then. */ if (C_ISDIR(hdr->cmh_type)) { rootdir: fb_dnode = e_calloc(1, sizeof(*fb_dnode)); fb_dnode->cvd_dnode.d_name = e_strdup(entry->cve_name); /* * in the root_dnode case this will be a bad pointer but it * will never be derefed. */ fb_dnode->cvd_dir = entry; if ((dnode = ctfile_parse_insertdir(parse_state, &fb_dnode->cvd_dnode)) != NULL) CABORTX("duplicate dentry"); TAILQ_INSERT_TAIL(&dnode_cache->cache, fb_dnode, cvd_link); if (root_dnode) { dnode_cache->root_dnode = fb_dnode; } } else if (C_ISREG(hdr->cmh_type)) { /* * Allfiles ctfiles may have shas == -1, so in some cases we * may wish to update an existing file when we find the actual * shas. It is an error to have a file node with -1 for shas * after all metadata have been parsed. it means one was * missing. */ file = (struct ct_vertree_file *)ver; /* * bugs in previous editions with incremental selection and * off_t on linux mean that there are ctfiles in the wild which * provide a list of shas in a later level when the file is * defined in an earlier level file, also. For example for the * same filename and date we have level 0: 3 shas, level 1: -1 * shas (i.e. in a previous level), level 2: 3 shas (same as * level * 0). In that case we just assume that if we already * have sha data for a file * then it is correct and we skip * previous versions. */ if (file->cvf_nr_shas != -1) { goto out; } /* * previous linux off_t bugs with files over 2gb mean that there * are sign extended ctfiles in the wild, so we count those as * zero length for purposes of the version tree. */ if (hdr->cmh_nr_shas < -1) { hdr->cmh_nr_shas = 0; } if (hdr->cmh_nr_shas != -1) { file->cvf_nr_shas = hdr->cmh_nr_shas; file->cvf_sha_offs = fileoffset; file->cvf_file = ctfile; if (ctfile_parse_seek(parse_state)) { CNDBG(CT_LOG_VERTREE, "failed to skip shas in %s", ctfile->cvc_path); goto err; } } if (ctfile_parse(parse_state) != XS_RET_FILE_END) { CNDBG(CT_LOG_VERTREE, "no file trailer found"); goto err; } file->cvf_file_size = parse_state->xs_trl.cmt_orig_size; } out: /* * If we're an explicit "/" entry then we don't want to be added to * the tree. all our children will be added to the root entry. */ if (root_dnode) { e_free(&entry); } return (0); err: if (entry != NULL) e_free(&entry); return (CTE_CTFILE_CORRUPT); }
int ct_version_tree_build(const char *filename, const char *ctfile_basedir, struct ct_version_tree **version_tree) { struct ct_version_tree *tree = NULL; struct ct_extract_head extract_head; struct ctfile_parse_state parse_state; struct ct_vertree_dnode_cache dnode_cache; struct ct_vertree_dnode *dnode_entry; struct ct_vertree_ctfile *ctfile = NULL; struct ct_vertree_dir *root_dir; struct ct_vertree_ver *root_version; off_t offset; int allfiles; int rv = 0; TAILQ_INIT(&extract_head); TAILQ_INIT(&dnode_cache.cache); dnode_cache.root_dnode = NULL; if ((rv = ct_extract_setup(&extract_head, &parse_state, filename, ctfile_basedir, &allfiles))) { CNDBG(CT_LOG_VERTREE, "failed to setup extract for filename %s: %s", filename, ct_strerror(rv)); goto out; } /* Create and init ctfile cache */ tree = e_calloc(1, sizeof(*tree)); TAILQ_INIT(&tree->cvt_ctfiles); TAILQ_INIT(&tree->cvt_head.cve_versions); RB_INIT(&tree->cvt_head.cve_children); tree->cvt_head.cve_name = e_strdup("/"); nextfile: root_dir = e_calloc(1, sizeof(*root_dir)); root_version = &root_dir->cvd_base; root_version->cvv_type = C_TY_DIR; root_version->cvv_uid = 0; root_version->cvv_gid = 0; root_version->cvv_mode = 0777; root_version->cvv_atime = parse_state.xs_gh.cmg_created; root_version->cvv_mtime = parse_state.xs_gh.cmg_created; TAILQ_INSERT_HEAD(&tree->cvt_head.cve_versions, root_version, cvv_link); /* * Create only one struct for each ctfile. Each entry in the version * tree references the appropriate one. These are added to a cache list * so they can be freed during tree cleanup. */ ctfile = e_calloc(1, sizeof(*ctfile)); strlcpy(ctfile->cvc_path, parse_state.xs_filename, sizeof(ctfile->cvc_path)); offset = ctfile_parse_tell(&parse_state); TAILQ_INSERT_TAIL(&tree->cvt_ctfiles, ctfile, cvc_link); while (((rv = ctfile_parse(&parse_state)) != XS_RET_EOF) && (rv != XS_RET_FAIL)) { switch(rv) { case XS_RET_FILE: if ((rv = ct_vertree_add(&dnode_cache, &tree->cvt_head, &parse_state, ctfile, offset, allfiles)) != 0) { goto out; } break; case XS_RET_FILE_END: break; case XS_RET_SHA: if ((rv = ctfile_parse_seek(&parse_state))) { goto out; } break; default: rv = CTE_CTFILE_CORRUPT; goto out; } offset = ctfile_parse_tell(&parse_state); } if (rv == XS_RET_EOF) { ctfile_parse_close(&parse_state); if (!TAILQ_EMPTY(&extract_head)) { /* XXX do we need to zero root dnode? */ ct_extract_open_next(&extract_head, &parse_state); goto nextfile; } rv = 0; /* free state */ } else { rv = CTE_CTFILE_CORRUPT; goto out; } *version_tree = tree; out: /* Free dnode_cache entries. */ while ((dnode_entry = TAILQ_FIRST(&dnode_cache.cache)) != NULL) { TAILQ_REMOVE(&dnode_cache.cache, dnode_entry, cvd_link); if (dnode_entry->cvd_dnode.d_name != NULL) e_free(&dnode_entry->cvd_dnode.d_name); e_free(&dnode_entry); } return rv; }
int ct_list(const char *file, char **flist, char **excludelist, int match_mode, const char *ctfile_basedir, int strip_slash, int verbose) { struct ct_extract_state *ces; struct ctfile_parse_state xs_ctx; struct fnode fnodestore; uint64_t reduction; struct fnode *fnode = &fnodestore; struct ct_match *match, *ex_match = NULL; char *ct_next_filename; char *sign; int state; int doprint = 0; int ret; int s_errno = 0, ct_errno = 0; char shat[SHA_DIGEST_STRING_LENGTH]; char cshat[SHA_DIGEST_STRING_LENGTH]; char iv[CT_IV_LEN*2+1]; if ((ret = ct_file_extract_init(&ces, NULL, 1, 1, 0, NULL, NULL)) != 0) CFATALX("failed to initialise extract state: %s", ct_strerror(ret)); if ((ret = ct_match_compile(&match, match_mode, flist)) != 0) CFATALX("failed to compile match pattern: %s", ct_strerror(ret)); if (excludelist != NULL && (ret = ct_match_compile(&ex_match, match_mode, excludelist)) != 0) CFATALX("failed to compile exclude pattern: %s", ct_strerror(ret)); verbose++; /* by default print something. */ ct_next_filename = NULL; next_file: ret = ctfile_parse_init(&xs_ctx, file, ctfile_basedir); if (ret) CFATALX("failed to open %s: %s", file, ct_strerror(ret)); ct_print_ctfile_info(&verbose, file, &xs_ctx.xs_gh); if (ct_next_filename) e_free(&ct_next_filename); if (xs_ctx.xs_gh.cmg_prevlvl_filename) { CNDBG(CT_LOG_CTFILE, "previous backup file %s\n", xs_ctx.xs_gh.cmg_prevlvl_filename); ct_next_filename = e_strdup(xs_ctx.xs_gh.cmg_prevlvl_filename); } bzero(&fnodestore, sizeof(fnodestore)); do { ret = ctfile_parse(&xs_ctx); switch (ret) { case XS_RET_FILE: ct_populate_fnode(ces, &xs_ctx, fnode, &state, xs_ctx.xs_gh.cmg_flags & CT_MD_MLB_ALLFILES, strip_slash); doprint = !ct_match(match, fnode->fn_fullname); if (doprint && ex_match != NULL && !ct_match(ex_match, fnode->fn_fullname)) doprint = 0; if (doprint) { ct_pr_fmt_file(&verbose, fnode); if (!C_ISREG(xs_ctx.xs_hdr.cmh_type) || verbose > 2) printf("\n"); } if (fnode->fn_hlname) e_free(&fnode->fn_hlname); if (fnode->fn_fullname) e_free(&fnode->fn_fullname); break; case XS_RET_FILE_END: sign = " "; if (xs_ctx.xs_trl.cmt_comp_size == 0) reduction = 100; else { uint64_t orig, comp; orig = xs_ctx.xs_trl.cmt_orig_size; comp = xs_ctx.xs_trl.cmt_comp_size; if (comp <= orig) { reduction = 100 * (orig - comp) / orig; } else { reduction = 100 * (comp - orig) / orig; if (reduction != 0) sign = "-"; } } if (doprint && verbose > 1) printf(" sz: %" PRIu64 " shas: %" PRIu64 " reduction: %s%" PRIu64 "%%\n", xs_ctx.xs_trl.cmt_orig_size, xs_ctx.xs_hdr.cmh_nr_shas, sign, reduction); else if (doprint) printf("\n"); break; case XS_RET_SHA: if (!(doprint && verbose > 2)) { if (ctfile_parse_seek(&xs_ctx)) { CFATALX("seek failed"); } } else { int i; ct_sha1_encode(xs_ctx.xs_sha, shat); switch (xs_ctx.xs_gh.cmg_flags & CT_MD_CRYPTO) { case 0: printf(" sha %s\n", shat); break; case CT_MD_CRYPTO: ct_sha1_encode(xs_ctx.xs_csha, cshat); for (i = 0; i < CT_IV_LEN; i++) snprintf(&iv[i * 2], 3, "%02x", xs_ctx.xs_iv[i]); printf(" sha %s csha %s iv %s\n", shat, cshat, iv); } } break; case XS_RET_EOF: break; case XS_RET_FAIL: s_errno = errno; ct_errno = xs_ctx.xs_errno; ; } } while (ret != XS_RET_EOF && ret != XS_RET_FAIL); ctfile_parse_close(&xs_ctx); if (ret != XS_RET_EOF) { errno = s_errno; CWARNX("corrupt ctfile: %s", ct_strerror(ct_errno)); } else { if (ct_next_filename) { file = ct_next_filename; goto next_file; } } ct_match_unwind(match); ct_file_extract_cleanup(ces); return (0); }