Esempio n. 1
0
/**
 * Handle tokens in "in head noscript" insertion mode
 *
 * \param treebuilder  The treebuilder instance
 * \param token        The token to process
 * \return True to reprocess the token, false otherwise
 */
hubbub_error handle_in_head_noscript(hubbub_treebuilder *treebuilder,
		const hubbub_token *token)
{
	hubbub_error err = HUBBUB_OK;
	bool handled = false;

	switch (token->type) {
	case HUBBUB_TOKEN_CHARACTER:
		err = process_characters_expect_whitespace(treebuilder,
				token, true);
		break;
	case HUBBUB_TOKEN_COMMENT:
		err = handle_in_head(treebuilder, token);
		break;
	case HUBBUB_TOKEN_DOCTYPE:
		/** \todo parse error */
		break;
	case HUBBUB_TOKEN_START_TAG:
	{
		element_type type = element_type_from_name(treebuilder,
				&token->data.tag.name);

		if (type == HTML) {
			/* Process as "in body" */
			err = handle_in_body(treebuilder, token);
		} else if (type == NOSCRIPT) {
			handled = true;
		} else if (type == LINK || type == META || type == NOFRAMES ||
				type == STYLE) {
			/* Process as "in head" */
			err = handle_in_head(treebuilder, token);
		} else if (type == HEAD || type == NOSCRIPT) {
			/** \todo parse error */
		} else {
			/** \todo parse error */
			err = HUBBUB_REPROCESS;
		}
	}
		break;
	case HUBBUB_TOKEN_END_TAG:
	{
		element_type type = element_type_from_name(treebuilder,
				&token->data.tag.name);

		if (type == NOSCRIPT) {
			handled = true;
		} else if (type == BR) {
			/** \todo parse error */
			err = HUBBUB_REPROCESS;
		} else {
			/** \todo parse error */
		}
	}
		break;
	case HUBBUB_TOKEN_EOF:
		/** \todo parse error */
		err = HUBBUB_REPROCESS;
		break;
	}

	if (handled || err == HUBBUB_REPROCESS) {
		hubbub_ns ns;
		element_type otype;
		void *node;

		element_stack_pop(treebuilder, &ns, &otype, &node);

		treebuilder->tree_handler->unref_node(
				treebuilder->tree_handler->ctx,
				node);

		treebuilder->context.mode = IN_HEAD;
	}

	return err;
}
Esempio n. 2
0
/**
 * Handle token in "in table" insertion mode
 *
 * \param treebuilder  The treebuilder instance
 * \param token        The token to handle
 * \return True to reprocess token, false otherwise
 */
hubbub_error handle_in_table(hubbub_treebuilder *treebuilder,
		const hubbub_token *token)
{
	hubbub_error err = HUBBUB_OK;
	bool handled = true;

	switch (token->type) {
	case HUBBUB_TOKEN_CHARACTER:
		if (treebuilder->context.element_stack[
				current_table(treebuilder)
				].tainted) {
			handled = false;
		} else {
			err = process_characters_expect_whitespace(
					treebuilder, token, true);
			handled = (err == HUBBUB_OK);
		}
		break;
	case HUBBUB_TOKEN_COMMENT:
		err = process_comment_append(treebuilder, token,
				treebuilder->context.element_stack[
				treebuilder->context.current_node].node);
		break;
	case HUBBUB_TOKEN_DOCTYPE:
		/** \todo parse error */
		break;
	case HUBBUB_TOKEN_START_TAG:
	{
		element_type type = element_type_from_name(treebuilder,
				&token->data.tag.name);
		bool tainted = treebuilder->context.element_stack[
					current_table(treebuilder)
					].tainted;

		if (type == CAPTION) {
			clear_stack_table_context(treebuilder);

			treebuilder->tree_handler->ref_node(
				treebuilder->tree_handler->ctx,
				treebuilder->context.element_stack[
				treebuilder->context.current_node].node);

			err = formatting_list_append(treebuilder,
					token->data.tag.ns, type,
					treebuilder->context.element_stack[
					treebuilder->context.current_node].node,
					treebuilder->context.current_node);
			if (err != HUBBUB_OK) {
				treebuilder->tree_handler->unref_node(
					treebuilder->tree_handler->ctx,
					treebuilder->context.element_stack[
					treebuilder->context.current_node].node);

				return err;
			}

			err = insert_element(treebuilder, &token->data.tag, 
					true);
			if (err != HUBBUB_OK) {
				hubbub_ns ns;
				element_type type;
				void *node;
				uint32_t index;

				formatting_list_remove(treebuilder,
					treebuilder->context.formatting_list_end,
					&ns, &type, &node, &index);

				treebuilder->tree_handler->unref_node(
					treebuilder->tree_handler->ctx,
					node);

				return err;
			}

			treebuilder->context.mode = IN_CAPTION;
		} else if (type == COLGROUP || type == COL) {
			hubbub_error e;
			hubbub_tag tag = token->data.tag;

			if (type == COL) {
				/* Insert colgroup and reprocess */
				tag.name.ptr = (const uint8_t *) "colgroup";
				tag.name.len = SLEN("colgroup");
				tag.n_attributes = 0;
				tag.attributes = NULL;

				err = HUBBUB_REPROCESS;
			}

			clear_stack_table_context(treebuilder);

			e = insert_element(treebuilder, &tag, true);
			if (e != HUBBUB_OK)
				return e;

			treebuilder->context.mode = IN_COLUMN_GROUP;
		} else if (type == TBODY || type == TFOOT || type == THEAD ||
				type == TD || type == TH || type == TR) {
			hubbub_error e;
			hubbub_tag tag = token->data.tag;

			if (type == TD || type == TH || type == TR) {
				/* Insert tbody and reprocess */
				tag.name.ptr = (const uint8_t *) "tbody";
				tag.name.len = SLEN("tbody");
				tag.n_attributes = 0;
				tag.attributes = NULL;

				err = HUBBUB_REPROCESS;
			}

			clear_stack_table_context(treebuilder);

			e = insert_element(treebuilder, &tag, true);
			if (e != HUBBUB_OK)
				return e;

			treebuilder->context.mode = IN_TABLE_BODY;
		} else if (type == TABLE) {
			/** \todo parse error */

			/* This should match "</table>" handling */
			element_stack_pop_until(treebuilder, TABLE);

			reset_insertion_mode(treebuilder);

			err = HUBBUB_REPROCESS;
		} else if (!tainted && (type == STYLE || type == SCRIPT)) {
			err = handle_in_head(treebuilder, token);
		} else if (!tainted && type == INPUT) {
			err = process_input_in_table(treebuilder, token);
			handled = (err == HUBBUB_OK);
		} else {
			handled = false;
		}
	}
		break;
	case HUBBUB_TOKEN_END_TAG:
	{
		element_type type = element_type_from_name(treebuilder,
				&token->data.tag.name);

		if (type == TABLE) {
			/** \todo fragment case */

			element_stack_pop_until(treebuilder, TABLE);

			reset_insertion_mode(treebuilder);
		} else if (type == BODY || type == CAPTION || type == COL ||
				type == COLGROUP || type == HTML ||
				type == TBODY || type == TD || type == TFOOT ||
				type == TH || type == THEAD || type == TR) {
			/** \todo parse error */
		} else {
			handled = false;
		}
	}
		break;
	case HUBBUB_TOKEN_EOF:
		break;
	}

	if (!handled) {
		treebuilder->context.in_table_foster = true;

		/** \todo parse error */
		err = handle_in_body(treebuilder, token);

		treebuilder->context.in_table_foster = false;
	}


	return err;
}
/**
 * Handle tokeniser emitting a token
 *
 * \param token  The emitted token
 * \param pw     Pointer to treebuilder instance
 */
hubbub_error hubbub_treebuilder_token_handler(const hubbub_token *token,
		void *pw)
{
	hubbub_treebuilder *treebuilder = (hubbub_treebuilder *) pw;
	hubbub_error err = HUBBUB_REPROCESS;

	/* Do nothing if we have no document node or there's no tree handler */
	if (treebuilder->context.document == NULL ||
			treebuilder->tree_handler == NULL)
		return HUBBUB_OK;

	assert((signed) treebuilder->context.current_node >= 0);

/* A slightly nasty debugging hook, but very useful */
#ifdef NDEBUG
# define mode(x) \
		case x:
#else
# define mode(x) \
		case x: \
			printf( #x "\n");
#endif

	while (err == HUBBUB_REPROCESS) {
		switch (treebuilder->context.mode) {
		mode(INITIAL)
			err = handle_initial(treebuilder, token);
			break;
		mode(BEFORE_HTML)
			err = handle_before_html(treebuilder, token);
			break;
		mode(BEFORE_HEAD)
			err = handle_before_head(treebuilder, token);
			break;
		mode(IN_HEAD)
			err = handle_in_head(treebuilder, token);
			break;
		mode(IN_HEAD_NOSCRIPT)
			err = handle_in_head_noscript(treebuilder, token);
			break;
		mode(AFTER_HEAD)
			err = handle_after_head(treebuilder, token);
			break;
		mode(IN_BODY)
			err = handle_in_body(treebuilder, token);
			break;
		mode(IN_TABLE)
			err = handle_in_table(treebuilder, token);
			break;
		mode(IN_CAPTION)
			err = handle_in_caption(treebuilder, token);
			break;
		mode(IN_COLUMN_GROUP)
			err = handle_in_column_group(treebuilder, token);
			break;
		mode(IN_TABLE_BODY)
			err = handle_in_table_body(treebuilder, token);
			break;
		mode(IN_ROW)
			err = handle_in_row(treebuilder, token);
			break;
		mode(IN_CELL)
			err = handle_in_cell(treebuilder, token);
			break;
		mode(IN_SELECT)
			err = handle_in_select(treebuilder, token);
			break;
		mode(IN_SELECT_IN_TABLE)
			err = handle_in_select_in_table(treebuilder, token);
			break;
		mode(IN_FOREIGN_CONTENT)
			err = handle_in_foreign_content(treebuilder, token);
			break;
		mode(AFTER_BODY)
			err = handle_after_body(treebuilder, token);
			break;
		mode(IN_FRAMESET)
			err = handle_in_frameset(treebuilder, token);
			break;
		mode(AFTER_FRAMESET)
			err = handle_after_frameset(treebuilder, token);
			break;
		mode(AFTER_AFTER_BODY)
			err = handle_after_after_body(treebuilder, token);
			break;
		mode(AFTER_AFTER_FRAMESET)
			err = handle_after_after_frameset(treebuilder, token);
			break;
		mode(GENERIC_RCDATA)
			err = handle_generic_rcdata(treebuilder, token);
			break;
		}
	}

	return err;
}