您的位置:首页 > 编程语言 > C语言/C++

[C/C++]_[字符串处理]_[过滤出HTML标签的属性值]

2012-11-12 11:03 344 查看
typedef struct ElementAttribute ElementAttribute;

struct ElementAttribute
{
	const char* name;
	const char* value;
	ElementAttribute* previous;
};

static const char* HtmlFindSpaceFromRecursion(const char* str, const char* start)
{
	const char* p = str;
	while (p >= start)
	{
		if (*p == 0x20)
		{
			return p;
		}
		--p;
	}
	return str;
}

/**
 * 1.注意,这个函数只适合标准的属性格式,也就是"是成对存在.
 */
static ElementAttribute* HtmlGetElementAttribute(char* str)
{
	ElementAttribute *attr = NULL;
	static char quote = '\"';
	char* p = strchr(str, quote);
	while (p)
	{
		char *start = p;
		//属性名
		char* a_name_start = (char*) HtmlFindSpaceFromRecursion(start, str);
		*(start - 1) = 0;

		//属性值
		p = strchr(start + 1, quote);
		*p = 0;

		ElementAttribute *next = (ElementAttribute*) malloc(
				sizeof(ElementAttribute));
		memset(next, 0, sizeof(ElementAttribute));
		next->name = a_name_start + 1;
		next->value = start + 1;
		next->previous = attr;
		attr = next;

		p = strchr(p + 1, quote);
	}
	return attr;
}

TEST(main,testElementAttribute)
{
	char* str = strdup("p height=\"1em\" width=\"0pt\" align=\"center\"");
	ElementAttribute* attr = HtmlGetElementAttribute(str);
	while(attr)
	{
		QXLOG("name: ",attr->name);
		QXLOG("value:",attr->value);
		attr = attr->previous;
	}
	free(str);
}
内容来自用户分享和网络整理,不保证内容的准确性,如有侵权内容,可联系管理员处理 点击这里给我发消息
标签: