@inproceedings{2d2e4ce1c1f64ecab9d7a3a400b895d5,
title = "Tree-structured template generation for Web pages",
abstract = "As the web becomes an increasingly important source of information, tools for modeling, searching, and extracting information from Web pages are indispensable. By modeling the structure of a Web page defined by its markup tags, one can easily extract target information using structural templates. This paper introduces the Tree Template Automatic Generator (TTAG) that learns tree-structured templates from training Web pages. TTAG was applied to both query-based and frequently updated Web sites, and produced effective templates from a small number of examples. The experiments show that TTAG is a powerful extraction tool for semi-structured information sources.",
author = "Chuang, {Shui Lung} and Hsu, {Jane Yung Jen}",
year = "2004",
language = "英语",
isbn = "0769521002",
series = "Proceedings - IEEE/WIC/ACM International Conference on Web Intelligence, WI 2004",
pages = "327--333",
editor = "N. Zhong and H. Tirri and Y. Yao and L. Zhou",
booktitle = "Proceedings - IEEE/WIC/ACM International Conference on Web Intelligence, WI 2004",
note = "Proceedings - IEEE/WIC/ACM International Conference on Web Intelligence, WI 2004 ; Conference date: 20-09-2004 Through 24-09-2004",
}