@inproceedings{6a14d10e5bde4c9b985841ac1035f85f,
title = "Transforming web pages to become standard-compliant through reverse engineering",
abstract = "Developing Web pages following established standards can make the information more accessible, their rendering more efficient, and their processing by computer applications easier. Unfortunately, more than 95\% of the existing Web pages today are not {"}valid{"} in that they do not follow some of the recommendations (standards) of the World Wide Web Consortium (W3C). Fixing any Web page to make it standard-compliant is a major undertaking. There is now an open-source tool called HTML Tidy which will attempt to fix the invalid HTML code automatically. However, Tidy often changes the Web page's appearance after processing. It is not an effective tool to transform existing Web pages to make them standard-compliant. In this paper we report the design and implementation of PURE, a tool that cleans up an HTML document through reverse engineering. PURE starts with the rendering result of a given Web page and generates valid HTML code and CSS automatically to produce the same appearance. It is found to be effective for many existing Web pages. A prototype is now available for public testing and comments.",
keywords = "Browser, Cascade style sheets, HTML, HTML tidy, Rendering engine, W3C recommendations, Web page",
author = "Benfeng Chen and Shen, \{Vincent Y.\}",
year = "2006",
doi = "10.1145/1133219.1133223",
language = "English",
isbn = "159593281X",
series = "ACM International Conference Proceeding Series",
pages = "14--22",
booktitle = "ACM International Conference Proceeding Series - Proceedings of the 2006 International Cross-disciplinary Workshop on Web Accessibility, W4A - Building the Mobile Web",
note = "2006 International Cross-disciplinary Workshop on Web Accessibility, W4A - Building the Mobile Web: Rediscovering Accessibility ; Conference date: 22-05-2006 Through 22-05-2006",
}