\begin{thebibliography}{} \bibitem[ric 2001]{rich-text-:2001} \ (2001). \newblock {\em Rich Text Format {(}RTF{)} Specification\/}. \newblock Microsoft. \newblock Version 1.7. \bibitem[{\sc Aho} \btxetalshort{.} 1989]{compiler-b:1989} {\sc Aho, Alfred~V.}, {\sc R.~Sethi} \btxandshort{.}\ {\sc J.~D. Ullman}\ (1989). \newblock {\em Compiler-Bau\/}. \newblock Teil 1. Addison-Wesley, Universit{\"a}t Bonn. \bibitem[{\sc Altamura} \btxetalshort{.} 2000]{transformi:2000} {\sc Altamura, Oronzo}, {\sc F.~Esposito} \btxandshort{.}\ {\sc D.~Malerba}\ (2000). \newblock {\em Transforming Paper Documents into XML Format with WISDOM++\/}. \newblock \Btxtechreplong{.}, Dipartimento di Informatica, Universit{\`a} degli Studi di Bari - Italy. \bibitem[{\sc Altamura} \btxetalshort{.} 2001]{transformi:2001} {\sc Altamura, Oronzo}, {\sc F.~Esposito} \btxandshort{.}\ {\sc D.~Malerba}\ (2001). \newblock {\em Transforming paper documents into XML format with WISDOM++\/}. \newblock International Journal on Document Analysis and Recognition. \bibitem[{\sc Behme} \btxandshort{.}\ {\sc Mintert} 2000]{xml-in-der:2000} {\sc Behme, Henning} \btxandshort{.}\ {\sc S.~Mintert}\ (2000). \newblock {\em XML in der Praxis\/}. \newblock Addison-Wesley. \bibitem[{\sc Born} 1995]{noch-mehr-:1995} {\sc Born, G{\"u}nter}\ (1995). \newblock {\em Noch mehr Dateiformate: Neue Dateiformate f{\"u}r Grafik, Text, Tabellenkalkulation und Sound\/}. \newblock Addison-Wesley, 1. \btxeditionshort{.} \bibitem[{\sc Born} 2001]{dateiforma:2001} {\sc Born, G{\"u}nter}\ (2001). \newblock {\em Dateiformate - Die Referenz\/}. \newblock Galileo Press GmbH, Bonn, 1 \btxeditionshort{.} \bibitem[{\sc Bryan} 1988]{sgml---an-:1988} {\sc Bryan, Martin}\ (1988). \newblock {\em SGML - an author's guide to the Standard Generalized Markup Language\/}. \newblock Addison-Wesley. \bibitem[{\sc Dahn} 2001a]{slicing-bo:2001} {\sc Dahn, Ingo}\ (2001a). \newblock {\em Slicing Book Technology - Providing Online Support for Textbooks\/}. \newblock \Btxinshort{.}\ {\em ICDE 2001\/}. \bibitem[{\sc Dahn} 2001b]{using-netw:2001} {\sc Dahn, Ingo}\ (2001b). \newblock {\em Using Networks for Advanced Personalization of Documents\/}. \newblock \Btxinshort{.}\ {\em SSGRR 2001 International Conference on Advances in Infrastructure for Electronic Buisness, Science and Education on the Internet\/}, L'Aqu. Scuola Superiore Guglielmo Reiss Romoli. \bibitem[{\sc Dahn} \btxetalshort{.}]{dahn-slicing} {\sc Dahn, Ingo}, {\sc M.~Armbruster}, {\sc U.~Furbach} \btxandshort{.}\ {\sc G.~Schwabe}. \newblock {\em Slicing Books - The Authors' Perspective\/}. \newblock \url{http://www.citeseer.nj.nec.com/487947.html}. \bibitem[{\sc Esposito} \btxetalshort{.} 2000]{machine-le:2000} {\sc Esposito, Floriana}, {\sc D.~Malerba} \btxandshort{.}\ {\sc F.~A. Lisi}\ (2000). \newblock {\em Machine Learning for Intelligent Processing of Printed Documents\/}. \newblock Journal of Intelligent Information Systems, 14(2/3):175--198. \bibitem[{\sc Esposito} \btxetalshort{.} 1995]{a-knowledg:1995} {\sc Esposito, Floriana}, {\sc D.~Malerba} \btxandshort{.}\ {\sc G.~Semeraro}\ (1995). \newblock {\em A Knowledge-Based Approach to the Layout Analysis\/}. \newblock Proc. of the 3rd Int. Conf. on the Practical Application of Prolog, \btxpagesshort{.}\ 429--443. \bibitem[{\sc Goldfarb} 1996]{the-roots-:1996} {\sc Goldfarb, Charles~F.}\ (1996). \newblock {\em The Roots of SGML -- A Personal Recollection\/}. \bibitem[{\sc Goossens} \btxetalshort{.} 2000]{der-latex-:2000} {\sc Goossens, Michel}, {\sc F.~Mittelbach} \btxandshort{.}\ {\sc A.~Samarin}\ (2000). \newblock {\em Der \LaTeX\ Begleiter\/}. \newblock Addision-Wesley. \bibitem[{\sc Hyafil} \btxandshort{.}\ {\sc Rivest} 1976]{constructi:1976} {\sc Hyafil, Laurent} \btxandshort{.}\ {\sc R.~L. Rivest}\ (1976). \newblock {\em Constructing optimal binary decision trees is NP-complete\/}. \newblock \Btxinshort{.}\ {\sc Glushkov, V.M.}, {\sc D.~Gries}, {\sc D.~Knuth}, {\sc M.~Paul}, {\sc W.~Turski} \btxandshort{.}\ {\sc W.~{Van der Poel}}, \btxeditorsshort{.}: {\em Information Processing Letters\/}, \btxvolumeshort{.}~5, \btxpagesshort{.}\ 15--17. North-Holland Publishing Company. \bibitem[{\sc Knappen} \btxetalshort{.} 1995]{latex-kur:1995} {\sc Knappen, J{\"o}rg}, {\sc H.~Partl}, {\sc E.~Schlegl} \btxandshort{.}\ {\sc I.~Hyna}\ (1995). \newblock {\em \LaTeX2$_\varepsilon$-Kurzbeschreibung\/}. \newblock Zentrum f{\"u}r Datenverarbeitung, Johannes Gutenberg-Universit{\"a}t Mainz. \bibitem[{\sc Kobert} 1999]{xml:1999} {\sc Kobert, Thomas}\ (1999). \newblock {\em XML\/}. \newblock bhv Verlags GmbH. \bibitem[{\sc Lobin} 2001]{informatio:2001} {\sc Lobin, Henning}\ (2001). \newblock {\em Informationsmodellierung in XML und SGML\/}. \newblock Springer-Verlag. \bibitem[{\sc Mintert} 1999]{automatisi:1999} {\sc Mintert, Stefan}\ (1999). \newblock {\em Automatisierte WWW-Ver{\"o}ffentlichung auf der Basis formaler Auszeichnungssprachen\/}. \newblock \btxmastthesis{.}, Universit{\"a}t Dortmund, Lehrstuhl f{\"u}r K{\"u}nstliche Intelligenz. \bibitem[{\sc Mintert} 2002]{xmlCo:2002} {\sc Mintert, Stefan}\ (2002). \newblock {\em XML \& Co\/}. \newblock Addison-Wesley. \bibitem[{\sc Mitchell} 1997]{machine-le:1997} {\sc Mitchell, Tom~M.}\ (1997). \newblock {\em Machine Learning\/}. \newblock The McGraw-Hill Companies, Inc. \bibitem[{\sc Morik} 1995]{katharina-:1} {\sc Morik, Katharina}\ (1995). \newblock {\em Einf{\"u}hrung in die K{\"u}nstliche Intelligenz\/}, \btxchaptershort{.}~3, \btxpagesshort{.}\ 243--297. \newblock Addison-Wesley, 2 \btxeditionshort{.} \bibitem[{\sc Morik} 1997]{einfueh:1997} {\sc Morik, Katharina}\ (1997). \newblock {\em Einf{\"u}hrung in die K{\"u}nstliche Intelligenz\/}. \newblock Vorlesungsskript. \newblock \url{http://www-ai.cs.uni-dortmund.de/LEHRE/VORLESUNGEN/KI/SKRIPT/skript97_0. pdf}. \bibitem[{\sc Morik} 1998]{programmie:1998} {\sc Morik, Katharina}\ (1998). \newblock {\em Programmierung I: JAVA Skript zur Vorlesung WS 98/99\/}. \newblock Vorlesungsskript. \newblock \url{http://www-ai.cs.uni-dortmund.de/DOKUMENTE/morik_2000b.ps.gz}. \bibitem[{\sc Morik} 2002]{maschinell:2002} {\sc Morik, Katharina}\ (2002). \newblock {\em Maschinelles Lernen und Data Mining\/}. \newblock Begleitfolien zur Vorlesung. \newblock \url{http://www-ai.cs.uni-dortmund.de/LEHRE/VORLESUNGEN/MLRN/FOLIEN/FolienSu che.pdf}. \bibitem[{\sc Quinlan} 1983]{learning-e:1983} {\sc Quinlan, John~Ross}\ (1983). \newblock {\em Learning Efficient Classification Procedures And Their Application To Chess End Games\/}. \newblock \Btxinshort{.}\ {\sc Michalski, Ryszard~S.}, {\sc J.~G. Carbonell} \btxandshort{.}\ {\sc T.~M. Mitchell}, \btxeditorsshort{.}: {\em Machine Learning - An Artifical Intelligence Approach\/}, \btxpagesshort{.}\ 463--482. Tioga Publishing Company. \bibitem[{\sc Quinlan} 1993]{c4.5-progr:1993} {\sc Quinlan, John~Ross}\ (1993). \newblock {\em C4.5 programs for machine learning\/}. \newblock Morgan Kaufmann Publishers, Inc. \bibitem[{\sc Valerius} \btxetalshort{.} 2001]{adaptive-b:2001} {\sc Valerius, Marianne}, {\sc I.~Dahn} \btxandshort{.}\ {\sc G.~Schwabe}\ (2001). \newblock {\em Adaptive B{\"u}cher f{\"u}r das kooperative Lernen: Anwendungen - Konzepte - Erfahrungen\/}. \newblock \Btxinshort{.}\ {\sc M.~Engelien, J.~Homann}, \btxeditorshort{.}: {\em Virtuelle Organisation und Neue Medien 2001\/}, \btxpagesshort{.}\ 391--413. Josef Eul Verlag. \bibitem[{\sc Wang} \btxetalshort{.} 1999]{from-image:1999} {\sc Wang, Y.}, {\sc T.~Phillips} \btxandshort{.}\ {\sc R.~Haralick}\ (1999). \newblock {\em From Image to SGML/XML Representation: One Method\/}. \newblock Proc. of the Int. Workshop on Document Layout Interpretation and its Applications. \bibitem[{\sc Witten} \btxandshort{.}\ {\sc Frank} 2000]{data-minin:2000} {\sc Witten, Ian~H.} \btxandshort{.}\ {\sc E.~Frank}\ (2000). \newblock {\em Data Mining - Practical Machine Learning Tools and Techniques with Java Implementations\/}. \newblock Morgan Kauffmann Publishers, San Francisco. \bibitem[{\sc Wong} \btxetalshort{.} 1982]{document-a:1982} {\sc Wong, Kwan~Y.}, {\sc R.~G. Casey} \btxandshort{.}\ {\sc F.~M. Wahl}\ (1982). \newblock {\em Document analysis system\/}. \newblock IBM Journal of Research and Developpment, 26(6):647--656. \end{thebibliography}