@inproceedings{pekar-etal-2004-categorizing, title = "Categorizing Web Pages as a Preprocessing Step for Information Extraction", author = "Pekar, Viktor and Evans, Richard and Mitkov, Ruslan", editor = "Lino, Maria Teresa and Xavier, Maria Francisca and Ferreira, F{\'a}tima and Costa, Rute and Silva, Raquel", booktitle = "Proceedings of the Fourth International Conference on Language Resources and Evaluation ({LREC}{'}04)", month = may, year = "2004", address = "Lisbon, Portugal", publisher = "European Language Resources Association (ELRA)", url = "https://preview.aclanthology.org/fix-sig-urls/L04-1328/" }