@inproceedings{zmigrod-etal-2024-treeform,
title = "{T}ree{F}orm: End-to-end Annotation and Evaluation for Form Document Parsing",
author = "Zmigrod, Ran and
Ma, Zhiqiang and
Nourbakhsh, Armineh and
Shah, Sameena",
editor = "Henning, Sophie and
Stede, Manfred",
booktitle = "Proceedings of The 18th Linguistic Annotation Workshop (LAW-XVIII)",
month = mar,
year = "2024",
address = "St. Julians, Malta",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2024.law-1.1",
pages = "1--11",
abstract = "Visually Rich Form Understanding (VRFU) poses a complex research problemdue to the documents{'} highly structured nature and yet highly variable style and content. Current annotation schemes decompose form understanding and omit key hierarchical structure, making development and evaluation of end-to-end models difficult. In this paper, we propose a novel F1 metric to evaluate form parsers and describe a new content-agnostic, tree-based annotation scheme for VRFU: TreeForm. We provide methods to convert previous annotation schemes into TreeForm structures and evaluate TreeForm predictions using a modified version of the normalized tree-edit distance. We present initial baselines for our end-to-end performance metric and the TreeForm edit distance, averaged over the FUNSD and XFUND datasets, of 61.5 and 26.4 respectively. We hope that TreeForm encourages deeper research in annotating, modeling, and evaluating the complexities of form-like documents.",
}
Markdown (Informal)
[TreeForm: End-to-end Annotation and Evaluation for Form Document Parsing](https://aclanthology.org/2024.law-1.1) (Zmigrod et al., LAW-WS 2024)
ACL