Metadata

Close
Metadata
@InProceedings{MaiaJulcHira:2018:MaLeAp,
               author = "Maia, Ana Lucia Lima Marreiros and Julca-Aguilar, Frank Dennis and 
                         Hirata, Nina Sumiko Tomita",
          affiliation = "{University of S{\~a}o Paulo/State University of Feira de 
                         Santana} and {University of S{\~a}o Paulo} and {University of 
                         S{\~a}o Paulo}",
                title = "A Machine Learning approach for Graph-based Page Segmentation",
            booktitle = "Proceedings...",
                 year = "2018",
               editor = "Ross, Arun and Gastal, Eduardo S. L. and Jorge, Joaquim A. and 
                         Queiroz, Ricardo L. de and Minetto, Rodrigo and Sarkar, Sudeep and 
                         Papa, Jo{\~a}o Paulo and Oliveira, Manuel M. and Arbel{\'a}ez, 
                         Pablo and Mery, Domingo and Oliveira, Maria Cristina Ferreira de 
                         and Spina, Thiago Vallin and Mendes, Caroline Mazetto and Costa, 
                         Henrique S{\'e}rgio Gutierrez and Mejail, Marta Estela and Geus, 
                         Klaus de and Scheer, Sergio",
         organization = "Conference on Graphics, Patterns and Images, 31. (SIBGRAPI)",
            publisher = "IEEE Computer Society",
              address = "Los Alamitos",
             keywords = "Page segmentation, document image, machine learning, graph, 
                         connected components classification, convolutional neural 
                         network.",
             abstract = "We propose a new approach for segmenting a document image into its 
                         page components (e.g. text, graphics and tables). Our approach 
                         consists of two main steps. In the first step, a set of scores 
                         corresponding to the output of a convolutional neural network, one 
                         for each of the possible page component categories, is assigned to 
                         each connected component in the document. The labeled connected 
                         components define a fuzzy over-segmentation of the page. In the 
                         second step, spatially close connected components that are likely 
                         to belong to a same page component are grouped together. This is 
                         done by building an attributed region adjacency graph of the 
                         connected components and modeling the problem as an edge removal 
                         problem. Edges are then kept or removed based on a pre-trained 
                         classifier. The resulting groups, defined by the connected 
                         subgraphs, correspond to the detected page components. We evaluate 
                         our method on the ICDAR2009 dataset. Results show that our method 
                         effectively segments pages, being able to detect the nine types of 
                         page components. Furthermore, as our approach is based on simple 
                         machine learning models and graph-based techniques, it should be 
                         easily adapted to the segmentation of a variety of document 
                         types.",
  conference-location = "Foz do Igua{\c{c}}u, PR, Brazil",
      conference-year = "29 Oct.-1 Nov. 2018",
                  doi = "10.1109/SIBGRAPI.2018.00061",
                  url = "http://dx.doi.org/10.1109/SIBGRAPI.2018.00061",
             language = "en",
                  ibi = "8JMKD3MGPAW/3RP2P48",
                  url = "http://urlib.net/ibi/8JMKD3MGPAW/3RP2P48",
           targetfile = "Final_PaperID_50.pdf",
        urlaccessdate = "2025, July 05"
}