@inproceedings{bb344400,
        AUTHOR = "Hamza, H. and Belaid, Y. and Belaid, A. and Chaudhuri, B.B.",
        TITLE = "Incremental classification of invoice documents",
        BOOKTITLE = ICPR08,
        YEAR = "2008",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338680"}

@inproceedings{bb344401,
        AUTHOR = "Jha, P. and Nagy, G.",
        TITLE = "Wang Notation Tool: Layout independent representation of tables",
        BOOKTITLE = ICPR08,
        YEAR = "2008",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338681"}

@inproceedings{bb344402,
        AUTHOR = "Minagawa, A. and Fujii, Y. and Takebe, H. and Fujimoto, K.",
        TITLE = "Logical Structure Analysis for Form Images with Arbitrary Layout by
Belief Propagation",
        BOOKTITLE = ICDAR07,
        YEAR = "2007",
        PAGES = "714-718",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338682"}

@inproceedings{bb344403,
        AUTHOR = "Huang, W. and Tan, C.L.",
        TITLE = "Locating Charts from Scanned Document Pages",
        BOOKTITLE = ICDAR07,
        YEAR = "2007",
        PAGES = "307-311",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338683"}

@inproceedings{bb344404,
        AUTHOR = "Liu, Y. and Bai, K. and Mitra, P. and Giles, C.L.",
        TITLE = "Searching for Tables in Digital Documents",
        BOOKTITLE = ICDAR07,
        YEAR = "2007",
        PAGES = "934-938",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338684"}

@inproceedings{bb344405,
        AUTHOR = "Hassan, T. and Baumgartner, R.",
        TITLE = "Table Recognition and Understanding from PDF Files",
        BOOKTITLE = ICDAR07,
        YEAR = "2007",
        PAGES = "1143-1147",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338685"}

@inproceedings{bb344406,
        AUTHOR = "Huang, W.H. and Zong, S.Q. and Tan, C.L.",
        TITLE = "Chart Image Classification Using Multiple-Instance Learning",
        BOOKTITLE = WACV07,
        YEAR = "2007",
        PAGES = "27-27",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338686"}

@inproceedings{bb344407,
        AUTHOR = "Hua, G. and Liu, Z.C. and Zhang, Z.Y. and Wu, Y.",
        TITLE = "Automatic Business Card Scanning with a Camera",
        BOOKTITLE = ICIP06,
        YEAR = "2006",
        PAGES = "373-376",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338687"}

@inproceedings{bb344408,
        AUTHOR = "Alrashed, S.A.",
        TITLE = "Finding Hidden Semantics of Text Tables",
        BOOKTITLE = DAS06,
        YEAR = "2006",
        PAGES = "449-461",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338688"}

@inproceedings{bb344409,
        AUTHOR = "Alrashed, S.A. and Gray, W.A.",
        TITLE = "Detection Approaches for Table Semantics in Text",
        BOOKTITLE = DAS02,
        YEAR = "2002",
        PAGES = "287 ff.",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338689"}

@inproceedings{bb344410,
        AUTHOR = "Pereira Neves, L.A. and de Carvalho, J.M. and Facon, J. and Bortolozzi, F. and Ignacio, S.A.",
        TITLE = "Handwritten Artefact Identification Method for Table Interpretation
with Little Use of Previous Knowledge",
        BOOKTITLE = DAS06,
        YEAR = "2006",
        PAGES = "176-185",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338690"}

@inproceedings{bb344411,
        AUTHOR = "Embley, D.W. and Lopresti, D.P. and Nagy, G.",
        TITLE = "Notes on Contemporary Table Recognition",
        BOOKTITLE = DAS06,
        YEAR = "2006",
        PAGES = "164-175",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338691"}

@inproceedings{bb344412,
        AUTHOR = "Kieninger, T. and Dengel, A.R.",
        TITLE = "An approach towards benchmarking of table structure recognition results",
        BOOKTITLE = ICDAR05,
        YEAR = "2005",
        PAGES = "II: 1232-1236",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338692"}

@inproceedings{bb344413,
        AUTHOR = "Kieninger, T. and Dengel, A.R.",
        TITLE = "Applying the T-Recs table recognition system to the business letter
domain",
        BOOKTITLE = ICDAR01,
        YEAR = "2001",
        PAGES = "518-522",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338693"}

@inproceedings{bb344414,
        AUTHOR = "Klein, B. and Gokkus, S. and Kieninger, T. and Dengel, A.R.",
        TITLE = "Three approaches to 'industrial' table spotting",
        BOOKTITLE = ICDAR01,
        YEAR = "2001",
        PAGES = "513-517",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338694"}

@inproceedings{bb344415,
        AUTHOR = "Ishitani, Y. and Fume, K. and Sumita, K.",
        TITLE = "Table structure analysis based on cell classification and cell
modification for XML document transformation",
        BOOKTITLE = ICDAR05,
        YEAR = "2005",
        PAGES = "II: 1247-1252",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338695"}

@inproceedings{bb344416,
        AUTHOR = "Long, V. and Dale, R. and Cassidy, S.",
        TITLE = "A model for detecting and merging vertically spanned table cells in
plain text documents",
        BOOKTITLE = ICDAR05,
        YEAR = "2005",
        PAGES = "II: 1242-1246",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338696"}

@inproceedings{bb344417,
        AUTHOR = "Kboubi, F. and Chabi, A.H. and Ahmed, M.B.",
        TITLE = "Table recognition evaluation and combination methods",
        BOOKTITLE = ICDAR05,
        YEAR = "2005",
        PAGES = "II: 1237-1241",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338697"}

@inproceedings{bb344418,
        AUTHOR = "Kim, Y.S. and Lee, K.H.",
        TITLE = "Extracting Table Information from the Web",
        BOOKTITLE = DAS04,
        YEAR = "2004",
        PAGES = "438-441",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338698"}

@inproceedings{bb344419,
        AUTHOR = "Ohtera, R. and Horiuchi, T.",
        TITLE = "Faxed form identification using histogram of the hough-space",
        BOOKTITLE = ICPR04,
        YEAR = "2004",
        PAGES = "II: 566-569",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338699"}

@inproceedings{bb344420,
        AUTHOR = "Ramel, J.Y. and Crucianu, M. and Vincent, N. and Faure, C.",
        TITLE = "Detection, extraction and representation of tables",
        BOOKTITLE = ICDAR03,
        YEAR = "2003",
        PAGES = "374-378",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338700"}

@inproceedings{bb344421,
        AUTHOR = "Wasserman, H. and Yukawa, K. and Sy, B. and Kwok, K.L. and Phillips, I.T.",
        TITLE = "A Theoretical Foundation and a Method for Document Table Structure
Extraction and Decomposition",
        BOOKTITLE = DAS02,
        YEAR = "2002",
        PAGES = "291 ff.",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338701"}

@inproceedings{bb344422,
        AUTHOR = "Cesarini, F. and Marinai, S. and Sarti, L. and Soda, G.",
        TITLE = "Trainable table location in document images",
        BOOKTITLE = ICPR02,
        YEAR = "2002",
        PAGES = "III: 236-240",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338702"}

@inproceedings{bb344423,
        AUTHOR = "Tsuruoka, S. and Takao, K. and Tanaka, T. and Yoshikawa, T. and Shinogi, T.",
        TITLE = "Region segmentation for table image with unknown complex structure",
        BOOKTITLE = ICDAR01,
        YEAR = "2001",
        PAGES = "709-713",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338703"}

@inproceedings{bb344424,
        AUTHOR = "Zuyev, K.",
        TITLE = "Table Image Segmentation",
        BOOKTITLE = ICDAR97,
        YEAR = "1997",
        PAGES = "705-708",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338704"}

@inproceedings{bb344425,
        AUTHOR = "Chen, J.S. and Tseng, D.C.",
        TITLE = "Overlapped-Character Separation and Reconstruction
for Table-Form Documents",
        BOOKTITLE = ICIP96,
        YEAR = "1996",
        PAGES = "II: 233-236",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338705"}

@inproceedings{bb344426,
        AUTHOR = "Arias, J.F. and Chhabra, A. and Misra, V.",
        TITLE = "Interpreting and Representing Tabular Documents",
        BOOKTITLE = CVPR96,
        YEAR = "1996",
        PAGES = "600-605",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338706"}

@inproceedings{bb344427,
        AUTHOR = "Arias, J.F. and Chhabra, A. and Misra, V.",
        TITLE = "Efficient Interpretation of Tabular Documents",
        BOOKTITLE = ICPR96,
        YEAR = "1996",
        PAGES = "III: 681-685",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338707"}

@inproceedings{bb344428,
        AUTHOR = "Watanabe, T. and Huang, X.",
        TITLE = "Automatic Acquisition of Layout Knowledge for
Understanding Business Cards",
        BOOKTITLE = ICDAR97,
        YEAR = "1997",
        PAGES = "216-220",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338708"}

@inproceedings{bb344429,
        AUTHOR = "Saiga, H. and Kitamura, Y. and Ida, S.",
        TITLE = "High-speed recognition of tabulated data",
        BOOKTITLE = ICPR94,
        YEAR = "1994",
        PAGES = "B:577-579",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338709"}

@inproceedings{bb344430,
        AUTHOR = "Laurentini, A. and Viada, P.",
        TITLE = "Identifying and understanding tabular material in compound documents",
        BOOKTITLE = ICPR92,
        YEAR = "1992",
        PAGES = "II:405-409",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338710"}

@inproceedings{bb344431,
        AUTHOR = "Kreich, J. and Luhn, A. and Maderlechner, G.",
        TITLE = "An Experimental Environment for Model Based Document Analysis",
        BOOKTITLE = ICDAR91,
        YEAR = "1991",
        PAGES = "50-58",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char969.html#TT338711"}

@article{bb344432,
        AUTHOR = "Karatzs, D. and Antonacopoulos, A.",
        TITLE = "Colour text segmentation in web images based on human perception",
        JOURNAL = IVC,
        VOLUME = "25",
        YEAR = "2007",
        NUMBER = "5",
        MONTH = "May",
        PAGES = "564-577",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338713"}

@inproceedings{bb344433,
        AUTHOR = "Karatzs, D. and Antonacopoulos, A.",
        TITLE = "Text extraction from web images based on a split-and-merge segmentation
method using colour perception",
        BOOKTITLE = ICPR04,
        YEAR = "2004",
        PAGES = "II: 634-637",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338714"}

@inproceedings{bb344434,
        AUTHOR = "Karatzs, D. and Antonacopoulos, A.",
        TITLE = "Two approaches for text segmentation in web images",
        BOOKTITLE = ICDAR03,
        YEAR = "2003",
        PAGES = "131-137",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338715"}

@inproceedings{bb344435,
        AUTHOR = "Antonacopoulos, A. and Karatzs, D.",
        TITLE = "Fuzzy Segmentation of Characters in Web Images Based on Human Colour
Perception",
        BOOKTITLE = DAS02,
        YEAR = "2002",
        PAGES = "295 ff.",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338716"}

@article{bb344436,
        AUTHOR = "Ashraf, F. and Ozyer, T. and Alhajj, R.",
        TITLE = "Employing Clustering Techniques for Automatic Information Extraction
From HTML Documents",
        JOURNAL = SMC-C,
        VOLUME = "38",
        YEAR = "2008",
        NUMBER = "5",
        MONTH = "September",
        PAGES = "660-673",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338717"}

@article{bb344437,
        AUTHOR = "Carullo, M. and Binaghi, E. and Gallo, I.",
        TITLE = "An online document clustering technique for short web contents",
        JOURNAL = PRL,
        VOLUME = "30",
        YEAR = "2009",
        NUMBER = "10",
        MONTH = "July",
        PAGES = "870-876",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338718"}

@inproceedings{bb344438,
        AUTHOR = "Carullo, M. and Binaghi, E. and Gallo, I. and Lamberti, N.",
        TITLE = "Clustering of short commercial documents for the web",
        BOOKTITLE = ICPR08,
        YEAR = "2008",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338719"}

@article{bb344439,
        AUTHOR = "Borges, K.A.V. and Davis, C.A. and Laender, A.H.F. and Medeiros, C.B.",
        TITLE = "Ontology-driven discovery of geospatial evidence in web pages",
        JOURNAL = GeoInfo,
        VOLUME = "15",
        YEAR = "2011",
        NUMBER = "4",
        MONTH = "October",
        PAGES = "609-631",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338720"}

@article{bb344440,
        AUTHOR = "Lu, W.T. and Li, J.X. and Li, T. and Guo, W.D. and Zhang, H.G. and Guo, J.",
        TITLE = "Web Multimedia Object Classification Using Cross-Domain Correlation
Knowledge",
        JOURNAL = MultMed,
        VOLUME = "15",
        YEAR = "2013",
        NUMBER = "8",
        MONTH = "December",
        PAGES = "1920-1929",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338721"}

@inproceedings{bb344441,
        AUTHOR = "Lu, W.T. and Li, L. and Li, T. and Zhang, H.G. and Guo, J.",
        TITLE = "Web Multimedia Object Clustering via Information Fusion",
        BOOKTITLE = ICDAR11,
        YEAR = "2011",
        PAGES = "319-323",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338722"}

@article{bb344442,
        AUTHOR = "Embley, D.W. and Krishnamoorthy, M.S. and Nagy, G. and Seth, S.",
        TITLE = "Converting heterogeneous statistical tables on the web to searchable
databases",
        JOURNAL = IJDAR,
        VOLUME = "19",
        YEAR = "2016",
        NUMBER = "2",
        MONTH = "June",
        PAGES = "119-138",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338723"}

@inproceedings{bb344443,
        AUTHOR = "Nagy, G. and Seth, S.",
        TITLE = "Table headers: An entrance to the data mine",
        BOOKTITLE = ICPR16,
        YEAR = "2016",
        PAGES = "4065-4070",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338724"}

@article{bb344444,
        AUTHOR = "Wu, O. and Zuo, H. and Hu, W. and Li, B.",
        TITLE = "Multimodal Web Aesthetics Assessment Based on Structural SVM and
Multitask Fusion Learning",
        JOURNAL = MultMed,
        VOLUME = "18",
        YEAR = "2016",
        NUMBER = "6",
        MONTH = "June",
        PAGES = "1062-1076",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338725"}

@article{bb344445,
        AUTHOR = "Cormier, M. and Moffatt, K. and Cohen, R. and Mann, R.",
        TITLE = "Purely vision-based segmentation of web pages for assistive
technology",
        JOURNAL = CVIU,
        VOLUME = "148",
        YEAR = "2016",
        NUMBER = "1",
        PAGES = "46-66",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338726"}

@inproceedings{bb344446,
        AUTHOR = "Cormier, M. and Mann, R. and Moffatt, K. and Cohen, R.",
        TITLE = "Towards an Improved Vision-Based Web Page Segmentation Algorithm",
        BOOKTITLE = CRV17,
        YEAR = "2017",
        PAGES = "345-352",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338727"}

@article{bb344447,
        AUTHOR = "Mei, T. and Li, L. and Tian, X. and Tao, D. and Ngo, C.W.",
        TITLE = "PageSense: Toward Stylewise Contextual Advertising via Visual
Analysis of Web Pages",
        JOURNAL = CirSysVideo,
        VOLUME = "28",
        YEAR = "2018",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "254-266",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338728"}

@article{bb344448,
        AUTHOR = "Kim, N.",
        TITLE = "Extracting and searching news articles in web portal news pages",
        JOURNAL = IJCVR,
        VOLUME = "10",
        YEAR = "2020",
        NUMBER = "3",
        PAGES = "202-212",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338729"}

@article{bb344449,
        AUTHOR = "Huang, X. and Chong, K.F.E.",
        TITLE = "GenKL: An Iterative Framework for Resolving Label Ambiguity and Label
Non-conformity in Web Images Via a New Generalized KL Divergence",
        JOURNAL = IJCV,
        VOLUME = "131",
        YEAR = "2023",
        NUMBER = "1",
        MONTH = "January",
        PAGES = "3035-3059",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338730"}

@inproceedings{bb344450,
        AUTHOR = "Shao, Z.R. and Gao, F.Y. and Xing, H.D. and Zhu, Z.P. and Yu, Z. and Bu, J.J. and Zheng, Q. and Yao, C.",
        TITLE = "WEBRPG: Automatic Web Rendering Parameters Generation for Visual
Presentation",
        BOOKTITLE = ECCV24,
        YEAR = "2024",
        PAGES = "VIII: 56-74",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338731"}

@inproceedings{bb344451,
        AUTHOR = "Sadeghi, Z. and Homayounvala, E. and Borhani, M.",
        TITLE = "HCI for Elderly, Measuring Visual Complexity of Webpages Based on
Machine Learning",
        BOOKTITLE = DICTA20,
        YEAR = "2020",
        PAGES = "1-6",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338732"}

@inproceedings{bb344452,
        AUTHOR = "Zheng, Q.L. and Jiao, J.B. and Cao, Y. and Lau, R.W.H.",
        TITLE = "Task-Driven Webpage Saliency",
        BOOKTITLE = ECCV18,
        YEAR = "2018",
        PAGES = "XIV: 300-316",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338733"}

@inproceedings{bb344453,
        AUTHOR = "Li, J. and Su, L. and Wu, B. and Pang, J. and Wang, C. and Wu, Z. and Huang, Q.",
        TITLE = "Webpage saliency prediction with multi-features fusion",
        BOOKTITLE = ICIP16,
        YEAR = "2016",
        PAGES = "674-678",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338734"}

@inproceedings{bb344454,
        AUTHOR = "Baharum, A. and Jaafar, A.",
        TITLE = "Identifying the Importance of Web Objects:
A Study of ASEAN Perspectives",
        BOOKTITLE = IVIC15,
        YEAR = "2015",
        PAGES = "464-475",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338735"}

@inproceedings{bb344455,
        AUTHOR = "Goyal, A. and Jadon, M.K. and Pujari, A.K.",
        TITLE = "Spectral approach to find number of clusters of short-text documents",
        BOOKTITLE = NCVPRIPG13,
        YEAR = "2013",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338736"}

@inproceedings{bb344456,
        AUTHOR = "Marinai, S. and Marino, E. and Soda, G.",
        TITLE = "Conversion of PDF Books in ePub Format",
        BOOKTITLE = ICDAR11,
        YEAR = "2011",
        PAGES = "478-482",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338737"}

@inproceedings{bb344457,
        AUTHOR = "Karatzas, D. and Mestre, S.R. and Mas, J. and Nourbakhsh, F. and Roy, P.P.",
        TITLE = "ICDAR 2011 Robust Reading Competition - Challenge 1: Reading Text in
Born-Digital Images (Web and Email)",
        BOOKTITLE = ICDAR11,
        YEAR = "2011",
        PAGES = "1485-1490",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338738"}

@inproceedings{bb344458,
        AUTHOR = "Liu, G. and Qiu, B. and Liu, W.Y.",
        TITLE = "Automatic Detection of Phishing Target from Phishing Webpage",
        BOOKTITLE = ICPR10,
        YEAR = "2010",
        PAGES = "4153-4156",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338739"}

@inproceedings{bb344459,
        AUTHOR = "Hassan, T.",
        TITLE = "User-Guided Wrapping of PDF Documents Using Graph Matching Techniques",
        BOOKTITLE = ICDAR09,
        YEAR = "2009",
        PAGES = "631-635",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338740"}

@inproceedings{bb344460,
        AUTHOR = "Ghosh, S. and Mitra, P.",
        TITLE = "Combining content and structure similarity for XML document
classification using composite SVM kernels",
        BOOKTITLE = ICPR08,
        YEAR = "2008",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338741"}

@inproceedings{bb344461,
        AUTHOR = "Hirano, T. and Okano, Y. and Okada, Y. and Yoda, F.",
        TITLE = "Text and Layout Information Extraction from Document Files of Various
Formats Based on the Analysis of Page Description Language",
        BOOKTITLE = ICDAR07,
        YEAR = "2007",
        PAGES = "262-266",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338742"}

@inproceedings{bb344462,
        AUTHOR = "Burget, R.",
        TITLE = "Layout Based Information Extraction from HTML Documents",
        BOOKTITLE = ICDAR07,
        YEAR = "2007",
        PAGES = "624-628",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338743"}

@inproceedings{bb344463,
        AUTHOR = "Guo, H. and Mahmud, J. and Borodin, Y. and Stent, A. and Ramakrishnan, I.",
        TITLE = "A General Approach for Partitioning Web Page Content Based on Geometric
and Style Information",
        BOOKTITLE = ICDAR07,
        YEAR = "2007",
        PAGES = "929-933",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338744"}

@inproceedings{bb344464,
        AUTHOR = "Yoshida, M. and Nakagawa, H.",
        TITLE = "Web Document Parsing:
A New Approach to Modeling Layout-Language Relations",
        BOOKTITLE = ICDAR07,
        YEAR = "2007",
        PAGES = "203-207",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338745"}

@inproceedings{bb344465,
        AUTHOR = "Ferilli, S. and Biba, M. and Basile, T.M.A. and Esposito, F.",
        TITLE = "Incremental machine learning techniques for document layout
understanding",
        BOOKTITLE = ICPR08,
        YEAR = "2008",
        PAGES = "1-4",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338746"}

@inproceedings{bb344466,
        AUTHOR = "Esposito, F. and Ferilli, S. and di Mauro, N. and Basile, T.M.A.",
        TITLE = "Incremental Learning of First Order Logic Theories for the Automatic
Annotations of Web Documents",
        BOOKTITLE = ICDAR07,
        YEAR = "2007",
        PAGES = "1093-1097",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338747"}

@inproceedings{bb344467,
        AUTHOR = "Esposito, F. and Ferilli, S. and Basile, T.M.A. and di Mauro, N.",
        TITLE = "Automatic Content-based Indexing of Digital Documents through
Intelligent Processing Techniques",
        BOOKTITLE = DIAL06,
        YEAR = "2006",
        PAGES = "204-219",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338748"}

@inproceedings{bb344468,
        AUTHOR = "Esposito, F. and Ferilli, S. and Basile, T.M.A. and di Mauro, N.",
        TITLE = "Intelligent document processing",
        BOOKTITLE = ICDAR05,
        YEAR = "2005",
        PAGES = "II: 1100-1104",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338749"}

@inproceedings{bb344469,
        AUTHOR = "Watai, Y. and Yamasaki, T. and Aizawa, K.",
        TITLE = "View-Based Web Page Retrieval using Interactive Sketch Query",
        BOOKTITLE = ICIP07,
        YEAR = "2007",
        PAGES = "VI: 357-360",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338750"}

@inproceedings{bb344470,
        AUTHOR = "Ma, J.C. and Gu, Z.M.",
        TITLE = "A Shared Fragments Analysis System for Large Collections of Web Pages",
        BOOKTITLE = DAS06,
        YEAR = "2006",
        PAGES = "390-401",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338751"}

@inproceedings{bb344471,
        AUTHOR = "Liu, W.Y. and Huang, G.L. and Liu, X.Y. and Deng, X.T. and Min, Z.",
        TITLE = "Phishing Web page detection",
        BOOKTITLE = ICDAR05,
        YEAR = "2005",
        PAGES = "II: 560-564",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338752"}

@inproceedings{bb344472,
        AUTHOR = "Feng, J. and Haffner, P. and Gilbert, M.",
        TITLE = "A learning approach to discovering Web page semantic structures",
        BOOKTITLE = ICDAR05,
        YEAR = "2005",
        PAGES = "II: 1055-1059",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338753"}

@inproceedings{bb344473,
        AUTHOR = "Chao, H. and Lin, X.F.",
        TITLE = "Capturing the layout of electronic documents for reuse in variable data
printing",
        BOOKTITLE = ICDAR05,
        YEAR = "2005",
        PAGES = "II: 940-944",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338754"}

@inproceedings{bb344474,
        AUTHOR = "Chao, H. and Fan, J.",
        TITLE = "Layout and Content Extraction for PDF Documents",
        BOOKTITLE = DAS04,
        YEAR = "2004",
        PAGES = "213-224",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338755"}

@inproceedings{bb344475,
        AUTHOR = "Behera, A. and Lalanne, D. and Ingold, R.",
        TITLE = "Enhancement of layout-based identification of low-resolution documents
using geometrical color distribution",
        BOOKTITLE = ICDAR05,
        YEAR = "2005",
        PAGES = "I: 468-472",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338756"}

@inproceedings{bb344476,
        AUTHOR = "Mekhaldi, D. and Lalanne, D. and Ingold, R.",
        TITLE = "From searching to browsing through multimodal documents linking",
        BOOKTITLE = ICDAR05,
        YEAR = "2005",
        PAGES = "II: 924-928",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338757"}

@inproceedings{bb344477,
        AUTHOR = "Mekhaldi, D. and Lalanne, D. and Ingold, R.",
        TITLE = "Unity Is Strength: Coupling Media for Thematic Segmentation",
        BOOKTITLE = DAS04,
        YEAR = "2004",
        PAGES = "559-562",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338758"}

@inproceedings{bb344478,
        AUTHOR = "Rigamonti, M. and Bloechle, J.L. and Hadjar, K. and Lalanne, D. and Ingold, R.",
        TITLE = "Towards a canonical and structured representation of PDF documents
through reverse engineering",
        BOOKTITLE = ICDAR05,
        YEAR = "2005",
        PAGES = "II: 1050-1054",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338759"}

@inproceedings{bb344479,
        AUTHOR = "Hadjar, K. and Rigamonti, M. and Lalanne, D. and Ingold, R.",
        TITLE = "Xed: a new tool for extracting hidden structures from electronic
documents",
        BOOKTITLE = DIAL04,
        YEAR = "2004",
        PAGES = "212-224",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338760"}

@inproceedings{bb344480,
        AUTHOR = "Hadjar, K. and Ingold, R.",
        TITLE = "Logical labeling of Arabic newspapers using artificial neural nets",
        BOOKTITLE = ICDAR05,
        YEAR = "2005",
        PAGES = "I: 426-430",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338761"}

@inproceedings{bb344481,
        AUTHOR = "Schenker, A. and Bunke, H. and Last, M. and Kandel, A.",
        TITLE = "A Graph-Based Framework for Web Document Mining",
        BOOKTITLE = DAS04,
        YEAR = "2004",
        PAGES = "401-412",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338762"}

@inproceedings{bb344482,
        AUTHOR = "Schenker, A. and Last, M. and Bunke, H. and Kandel, A.",
        TITLE = "Classification of web documents using a graph model",
        BOOKTITLE = ICDAR03,
        YEAR = "2003",
        PAGES = "240-244",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338763"}

@inproceedings{bb344483,
        AUTHOR = "Vitali, F. and di Iorio, A. and Campori, E.V.",
        TITLE = "Rule-Based Structural Analysis of Web Pages",
        BOOKTITLE = DAS04,
        YEAR = "2004",
        PAGES = "425-437",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338764"}

@inproceedings{bb344484,
        AUTHOR = "Hu, J.Y. and Bagga, A.",
        TITLE = "Identifying story and preview images in news web pages",
        BOOKTITLE = ICDAR03,
        YEAR = "2003",
        PAGES = "640-644",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338765"}

@inproceedings{bb344485,
        AUTHOR = "Ramachandran, S. and Kashi, R.",
        TITLE = "An architecture for ink annotations on web documents",
        BOOKTITLE = ICDAR03,
        YEAR = "2003",
        PAGES = "256-260",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338766"}

@inproceedings{bb344486,
        AUTHOR = "Gagneux, A. and Emptoz, H.",
        TITLE = "Web site: a structured document",
        BOOKTITLE = ICDAR03,
        YEAR = "2003",
        PAGES = "1158-1162",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338767"}

@inproceedings{bb344487,
        AUTHOR = "Mukherjee, S. and Yang, G.Z. and Tan, W.F. and Ramakrishnan, I.V.",
        TITLE = "Automatic discovery of semantic structures in HTML documents",
        BOOKTITLE = ICDAR03,
        YEAR = "2003",
        PAGES = "245-249",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338768"}

@inproceedings{bb344488,
        AUTHOR = "Alam, H. and Kumar, A. and Nakamura, M. and Rahman, F. and Tarnikova, Y. and Wilcox, C.",
        TITLE = "Structured and unstructured document summarization: Design of a
commercial summarizer using Lexical chains",
        BOOKTITLE = ICDAR03,
        YEAR = "2003",
        PAGES = "1147-1152",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338769"}

@inproceedings{bb344489,
        AUTHOR = "Rahman, F. and Alam, H.",
        TITLE = "A commercial Web based digital library for sharing and distributing
documents",
        BOOKTITLE = DIAL04,
        YEAR = "2004",
        PAGES = "93-103",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338770"}

@inproceedings{bb344490,
        AUTHOR = "Alam, H. and Hartono, R. and Kumar, A. and Rahman, F. and Tarnikova, Y. and Wilcox, C.",
        TITLE = "Web page summarization for handheld devices: a natural language
approach",
        BOOKTITLE = ICDAR03,
        YEAR = "2003",
        PAGES = "1153-1158",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338771"}

@inproceedings{bb344491,
        AUTHOR = "Rahman, A.F.R. and Alam, H. and Hartono, R. and Ariyoshi, K.",
        TITLE = "Automatic summarization of Web content to smaller display devices",
        BOOKTITLE = ICDAR01,
        YEAR = "2001",
        PAGES = "1064-1068",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338772"}

@inproceedings{bb344492,
        AUTHOR = "Serradura, L. and Slimane, M. and Vincent, N.",
        TITLE = "Web sites thematic classification using hidden Markov models",
        BOOKTITLE = ICDAR01,
        YEAR = "2001",
        PAGES = "1094-1098",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338773"}

@inproceedings{bb344493,
        AUTHOR = "Penn, G. and Hu, J.Y. and Luo, H.B. and McDonald, R.",
        TITLE = "Flexible Web document analysis for delivery to narrow-bandwidth devices",
        BOOKTITLE = ICDAR01,
        YEAR = "2001",
        PAGES = "1074-1078",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338774"}

@inproceedings{bb344494,
        AUTHOR = "Anjewierden, A.",
        TITLE = "AIDAS: incremental logical structure discovery in PDF documents",
        BOOKTITLE = ICDAR01,
        YEAR = "2001",
        PAGES = "374-378",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338775"}

@inproceedings{bb344495,
        AUTHOR = "Athitsos, V. and Swain, M.J. and Frankel, C.",
        TITLE = "Distinguishing photographs and graphics on the World Wide Web",
        BOOKTITLE = CBAIVL97,
        YEAR = "1997",
        PAGES = "10",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char970.html#TT338776"}

@article{bb344496,
        AUTHOR = "Nagy, G. and Seth, S.C. and Viswanathan, M.",
        TITLE = "A Prototype Document Image Analysis System for Technical Journals",
        JOURNAL = Computer,
        VOLUME = "25",
        YEAR = "1992",
        NUMBER = "7",
        MONTH = "July",
        PAGES = "10-22",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char971.html#TT338777"}

@inproceedings{bb344497,
        AUTHOR = "Nagy, G.",
        TITLE = "Towards a Structured Document Image Utility",
        BOOKTITLE = SDIA92,
        YEAR = "1992",
        PAGES = "xx-yy",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char971.html#TT338778"}

@article{bb344498,
        AUTHOR = "Viswanathan, M. and Nagy, G.",
        TITLE = "Characteristics of Digitized Images of Technical Articles",
        JOURNAL = SPIE,
        VOLUME = "1661",
        YEAR = "1992",
        PAGES = "6-17",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char971.html#TT338779"}

@article{bb344499,
        AUTHOR = "Marukawa, K. and Hu, T. and Fujisawa, H. and Shima, Y.",
        TITLE = "Document-Retrieval Tolerating Character-Recognition Errors:
Evaluation and Application",
        JOURNAL = PR,
        VOLUME = "30",
        YEAR = "1997",
        NUMBER = "8",
        MONTH = "August",
        PAGES = "1361-1371",
        BIBSOURCE = "http://www.visionbib.com/bibliography/char971.html#TT338780"}

Last update:Jul 7, 2025 at 14:35:55