@inproceedings{9f602a27812f4842a11b3cdc5868ee3b,
title = "Curve separation for line graphs in scholarly documents",
abstract = "Line graphs are abundant in scholarly papers. They are usually generated from a data table and that data can not be accessed. One important step in an automated data extraction pipeline is the curve separation problem: segmenting the pixels into separate curves. Previous work in this domain has focused on raster graphics extracted from scholarly PDFs, whereas most scholarly plots are embedded as vector graphics. We report a system to extract these plots as SVG images and show how that can improve both the accuracy (90%) and the scalability (5-8 seconds) of the curve separation problem.",
author = "Choudhury, {Sagnik Ray} and Shuting Wang and Giles, {C. Lee}",
year = "2016",
month = sep,
day = "1",
doi = "10.1145/2910896.2925469",
language = "English (US)",
series = "Proceedings of the ACM/IEEE Joint Conference on Digital Libraries",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
pages = "277--278",
booktitle = "JCDL 2016 - Proceedings of the 16th ACM/IEEE-CS Joint Conference on Digital Libraries",
address = "United States",
note = "16th ACM/IEEE-CS Joint Conference on Digital Libraries, JCDL 2016 ; Conference date: 19-06-2016 Through 23-06-2016",
}