Article Instance
API Endpoint for journals.
GET /api/articles/57200/?format=api
{ "pk": 57200, "title": "[Tool] Automatically Extracting Hardware Descriptions from PDF Technical Documentation", "subtitle": null, "abstract": "The ever-increasing variety of microcontrollers aggravatesthe challenge of porting embedded software to new devicesthrough much manual work, whereas code generators can beused only in special cases. Moreover, only little technical documentation for these devices is available in machine-readableformats that could facilitate automating porting efforts. Instead, the bulk of documentation comes as print-orientedPDFs. We hence identify a strong need for a processor toaccess the PDFs and extract their data with a high quality toimprove the code generation for embedded software.\nIn this paper, we design and implement a modular processor for extracting detailed datasets from PDF files containing technical documentation using deterministic table processing for thousands of microcontrollers. Namely, we systematically extract device identifiers, interrupt tables, package and pinouts, pin functions, and register maps. In our evaluation, we compare the documentation from STMicro againstexisting machine-readable sources. Our results show thatour processor matches 96.5 % of almost 6 million referencedata points, and we further discuss identified issues in bothsources. Hence, our tool yields very accurate data with onlylimited manual effort and can enable and enhance a significant amount of existing and new code generation use cases inthe embedded software domain that are currently limited by alack of machine-readable data sources.", "language": "en", "license": { "name": "Creative Commons Attribution-NonCommercial 4.0", "short_name": "CC BY-NC 4.0", "text": "Attribution — You must give appropriate credit, provide a link to the license, and indicate if changes were made. You may do so in any reasonable manner, but not in any way that suggests the licensor endorses you or your use.\n\nNonCommercial — You may not use the material for commercial purposes.\n\nNo additional restrictions — You may not apply legal terms or technological measures that legally restrict others from doing anything the license permits.", "url": "https://creativecommons.org/licenses/by-nc/4.0" }, "keywords": [], "section": "Articles", "is_remote": true, "remote_url": "https://escholarship.org/uc/item/32z0068j", "frozenauthors": [ { "first_name": "Niklas", "middle_name": "", "last_name": "Hauser", "name_suffix": "", "institution": "", "department": "" }, { "first_name": "Jan", "middle_name": "", "last_name": "Pennekamp", "name_suffix": "", "institution": "", "department": "" } ], "date_submitted": "2023-10-31T08:09:47Z", "date_accepted": "2023-10-31T08:09:47Z", "date_published": "2023-01-01T00:00:00Z", "render_galley": null, "galleys": [ { "label": "", "type": "pdf", "path": "https://journalpub.escholarship.org/jsys/article/57200/galley/43397/download/" } ] }