<resource xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:dcterms="http://purl.org/dc/terms/" xmlns:datacite="http://datacite.org/schema/kernel-4" xmlns:oaire="http://namespace.openaire.eu/schema/oaire/" xsi:schemaLocation="http://namespace.openaire.eu/schema/oaire/ https://www.openaire.eu/schema/repo-lit/4.0/openaire.xsd"><datacite:identifier identifierType="DOI">10.4000/proceedings.elpub.2018.19</datacite:identifier><datacite:alternateIdentifiers><datacite:alternateIdentifier alternateIdentifierType="URL">http://elpub.episciences.org/4607</datacite:alternateIdentifier></datacite:alternateIdentifiers><datacite:creators><datacite:creator><datacite:creatorName>Pokorny, Jan</datacite:creatorName><datacite:givenName>Jan</datacite:givenName><datacite:familyName>Pokorny</datacite:familyName><datacite:affiliation>ENKI, o.p.s.</datacite:affiliation></datacite:creator></datacite:creators><datacite:titles><datacite:title xml:lang="en">Automatic Subject Indexing and Classification Using Text Recognition and Computer-Based Analysis of Tables of Contents</datacite:title></datacite:titles><dc:description xml:lang="en">This paper will describe a method for machine-based creation of high quality subject indexing and classification for both electronic and print documents using tables of contents (ToCs). The technology described here is primarily focused on electronic and print documents for which, because of technical or licensing reasons, it is not possible to index full text. However, the technology would also be useful for full text documents, because it could significantly enhance the accuracy and relevance of subject description by analyzing the structure of ToCs.</dc:description><datacite:subjects><datacite:subject subjectScheme="author">machine learning system</datacite:subject><datacite:subject subjectScheme="author">computer-generated keywords</datacite:subject><datacite:subject subjectScheme="author">library automatization</datacite:subject><datacite:subject subjectScheme="author">text mining</datacite:subject><datacite:subject subjectScheme="author">computer-generated subject headings</datacite:subject><datacite:subject subjectScheme="author">[SHS.INFO]Humanities and Social Sciences/Library and information sciences</datacite:subject></datacite:subjects><oaire:licenseCondition startDate="2018-06-20 21:57:28" uri="https://creativecommons.org/licenses/by/4.0">Attribution 4.0 International (CC BY 4.0)</oaire:licenseCondition><datacite:dates><datacite:date dateType="Accepted">2018-06-20</datacite:date><datacite:date dateType="Issued">2018-06-20</datacite:date><datacite:date dateType="Available">2018-06-20</datacite:date></datacite:dates><dc:language>eng</dc:language><oaire:resourceType resourceTypeGeneral="literature" uri="http://purl.org/coar/resource_type/c_6501">journal        article    </oaire:resourceType><datacite:relatedIdentifiers><datacite:relatedIdentifier relatedIdentifierType="URL" relationType="IsIdenticalTo">https://hal.science/hal-01816705v1</datacite:relatedIdentifier></datacite:relatedIdentifiers><datacite:rights rightsURI="http://purl.org/coar/access_right/c_abf2">open access</datacite:rights><oaire:file accessRightsURI="http://purl.org/coar/access_right/c_abf2" mimeType="application/pdf" objectType="fulltext">http://elpub.episciences.org/4607/pdf</oaire:file><oaire:version uri="http://purl.org/coar/version/c_970fb48d4fbd8a85">VoR</oaire:version><dc:format>application/pdf</dc:format><oaire:citationTitle>ElPub - ELectronic PUBlishing</oaire:citationTitle><oaire:citationVolume>Connecting the Knowledge Commons: From Projects to Sustainable Infrastructure</oaire:citationVolume><oaire:citationIssue>Long Papers</oaire:citationIssue><dcterms:audience>Researchers</dcterms:audience><dcterms:audience>Students</dcterms:audience></resource>