{"journal": {"journal_issue": {"issue": "Short Papers", "journal_volume": {"volume": "Charting The Futures(s) of..."}, "publication_date": {"day": "18", "year": "2020", "month": "04", "@media_type": "online"}}, "journal_article": {"titles": {"title": "Open science-based framework to reveal open data publishing: an experience from using Common Crawl"}, "program": {"related_item": {"intra_work_relation": {"value": "https://hal.science/hal-02544245v1", "@identifier-type": "uri", "@relationship-type": "isSameAs"}}}, "abstract": {"value": {"value": "The publishing of open data is considered a key element for civic participation paving the way tothe ‘public value’, a term which underpins the social contribution. A result of that can be seenthrough the popularity of data portals published all around the world by governments, publicand private organizations. However, the diffusion of data portals raises concerns aboutdiscoverability and validity of these data sources, especially to what extent they contribute toopen data and open science. The purpose of this work is to develop a framework to reveal opendata publishing with the use of a freely available open science project called Common Crawl. Theidea is to identify open data-related initiatives and to gather information about their availability,having in the framework’s essence an iterative and differential process. The main outcome isshown through a proposed model for the historical data repository which involves both use andcreation of open science to branch new sort of research possibilities based on publishing ofderived data.", "@xml:lang": "en"}}, "doi_data": {"doi": "10.4000/proceedings.elpub.2020.1", "resource": "http://elpub.episciences.org/6307", "collection": [{"item": {"@crawler": "iParadigms", "resource": "https://hal.science/hal-02544245v1/document"}, "@property": "crawler-based"}, {"item": {"resource": {"value": "https://hal.science/hal-02544245v1/document", "@mime_type": "application/pdf"}}, "@property": "text-mining"}]}, "keywords": {"0": "[SHS.INFO]Humanities and Social Sciences/Library and information sciences", "en": ["open data", "open science", "common crawl", "data portals"]}, "@language": "en", "contributors": {"person_name": [{"surname": "Correa", "@sequence": "first", "given_name": "Andreiwid", "affiliations": {"institution": {"institution_id": {"@type": "ror", "value": "https://ror.org/005pn5z34"}, "institution_name": "Federal Institute of São Paulo"}}, "@contributor_role": "author"}, {"surname": "Fernandes", "@sequence": "additional", "given_name": "Israel", "affiliations": {"institution": {"institution_id": {"@type": "ror", "value": "https://ror.org/005pn5z34"}, "institution_name": "Federal Institute of São Paulo"}}, "@contributor_role": "author"}]}, "publisher_item": {"item_number": {"value": "6307", "@item_number_type": "article_number"}}, "acceptance_date": {"day": "18", "year": "2020", "month": "04", "@media_type": "online"}, "publication_date": {"day": "18", "year": "2020", "month": "04", "@media_type": "online"}, "@publication_type": "full_text"}, "journal_metadata": {"@language": "en", "full_title": "ElPub - ELectronic PUBlishing"}}, "database": {"current": {"url": "http://elpub.episciences.org/6307", "flag": "imported", "type": {"title": "conferenceobject"}, "dates": {"posted_date": "2020-04-18 10:18:36", "publication_date": "2020-04-18 10:34:33", "modification_date": "2025-04-01 00:11:49", "first_submission_date": "2020-04-18 10:18:35"}, "files": {"link": "http://elpub.episciences.org/6307/pdf"}, "isTmp": false, "status": {"id": 16, "label": {"en": "published", "fr": "publié"}}, "volume": {"id": 402, "year": "2020", "number": 3, "titles": {"en": "Charting The Futures(s) of Digital Publishing"}, "position": "3", "settings": {"is_open": true, "is_current_issue": true, "is_special_issue": false}, "descriptions": {"en": "The 24th edition of the International Conference on Electronic Publishing is hosted by UCL Qatar"}, "has_proceedings": false, "bibliographical_references": ""}, "journal": {"id": 16, "url": "http://elpub.episciences.org", "code": "elpub", "name": "ElPub - ELectronic PUBlishing"}, "metrics": {"file_count": "262", "page_count": "620"}, "section": {"id": 89, "titles": {"en": "Short Papers"}, "position": 2, "settings": {"is_open": true}, "descriptions": null}, "version": 1, "cited_by": null, "mainPdfUrl": "https://hal.science/hal-02544245v1/document", "repository": {"id": "1", "name": "HAL", "type": "repository", "status": "1", "api_url": "https://api.archives-ouvertes.fr", "doc_url": "https://hal.science/hal-02544245v1", "base_url": "https://api.archives-ouvertes.fr/oai/hal/", "paper_url": "https://hal.science/hal-02544245v1/document", "doi_prefix": "", "identifier": "oai:HAL:hal-02544245v1"}, "identifiers": {"concept_identifier": null, "document_item_number": 6307, "permanent_item_number": 6307, "repository_identifier": "hal-02544245"}, "classifications": [], "original_language": "en", "position_in_volume": 19, "graphical_abstract_file": ""}, "previous_versions": null, "first_version_item_number": 6307, "latest_version_item_number": 6307}}