From e461fb63be7ce2c5706fe007d473f588657882b6 Mon Sep 17 00:00:00 2001 From: johannesknuechel <163017392+johannesknuechel@users.noreply.github.com> Date: Fri, 18 Oct 2024 16:02:02 +0200 Subject: [PATCH] Update die-bombe_metadata-readme.md (formatting and exemplary data instance) --- die-bombe_metadata-readme.md | 48 +++++++++++++++++++----------------- 1 file changed, 25 insertions(+), 23 deletions(-) diff --git a/die-bombe_metadata-readme.md b/die-bombe_metadata-readme.md index 6c3d35a..7f2f67d 100644 --- a/die-bombe_metadata-readme.md +++ b/die-bombe_metadata-readme.md @@ -1,25 +1,27 @@ -This Readme offers explanations for all attributes of the metadata csv table to the dataset "Die Bombe". +# Die Bombe Metadata Readme + +This Readme offers explanations for all attributes of the metadata ``.csv`` table to the dataset “Die Bombe.” The frequency attribute can have the value "all", "most", "some" or "none". It gives you an overview of how often a value is to be expected for the attribute explained in relation to the whole dataset. -The CSV is an export of keys and values of the Relational Database (MySQL) used for ANNO. +The CSV is an export of keys and values of the Relational Database (MySQL) used for ANNO (AustriaN Newspapers Online). The exemplary data instance was taken from the full metadata ``.csv`` table. -| attribute | explanation | frequency | datatype | -| ---- | ---- | ---- | ---- | -| manifest_id | ID for the IIIF manifest in the form of \{aidaaaammdd} | all | string | -| aid | ID for issues contained in the ANNO database, usually an abbreviation for the title | all | string | -| year | year of publication | all | integer | -| day | date of publication | all | string | -| dc_title | title of the newspaper | all | string | -| dc_title_additional | subtitle or any other additional title of the resource | none | string | -| subjects | subject terms (German), not linked to authority file; multiple values are separated by a hyphen | all | string | -| place_of_publications | placename (German) of publication place, not linked to authority file | all | string | -| languages | language of the document in the form of ISO-639-1 | all | string | -| dc_type | type of the document (English); default is "newspaper" | all | string | -| meta_type | type of document (German); default is "zeitungen" | all | string | -| ini_type | value for database; default is "anno" | all | string | -| modification_datetime | timestamp for date of last modification of the database entry | all | datetime | -| longer_page_id | value is either "O" or "1" | all | integer | -| dc_date | date of publication in ISO-form "aaaa-mm-dd"| all | date | -| link_pdf | URL to PDF download of issue | all | string | -| link_old | URL to issue in the ANNO interface | all | string | -| has_ocr | value is "1" if the document has OCR, else value is "0" | all | integer | -| page_count | number of pages for each issue | all | integer | +| attribute | explanation | frequency | datatype | exemplary data instance | +| ---- | ---- | ---- | ---- | ---- | +| manifest_id | ID for the IIIF manifest in the form of \{aidaaaammdd\} | all | string |bom18720915| +| aid | ID for issues contained in the ANNO database, usually an abbreviation for the title | all | string |bom| +| year | year of publication | all | integer |1872| +| day | date of publication in the form of \{aaaammdd\} | all | string |18720915| +| dc_title | title of the newspaper | all | string |Die Bombe| +| dc_title_additional | subtitle or any other additional title of the resource | none | string || +| subjects | subject terms (German), not linked to authority file; multiple values are separated by a hyphen | all | string |Humor; Satire| +| place_of_publications | placename (German) of publication place, not linked to authority file | all | string |Wien| +| languages | language of the document in the form of ISO-639-1 | all | string |de| +| dc_type | type of the document (English); default is "newspaper" | all | string |newspaper| +| meta_type | type of document (German); default is "zeitungen" | all | string |zeitungen| +| ini_type | value for database; default is "anno" | all | string |anno| +| modification_datetime | timestamp for date of last modification of the database entry | all | datetime |26.09.2011 10:38:48| +| longer_page_id | value is either "O" or "1" | all | integer |0| +| dc_date | date of publication in ISO-form "aaaa-mm-dd"| all | date |1872-09-15| +| link_pdf | URL to PDF download of issue | all | string |http://anno.onb.ac.at/cgi-content/anno_pdf.pl?aid=bom&datum=18720915| +| link_old | URL to issue in the ANNO interface | all | string |http://anno.onb.ac.at/cgi-content/anno?aid=bom&datum=18720915| +| has_ocr | value is "1" if the document has OCR, else value is "0" | all | integer |1| +| page_count | number of pages for each issue | all | integer |12| -- GitLab