diff --git a/LOC Colors - Data Management.ipynb b/LOC Colors - Data Management.ipynb new file mode 100644 index 0000000000000000000000000000000000000000..c4ba0673c0cdf5c071a3a5358481cbb4bb91a11d --- /dev/null +++ b/LOC Colors - Data Management.ipynb @@ -0,0 +1,1509 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# LOC Colors - Data Management" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "*Export data as minimal JSON files - only the essentials to create the swatches in the browser*" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "To use the created swatches for [https://labs.onb.ac.at/en/topic/akon-swatches/](https://labs.onb.ac.at/en/topic/akon-swatches/), I have to create a JSON file looking like this:\n", + "\n", + "```json\n", + "[[\"AK111_461\", [\"#f4e6cd\", \"#cac4b2\", \"#7e8077\", \"#3e4139\", \"#2f3431\", \"#000304\"], \"Nonza\", \"gelaufen 1903\"],\n", + "[\"AK111_072\", [\"#e2d7c1\", \"#a19c8f\", \"#504e42\", \"#494a44\", \"#010500\", \"#393c39\"], \"Kirchberg am Walde\", \"gelaufen 1914\"],\n", + "[\"AK111_077\", [\"#454234\", \"#3e3b1f\", \"#7f7e77\", \"#a9b8be\", \"#3b4347\", \"#425a6b\"], \"Kirchberg am Wechsel\", \"gelaufen 1913\"]]\n", + "```" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "The first part (the id and the colors) are part of the created swatches, the second part (a name and an approximate date) are part of the metadata to download here: [https://labs.onb.ac.at/gitlab/labs-team/raw-metadata/raw/master/akon_postcards_public_domain.csv.bz2?inline=false](https://labs.onb.ac.at/gitlab/labs-team/raw-metadata/raw/master/akon_postcards_public_domain.csv.bz2?inline=false)." + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "### Read created swatches" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "df = pd.read_csv('historic_postcards_color_swatches.csv.bz2', compression='bz2')" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + " | Unnamed: 0 | \n", + "akon_id | \n", + "image_link | \n", + "hex_colors | \n", + "html | \n", + "
---|---|---|---|---|---|
21914 | \n", + "21914 | \n", + "AK036_405 | \n", + "https://iiif.onb.ac.at/images/AKON/AK036_405/4... | \n", + "['#f2e3c1', '#e6dec6', '#8e8a7a', '#7b7864', '... | \n", + "<a href=\"https://iiif.onb.ac.at/images/AKON/AK... | \n", + "
\n", + " | akon_id | \n", + "hex_colors | \n", + "
---|---|---|
14980 | \n", + "AK010_595 | \n", + "['#cfbfa4', '#62583b', '#c8c7b6', '#4f5144', '... | \n", + "
7474 | \n", + "AK084_243 | \n", + "['#aca693', '#414028', '#444537', '#5c5f57', '... | \n", + "
23730 | \n", + "AK043_578 | \n", + "['#4e502c', '#444735', '#51554a', '#dae1d1', '... | \n", + "
30352 | \n", + "AK085_096 | \n", + "['#b5aa9d', '#f3e7d7', '#756d62', '#211a0f', '... | \n", + "
22389 | \n", + "AK038_067 | \n", + "['#f2e9cb', '#989384', '#545245', '#fcf7db', '... | \n", + "
\n", + " | akon_id | \n", + "hex_colors | \n", + "colors | \n", + "
---|---|---|---|
1291 | \n", + "AK116_455 | \n", + "['#f4ece0', '#d4d2ce', '#716d5c', '#65665e', '... | \n", + "[#f4ece0, #d4d2ce, #716d5c, #65665e, #b2b4bb, ... | \n", + "
\n", + " | akon_id | \n", + "name | \n", + "date | \n", + "
---|---|---|---|
16251 | \n", + "AK016_087 | \n", + "Neulengbach | \n", + "vor 1907 | \n", + "
23864 | \n", + "AK044_401 | \n", + "Gloriette | \n", + "1907 | \n", + "
33292 | \n", + "AK085_517 | \n", + "Milano | \n", + "vor 1905 | \n", + "
13875 | \n", + "AK008_070 | \n", + "Schloß Schönbrunn | \n", + "1906 | \n", + "
12223 | \n", + "AK004_040 | \n", + "Pürgg | \n", + "1909 | \n", + "
4129 | \n", + "AK125_097 | \n", + "Altaussee | \n", + "gelaufen 1901 | \n", + "
23756 | \n", + "AK044_080 | \n", + "Radstädter Tauern | \n", + "1907 | \n", + "
26479 | \n", + "AK069_067 | \n", + "Attersee | \n", + "1906 | \n", + "
14251 | \n", + "AK109_329 | \n", + "Josefsthal | \n", + "vor 1907 | \n", + "
28518 | \n", + "AK063_083 | \n", + "Gaußig | \n", + "1908 | \n", + "
\n", + " | akon_id | \n", + "name | \n", + "date | \n", + "
---|---|---|---|
24871 | \n", + "AK048_377 | \n", + "Reichenau an der Rax | \n", + "1925 | \n", + "
4191 | \n", + "AK054_543 | \n", + "Aflenz Kurort | \n", + "vor 1905 | \n", + "
\n", + " | akon_id | \n", + "colors | \n", + "name | \n", + "date | \n", + "
---|---|---|---|---|
16356 | \n", + "AK016_310 | \n", + "[#5f5a57, #9c938c, #4d453f, #cabbab, #3c3b39, ... | \n", + "Kapellen | \n", + "1908 | \n", + "
1117 | \n", + "AK116_129 | \n", + "[#dcc9ab, #cec0a7, #a8a290, #48473a, #6c6c62, ... | \n", + "Garsten | \n", + "gelaufen 1902 | \n", + "
\n", + " | akon_id | \n", + "colors | \n", + "name | \n", + "date | \n", + "
---|---|---|---|---|
99 | \n", + "AK111_207 | \n", + "[#403e2c, #f9f8eb, #7e7f6b, #35362d, #32342f, ... | \n", + "Klosterneuburg | \n", + "gelaufen 1908 | \n", + "
34 | \n", + "AK111_293 | \n", + "[#e6d8bf, #c7c1b1, #4a4c3c, #aeafa5, #464740, ... | \n", + "Komotau | \n", + "vor 1905 | \n", + "
86 | \n", + "AK111_184 | \n", + "[#f7edd6, #d1cbb8, #f6f0db, #2d2a1b, #9e9f93, ... | \n", + "Klausenburg | \n", + "gelaufen 1904 | \n", + "
3 | \n", + "AK111_026 | \n", + "[#e2cba6, #9e8e73, #574c39, #3c311a, #4c473b, ... | \n", + "Kierling | \n", + "1922 | \n", + "
39 | \n", + "AK111_072 | \n", + "[#e5d9c2, #c0baac, #928e81, #4c493e, #484943, ... | \n", + "Kirchberg am Walde | \n", + "gelaufen 1914 | \n", + "
\n", + " | Unnamed: 0 | \n", + "akon_id | \n", + "image_link | \n", + "hex_colors | \n", + "html | \n", + "
---|---|---|---|---|---|
11914 | \n", + "11914 | \n", + "AK003_285 | \n", + "https://iiif.onb.ac.at/images/AKON/AK003_285/2... | \n", + "['#050300', '#eee2c9', '#b6af9e', '#fdf7da', '... | \n", + "<a href=\"https://iiif.onb.ac.at/images/AKON/AK... | \n", + "
\n", + " | Unnamed: 0 | \n", + "akon_id | \n", + "id | \n", + "altitude | \n", + "building | \n", + "city | \n", + "color | \n", + "comment | \n", + "mountain | \n", + "other | \n", + "... | \n", + "feature_class | \n", + "feature_code | \n", + "geoname_id | \n", + "latitude | \n", + "longitude | \n", + "name | \n", + "country_id | \n", + "admin_name_1 | \n", + "admin_code_1 | \n", + "geo | \n", + "
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
23435 | \n", + "23435 | \n", + "AK042_533 | \n", + "25265 | \n", + "434.0 | \n", + "NaN | \n", + "Frohnleiten | \n", + "False | \n", + "NaN | \n", + "NaN | \n", + "NaN | \n", + "... | \n", + "P | \n", + "PPLA3 | \n", + "2779202.0 | \n", + "47.26667 | \n", + "15.31667 | \n", + "Frohnleiten | \n", + "AT | \n", + "NaN | \n", + "NaN | \n", + "47.26667, 15.31667 | \n", + "
1 rows × 30 columns
\n", + "" + ], + "text/plain": [ + " Unnamed: 0 akon_id id altitude building city color \\\n", + "23435 23435 AK042_533 25265 434.0 NaN Frohnleiten False \n", + "\n", + " comment mountain other ... feature_class feature_code \\\n", + "23435 NaN NaN NaN ... P PPLA3 \n", + "\n", + " geoname_id latitude longitude name country_id admin_name_1 \\\n", + "23435 2779202.0 47.26667 15.31667 Frohnleiten AT NaN \n", + "\n", + " admin_code_1 geo \n", + "23435 NaN 47.26667, 15.31667 \n", + "\n", + "[1 rows x 30 columns]" + ] + }, + "execution_count": 67, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "raw_data.sample()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Combine Data" + ] + }, + { + "cell_type": "code", + "execution_count": 68, + "metadata": {}, + "outputs": [], + "source": [ + "combined_data = pd.merge(colors_hsv_clip[['akon_id', 'hex_colors', 'image_link']],\n", + " raw_data[['akon_id', 'name', 'date']],\n", + " on='akon_id')" + ] + }, + { + "cell_type": "code", + "execution_count": 69, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "\n", + " | akon_id | \n", + "hex_colors | \n", + "image_link | \n", + "name | \n", + "date | \n", + "
---|---|---|---|---|---|
23217 | \n", + "AK041_595 | \n", + "['#ada896', '#fcf6d5', '#767467', '#484739', '... | \n", + "https://iiif.onb.ac.at/images/AKON/AK041_595/5... | \n", + "Ötscher | \n", + "1909 | \n", + "
\n", + " | akon_id | \n", + "hex_colors | \n", + "image_link | \n", + "name | \n", + "date | \n", + "hex_colors_list | \n", + "
---|---|---|---|---|---|---|
15996 | \n", + "AK014_589 | \n", + "['#020100', '#fbfae8', '#88887e', '#64645a', '... | \n", + "https://iiif.onb.ac.at/images/AKON/AK014_589/5... | \n", + "Maria Taferl | \n", + "1909 | \n", + "[#020100, #fbfae8, #88887e, #64645a, #4d4f49, ... | \n", + "
\n", + " | akon_id | \n", + "image_link | \n", + "name | \n", + "date | \n", + "hex_colors_list | \n", + "
---|---|---|---|---|---|
19590 | \n", + "AK028_177 | \n", + "https://iiif.onb.ac.at/images/AKON/AK028_177/1... | \n", + "Frohnleiten | \n", + "1906 | \n", + "[#020100, #a8a599, #7b7a6f, #fbf9e5, #4b4b40, ... | \n", + "
\n", + " | akon_id | \n", + "image_link | \n", + "name | \n", + "date | \n", + "hex_colors | \n", + "
---|---|---|---|---|---|
33304 | \n", + "AK087_042 | \n", + "https://iiif.onb.ac.at/images/AKON/AK087_042/0... | \n", + "Abcoude | \n", + "vor 1905 | \n", + "[#f8eacd, #aca391, #5b5747, #6e6a5e, #525148, ... | \n", + "
\n", + " | akon_id | \n", + "hex_colors | \n", + "image_link | \n", + "name | \n", + "date | \n", + "
---|---|---|---|---|---|
25575 | \n", + "AK031_287 | \n", + "[#444626, #caccbc, #4a4d41, #48504f, #5b7073, ... | \n", + "https://iiif.onb.ac.at/images/AKON/AK031_287/2... | \n", + "Ebensee | \n", + "1907 | \n", + "