diff --git a/ANNO-Sprachen Plotly Dynamic.ipynb b/ANNO-Sprachen Plotly Dynamic.ipynb new file mode 100644 index 0000000000000000000000000000000000000000..932716ddb4a2775431ee85299e74bf7742b9dac2 --- /dev/null +++ b/ANNO-Sprachen Plotly Dynamic.ipynb @@ -0,0 +1,1051 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "# Dynamic Plots" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "* Filter: Issue size\n", + "* Filter: Language\n", + "* Filter: Time" + ] + }, + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd\n", + "import ipywidgets as widgets" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [], + "source": [ + "dd = pd.read_csv('../issue-based-data.csv.gz', compression='gzip')" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Unnamed: 0titleaisyearpageslanguagesplacein_labs
00Der Telegrapha4418364deWien0
11Der Telegrapha4418364deWien0
22Der Telegrapha4418364deWien0
33Der Telegrapha4418364deWien0
44Der Telegrapha4418364deWien0
\n", + "
" + ], + "text/plain": [ + " Unnamed: 0 title ais year pages languages place in_labs\n", + "0 0 Der Telegraph a44 1836 4 de Wien 0\n", + "1 1 Der Telegraph a44 1836 4 de Wien 0\n", + "2 2 Der Telegraph a44 1836 4 de Wien 0\n", + "3 3 Der Telegraph a44 1836 4 de Wien 0\n", + "4 4 Der Telegraph a44 1836 4 de Wien 0" + ] + }, + "execution_count": 3, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "dd.head()" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Unnamed: 0yearpagesin_labs
count1.461409e+061.461409e+061.461409e+061.461409e+06
mean7.307040e+051.872292e+031.367011e+011.582233e-01
std4.218726e+051.360414e+023.744340e+013.649504e-01
min0.000000e+001.000000e+000.000000e+000.000000e+00
25%3.653520e+051.849000e+034.000000e+000.000000e+00
50%7.307040e+051.891000e+038.000000e+000.000000e+00
75%1.096056e+061.915000e+031.600000e+010.000000e+00
max1.461408e+062.017000e+034.012000e+031.000000e+00
\n", + "
" + ], + "text/plain": [ + " Unnamed: 0 year pages in_labs\n", + "count 1.461409e+06 1.461409e+06 1.461409e+06 1.461409e+06\n", + "mean 7.307040e+05 1.872292e+03 1.367011e+01 1.582233e-01\n", + "std 4.218726e+05 1.360414e+02 3.744340e+01 3.649504e-01\n", + "min 0.000000e+00 1.000000e+00 0.000000e+00 0.000000e+00\n", + "25% 3.653520e+05 1.849000e+03 4.000000e+00 0.000000e+00\n", + "50% 7.307040e+05 1.891000e+03 8.000000e+00 0.000000e+00\n", + "75% 1.096056e+06 1.915000e+03 1.600000e+01 0.000000e+00\n", + "max 1.461408e+06 2.017000e+03 4.012000e+03 1.000000e+00" + ] + }, + "execution_count": 6, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "dd.describe()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Prepare Data" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [], + "source": [ + "dd = dd[dd['year'] >= 1500]" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": {}, + "outputs": [], + "source": [ + "dd['in_labs'] = dd['in_labs'].astype(bool)" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Unnamed: 0titleaisyearpageslanguagesplacein_labs
00Der Telegrapha4418364deWienFalse
11Der Telegrapha4418364deWienFalse
22Der Telegrapha4418364deWienFalse
33Der Telegrapha4418364deWienFalse
44Der Telegrapha4418364deWienFalse
\n", + "
" + ], + "text/plain": [ + " Unnamed: 0 title ais year pages languages place in_labs\n", + "0 0 Der Telegraph a44 1836 4 de Wien False\n", + "1 1 Der Telegraph a44 1836 4 de Wien False\n", + "2 2 Der Telegraph a44 1836 4 de Wien False\n", + "3 3 Der Telegraph a44 1836 4 de Wien False\n", + "4 4 Der Telegraph a44 1836 4 de Wien False" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "dd.head()" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [], + "source": [ + "dd.loc[dd['languages'].str.len() > 2, 'languages'] = 'multi'" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [], + "source": [ + "dd.loc[dd['languages'].isnull(), 'languages'] = 'unknown'" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "array(['de', 'it', 'hu', 'ro', 'unknown', 'en', 'pt', 'multi', 'sk', 'cs',\n", + " 'eo', 'el', 'hr', 'he', 'pl', 'fr', 'ru', 'sl', 'sr', 'uk'],\n", + " dtype=object)" + ] + }, + "execution_count": 10, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "dd.languages.unique()" + ] + }, + { + "cell_type": "code", + "execution_count": 11, + "metadata": {}, + "outputs": [], + "source": [ + "dd.loc[dd['place'].isnull(), 'place'] = 'unknown'" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Filter" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Some section\n", + "\n", + "* a list\n", + "* with bullet points" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": {}, + "outputs": [], + "source": [ + "year_min, year_max = dd.year.min(), dd.year.max()\n", + "pages_min, pages_max = dd.pages.min(), dd.pages.max()\n", + "pages_unique = sorted(dd.pages.unique())\n", + "all_languages = dd.languages.unique()" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "metadata": {}, + "outputs": [], + "source": [ + "language_options = sorted(all_languages)" + ] + }, + { + "cell_type": "code", + "execution_count": 14, + "metadata": {}, + "outputs": [ + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "549383bbad4a4bf7b9866d0c051b3227", + "version_major": 2, + "version_minor": 0 + }, + "text/html": [ + "

Failed to display Jupyter Widget of type VBox.

\n", + "

\n", + " If you're reading this message in the Jupyter Notebook or JupyterLab Notebook, it may mean\n", + " that the widgets JavaScript is still loading. If this message persists, it\n", + " likely means that the widgets JavaScript library is either not installed or\n", + " not enabled. See the Jupyter\n", + " Widgets Documentation for setup instructions.\n", + "

\n", + "

\n", + " If you're reading this message in another frontend (for example, a static\n", + " rendering on GitHub or NBViewer),\n", + " it may mean that your frontend doesn't currently support widgets.\n", + "

\n" + ], + "text/plain": [ + "VBox(children=(IntRangeSlider(value=(1505, 2017), continuous_update=False, description='Years', layout=Layout(width='90%'), max=2017, min=1505), SelectionRangeSlider(continuous_update=False, description='Pages', index=(0, 1128), layout=Layout(width='90%'), options=(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 37, 38, 39, 40, 41, 42, 43, 44, 45, 46, 47, 48, 49, 50, 51, 52, 53, 54, 55, 56, 57, 58, 59, 60, 61, 62, 63, 64, 65, 66, 67, 68, 69, 70, 71, 72, 73, 74, 75, 76, 77, 78, 79, 80, 81, 82, 83, 84, 85, 86, 87, 88, 89, 90, 91, 92, 93, 94, 95, 96, 97, 98, 99, 100, 101, 102, 103, 104, 105, 106, 107, 108, 109, 110, 111, 112, 113, 114, 115, 116, 117, 118, 119, 120, 121, 122, 123, 124, 125, 126, 127, 128, 129, 130, 131, 132, 133, 134, 135, 136, 137, 138, 139, 140, 141, 142, 143, 144, 145, 146, 147, 148, 149, 150, 151, 152, 153, 154, 155, 156, 157, 158, 159, 160, 161, 162, 163, 164, 165, 166, 167, 168, 169, 170, 171, 172, 173, 174, 175, 176, 177, 178, 179, 180, 181, 182, 183, 184, 185, 186, 187, 188, 189, 190, 191, 192, 193, 194, 195, 196, 197, 198, 199, 200, 201, 202, 203, 204, 205, 206, 207, 208, 209, 210, 211, 212, 213, 214, 215, 216, 217, 218, 219, 220, 221, 222, 223, 224, 225, 226, 227, 228, 229, 230, 231, 232, 233, 234, 235, 236, 237, 238, 239, 240, 241, 242, 243, 244, 245, 246, 247, 248, 249, 250, 251, 252, 253, 254, 255, 256, 257, 258, 259, 260, 261, 262, 263, 264, 265, 266, 267, 268, 269, 270, 271, 272, 273, 274, 275, 276, 277, 278, 279, 280, 281, 282, 283, 284, 285, 286, 287, 288, 289, 290, 291, 292, 293, 294, 295, 296, 297, 298, 299, 300, 301, 302, 303, 304, 305, 306, 307, 308, 309, 310, 311, 312, 313, 314, 315, 316, 317, 318, 319, 320, 321, 322, 323, 324, 325, 326, 327, 328, 329, 330, 331, 332, 333, 334, 335, 336, 337, 338, 339, 340, 341, 342, 343, 344, 345, 346, 347, 348, 349, 350, 351, 352, 353, 354, 355, 356, 357, 358, 359, 360, 361, 362, 363, 364, 365, 366, 367, 368, 369, 370, 371, 372, 373, 374, 375, 376, 377, 378, 379, 380, 381, 382, 383, 384, 385, 386, 387, 388, 389, 390, 391, 392, 393, 394, 395, 396, 397, 398, 399, 400, 401, 402, 403, 404, 405, 406, 407, 408, 409, 410, 411, 412, 413, 414, 415, 416, 417, 418, 419, 420, 421, 422, 423, 424, 425, 426, 427, 428, 429, 430, 431, 432, 433, 434, 435, 436, 437, 438, 440, 441, 442, 443, 444, 445, 446, 447, 448, 450, 451, 452, 453, 454, 455, 456, 457, 458, 459, 460, 461, 462, 464, 465, 466, 467, 468, 469, 470, 471, 472, 473, 474, 475, 476, 477, 478, 479, 480, 481, 482, 483, 484, 485, 486, 487, 488, 489, 490, 491, 492, 493, 494, 495, 496, 497, 498, 499, 500, 501, 502, 503, 504, 505, 506, 507, 508, 509, 510, 511, 512, 513, 514, 515, 516, 517, 518, 519, 520, 521, 522, 523, 524, 525, 526, 527, 528, 529, 530, 531, 532, 533, 534, 535, 536, 537, 538, 539, 540, 541, 542, 543, 544, 545, 546, 547, 548, 549, 550, 551, 552, 553, 554, 555, 556, 557, 558, 560, 561, 562, 563, 564, 565, 566, 567, 568, 569, 570, 571, 572, 573, 574, 575, 576, 577, 578, 579, 580, 581, 582, 583, 584, 585, 586, 587, 588, 589, 590, 591, 592, 593, 594, 595, 596, 597, 598, 599, 600, 601, 602, 603, 604, 605, 606, 607, 608, 609, 610, 611, 612, 613, 614, 615, 616, 617, 618, 619, 620, 622, 623, 624, 625, 626, 627, 628, 629, 630, 631, 632, 633, 634, 635, 636, 638, 639, 640, 641, 642, 644, 645, 646, 647, 648, 649, 650, 651, 652, 653, 654, 655, 656, 657, 658, 659, 660, 661, 662, 663, 664, 665, 666, 667, 668, 669, 670, 671, 672, 673, 674, 675, 676, 677, 678, 679, 680, 681, 682, 683, 684, 685, 686, 687, 688, 689, 690, 691, 692, 694, 695, 696, 697, 698, 699, 700, 701, 702, 703, 704, 705, 707, 708, 709, 710, 711, 712, 713, 714, 715, 716, 717, 718, 719, 720, 721, 722, 723, 724, 725, 726, 727, 728, 730, 731, 732, 733, 734, 735, 736, 737, 738, 740, 741, 742, 743, 744, 745, 746, 747, 748, 750, 751, 752, 753, 754, 755, 756, 757, 758, 759, 760, 762, 764, 765, 766, 767, 768, 769, 770, 771, 772, 774, 775, 776, 777, 778, 780, 781, 782, 783, 784, 785, 786, 787, 788, 789, 790, 792, 793, 794, 795, 797, 798, 799, 800, 801, 802, 803, 804, 805, 807, 808, 809, 810, 812, 813, 814, 816, 817, 818, 819, 820, 821, 822, 824, 825, 826, 828, 829, 832, 834, 835, 836, 837, 838, 839, 840, 841, 842, 844, 846, 848, 850, 852, 853, 854, 855, 856, 858, 859, 860, 863, 864, 865, 867, 868, 870, 872, 874, 876, 877, 878, 880, 882, 884, 888, 892, 893, 894, 896, 898, 899, 900, 902, 904, 905, 907, 910, 917, 918, 919, 926, 928, 932, 934, 936, 940, 941, 942, 944, 948, 950, 954, 956, 958, 960, 962, 963, 964, 966, 968, 969, 970, 972, 973, 974, 976, 977, 978, 982, 984, 986, 988, 990, 992, 993, 996, 998, 1002, 1004, 1005, 1006, 1008, 1010, 1012, 1018, 1020, 1022, 1024, 1026, 1028, 1030, 1036, 1037, 1040, 1042, 1044, 1045, 1046, 1048, 1052, 1056, 1058, 1060, 1070, 1074, 1078, 1084, 1087, 1088, 1093, 1096, 1098, 1100, 1102, 1104, 1106, 1109, 1110, 1112, 1114, 1116, 1118, 1128, 1130, 1132, 1133, 1134, 1135, 1136, 1138, 1140, 1141, 1142, 1144, 1146, 1147, 1152, 1153, 1155, 1156, 1157, 1160, 1164, 1182, 1183, 1192, 1194, 1196, 1197, 1198, 1199, 1202, 1205, 1206, 1207, 1208, 1214, 1216, 1217, 1220, 1224, 1226, 1228, 1230, 1231, 1232, 1234, 1235, 1236, 1237, 1238, 1240, 1242, 1244, 1248, 1252, 1256, 1258, 1264, 1269, 1273, 1274, 1275, 1277, 1281, 1284, 1288, 1292, 1293, 1294, 1296, 1301, 1305, 1306, 1318, 1320, 1321, 1322, 1326, 1328, 1336, 1348, 1354, 1356, 1362, 1375, 1380, 1398, 1402, 1408, 1412, 1416, 1419, 1420, 1428, 1431, 1432, 1433, 1434, 1438, 1440, 1444, 1456, 1462, 1464, 1466, 1474, 1478, 1480, 1489, 1494, 1498, 1500, 1506, 1507, 1508, 1509, 1510, 1511, 1512, 1513, 1514, 1516, 1517, 1518, 1520, 1522, 1527, 1528, 1532, 1539, 1540, 1542, 1546, 1550, 1552, 1553, 1564, 1574, 1576, 1585, 1586, 1588, 1592, 1594, 1602, 1604, 1605, 1610, 1614, 1615, 1617, 1623, 1624, 1632, 1639, 1642, 1644, 1651, 1659, 1666, 1668, 1701, 1704, 1706, 1708, 1712, 1713, 1716, 1717, 1722, 1738, 1750, 1755, 1768, 1774, 1886, 1890, 1894, 1905, 2049, 2060, 2162, 2271, 2367, 2421, 2604, 2699, 2876, 4012), value=(0, 4012)), SelectMultiple(description='Languages', index=(0, 1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16, 17, 18, 19), layout=Layout(width='90%'), options=('cs', 'de', 'el', 'en', 'eo', 'fr', 'he', 'hr', 'hu', 'it', 'multi', 'pl', 'pt', 'ro', 'ru', 'sk', 'sl', 'sr', 'uk', 'unknown'), rows=20, value=('cs', 'de', 'el', 'en', 'eo', 'fr', 'he', 'hr', 'hu', 'it', 'multi', 'pl', 'pt', 'ro', 'ru', 'sk', 'sl', 'sr', 'uk', 'unknown')), Checkbox(value=False, description='Limit to Lab content', layout=Layout(width='90%')), Output()))" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "wide_layout = widgets.Layout(width='90%')\n", + "\n", + "years = widgets.IntRangeSlider(value=(year_min, year_max), min=year_min, max=year_max, step=1,\n", + " continuous_update=False, description='Years', layout=wide_layout)\n", + "pages = widgets.SelectionRangeSlider(value=(pages_min, pages_max), options=pages_unique,\n", + " continuous_update=False, description='Pages', layout=wide_layout)\n", + "lang = widgets.SelectMultiple(options=language_options, value=language_options[:], rows=len(language_options),\n", + " description='Languages', layout=wide_layout)\n", + "labs = widgets.Checkbox(value=False,\n", + " description='Limit to Lab content', layout=wide_layout)\n", + "out = widgets.Output()\n", + "\n", + "\n", + "def get_filtered_dataframe():\n", + " ymin, ymax = years.value\n", + " pmin, pmax = pages.value\n", + " selected_languages = lang.value\n", + " filtered = dd[\n", + " (dd['year'] >= ymin) &\n", + " (dd['year'] <= ymax) &\n", + " (dd['pages'] >= pmin) &\n", + " (dd['pages'] <= pmax) &\n", + " (dd['languages'].isin(selected_languages))\n", + " ]\n", + " if labs.value:\n", + " filtered = filtered[filtered['in_labs']]\n", + " return filtered\n", + "\n", + "def update_filtered_plotly_output(*args):\n", + " filtered_data = get_filtered_dataframe()\n", + " out.clear_output()\n", + " with out:\n", + " print('Data length: {}'.format(len(filtered_data)))\n", + "\n", + " \n", + "years.observe(update_filtered_plotly_output, names=['value'])\n", + "pages.observe(update_filtered_plotly_output, names=['value'])\n", + "lang.observe(update_filtered_plotly_output, names=['value'])\n", + "labs.observe(update_filtered_plotly_output, names=['value'])\n", + "\n", + "\n", + "update_filtered_plotly_output()\n", + " \n", + "widgets.VBox([\n", + " years,\n", + " pages,\n", + " lang,\n", + " labs,\n", + " out\n", + "])" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Plotly" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "" + ], + "text/vnd.plotly.v1+html": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "import plotly.offline as py\n", + "import plotly.graph_objs as go\n", + "\n", + "py.init_notebook_mode()" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": {}, + "outputs": [ + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "bbcd0b1ac1c549b9bfd133721543f0ec", + "version_major": 2, + "version_minor": 0 + }, + "text/html": [ + "

Failed to display Jupyter Widget of type VBox.

\n", + "

\n", + " If you're reading this message in the Jupyter Notebook or JupyterLab Notebook, it may mean\n", + " that the widgets JavaScript is still loading. If this message persists, it\n", + " likely means that the widgets JavaScript library is either not installed or\n", + " not enabled. See the Jupyter\n", + " Widgets Documentation for setup instructions.\n", + "

\n", + "

\n", + " If you're reading this message in another frontend (for example, a static\n", + " rendering on GitHub or NBViewer),\n", + " it may mean that your frontend doesn't currently support widgets.\n", + "

\n" + ], + "text/plain": [ + "VBox(children=(Button(description='Plot!', style=ButtonStyle()), Output()))" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "create_plot = widgets.Button(description='Plot!')\n", + "plot_out = widgets.Output()\n", + "\n", + "\n", + "def plot(*args):\n", + " with plot_out:\n", + " per_year = get_filtered_dataframe()[['year', 'pages']].groupby('year').sum()\n", + " ppy = go.Bar(x=per_year.index,\n", + " y=per_year.pages,\n", + " name='PPY'\n", + " )\n", + " ppy_data = go.Data([ppy])\n", + " ppy_layout = go.Layout(title='Pages per Year',\n", + " xaxis={'title': 'Years'},\n", + " yaxis={'title': 'Pages'})\n", + " ppy_figure = go.Figure(data=ppy_data, layout=ppy_layout)\n", + " py.iplot(ppy_figure)\n", + " \n", + "create_plot.on_click(plot)\n", + "\n", + "\n", + "widgets.VBox([\n", + " create_plot,\n", + " plot_out\n", + "])" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## Widgets + Plotly" + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "metadata": {}, + "outputs": [ + { + "ename": "NameError", + "evalue": "name 'plot_clear' is not defined", + "output_type": "error", + "traceback": [ + "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[0;31mNameError\u001b[0m Traceback (most recent call last)", + "\u001b[0;32m\u001b[0m in \u001b[0;36m\u001b[0;34m()\u001b[0m\n\u001b[1;32m 110\u001b[0m \u001b[0mlang\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mobserve\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mupdate_filtered_plotly_output\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mnames\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'value'\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 111\u001b[0m \u001b[0mlabs\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mobserve\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mupdate_filtered_plotly_output\u001b[0m\u001b[0;34m,\u001b[0m \u001b[0mnames\u001b[0m\u001b[0;34m=\u001b[0m\u001b[0;34m[\u001b[0m\u001b[0;34m'value'\u001b[0m\u001b[0;34m]\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0;32m--> 112\u001b[0;31m \u001b[0mclear_plot\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mon_click\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mplot_clear\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[0m\u001b[1;32m 113\u001b[0m \u001b[0mcreate_plot\u001b[0m\u001b[0;34m.\u001b[0m\u001b[0mon_click\u001b[0m\u001b[0;34m(\u001b[0m\u001b[0mplot\u001b[0m\u001b[0;34m)\u001b[0m\u001b[0;34m\u001b[0m\u001b[0m\n\u001b[1;32m 114\u001b[0m \u001b[0;34m\u001b[0m\u001b[0m\n", + "\u001b[0;31mNameError\u001b[0m: name 'plot_clear' is not defined" + ] + } + ], + "source": [ + "wide_layout = widgets.Layout(width='90%')\n", + "\n", + "years = widgets.IntRangeSlider(value=(year_min, year_max), min=year_min, max=year_max, step=1,\n", + " continuous_update=False, description='Years', layout=wide_layout)\n", + "pages = widgets.SelectionRangeSlider(value=(pages_min, pages_max), options=pages_unique,\n", + " continuous_update=False, description='Pages', layout=wide_layout)\n", + "lang = widgets.SelectMultiple(options=language_options, value=language_options[:], rows=len(language_options),\n", + " description='Languages', layout=wide_layout)\n", + "labs = widgets.Checkbox(value=False,\n", + " description='Limit to Lab content', layout=wide_layout)\n", + "clear_plot = widgets.Button(description='Clear!', layout=wide_layout)\n", + "create_plot = widgets.Button(description='Plot!', layout=wide_layout)\n", + "text_out = widgets.Output(layout=wide_layout)\n", + "plot_out = widgets.Output(layout=wide_layout)\n", + "\n", + "\n", + "def get_filtered_dataframe():\n", + " ymin, ymax = years.value\n", + " pmin, pmax = pages.value\n", + " selected_languages = lang.value\n", + " filtered = dd[\n", + " (dd['year'] >= ymin) &\n", + " (dd['year'] <= ymax) &\n", + " (dd['pages'] >= pmin) &\n", + " (dd['pages'] <= pmax) &\n", + " (dd['languages'].isin(selected_languages))\n", + " ]\n", + " if labs.value:\n", + " filtered = filtered[filtered['in_labs']]\n", + " return filtered\n", + "\n", + "\n", + "def plot_issues():\n", + " with plot_out:\n", + " per_year_and_language = get_filtered_dataframe()[['languages', 'year']] \\\n", + " .groupby(['languages', 'year']).size().to_frame() \\\n", + " .rename(index=str, columns={0: 'issues'})\n", + " \n", + " # issues per language - all languages\n", + " idx = per_year_and_language.index\n", + "\n", + " iper_language = {}\n", + " for lang in idx.get_level_values(0):\n", + " data = per_year_and_language[idx.get_level_values(0) == lang]\n", + " graph_obj = go.Bar(\n", + " x = data.index.get_level_values(1),\n", + " y = data.issues,\n", + " name = lang.upper()\n", + " )\n", + " iper_language[lang] = {\n", + " 'data_obj': data,\n", + " 'graph_obj': graph_obj\n", + " }\n", + "\n", + " ipl_all_data = [iper_language[lang]['graph_obj'] for lang in sorted(iper_language.keys(), reverse=True)]\n", + " ipl_all_layout = go.Layout(\n", + " title='Issues per Language per Year',\n", + " barmode='stack',\n", + " xaxis={'title': 'Year'},\n", + " yaxis={'title': 'Issues'},\n", + " height=500\n", + " )\n", + " ipl_all_fig = go.Figure(data=ipl_all_data, layout=ipl_all_layout)\n", + " py.iplot(ipl_all_fig) \n", + "\n", + " \n", + "def plot_pages():\n", + " with plot_out:\n", + " per_year_and_language = get_filtered_dataframe()[['languages', 'year', 'pages']].groupby(['languages', 'year']).sum()\n", + " \n", + " # pages per language - all languages\n", + " idx = per_year_and_language.index\n", + "\n", + " pper_language = {}\n", + " for lang in idx.get_level_values(0):\n", + " data = per_year_and_language[idx.get_level_values(0) == lang]\n", + " graph_obj = go.Bar(\n", + " x = data.index.get_level_values(1),\n", + " y = data.pages,\n", + " name = lang.upper()\n", + " )\n", + " pper_language[lang] = {\n", + " 'data_obj': data,\n", + " 'graph_obj': graph_obj\n", + " }\n", + "\n", + " ppl_all_data = [pper_language[lang]['graph_obj'] for lang in sorted(pper_language.keys(), reverse=True)]\n", + " ppl_all_layout = go.Layout(\n", + " title='Pages per Language per Year',\n", + " barmode='stack',\n", + " xaxis={'title': 'Year'},\n", + " yaxis={'title': 'Pages'},\n", + " height=500\n", + " )\n", + " ppl_all_fig = go.Figure(data=ppl_all_data, layout=ppl_all_layout)\n", + " py.iplot(ppl_all_fig) \n", + " \n", + "def plot(*args):\n", + " plot_out.clear_output()\n", + " plot_pages()\n", + " plot_issues()\n", + "\n", + "def update_filtered_plotly_output(*args):\n", + " filtered_data = get_filtered_dataframe()\n", + " text_out.clear_output()\n", + " with text_out:\n", + " print('Selected Issues: {}'.format(len(filtered_data)))\n", + "\n", + " \n", + "years.observe(update_filtered_plotly_output, names=['value'])\n", + "pages.observe(update_filtered_plotly_output, names=['value'])\n", + "lang.observe(update_filtered_plotly_output, names=['value'])\n", + "labs.observe(update_filtered_plotly_output, names=['value'])\n", + "clear_plot.on_click(plot_clear)\n", + "create_plot.on_click(plot)\n", + "\n", + "update_filtered_plotly_output()\n", + " \n", + "dyn_view = widgets.VBox([\n", + " years,\n", + " pages,\n", + " lang,\n", + " labs,\n", + " text_out,\n", + " # widgets.HBox([create_plot, clear_plot]),\n", + " create_plot,\n", + " plot_out\n", + "])\n", + "dyn_view" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "import ipywidgets.embed as embed" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "embed.embed_minimal_html('export.html', views=dyn_view, title='Widgets export')" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "## IPyWidgets Walker" + ] + }, + { + "cell_type": "code", + "execution_count": 257, + "metadata": {}, + "outputs": [], + "source": [ + "data = embed.embed_data(dyn_view)\n", + "state, view = data['manager_state']['state'], data['view_specs']" + ] + }, + { + "cell_type": "code", + "execution_count": 262, + "metadata": {}, + "outputs": [], + "source": [ + "def get_model(model_id):\n", + " return state[model_id]\n", + "\n", + "def model_to_html(model_id):\n", + " model = get_model(model_id)\n", + " name = model['model_name']\n", + " state = model.get('state', {})\n", + " if name == 'VBoxModel':\n", + " children = state['children']\n", + " child_ids = [e.replace('IPY_MODEL_', '') for e in children if e.startswith('IPY_MODEL_')]\n", + " return '
{children}
', child_ids\n", + " #elif name == 'CheckboxModel':\n", + " # descr, value = state['description'], state['value']\n", + " # return ''.format(\n", + " # checked='checked' if value else '',\n", + " # id=model_id,\n", + " # descr=descr)\n", + " elif name == 'IntRangeSliderModel':\n", + " # TODO: Labels to show current values\n", + " # TODO: Text input to set current values - connect to slider position\n", + " descr, min_, max_, low, high = state['description'], state['min'], state['max'], *state['value']\n", + " return ('\\n'\n", + " '\\n'\n", + " '').format(\n", + " id=model_id, descr=descr, min=min_, max=max_, low=low, high=high)\n", + " # TODO: SelectionRangeSliderModel\n", + " # TODO: SelectMultipleModel\n", + " # TODO: ButtonModel\n", + " else:\n", + " return ''.format(model_id)\n", + "\n", + "def walk_view(view):\n", + " html_widgets = []\n", + " for view_obj in view:\n", + " model_id = view_obj['model_id']\n", + " html_string, children = model_to_html(model_id)\n", + " if children:\n", + " children_html = [model_to_html(child) for child in children]\n", + " html_widgets.append(html_string.format(children='\\n'.join(children_html)))\n", + " else:\n", + " html_widgets.append(html_string)\n", + " return html_widgets" + ] + }, + { + "cell_type": "code", + "execution_count": 263, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "('
{children}
',\n", + " ['e3d17a73234248318d14a1f28814a565',\n", + " 'f5229546363143b685d9750d555e5a73',\n", + " '11218b97f7d84062b89abda12a395a23',\n", + " 'da995b665fd047faadad9a32303622d9',\n", + " 'f4ac1c6f5d5b4da299ecf558a9954c94',\n", + " 'edb7713a2fb641e6a2cba5be524fe76c',\n", + " '2f65bc25d8d241939f8eebd72172181f'])" + ] + }, + "execution_count": 263, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "model_to_html('13f4f856169d45f1915e2b89864048b5')" + ] + }, + { + "cell_type": "code", + "execution_count": 270, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "\n", + "
" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "from IPython.display import HTML\n", + "display(HTML(walk_view(view)[0]))\n", + "# len(walk_view(view))" + ] + }, + { + "cell_type": "code", + "execution_count": 265, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "{'model_module': '@jupyter-widgets/controls',\n", + " 'model_module_version': '1.1.0',\n", + " 'model_name': 'ButtonModel',\n", + " 'state': {'_dom_classes': (),\n", + " 'description': 'Plot!',\n", + " 'layout': 'IPY_MODEL_bb74d1dd994244ce9914f73e86a15bc0',\n", + " 'style': 'IPY_MODEL_2acd0a3ca0ee412590f1e1186183383e'}}" + ] + }, + "execution_count": 265, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "get_model('edb7713a2fb641e6a2cba5be524fe76c')" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 User Default", + "language": "python", + "name": "python_3_user_default" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.6.5" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +} diff --git a/Metadata Overview.ipynb b/Metadata Overview.ipynb new file mode 100644 index 0000000000000000000000000000000000000000..5b0b4eac3fece412554502f56209fc9c37424303 --- /dev/null +++ b/Metadata Overview.ipynb @@ -0,0 +1,1674 @@ +{ + "cells": [ + { + "cell_type": "code", + "execution_count": 1, + "metadata": {}, + "outputs": [], + "source": [ + "import pandas as pd" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "df = pd.read_csv('data_manifests_2018-04-17.csv.gz', compression='gzip')" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Unnamed: 0manifest_idaidyeardaydc_titledc_title_additionalsubjectsplace_of_publicationslanguagesdc_typefrom_abometa_typeini_typelonger_page_iddc_datelink_pdflink_oldhas_ocrmeta_id
00dwr19111001dwr191119111001Der WeckrufNaNWochenzeitung, Landwirtschaft, Kunst, Kultur, ...Innsbruckdenewspaper0brzanno01911-10-01http://anno.onb.ac.at/cgi-content/anno_pdf.pl?...http://anno.onb.ac.at/cgi-content/anno?aid=dwr...01045416
11dwr19111008dwr191119111008Der WeckrufNaNWochenzeitung, Landwirtschaft, Kunst, Kultur, ...Innsbruckdenewspaper0brzanno01911-10-08http://anno.onb.ac.at/cgi-content/anno_pdf.pl?...http://anno.onb.ac.at/cgi-content/anno?aid=dwr...01045417
22dwr19111015dwr191119111015Der WeckrufNaNWochenzeitung, Landwirtschaft, Kunst, Kultur, ...Innsbruckdenewspaper0brzanno01911-10-15http://anno.onb.ac.at/cgi-content/anno_pdf.pl?...http://anno.onb.ac.at/cgi-content/anno?aid=dwr...01045418
33dwr19111022dwr191119111022Der WeckrufNaNWochenzeitung, Landwirtschaft, Kunst, Kultur, ...Innsbruckdenewspaper0brzanno01911-10-22http://anno.onb.ac.at/cgi-content/anno_pdf.pl?...http://anno.onb.ac.at/cgi-content/anno?aid=dwr...01045419
44dwr19111029dwr191119111029Der WeckrufNaNWochenzeitung, Landwirtschaft, Kunst, Kultur, ...Innsbruckdenewspaper0brzanno01911-10-29http://anno.onb.ac.at/cgi-content/anno_pdf.pl?...http://anno.onb.ac.at/cgi-content/anno?aid=dwr...01045420
\n", + "
" + ], + "text/plain": [ + " Unnamed: 0 manifest_id aid year day dc_title \\\n", + "0 0 dwr19111001 dwr 1911 19111001 Der Weckruf \n", + "1 1 dwr19111008 dwr 1911 19111008 Der Weckruf \n", + "2 2 dwr19111015 dwr 1911 19111015 Der Weckruf \n", + "3 3 dwr19111022 dwr 1911 19111022 Der Weckruf \n", + "4 4 dwr19111029 dwr 1911 19111029 Der Weckruf \n", + "\n", + " dc_title_additional subjects \\\n", + "0 NaN Wochenzeitung, Landwirtschaft, Kunst, Kultur, ... \n", + "1 NaN Wochenzeitung, Landwirtschaft, Kunst, Kultur, ... \n", + "2 NaN Wochenzeitung, Landwirtschaft, Kunst, Kultur, ... \n", + "3 NaN Wochenzeitung, Landwirtschaft, Kunst, Kultur, ... \n", + "4 NaN Wochenzeitung, Landwirtschaft, Kunst, Kultur, ... \n", + "\n", + " place_of_publications languages dc_type from_abo meta_type ini_type \\\n", + "0 Innsbruck de newspaper 0 brz anno \n", + "1 Innsbruck de newspaper 0 brz anno \n", + "2 Innsbruck de newspaper 0 brz anno \n", + "3 Innsbruck de newspaper 0 brz anno \n", + "4 Innsbruck de newspaper 0 brz anno \n", + "\n", + " longer_page_id dc_date \\\n", + "0 0 1911-10-01 \n", + "1 0 1911-10-08 \n", + "2 0 1911-10-15 \n", + "3 0 1911-10-22 \n", + "4 0 1911-10-29 \n", + "\n", + " link_pdf \\\n", + "0 http://anno.onb.ac.at/cgi-content/anno_pdf.pl?... \n", + "1 http://anno.onb.ac.at/cgi-content/anno_pdf.pl?... \n", + "2 http://anno.onb.ac.at/cgi-content/anno_pdf.pl?... \n", + "3 http://anno.onb.ac.at/cgi-content/anno_pdf.pl?... \n", + "4 http://anno.onb.ac.at/cgi-content/anno_pdf.pl?... \n", + "\n", + " link_old has_ocr meta_id \n", + "0 http://anno.onb.ac.at/cgi-content/anno?aid=dwr... 0 1045416 \n", + "1 http://anno.onb.ac.at/cgi-content/anno?aid=dwr... 0 1045417 \n", + "2 http://anno.onb.ac.at/cgi-content/anno?aid=dwr... 0 1045418 \n", + "3 http://anno.onb.ac.at/cgi-content/anno?aid=dwr... 0 1045419 \n", + "4 http://anno.onb.ac.at/cgi-content/anno?aid=dwr... 0 1045420 " + ] + }, + "execution_count": 3, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.head()" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "['(Linzer) Tages-Post',\n", + " '(Neue) Freie Lehrer-Zeitung',\n", + " '(Neue) Wiener Schachzeitung',\n", + " '(Neuigkeits) Welt Blatt',\n", + " '(Salzburger) Fremden-Zeitung',\n", + " '(Wiener) Sporttagblatt',\n", + " '(Österreichische) Volks-Zeitung',\n", + " '12 Uhr Blatt',\n", + " '84er Zeitung',\n", + " 'Acht Uhr Blatt',\n", + " 'Agramer Zeitung',\n", + " 'Agrarische Post',\n", + " 'Akademische Frauenblätter',\n", + " 'Allgemeine Automobil-Zeitung',\n", + " 'Allgemeine Bauzeitung',\n", + " 'Allgemeine Eisenbahn-Zeitung',\n", + " 'Allgemeine Feuerwehr-Zeitung',\n", + " 'Allgemeine Frauen-Zeitung',\n", + " 'Allgemeine Frauen-Zeitung. Vereins-Zeitung der österreichisch-ungarischen Frauen-Vereine',\n", + " 'Allgemeine Radio-Zeitung',\n", + " 'Allgemeine Schutzhütten-Zeitung',\n", + " 'Allgemeine Sport-Zeitung',\n", + " 'Allgemeine Zeitschrift für Lehrerinnen',\n", + " 'Allgemeine land- und forstwirthschaftliche Zeitung',\n", + " 'Allgemeine musikalische Zeitung',\n", + " 'Allgemeine photographische Zeitung',\n", + " 'Allgemeine Österreichische Gerichtszeitung',\n", + " 'Allgemeiner Tiroler Anzeiger',\n", + " 'Almanach der k. k. österreichischen Staatsbahnen',\n", + " 'Almanach des Oberösterreichischen Künstlerbundes \"März\"',\n", + " 'Alpenländische Morgen Zeitung',\n", + " 'Alpenländische Rundschau',\n", + " 'Alphabetisches Namens-Verzeichniss der k. u. k. österr.-ungar. Consularfunctionäre sowie der k. u. k. österr.-ungar. Consularämter',\n", + " 'Amtliche Linzer Zeitung',\n", + " 'Amtliche Nachrichten des k. k. Ministeriums des Innern',\n", + " 'Amtliches Cursblatt der Wiener Börse',\n", + " 'Amtliches Veterinärblatt',\n", + " 'Amtsblatt der Bezirkshauptmannschaft Hollabrunn',\n", + " 'An der Schönen Blauen Donau',\n", + " 'Arbeiter Schachzeitung',\n", + " 'Arbeiter Zeitung',\n", + " 'Arbeiterinnen Zeitung',\n", + " 'Arbeiterinnen-Zeitung/Die Frau',\n", + " 'Arbeiterinnenblatt',\n", + " 'Arbeiterinnenzeitung',\n", + " 'Arbeitersturm',\n", + " 'Arbeiterwille',\n", + " 'Architektonische Rundschau',\n", + " 'Armeeblatt: militär-wiss. Wochens. ...unserer Land- u. Seemacht',\n", + " 'Austria',\n", + " 'Austria. Vereinigte Emaillierwerke, Lampen- und Metallwaren-Fabriken',\n", + " 'Austrian Centre',\n", + " 'Austrian Labor Information',\n", + " 'Austrian News',\n", + " 'Auszug aus der Tagespresse',\n", + " 'Az Ember',\n", + " 'Bade- und Reise-Journal',\n", + " 'Badener Bezirks-Blatt',\n", + " 'Badener Zeitung',\n", + " 'Banater Deutsche Zeitung',\n", + " 'Bastler-Zeitung',\n", + " 'Bau- und Werkkunst',\n", + " 'Beaux Arts de Modes',\n", + " 'Becsi Magyar Ujsag (Wiener Ungarische Zeitung)',\n", + " 'Belehrendes und Unterhaltendes',\n", + " 'Belvedere',\n", + " 'Bericht der Auskunftsstelle für Wohlfahrtseinrichtungen',\n", + " 'Bericht der Oesterreichischen Liga zur Bekämpfung des Mädchenhandels',\n", + " 'Bericht des Ausschusses für die ordentliche General-Versammlung des Deutschen Prager Frauen-Erwerb-Vereins',\n", + " 'Bericht des Vereins für Abhaltung von wissenschaftlichen Lehrkursen für Frauen und Mädchen ATHENÄUM in Wien',\n", + " 'Bericht über die Thötigkeit des (...) patriotischen Frauen-Hilfsvereines vom Rothen Kreuze in Mähren',\n", + " 'Bericht über die Vermögens-Gebarung ... des Zweigvereines Freiwalden des Frauenhilfsvereines vom rothen Kreuze für Schlesien ',\n", + " 'Bericht über die Wirksamkeit des (...) Frauenvereines für Arbeitsschulen',\n", + " 'Bericht über die k.k. Lehrerinnen-Bildungsanstalt in Wien (I.)',\n", + " 'Berichte der AK Wien',\n", + " 'Berichte und Informationen des österreichischen Forschungsinstituts für Wirtschaft und Politik',\n", + " 'Betrieb und Front',\n", + " 'Betriebsnachrichten für die Gefolgschaft der Firma Herrburger u. Rhomberg, Dornbirn, Innsbruck, Wien',\n", + " 'Bildungsarbeit. Blätter für sozialistisches Bildungswesen',\n", + " 'Bludenzer Anzeiger',\n", + " 'Blätter für Musik, Theater und Kunst',\n", + " 'Brand Aus',\n", + " 'Bregenzer Wochenblatt',\n", + " 'Bregenzer/Vorarlberger Tagblatt',\n", + " 'Brioni Insel-Zeitung',\n", + " 'Brixner Diözesanblatt',\n", + " 'Brünner Hebammen-Zeitung',\n", + " 'Buchdrucker-Zeitung',\n", + " 'Bukowina',\n", + " 'Bukowinaer Fortuna',\n", + " 'Bukowinaer Landwirtschaftliche Blätter',\n", + " 'Bukowinaer Nachrichten',\n", + " 'Bukowinaer Post',\n", + " 'Bukowinaer Rundschau',\n", + " 'Bukowinaer-Volks-Zeitung',\n", + " 'Bukowiner Bote',\n", + " 'Bukowiner Genossenschafts- und Vereins-Zeitung (Handel und Gewerbe).',\n", + " 'Bukowiner Pädagogische Blätter',\n", + " 'Bukowiner Schule',\n", + " 'Bukowiner Volksblatt',\n", + " 'Bukowiner Zeitung',\n", + " 'Böhmerwald Volksbote',\n", + " 'Böse Buben Journal',\n", + " 'Carinthia I',\n", + " 'Carinthia II',\n", + " 'Carinthia. Zeitschrift für Vaterlandskunde, Belehrung und Unterhaltung',\n", + " 'Cech. Der Böhme',\n", + " 'Cetinjer Zeitung',\n", + " 'Champagne-Kriegs-Zeitung',\n", + " 'Christliche Kunstblätter',\n", + " 'Club-Organ des Oesterreichischen Touring-Club',\n", + " \"Cook's Welt-Reise-Zeitung\",\n", + " 'Cur-Liste von Teplic-Schönau',\n", + " 'Curliste von Abbazia',\n", + " 'Curlisten Bad Ischl',\n", + " 'Czernowitzer Allgemeine Zeitung',\n", + " 'Czernowitzer Gemeinde-Bote',\n", + " 'Czernowitzer Presse',\n", + " 'Danzers Armee-Zeitung',\n", + " 'Das Deutsche Echo',\n", + " 'Das Kino-Journal',\n", + " 'Das Kleine Blatt',\n", + " 'Das Motorrad',\n", + " 'Das Mädchen-Unterstützungs-Komitee',\n", + " 'Das Rote Kreuz',\n", + " 'Das Vaterland',\n", + " 'Das Wort',\n", + " 'Das Wort der Frau',\n", + " 'Das Ziel',\n", + " 'Das interessante Blatt',\n", + " 'Das kleine Volksblatt',\n", + " 'Der Alpenfreund',\n", + " 'Der Architekt',\n", + " 'Der Architekt - Supplemente',\n", + " 'Der Bauernbündler',\n", + " 'Der Bautechniker',\n", + " 'Der Bote aus dem Waldviertel',\n", + " 'Der Bund. Zentralblatt des Bundes österreichischer Frauenvereine',\n", + " 'Der Böhmische Bierbrauer',\n", + " 'Der Eishockeysport',\n", + " 'Der Filmbote. Zeitschrift für alle Zweige der Kinematographie.',\n", + " 'Der Floh',\n", + " 'Der Fremdenverkehr',\n", + " 'Der Friseur',\n", + " 'Der Front-Kamerad',\n", + " 'Der Gebirgsfreund',\n", + " 'Der Hausbesitzer/Hausherren Zeitung',\n", + " 'Der Heimatgruß',\n", + " 'Der Humorist',\n", + " 'Der Jud. A Zeitung for\"n jüdischen Volk. (sic!) \"Zyd\", gazeta dla ludu zydowskiego',\n", + " 'Der Jude',\n", + " 'Der Kampf',\n", + " 'Der Kinobesitzer',\n", + " 'Der Krüppel',\n", + " 'Der Kuckuck',\n", + " 'Der Kyffhäuser',\n", + " 'Der Landbote',\n", + " 'Der Lehrerinnen-Wart',\n", + " 'Der Militärarzt',\n", + " 'Der Montag',\n", + " 'Der Morgen. Wiener Montagblatt',\n", + " 'Der Naturfreund',\n", + " 'Der Neue Mahnruf',\n", + " 'Der Obdachlose und Wohnungssuchende',\n", + " 'Der Romanleser',\n", + " 'Der Schlankel',\n", + " 'Der Schnee',\n", + " 'Der Schützengraben',\n", + " 'Der Straßenbahner',\n", + " 'Der Sturm',\n", + " 'Der Tiroler',\n", + " 'Der Tresor',\n", + " 'Der Volksfreund',\n", + " 'Der Vorarlberger',\n", + " 'Der Weckruf',\n", + " 'Der Wiener Film',\n", + " 'Der Wähler',\n", + " 'Der Zeitungs-Verlag',\n", + " 'Der Zweigverein Olmütz des patriotischen Landes- und Frauenhilfsvereines vom Roten Kreuze für Mähren. Tätigkeitsbericht',\n", + " 'Der Zwischen-Akt',\n", + " 'Der deutsch-österreichische Photograph',\n", + " 'Der deutsche Straßenbahner',\n", + " 'Der große Krieg',\n", + " 'Der gute Film',\n", + " 'Der jüdische Arbeiter',\n", + " 'Der wahre Jude',\n", + " 'Der Österreichische Schulbote',\n", + " 'Der österreichische Volkswirt',\n", + " 'Deutsch-Englischer-Reise-Courier',\n", + " 'Deutsch-Österreichische tierärztliche Wochenschrift',\n", + " 'Deutsche Kriegszeitung von Baranowitschi',\n", + " 'Deutsche Musik-Zeitung',\n", + " 'Deutsche Presse',\n", + " 'Deutsche Volkszeitung',\n", + " 'Deutsche Zeitung',\n", + " 'Deutsche Zeitung. Vereinigt mit der \"Heimat\"',\n", + " 'Deutsches Nordmährerblatt',\n", + " 'Deutsches Südmährerblatt',\n", + " 'Deutsches Volksblatt',\n", + " 'Die Arbeit',\n", + " 'Die Arbeit. Sozialdemokratisches Organ der Arbeiter Österreichs.',\n", + " 'Die Arbeiterin: Organ für die Interessen der werktätigen Frauen in Österreich',\n", + " 'Die Bombe',\n", + " 'Die Bühne',\n", + " 'Die Debatte',\n", + " 'Die Emancipation. Zeitschrift für Frauen',\n", + " 'Die Feuerwehr',\n", + " 'Die Filmwelt',\n", + " 'Die Frau und Mutter',\n", + " 'Die Frau und ihre Interessen',\n", + " 'Die Gartenlaube für Österreich',\n", + " 'Die Gewerkschaft',\n", + " 'Die Glühlichter',\n", + " 'Die Hausfrau: Blätter für Haus und Wirthschaft',\n", + " 'Die Hausfrau: Offizielles Organ der Reichsorganisation der Hausfrauen Österreichs',\n", + " 'Die Hausgehilfin: Zeitschrift des Verbandes der Christlichen Hausgehilfinnen Österreichs',\n", + " 'Die Kindes-Seele',\n", + " 'Die Kinowoche',\n", + " 'Die Leuchtrakete',\n", + " 'Die Lokomotive',\n", + " 'Die Lyra',\n", + " 'Die Mode der eleganten Frau',\n", + " 'Die Moderne Welt',\n", + " 'Die Muskete',\n", + " 'Die Mutter. Halbmonatsschrift für alle Fragen der Schwangerschaft',\n", + " 'Die Mädchenschule. Ein Organ für die gesammten Interessen der weiblichen Erziehung',\n", + " 'Die Neue Zeitung',\n", + " 'Die Neuzeit',\n", + " 'Die Postanstaltsbeamtin',\n", + " 'Die Presse',\n", + " 'Die Rechtsprechung',\n", + " 'Die Rote Fahne',\n", + " 'Die Sonne',\n", + " 'Die Spruchpraxis',\n", + " 'Die Stimme',\n", + " 'Die Unzufriedene',\n", + " 'Die Vedette',\n", + " 'Die Waffen nieder!',\n", + " 'Die Wahrheit',\n", + " 'Die Weltpresse',\n", + " 'Die Wählerin. Sozialdemokratisches Frauen-Wochenblatt',\n", + " 'Die Zeit',\n", + " 'Die bildenden Künste',\n", + " 'Die kluge Frau',\n", + " 'Die moderne Frau',\n", + " 'Die nationale Frau',\n", + " 'Die Österreicherin',\n", + " \"Dillinger's Reisezeitung\",\n", + " 'Diogenes',\n", + " 'Dokumente der Frauen',\n", + " 'Domov (Die Heimat)',\n", + " 'Donauland. Illustrierte Monatsschrift',\n", + " 'Dornaer Curblatt',\n", + " 'Drogisten Zeitung',\n", + " 'Dělnické listy',\n", + " 'Echo aus Pilsen und Westböhmen',\n", + " 'Eggenburger Zeitung',\n", + " 'Eideseis dia ta anatolika mere',\n", + " 'Elektrotechnik und Maschinenbau',\n", + " 'Elisabeth-Blatt',\n", + " 'Ephemeris',\n", + " 'Epoche',\n", + " 'Erste Allgemeine Nachrichten',\n", + " 'Erste allgemeine österr(eichische) Hebammen-Zeitung',\n", + " 'Eva',\n", + " 'Evangelische Kirchen-Zeitung für Österreich',\n", + " 'Evangelisches Gemeindeblatt für Galizien und die Bukowina',\n", + " 'Extraausgaben des 1. Weltkrieges',\n", + " 'Extract-Schreiben (Europaeische Zeitung)',\n", + " 'Fachblatt für Raseur-, Friseur- und Perückenmacher-Genossenschaft',\n", + " 'Feldblatt',\n", + " 'Feldkircher Anzeiger',\n", + " 'Feldkircher Wochenblatt',\n", + " 'Feldkircher Zeitung',\n", + " 'Feldpostbrief Niederdonau',\n", + " 'Feldpostbrief der 56er',\n", + " 'Feldpostbrief der Gefolgschaft des Postamtes Waidhofen an der Thaya',\n", + " 'Feuerwehr-Signale',\n", + " 'Figaro',\n", + " 'Floridsdorfer Zeitung',\n", + " 'Franzensbader Curliste',\n", + " 'Frau und Volk',\n", + " 'Frauen-Briefe/Österreichische Frauenzeitung/Katholische Frauenzeitung',\n", + " 'Frauen-Kalender',\n", + " 'Frauen-Kalender/Frauen-Jahrbuch',\n", + " 'Frauen-Werke',\n", + " 'Frauen-Wohltätigkeits-Verein für Wien und Umgebung',\n", + " 'Frauenarbeit und Frauenrecht: Zeitung für die erwerbenden christlichen Frauen und Mädchen',\n", + " 'Frauenblätter',\n", + " 'Frauenbote',\n", + " 'Frauentag',\n", + " 'Free Austria',\n", + " 'Freie Pädagogische Blätter',\n", + " 'Freies Blatt',\n", + " 'Freies Österreich',\n", + " 'Freiheit!',\n", + " 'Fremden-Blatt',\n", + " 'Fremdenblatt - Organ für die böhmischen Kurorte',\n", + " 'Friseur und Fortschritt',\n", + " 'Frisierkunst der Mode',\n", + " \"Fromme's Österreichischer Feuerwehr-Kalender\",\n", + " 'Front und Heimat',\n", + " 'Frontbriefe des N[ational-]S[ozialistischen] L[ehrer-]B[undes], Kreiswaltung W[iene]r Neustadt',\n", + " 'Frontzeitung. Kreiswaltung Nikolsburg des N.S.-Lehrerbundes',\n", + " 'Frühneuzeit-Info',\n", + " 'Fugger - Zeitungen',\n", + " 'Fußball-Sonntag',\n", + " \"Für's Jagdschloß (Organ der Jagdherren Österreich-Ungarns)\",\n", + " 'G. K. B.-Zeitung (Graz-Köflacher-Bergbaugesellschafts-Zeitung) für Eisenbahn und Bergbau',\n", + " 'Gambrinus, Brauerei- und Hopfen-Zeitung',\n", + " 'Genossenschafts- und Vereins-Zeitung',\n", + " 'Gerechtigkeit',\n", + " 'Gerichts-Zeitung',\n", + " 'Gerichtshalle',\n", + " 'Glück Auf!',\n", + " 'Gotscheer Zeitung',\n", + " 'Gottscheer Bote',\n", + " 'Grazer Kunst',\n", + " 'Grazer Mittags-Zeitung',\n", + " 'Grazer Tagblatt',\n", + " 'Grazer Volksblatt',\n", + " 'Grazer Vorortezeitung: Organ f. d. Umgebungsgemeinden v. Graz',\n", + " 'Götz von Berlichingen',\n", + " 'Halleiner Bothe',\n", + " 'Hebammen-Zeitung',\n", + " 'Hebammenzeitschrift',\n", + " 'Heimat',\n", + " 'Hellenikos telegraphos',\n", + " 'Hermes ho logios',\n", + " 'Heroldo de Cinio',\n", + " 'Humor. Beilage des \"Neuen Wiener Journal\"',\n", + " 'Il Giornaletto di Pola',\n", + " 'Il Popolo Istriano',\n", + " 'Il Proletario',\n", + " 'Ill. Fremden-Zeitung/Ill. österr. Alpenzeitung für Tirol, ...',\n", + " 'Illustrierte Flora',\n", + " 'Illustrierte Kronen Zeitung',\n", + " 'Illustrierte Mädchenzeitung',\n", + " 'Illustrierte Sport-Zeitung',\n", + " 'Illustrierte Wochenpost',\n", + " 'Illustrierter Film-Kurier',\n", + " 'Illustrierter Wegweiser durch die österreichischen Kurorte, Sommerfrischen und Winterstationen',\n", + " 'Illustriertes (Österreichisches) Sportblatt',\n", + " 'Illustriertes Familienblatt. Häuslicher Ratgeber für Österreichs Frauen',\n", + " 'Illustriertes Österreichisches Journal',\n", + " 'Illustrirte Sport Zeitung',\n", + " 'Illustrirtes Wiener Extrablatt',\n", + " 'Innsbrucker Nachrichten',\n", + " 'Innviertler Heimatblatt',\n", + " 'Internationale Ausstellungs-Zeitung',\n", + " 'Internationale Reisezeitung',\n", + " 'Internationale klinische Rundschau',\n", + " 'Ischler Fremden-Salon',\n", + " 'Israelitischer Frauenwohltätigkeits-Verein in Ung. -Brod. Jahresbericht über das abgelaufene Vereinsjahr',\n", + " 'Jahrbuch der Gesellschaft für die Geschichte des Protestantismus in Österreich',\n", + " 'Jahrbuch des Bundes österreichischer Frauenvereine mit Kalender',\n", + " 'Jahrbuch des Voralberger Landesmuseumsvereins',\n", + " 'Jahrbuch des k.u.k. auswärtigen Dienstes',\n", + " 'Jahres-Ausweis des israel. Frauenvereins in Brünn',\n", + " 'Jahres-Bericht des Frauen-Erwerb-Vereines in Klagenfurt',\n", + " 'Jahres-Bericht des Vereines der Schriftstellerinnen und Künstlerinnen in Wien',\n", + " 'Jahres-Bericht des Öffentlichen Mädchen-Lyzeums Liste',\n", + " 'Jahresbericht Akademisches Gymnasium Wien',\n", + " 'Jahresbericht Josefstädter Obergymnasium',\n", + " 'Jahresbericht Schottengymnasium Wien',\n", + " 'Jahresbericht Staats-Unterrealschule Margareten',\n", + " 'Jahresbericht Verein Kunstschule für Frauen und Mädchen',\n", + " 'Jahresbericht der Frauenvereinigung für soziale Hilfstätigkeit',\n", + " 'Jahresbericht der Schulen des Frauenerwerb-Vereins',\n", + " 'Jahresbericht der städtischen Volksschule für Mädchen',\n", + " 'Jahresbericht des \"Neuen Frauenklub\"',\n", + " 'Jahresbericht des Allgemeinen Frauenvereines der evangelischen Landeskirche A.B. in den siebenbürgischen Landesteilen Ungarns',\n", + " 'Jahresbericht des Ersten Frauen-Industrie-Vereines fiür das Königreich Böhmen / Vyrocni Zprava Proniho zenskeho',\n", + " 'Jahresbericht des Ersten Frauen-Industrie-Vereines für das Königreich Böhmen',\n", + " 'Jahresbericht des Evangelischen Frauen-Vereines in Wien',\n", + " 'Jahresbericht des Frauen-Vereines zur Unterstützung der Armen in Bregenz',\n", + " 'Jahresbericht des Frauen-Vereines zur Unterstützung der evangelischen Mädchenschule in Hermannstadt',\n", + " 'Jahresbericht des Frauen-Wohlthätigkeits-Vereines für Wien und Umgebung',\n", + " 'Jahresbericht des Frauen-Wohltiätigkeits-Vereines Franz Josef-Kinderhort Wien',\n", + " 'Jahresbericht des Frauenhilfsvereines des Roten Kreuzes',\n", + " 'Jahresbericht des Frauenhort israelitischer Frauen-Wohlthätigkeits-Verein im Bezirke Alsergrund in Wien',\n", + " 'Jahresbericht des Frauenvereines der Gustav Adolf-Stiftung in Wien',\n", + " 'Jahresbericht des Gustav-Adolf-Frauenvereines in Prag',\n", + " 'Jahresbericht des Immaculata-Vereines ',\n", + " 'Jahresbericht des Isr(aelitischen) Frauen-Wohlthätigkeits-Vereines für Wieden und Margarethen',\n", + " 'Jahresbericht des Kaiser Franz Josef-Mädchen-Lyzeums der Stadt Znaim',\n", + " 'Jahresbericht des Mädchen-Lyzeums am Kohlmarkt',\n", + " 'Jahresbericht des Mädchen-Lyzeums der Frauen Ursulinen in Innsbruck',\n", + " 'Jahresbericht des Mädchen-Unterstützungs-Vereines in Wien',\n", + " 'Jahresbericht des Männergesangsvereines in Wien',\n", + " 'Jahresbericht des Privat-Mädchen-Lyzeums Luithlen Wien I',\n", + " 'Jahresbericht des Vereines \"Wiener Frauenheim\"',\n", + " 'Jahresbericht des Vereines für erweiterte Frauenbildung in Wien',\n", + " 'Jahresbericht des christlichen Frauenvereines zu Baumgarten',\n", + " 'Jahresbericht des deutschen Mädchenlyzeums in Budweis',\n", + " 'Jahresbericht des deutschen Prager Frauen-Erwerb-Vereins',\n", + " 'Jahresbericht des evangelischen Frauen-Vereins in Mödling',\n", + " 'Jahresbericht des israelitischen Frauen-Vereines im XVIII. Bezirke (Währing) von Wien',\n", + " 'Jahresbericht des israelitischen Frauen-Wohlthätigkeits-Vereins des VIII Bezirkes',\n", + " 'Jahresbericht des k.k. Maximiliangymnasium in Wien',\n", + " 'Jahresbericht des unter dem Protectorate der Frau Gräfin Marie Bamberg stehenden Hilfsvereines für Privat-Lehrerinnen, Erzieherinnen und Bonnen in Graz',\n", + " 'Jahresbericht des öffentlichen Wiedner Mädchen-Lyzeums und der Reform-Realgymnasialen Oberklassen',\n", + " 'Jahresbericht Öffentliche Handelsschule für Mädchen des Frauenerwerb-Vereines in Brünn',\n", + " 'Jahresbericht Öffentliches Reformrealgymnasium für Mädchen, Öffentliches Mädchenlyzeum',\n", + " 'Jahresbericht über die Tätigkeit des Frauen-Vereines für die Mädchen-Arbeitsschule (...) in Klagenfurt',\n", + " 'Jahresbericht über die israelitische Kinderbewahr-Anstalt zu Wien, Leopoldstadt, Schiffamtsgasse No 77',\n", + " 'Jahresrechenschaft des Görzer Frauenvereines zur Unterstützung der Armen',\n", + " 'Janus',\n", + " 'Journal für Freymaurer: Als Manuskript gedruckt für Brüder und Meister des Ordens',\n", + " 'Jubiläumsnummer der Wiener Zeitung 1703-1903',\n", + " 'Juristische Blätter',\n", + " 'Jörgel Briefe',\n", + " 'Jüd. Frauen-Wohltätigkeits- und Freitisch-Verein für Ungi. Hradisch und Umgebung',\n", + " 'Jüdische Korrespondenz',\n", + " 'Jüdische Mittagszeitung',\n", + " 'Jüdische Presse',\n", + " 'Jüdische Volksstimme',\n", + " 'Jüdisches Gefühl',\n", + " 'KFO-Arbeit',\n", + " 'Kamera Kunst',\n", + " 'Karnisch-Julische Kriegszeitung',\n", + " 'Kartographische und Schulgeographische Zeitschrift',\n", + " 'Kaufmännische Zeitschrift',\n", + " 'Kikeriki',\n", + " 'Kindergarderobe',\n", + " 'Kinematographische Rundschau',\n", + " 'Kirchliches Verordnungs-Blatt für die Seckauer Diözese',\n", + " 'Kirchliches Verordnungsblatt für die Diözese Gurk',\n", + " 'Klagenfurter Zeitung',\n", + " 'Kleine Volks-Zeitung',\n", + " 'Kleine Wiener Kriegszeitung',\n", + " 'Kleiner Missionsbote',\n", + " 'Krakauer Tagblatt',\n", + " 'Krasso-Szörenyi lapok',\n", + " 'Kremser Feuerwehr-Zeitung',\n", + " 'Kriegsblatt der Palatina',\n", + " 'Kriegssammler-Zeitung',\n", + " 'Kriegszeitung der 4. Armee',\n", + " 'Kriegszeitung des A.T.V. Graz',\n", + " 'Kurjer Stanislawowski',\n", + " 'Kuryer Lwowski (Lemberger Courier)',\n", + " 'Kärntner Volkszeitung und Heimatblatt',\n", + " \"L'Eco dell'Adriatico\",\n", + " \"L'Eco di Pola\",\n", + " \"L'Esperanto Itala Esperanto Revuo\",\n", + " \"L'Istria\",\n", + " 'La Fiamma',\n", + " 'La Progreso',\n", + " 'La nova epoko',\n", + " 'Lagerzeitung für Wagna',\n", + " 'Laibacher Diöcesanblatt',\n", + " 'Landesamtsblatt für das Burgenland',\n", + " 'Landpost',\n", + " 'Lavanttaler Bote',\n", + " 'Le Grand Tailleur',\n", + " 'Leitmeritzer Zeitung',\n", + " 'Linzer Diözesanblatt',\n", + " 'Linzer Volksblatt',\n", + " 'Liste der Curgäste und Fremden in Wildbad-Gastein',\n", + " 'Lombardo-Venetien',\n", + " 'London Information of the Austrian Socialists in Great Britain',\n", + " 'MA',\n", + " 'Marburger Zeitung',\n", + " 'Marchfeldbote',\n", + " 'Marienbader Curliste',\n", + " 'Matador-Zeitung',\n", + " 'Medzunarodnyj Jazyk',\n", + " 'Mein Eigenheim: Mitteilungen des Österr. Bauhilfe-Vereins Kufstein',\n", + " 'Mein Film',\n", + " 'Meine erste Zeitung',\n", + " 'Mitteilung des Zentral-Vereines der staatlichen Vertragsbeamtinnen',\n", + " 'Mitteilungen (Mittheilungen) des Vereines der Schrebergärtner \"Wasserwiese\"',\n", + " 'Mitteilungen der Gesellschaft für Salzburger Landeskunde',\n", + " 'Mitteilungen des Deutschtirolischen Feuerwehr-Landes-Verbandes',\n", + " 'Mitteilungen des Frauenvereins \"Diskutierklub\"',\n", + " 'Mitteilungen des Reichsvereines der Post- und Telegraphenmanipulantinnen',\n", + " 'Mitteilungen des Vereines der deutschen Lehrerinnen in Mähren',\n", + " 'Mitteilungen des k. k. Ministeriums des Innern über Fürsorge für Kriegsgeschädigte',\n", + " 'Mitteilungen des n.-öst. Landes-Feuerwehr-Verbandes',\n", + " 'Mitteilungen des Österr. Bundes für Mutterschutz',\n", + " 'Mitteilungsblatt der Stadtwerke Graz an die eingerückten Kameraden',\n", + " 'Mittheilungen der kaiserl. königl. Central-Commission zur Erforschung und Erhaltung der Baudenkmale',\n", + " 'Mittheilungen der kaiserlich-königlichen Geographischen Gesellschaft',\n", + " 'Mittheilungen des Vereines der Lehrerinnen und Erzieherinnen in Österreich',\n", + " 'Mittheilungen des kais. königl. Militär-Geographischen Institutes',\n", + " 'Mocca',\n", + " 'Moderne illustrierte Zeitung für Reise und Sport',\n", + " 'Monatsschrift für den Orient',\n", + " 'Montags Zeitung',\n", + " 'Montags-Revue aus Böhmen',\n", + " 'Montfort',\n", + " 'Morgen-Post',\n", + " 'Musikalisch-literarischer Monatsbericht über neue Musikalien, musikalische Schriften und Abbildungen',\n", + " 'Musikalisches Wochenblatt',\n", + " 'Mädchenhort',\n", + " 'Mährisch-Schlesische Presse',\n", + " 'Mährisches Tagblatt',\n", + " 'Mödlinger Zeitung',\n", + " 'N.-Oe. Landpresse Stockerauer Zeitung',\n", + " 'N.-Oe. Landpresse Vöslauer Zeitung',\n", + " 'NS Telegraf',\n", + " 'NU - Jüdisches Magazin für Politik und Kultur',\n", + " 'Nachr. d. Verb. d. Spar- u. Darlehenskassenvereine in Vorarlberg',\n", + " 'Nachrichten der Sektion \"Austria\" des Dt. u. Österr. Alpenvereins',\n", + " 'Nachrichten der Sektion \"Donauland\" des Dt. u. Österr. Alpenvereins',\n", + " 'Nachrichten über Verwundete und Verletzte',\n", + " 'Narod. Das Volk',\n", + " 'Nasa Sloga',\n", + " 'Nasa dolja. Zbirnyk prac riznych avtoria',\n", + " 'Neue Freie Presse',\n", + " 'Neue Illustrirte Zeitung',\n", + " 'Neue Kino-Rundschau',\n", + " 'Neue Klosterneuburger Zeitung',\n", + " 'Neue Schlesische Zeitung',\n", + " 'Neue Warte am Inn',\n", + " 'Neue Wiener Friseur-Zeitung',\n", + " 'Neue Wiener Musik-Zeitung',\n", + " 'Neue Zeit- Organ der Kommunistischen Partei Oberösterreichs',\n", + " 'Neue Zeitschrift für Musik',\n", + " 'Neues 8 Uhr Blatt',\n", + " 'Neues Frauenleben',\n", + " 'Neues Fremden-Blatt',\n", + " 'Neues Wiener Journal',\n", + " 'Neues Wiener Tagblatt (Tages-Ausgabe)',\n", + " 'Neues Wiener Tagblatt (Wochen-Ausgabe)',\n", + " 'Neues Zentral-Organ der Hotel-, Gast- und Kaffeehaus-Angestellten',\n", + " 'Neues Österreich',\n", + " 'Neueste Bürser Funken-Zeitung',\n", + " 'Niederösterreichischer Almanach',\n", + " 'Niederösterreichischer Grenzbote',\n", + " 'Niederösterreichsiche Volks- und Vereinszeitung',\n", + " 'Nordböhmisches Volksblatt',\n", + " 'Nordmährische Rundschau',\n", + " \"Nouvelles d'Autriche. Österreichische Nachrichten.\",\n", + " 'Novitäten-Anzeiger für den Colportage Buchhandel',\n", + " 'Oberwarther Sonntags-Zeitung',\n", + " 'Oberösterreichische Nachrichten',\n", + " 'Oesterreichische Buchhändler-Correspondenz',\n", + " 'Oesterreichische Gartenlaube',\n", + " 'Oesterreichische Morgenzeitung und Handelsblatt',\n", + " 'Oesterreichischer Soldatenfreund',\n", + " 'Oesterreichisches Journal',\n", + " 'Oficiala Gazeto Esperantista',\n", + " 'Ordinariats-Blatt der Budweiser Diöcese',\n", + " 'Ordinariatsblatt der Königgrätzer Diözese',\n", + " 'Ordinariatsblatt der Leitmeritzer Diözese',\n", + " 'Panzer voran',\n", + " 'Parlamentarische Chronik. Beilage zur politischen Chronik',\n", + " 'Perfekte Mode',\n", + " 'Pester Lloyd',\n", + " 'Pettauer Anzeiger',\n", + " 'Pettauer Localanzeiger',\n", + " 'Pettauer Wochenblatt',\n", + " 'Pettauer Zeitung',\n", + " 'Philologikos telegraphos',\n", + " 'Photo Sport',\n", + " 'Photo-Börse',\n", + " 'Photographische Chronik',\n", + " 'Photographische Correspondenz',\n", + " 'Photographische Revue',\n", + " 'Pilsner Abendpost',\n", + " 'Pilsner Fremdenblatt',\n", + " 'Pilsner Tagblatt',\n", + " 'Polen - Wochenschrift für polnische Interessen',\n", + " 'Politische Chronik',\n", + " 'Politische Frauen-Zeitung',\n", + " 'Populäre österreichische Gesundheits-Zeitung',\n", + " 'Prager Abendblatt',\n", + " 'Prager Tagblatt',\n", + " 'Praktischer Ratgeber',\n", + " 'Radfahr-Sport',\n", + " 'Radio Wien',\n", + " 'Ragusäer Diöcesanblatt',\n", + " 'Ramingsteiner Heimatbrief',\n", + " 'Rechenschaftsbericht der Missionsvereinigung katholischer Frauen und Jungfrauen Oesterreichs',\n", + " 'Rechenschaftsbericht der Ortsgruppe Landstrasse des \"Christlichen Wiener Frauenbundes\"',\n", + " 'Rechenschaftsbericht des Brünner Frauenerwerb-Vereines',\n", + " 'Rechenschaftsbericht des Bundes Oesterreichischer Frauenvereine',\n", + " 'Rechenschaftsbericht des Ersten Wiener Kneipp-Vereines christlicher Frauen',\n", + " 'Rechenschaftsbericht des deutschen Frauenvereines in Brünn',\n", + " 'Reichenhaller Badeblatt',\n", + " 'Reichs-Organ der Arbeiter-Radfahrer',\n", + " 'Reichspost',\n", + " 'Revolution 1848',\n", + " 'Richtliniensammlung',\n", + " 'Rohö-Frauen-/Flugblatt',\n", + " 'Rote Frauenpost',\n", + " 'Rundschreiben Werkluftschutz-Bereichsstelle Donau-Alpenland',\n", + " 'Russische Rundschau',\n", + " 'Russische Rundschau (russische Ausgabe)',\n", + " 'SA in Feldgrau',\n", + " 'SRD',\n", + " 'Sa Rodinu (Für die Heimat)',\n", + " 'Salzburger Bote',\n", + " 'Salzburger Chronik für Stadt und Land',\n", + " 'Salzburger Montags-Zeitung',\n", + " 'Salzburger Nachrichten',\n", + " 'Salzburger Sportblatt',\n", + " 'Salzburger Tagblatt',\n", + " 'Salzburger Volksblatt: unabh. Tageszeitung f. Stadt u. Land Salzburg',\n", + " 'Salzburger Wacht',\n", + " 'Sankt Fidelis Blatt',\n", + " 'Schuhmacher Fachblatt',\n", + " 'Seidels Reklame',\n", + " 'Sennaciulo',\n", + " 'Siebenbürgisch-Deutsches Wochenblatt',\n", + " 'Signale für die musikalische Welt',\n", + " 'Slovenka (Die Slovenin. Das Organ der slovenischen Frauenwelt)',\n", + " 'Slovenska Zena (Die slowenische Frau)',\n", + " 'Social-politische Frauen-Zeitung. Organ für die Gesammt-Interessen des Frauenlebens. ',\n", + " 'Sonder-Abdruck Amtsblatt Wien',\n", + " 'Sonntagsblätter',\n", + " 'Soziale Sicherheit',\n", + " 'Sport im Bild',\n", + " 'Sport und Salon',\n", + " 'St. Pöltner Diözesanblatt',\n", + " 'Stajerc',\n", + " 'Start (Film-Start)',\n", + " 'Statistische Monatsschrift',\n", + " 'Statistisches Jahrbuch der Stadt Wien',\n", + " 'Steirerland',\n", + " 'Steirische Grenzwacht',\n", + " 'Sterne und Blumen',\n", + " 'Steyrer Zeitung',\n", + " 'Streffleur katonai lapja: Tábori ujság',\n", + " \"Streffleur's Militärblatt\",\n", + " 'Streffleurovy vojenské listy: Plní noviny',\n", + " 'Südsteirische Post',\n", + " 'Tagblatt',\n", + " 'Teplitz-Schönauer Anzeiger',\n", + " 'The Voice of Austria',\n", + " 'Theater an der Wien - Theaterzettel',\n", + " 'Theaterzettel (Oper und Burgtheater in Wien)',\n", + " 'Tiroler Bauern-Zeitung',\n", + " 'Tiroler Soldaten-Zeitung',\n", + " 'Triestingtaler u. Piestingtaler Wochen-Blatt',\n", + " 'Tätigkeitsbericht der Section Mutterfürsorge des Vereines der deutschen Lehrerinnen in Miähren.',\n", + " 'Tätigkeitsbericht des Allgem. Österr. Frauenvereines',\n", + " 'Union. Zeitschrift für Versicherungswesen und Volkswirtschaft',\n", + " 'Unione nazionale',\n", + " 'Unterhaltungs-Blatt zum Alzeyer Anzeigeblatt',\n", + " 'Unteroffiziers-Zeitung',\n", + " 'Vaterländische Blätter',\n", + " 'Veinsblatt - Organ des Vereines der Heim- und Hausarbeiterinnen',\n", + " 'Ver Sacrum',\n", + " 'Verein der Österreichischen Richter',\n", + " 'Verlustliste',\n", + " 'Verlustliste Alphabetisches Verzeichnis',\n", + " 'Videnskjkyi iljustravonyi Kalendar (Wiener Illustrierter Kalender)',\n", + " 'Vistnyk Sojuza Vyzvolennja Ukraïny',\n", + " 'Volksblatt für Stadt und Land',\n", + " 'Volksblätter aus Salzburg',\n", + " 'Volksbote',\n", + " 'Volksfreund',\n", + " 'Volkspost',\n", + " 'Volkswille',\n", + " 'Volkswirtschaftliche Chronik',\n", + " 'Volkswirtschaftliche Wochenschrift',\n", + " 'Vom Nordkap bis nach Afrika',\n", + " 'Vorarlberger Landes-Zeitung',\n", + " 'Vorarlberger Landstimme',\n", + " 'Vorarlberger Nachrichten',\n", + " 'Vorarlberger Volksblatt',\n", + " 'Vorarlberger Volksbote',\n", + " 'Vorarlberger Volksfreund',\n", + " 'Vorarlberger Wacht',\n", + " 'Vorarlberger Zeitung',\n", + " 'Vídenské Noviny',\n", + " 'Warnsdorfer Volkszeitung',\n", + " 'Wasser und Sonne',\n", + " 'Werkszeitung der Österreichisch-Alpinen Montangesellschaft',\n", + " 'Werkzeitung Wien Staatsdruckerei',\n", + " 'Werkzeitung der Gebrüder Böhler & Co. A.G.',\n", + " 'Werkzeitung der Hammerbrotwerke',\n", + " 'Wiener Abendzeitung',\n", + " 'Wiener Allgemeine Zeitung',\n", + " 'Wiener Bauindustrie-Zeitung',\n", + " 'Wiener Bilder',\n", + " 'Wiener Blusenmodelle',\n", + " 'Wiener Caricaturen',\n", + " 'Wiener Diözesanblatt',\n", + " 'Wiener Feldpost',\n", + " 'Wiener Feuerwehrzeitung',\n", + " 'Wiener Freie Photographische Zeitung',\n", + " 'Wiener Hausfrauen-Verein',\n", + " 'Wiener Hausfrauen-Zeitung',\n", + " 'Wiener Illustrierte Zeitung',\n", + " 'Wiener Kommunal-Kalender und städtisches Jahrbuch',\n", + " 'Wiener Landwirtschaftliche Zeitung',\n", + " 'Wiener Magazin',\n", + " 'Wiener Medizinische Wochenschrift',\n", + " 'Wiener Mittagsblatt',\n", + " 'Wiener Moden Zeitung',\n", + " 'Wiener Moden- und Hauswesen-Zeitung',\n", + " 'Wiener Modenzeitung',\n", + " 'Wiener Montagblatt',\n", + " 'Wiener Montags-Journal',\n", + " 'Wiener Montags-Post',\n", + " 'Wiener Neueste Nachrichten',\n", + " 'Wiener Photographische Blätter',\n", + " 'Wiener Presse',\n", + " 'Wiener Revue',\n", + " 'Wiener Salonblatt',\n", + " 'Wiener Sonn- und Montags-Zeitung',\n", + " 'Wiener Theater-Zeitung (Bäuerles Theaterzeitung)',\n", + " 'Wiener Theaterzeitung',\n", + " 'Wiener Tierärztliche Monatsschrift',\n", + " 'Wiener Vororte-Zeitung',\n", + " 'Wiener Vorstadt-Presse',\n", + " 'Wiener Woche',\n", + " 'Wiener Zeitung',\n", + " 'Wiener neueste Nachrichten',\n", + " 'Wiener sozialdemokratische Bücherei',\n", + " 'Wienerische Kirchenzeitung',\n", + " 'Wienerwald-Bote',\n", + " 'Wir Leben',\n", + " 'Wochenblatt der Bauernschaft für Salzburg',\n", + " 'Wochenzeitschrift des ö. Ingenieur- und Architektenvereins',\n", + " 'Wr. Weltaustellungs-Zeitung / Int. Austellungs-Zeitung',\n", + " 'Ybbser Zeitung',\n", + " 'Zeitgeschichte',\n", + " 'Zeitschrift d. Österr. Reichs-Verbandes f. Feuerwehr- und Rettungswesen',\n", + " 'Zeitschrift der oberösterreichischen Feuerwehren',\n", + " 'Zeitschrift des deutschen und österreichischen Alpenvereins',\n", + " 'Zeitschrift für Frauen-Stimmrecht. Organ für die politischen Interessen der Frau',\n", + " 'Zeitschrift für Musikwissenschaft',\n", + " 'Zeitschrift für Notariat und freiwillige Gerichtsbarkeit in Österreich',\n", + " 'Zeitschrift für Schul-Geographie',\n", + " 'Zeitschrift für Volkswirtschaft, Sozialpolitik und Verwaltung',\n", + " 'Zeitschrift für das Privat- und Öffentliche Recht der Gegenwart',\n", + " 'Zeitschrift für ungarisches öffentliches- und Privatrecht',\n", + " 'Zeitung für Landwirtschaft',\n", + " 'Zentralvereinigung österreichischer Emigranten',\n", + " 'Znaimer Tagblatt',\n", + " 'Znaimer Wochenblatt',\n", + " 'Zollämter- und Finanzwach-Zeitung',\n", + " 'Österr. Wäschezeitung',\n", + " 'Österreichisch-kaiserlicher Hofkalender',\n", + " 'Österreichisch-ungarische Revue',\n", + " 'Österreichische Allgemeine Friseur-Zeitung',\n", + " 'Österreichische Alpen-Zeitung',\n", + " 'Österreichische Alpenpost',\n", + " 'Österreichische Alpine, Volks- und Gebirgs-Trachten-Zeitung',\n", + " 'Österreichische Anwalts-Zeitung',\n", + " 'Österreichische Badezeitung',\n", + " 'Österreichische Feuerwehrzeitung',\n", + " 'Österreichische Film-Zeitung',\n", + " 'Österreichische Forst-Zeitung',\n", + " 'Österreichische Frauenrundschau/Mitteilungen der Vereinigung der arbeitenden Frauen',\n", + " 'Österreichische Frauenwelt',\n", + " 'Österreichische Illustrierte Zeitung',\n", + " 'Österreichische Kunst-Chronik',\n", + " 'Österreichische Land-Zeitung',\n", + " 'Österreichische Lehrerinnen-Zeitung',\n", + " 'Österreichische Musik- und Theaterzeitung',\n", + " 'Österreichische Nähmaschinen- und Fahrrad-Zeitung',\n", + " 'Österreichische Photographen-Zeitung',\n", + " 'Österreichische Revue',\n", + " 'Österreichische Schachrundschau',\n", + " 'Österreichische Schachzeitung',\n", + " 'Österreichische Statistik, 1880-',\n", + " 'Österreichische Statistik, Neue Folge, 1910-1915',\n", + " 'Österreichische Straßenbahner-Zeitung',\n", + " 'Österreichische Straßenbahnerzeitung',\n", + " 'Österreichische Touristenzeitung',\n", + " 'Österreichische Verbands-Feuerwehr-Zeitung',\n", + " 'Österreichische Volksstimme',\n", + " 'Österreichische Volkszeitung',\n", + " 'Österreichische Wochenschrift für Wissenschaft und Kunst',\n", + " 'Österreichische Zeitschrift für Gesetzgebung und Rechtsprechung',\n", + " 'Österreichische Zeitschrift für Strafrecht',\n", + " 'Österreichische Zeitschrift für Verwaltung',\n", + " 'Österreichischer Beobachter',\n", + " 'Österreichischer Straßenbahner',\n", + " 'Österreichischer/Europa Motor',\n", + " 'Österreichisches Abendblatt',\n", + " 'Österreichisches Kriegs-Echo',\n", + " 'Österreichisches Zentralblatt für die juristische Praxis',\n", + " 'Österreichs Ill. Zeitung - Kaiser-Huldigungs-Nummer 1917',\n", + " 'Österreichs Illustrierte Zeitung - Kaiser-Festnummer 1908',\n", + " 'Ženský svět']" + ] + }, + "execution_count": 7, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "sorted(df.dc_title.unique())" + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "1032995" + ] + }, + "execution_count": 4, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "len(df)" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Unnamed: 0yearfrom_abolonger_page_idhas_ocrmeta_id
count1.032995e+061.032995e+061032995.01.032995e+061.032995e+061.032995e+06
mean5.164970e+051.893724e+030.04.366914e-039.100712e-015.174625e+05
std2.982001e+057.603773e+010.06.593821e-022.860799e-012.997619e+05
min0.000000e+001.000000e+000.00.000000e+000.000000e+001.000000e+00
25%2.582485e+051.883000e+030.00.000000e+001.000000e+002.582965e+05
50%5.164970e+051.904000e+030.00.000000e+001.000000e+005.165540e+05
75%7.747455e+051.919000e+030.00.000000e+001.000000e+007.748225e+05
max1.032994e+062.016000e+030.01.000000e+001.000000e+001.063239e+06
\n", + "
" + ], + "text/plain": [ + " Unnamed: 0 year from_abo longer_page_id has_ocr \\\n", + "count 1.032995e+06 1.032995e+06 1032995.0 1.032995e+06 1.032995e+06 \n", + "mean 5.164970e+05 1.893724e+03 0.0 4.366914e-03 9.100712e-01 \n", + "std 2.982001e+05 7.603773e+01 0.0 6.593821e-02 2.860799e-01 \n", + "min 0.000000e+00 1.000000e+00 0.0 0.000000e+00 0.000000e+00 \n", + "25% 2.582485e+05 1.883000e+03 0.0 0.000000e+00 1.000000e+00 \n", + "50% 5.164970e+05 1.904000e+03 0.0 0.000000e+00 1.000000e+00 \n", + "75% 7.747455e+05 1.919000e+03 0.0 0.000000e+00 1.000000e+00 \n", + "max 1.032994e+06 2.016000e+03 0.0 1.000000e+00 1.000000e+00 \n", + "\n", + " meta_id \n", + "count 1.032995e+06 \n", + "mean 5.174625e+05 \n", + "std 2.997619e+05 \n", + "min 1.000000e+00 \n", + "25% 2.582965e+05 \n", + "50% 5.165540e+05 \n", + "75% 7.748225e+05 \n", + "max 1.063239e+06 " + ] + }, + "execution_count": 5, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df.describe()" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "metadata": {}, + "outputs": [], + "source": [ + "older = df[(df['year'] < 1878) & (df['year'] > 1500)]" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "218107" + ] + }, + "execution_count": 16, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "len(older)" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "array([0])" + ] + }, + "execution_count": 13, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "df['from_abo'].unique()" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [ + "pages = pd.read_csv('data_pages.csv.gz', compression='gzip')" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Unnamed: 0manifest_idpage_idstructure_infodateipfaddateiname
00dwr1911100100000006NaN/mnt/brz/dico03/m00/z02/h00/d00020076/z1883294...00000006.jpg
11dwr1911100100000007NaN/mnt/brz/dico03/m00/z02/h00/d00020076/z1883294...00000007.jpg
22dwr1911100100000008NaN/mnt/brz/dico03/m00/z02/h00/d00020076/z1883294...00000008.jpg
33dwr1911100100000009NaN/mnt/brz/dico03/m00/z02/h00/d00020076/z1883294...00000009.jpg
44dwr1911100100000010NaN/mnt/brz/dico03/m00/z02/h00/d00020076/z1883294...00000010.jpg
\n", + "
" + ], + "text/plain": [ + " Unnamed: 0 manifest_id page_id structure_info \\\n", + "0 0 dwr19111001 00000006 NaN \n", + "1 1 dwr19111001 00000007 NaN \n", + "2 2 dwr19111001 00000008 NaN \n", + "3 3 dwr19111001 00000009 NaN \n", + "4 4 dwr19111001 00000010 NaN \n", + "\n", + " dateipfad dateiname \n", + "0 /mnt/brz/dico03/m00/z02/h00/d00020076/z1883294... 00000006.jpg \n", + "1 /mnt/brz/dico03/m00/z02/h00/d00020076/z1883294... 00000007.jpg \n", + "2 /mnt/brz/dico03/m00/z02/h00/d00020076/z1883294... 00000008.jpg \n", + "3 /mnt/brz/dico03/m00/z02/h00/d00020076/z1883294... 00000009.jpg \n", + "4 /mnt/brz/dico03/m00/z02/h00/d00020076/z1883294... 00000010.jpg " + ] + }, + "execution_count": 18, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "pages.head()" + ] + }, + { + "cell_type": "code", + "execution_count": 19, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
Unnamed: 0manifest_idaidyeardaydc_titledc_title_additionalsubjectsplace_of_publicationslanguagesdc_typefrom_abometa_typeini_typelonger_page_iddc_datelink_pdflink_oldhas_ocrmeta_id
920920fug15050701fug150515050701Fugger - ZeitungenNaNTageszeitungo.O.denewspaper0brzanno01505-07-01http://anno.onb.ac.at/cgi-content/anno_pdf.pl?...http://anno.onb.ac.at/cgi-content/anno?aid=fug...01045922
921921fug15050725fug150515050725Fugger - ZeitungenNaNTageszeitungo.O.denewspaper0brzanno01505-07-25http://anno.onb.ac.at/cgi-content/anno_pdf.pl?...http://anno.onb.ac.at/cgi-content/anno?aid=fug...01045923
922922fug15070622fug150715070622Fugger - ZeitungenNaNTageszeitungo.O.denewspaper0brzanno01507-06-22http://anno.onb.ac.at/cgi-content/anno_pdf.pl?...http://anno.onb.ac.at/cgi-content/anno?aid=fug...01045924
923923fug15680120fug156815680120Fugger - ZeitungenNaNTageszeitungo.O.denewspaper0brzanno01568-01-20http://anno.onb.ac.at/cgi-content/anno_pdf.pl?...http://anno.onb.ac.at/cgi-content/anno?aid=fug...01045925
924924fug15680124fug156815680124Fugger - ZeitungenNaNTageszeitungo.O.denewspaper0brzanno01568-01-24http://anno.onb.ac.at/cgi-content/anno_pdf.pl?...http://anno.onb.ac.at/cgi-content/anno?aid=fug...01045926
\n", + "
" + ], + "text/plain": [ + " Unnamed: 0 manifest_id aid year day dc_title \\\n", + "920 920 fug15050701 fug 1505 15050701 Fugger - Zeitungen \n", + "921 921 fug15050725 fug 1505 15050725 Fugger - Zeitungen \n", + "922 922 fug15070622 fug 1507 15070622 Fugger - Zeitungen \n", + "923 923 fug15680120 fug 1568 15680120 Fugger - Zeitungen \n", + "924 924 fug15680124 fug 1568 15680124 Fugger - Zeitungen \n", + "\n", + " dc_title_additional subjects place_of_publications languages \\\n", + "920 NaN Tageszeitung o.O. de \n", + "921 NaN Tageszeitung o.O. de \n", + "922 NaN Tageszeitung o.O. de \n", + "923 NaN Tageszeitung o.O. de \n", + "924 NaN Tageszeitung o.O. de \n", + "\n", + " dc_type from_abo meta_type ini_type longer_page_id dc_date \\\n", + "920 newspaper 0 brz anno 0 1505-07-01 \n", + "921 newspaper 0 brz anno 0 1505-07-25 \n", + "922 newspaper 0 brz anno 0 1507-06-22 \n", + "923 newspaper 0 brz anno 0 1568-01-20 \n", + "924 newspaper 0 brz anno 0 1568-01-24 \n", + "\n", + " link_pdf \\\n", + "920 http://anno.onb.ac.at/cgi-content/anno_pdf.pl?... \n", + "921 http://anno.onb.ac.at/cgi-content/anno_pdf.pl?... \n", + "922 http://anno.onb.ac.at/cgi-content/anno_pdf.pl?... \n", + "923 http://anno.onb.ac.at/cgi-content/anno_pdf.pl?... \n", + "924 http://anno.onb.ac.at/cgi-content/anno_pdf.pl?... \n", + "\n", + " link_old has_ocr meta_id \n", + "920 http://anno.onb.ac.at/cgi-content/anno?aid=fug... 0 1045922 \n", + "921 http://anno.onb.ac.at/cgi-content/anno?aid=fug... 0 1045923 \n", + "922 http://anno.onb.ac.at/cgi-content/anno?aid=fug... 0 1045924 \n", + "923 http://anno.onb.ac.at/cgi-content/anno?aid=fug... 0 1045925 \n", + "924 http://anno.onb.ac.at/cgi-content/anno?aid=fug... 0 1045926 " + ] + }, + "execution_count": 19, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "older.head()" + ] + }, + { + "cell_type": "code", + "execution_count": 20, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "1505" + ] + }, + "execution_count": 20, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "min(older['year'])" + ] + }, + { + "cell_type": "code", + "execution_count": 22, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "2102287" + ] + }, + "execution_count": 22, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "len(pages[pages['manifest_id'].isin(older['manifest_id'])])" + ] + }, + { + "cell_type": "code", + "execution_count": 23, + "metadata": {}, + "outputs": [ + { + "data": { + "text/plain": [ + "13928766" + ] + }, + "execution_count": 23, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "len(pages)" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": {}, + "outputs": [], + "source": [] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3 User Default", + "language": "python", + "name": "python_3_user_default" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.6.5" + } + }, + "nbformat": 4, + "nbformat_minor": 2 +}