Skip to content
Snippets Groups Projects
Commit 3b0e0926 authored by philip.roeggla's avatar philip.roeggla
Browse files

Widmender

parent 3b5ec6d5
No related branches found
No related tags found
No related merge requests found
<?xml version="1.0" encoding="UTF-8"?>
<project version="4">
<component name="VcsDirectoryMappings">
<mapping directory="$PROJECT_DIR$" vcs="Git" />
</component>
</project>
\ No newline at end of file
import httpx import httpx
import pandas as pd import pandas as pd
import pytest import pytest
import typing
from travelogues_extraction.getrecords.session import RecordRetriever from travelogues_extraction.getrecords.session import RecordRetriever
from travelogues_extraction.getrecords.acnumber_extractor import extract_ac_from_series from travelogues_extraction.getrecords.acnumber_extractor import extract_ac_from_series
...@@ -83,7 +84,7 @@ async def test_multiple_classes(): ...@@ -83,7 +84,7 @@ async def test_multiple_classes():
await herausgeberGNDID.write(record) await herausgeberGNDID.write(record)
await übersetzerGNDID.write(record) await übersetzerGNDID.write(record)
await illustratorenGNDID.write(record) await illustratorenGNDID.write(record)
await widmenderGNDID.write(record_retriever) await widmenderGNDID.write(record)
assert target_dataframe.shape[0] == index + 1 assert target_dataframe.shape[0] == index + 1
if record.ac_number == 'AC09682453': if record.ac_number == 'AC09682453':
...@@ -208,11 +209,9 @@ async def test_multiple_classes(): ...@@ -208,11 +209,9 @@ async def test_multiple_classes():
assert übersetzerGNDID_list[0][0] == correct_übersetzer assert übersetzerGNDID_list[0][0] == correct_übersetzer
assert übersetzerGNDID_list[0][1].startswith('http://d-nb.info/gnd/') assert übersetzerGNDID_list[0][1].startswith('http://d-nb.info/gnd/')
print(index, record.ac_number, target_dataframe.at[record.ac_number, illustratorenGNDID.column])
if index == 0: if index == 0:
illval: str = target_dataframe.at[record.ac_number, illustratorenGNDID.column] illval: str = target_dataframe.at[record.ac_number, illustratorenGNDID.column]
illlist = [i.split(illustratorenGNDID.join_string_secondary_level) for i in illval.split(illustratorenGNDID.join_string_primary_level)] illlist = [i.split(illustratorenGNDID.join_string_secondary_level) for i in illval.split(illustratorenGNDID.join_string_primary_level)]
print(index, record.ac_number, illlist)
assert len(illlist) == 2 assert len(illlist) == 2
assert len(illlist[0]) == 2 assert len(illlist[0]) == 2
assert illlist[0][0][0].isalpha() assert illlist[0][0][0].isalpha()
...@@ -220,6 +219,22 @@ async def test_multiple_classes(): ...@@ -220,6 +219,22 @@ async def test_multiple_classes():
elif index == 1: elif index == 1:
assert target_dataframe.at[record.ac_number, illustratorenGNDID.column].__repr__() == 'nan' assert target_dataframe.at[record.ac_number, illustratorenGNDID.column].__repr__() == 'nan'
widmenderGNDID_val: typing.Union[str, float] = target_dataframe.at[record.ac_number, widmenderGNDID.column]
if index == 0:
assert widmenderGNDID_val.__class__ == str
widmenderGNDID_list = [
w.split(widmenderGNDID.join_string_secondary_level)
for w in widmenderGNDID_val.split(widmenderGNDID.join_string_primary_level)
]
assert widmenderGNDID_list.__len__() == 1
assert widmenderGNDID_list[0].__len__() == 2
assert widmenderGNDID_list[0][0][0].isalpha()
assert widmenderGNDID_list[0][1].startswith('http://d-nb.info/gnd/'
)
elif index == 1:
assert widmenderGNDID_val.__repr__() == 'nan'
index += 1 index += 1
if index == stop: if index == stop:
break break
......
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Please register or to comment