diff --git a/.idea/vcs.xml b/.idea/vcs.xml new file mode 100644 index 0000000000000000000000000000000000000000..94a25f7f4cb416c083d265558da75d457237d671 --- /dev/null +++ b/.idea/vcs.xml @@ -0,0 +1,6 @@ + + + + + + \ No newline at end of file diff --git a/test/dataextractors/test_multiple.py b/test/dataextractors/test_multiple.py index 28d1825ce129e92aa428e46e69f37e88bad895da..7e18e132db5ca3d6e489be5221682c4c3a521975 100644 --- a/test/dataextractors/test_multiple.py +++ b/test/dataextractors/test_multiple.py @@ -1,6 +1,7 @@ import httpx import pandas as pd import pytest +import typing from travelogues_extraction.getrecords.session import RecordRetriever from travelogues_extraction.getrecords.acnumber_extractor import extract_ac_from_series @@ -83,7 +84,7 @@ async def test_multiple_classes(): await herausgeberGNDID.write(record) await übersetzerGNDID.write(record) await illustratorenGNDID.write(record) - await widmenderGNDID.write(record_retriever) + await widmenderGNDID.write(record) assert target_dataframe.shape[0] == index + 1 if record.ac_number == 'AC09682453': @@ -208,11 +209,9 @@ async def test_multiple_classes(): assert übersetzerGNDID_list[0][0] == correct_übersetzer assert übersetzerGNDID_list[0][1].startswith('http://d-nb.info/gnd/') - print(index, record.ac_number, target_dataframe.at[record.ac_number, illustratorenGNDID.column]) if index == 0: illval: str = target_dataframe.at[record.ac_number, illustratorenGNDID.column] illlist = [i.split(illustratorenGNDID.join_string_secondary_level) for i in illval.split(illustratorenGNDID.join_string_primary_level)] - print(index, record.ac_number, illlist) assert len(illlist) == 2 assert len(illlist[0]) == 2 assert illlist[0][0][0].isalpha() @@ -220,6 +219,22 @@ async def test_multiple_classes(): elif index == 1: assert target_dataframe.at[record.ac_number, illustratorenGNDID.column].__repr__() == 'nan' + widmenderGNDID_val: typing.Union[str, float] = target_dataframe.at[record.ac_number, widmenderGNDID.column] + + if index == 0: + assert widmenderGNDID_val.__class__ == str + widmenderGNDID_list = [ + w.split(widmenderGNDID.join_string_secondary_level) + for w in widmenderGNDID_val.split(widmenderGNDID.join_string_primary_level) + ] + assert widmenderGNDID_list.__len__() == 1 + assert widmenderGNDID_list[0].__len__() == 2 + assert widmenderGNDID_list[0][0][0].isalpha() + assert widmenderGNDID_list[0][1].startswith('http://d-nb.info/gnd/' + ) + elif index == 1: + assert widmenderGNDID_val.__repr__() == 'nan' + index += 1 if index == stop: break