Skip to content
GitLab
Explore
Sign in
Primary navigation
Search or go to…
Project
T
Travelogues Extraction
Manage
Activity
Members
Labels
Plan
Issues
Issue boards
Milestones
Wiki
Code
Merge requests
Repository
Branches
Commits
Tags
Repository graph
Compare revisions
Snippets
Build
Pipelines
Jobs
Pipeline schedules
Artifacts
Deploy
Releases
Package registry
Model registry
Operate
Environments
Terraform modules
Monitor
Incidents
Analyze
Value stream analytics
Contributor analytics
CI/CD analytics
Repository analytics
Model experiments
Help
Help
Support
GitLab documentation
Compare GitLab plans
Community forum
Contribute to GitLab
Provide feedback
Keyboard shortcuts
?
Snippets
Groups
Projects
Show more breadcrumbs
labs-team
Travelogues Extraction
Commits
3b0e0926
Commit
3b0e0926
authored
5 years ago
by
philip.roeggla
Browse files
Options
Downloads
Patches
Plain Diff
Widmender
parent
3b5ec6d5
No related branches found
No related tags found
No related merge requests found
Changes
2
Show whitespace changes
Inline
Side-by-side
Showing
2 changed files
.idea/vcs.xml
+6
-0
6 additions, 0 deletions
.idea/vcs.xml
test/dataextractors/test_multiple.py
+18
-3
18 additions, 3 deletions
test/dataextractors/test_multiple.py
with
24 additions
and
3 deletions
.idea/vcs.xml
0 → 100644
+
6
−
0
View file @
3b0e0926
<?xml version="1.0" encoding="UTF-8"?>
<project
version=
"4"
>
<component
name=
"VcsDirectoryMappings"
>
<mapping
directory=
"$PROJECT_DIR$"
vcs=
"Git"
/>
</component>
</project>
\ No newline at end of file
This diff is collapsed.
Click to expand it.
test/dataextractors/test_multiple.py
+
18
−
3
View file @
3b0e0926
import
httpx
import
httpx
import
pandas
as
pd
import
pandas
as
pd
import
pytest
import
pytest
import
typing
from
travelogues_extraction.getrecords.session
import
RecordRetriever
from
travelogues_extraction.getrecords.session
import
RecordRetriever
from
travelogues_extraction.getrecords.acnumber_extractor
import
extract_ac_from_series
from
travelogues_extraction.getrecords.acnumber_extractor
import
extract_ac_from_series
...
@@ -83,7 +84,7 @@ async def test_multiple_classes():
...
@@ -83,7 +84,7 @@ async def test_multiple_classes():
await
herausgeberGNDID
.
write
(
record
)
await
herausgeberGNDID
.
write
(
record
)
await
übersetzerGNDID
.
write
(
record
)
await
übersetzerGNDID
.
write
(
record
)
await
illustratorenGNDID
.
write
(
record
)
await
illustratorenGNDID
.
write
(
record
)
await
widmenderGNDID
.
write
(
record
_retriever
)
await
widmenderGNDID
.
write
(
record
)
assert
target_dataframe
.
shape
[
0
]
==
index
+
1
assert
target_dataframe
.
shape
[
0
]
==
index
+
1
if
record
.
ac_number
==
'
AC09682453
'
:
if
record
.
ac_number
==
'
AC09682453
'
:
...
@@ -208,11 +209,9 @@ async def test_multiple_classes():
...
@@ -208,11 +209,9 @@ async def test_multiple_classes():
assert
übersetzerGNDID_list
[
0
][
0
]
==
correct_übersetzer
assert
übersetzerGNDID_list
[
0
][
0
]
==
correct_übersetzer
assert
übersetzerGNDID_list
[
0
][
1
].
startswith
(
'
http://d-nb.info/gnd/
'
)
assert
übersetzerGNDID_list
[
0
][
1
].
startswith
(
'
http://d-nb.info/gnd/
'
)
print
(
index
,
record
.
ac_number
,
target_dataframe
.
at
[
record
.
ac_number
,
illustratorenGNDID
.
column
])
if
index
==
0
:
if
index
==
0
:
illval
:
str
=
target_dataframe
.
at
[
record
.
ac_number
,
illustratorenGNDID
.
column
]
illval
:
str
=
target_dataframe
.
at
[
record
.
ac_number
,
illustratorenGNDID
.
column
]
illlist
=
[
i
.
split
(
illustratorenGNDID
.
join_string_secondary_level
)
for
i
in
illval
.
split
(
illustratorenGNDID
.
join_string_primary_level
)]
illlist
=
[
i
.
split
(
illustratorenGNDID
.
join_string_secondary_level
)
for
i
in
illval
.
split
(
illustratorenGNDID
.
join_string_primary_level
)]
print
(
index
,
record
.
ac_number
,
illlist
)
assert
len
(
illlist
)
==
2
assert
len
(
illlist
)
==
2
assert
len
(
illlist
[
0
])
==
2
assert
len
(
illlist
[
0
])
==
2
assert
illlist
[
0
][
0
][
0
].
isalpha
()
assert
illlist
[
0
][
0
][
0
].
isalpha
()
...
@@ -220,6 +219,22 @@ async def test_multiple_classes():
...
@@ -220,6 +219,22 @@ async def test_multiple_classes():
elif
index
==
1
:
elif
index
==
1
:
assert
target_dataframe
.
at
[
record
.
ac_number
,
illustratorenGNDID
.
column
].
__repr__
()
==
'
nan
'
assert
target_dataframe
.
at
[
record
.
ac_number
,
illustratorenGNDID
.
column
].
__repr__
()
==
'
nan
'
widmenderGNDID_val
:
typing
.
Union
[
str
,
float
]
=
target_dataframe
.
at
[
record
.
ac_number
,
widmenderGNDID
.
column
]
if
index
==
0
:
assert
widmenderGNDID_val
.
__class__
==
str
widmenderGNDID_list
=
[
w
.
split
(
widmenderGNDID
.
join_string_secondary_level
)
for
w
in
widmenderGNDID_val
.
split
(
widmenderGNDID
.
join_string_primary_level
)
]
assert
widmenderGNDID_list
.
__len__
()
==
1
assert
widmenderGNDID_list
[
0
].
__len__
()
==
2
assert
widmenderGNDID_list
[
0
][
0
][
0
].
isalpha
()
assert
widmenderGNDID_list
[
0
][
1
].
startswith
(
'
http://d-nb.info/gnd/
'
)
elif
index
==
1
:
assert
widmenderGNDID_val
.
__repr__
()
==
'
nan
'
index
+=
1
index
+=
1
if
index
==
stop
:
if
index
==
stop
:
break
break
...
...
This diff is collapsed.
Click to expand it.
Preview
0%
Loading
Try again
or
attach a new file
.
Cancel
You are about to add
0
people
to the discussion. Proceed with caution.
Finish editing this message first!
Save comment
Cancel
Please
register
or
sign in
to comment