Skip to content

Commit

Permalink
More metadata to model mapping
Browse files Browse the repository at this point in the history
  • Loading branch information
jwodder committed Aug 31, 2020
1 parent 54d1448 commit 3f2fe15
Show file tree
Hide file tree
Showing 2 changed files with 73 additions and 9 deletions.
51 changes: 42 additions & 9 deletions dandi/metadata.py
Original file line number Diff line number Diff line change
@@ -1,4 +1,7 @@
from functools import partial
import os.path as op
import re
from .models import AssetMeta, Biosample, PropertyValue
from .pynwb_utils import (
_get_pynwb_metadata,
get_neurodata_types,
Expand Down Expand Up @@ -85,14 +88,44 @@ def get_metadata(path):
return meta


def nwb2asset(nwb_path):
from .models import AssetMeta
def parse_age(age):
m = re.fullmatch(r"(\d+)\s*(y(ear)?|m(onth)?|w(eek)?|d(ay)?)s?", age, flags=re.I)
if m:
qty = int(m.group(1))
unit = m.group(2)[0].upper()
return f"P{qty}{unit}"
else:
raise ValueError(age)


def extract_age(metadata):
try:
duration = parse_age(metadata["age"])
except (KeyError, ValueError):
return None
return PropertyValue(value=duration)


def extract_model(modelcls, metadata):
m = modelcls.unvalidated()
for field in m.__fields__.keys():
setattr(m, field, extract_field(field, metadata))
return modelcls(**m)


FIELD_EXTRACTORS = {
"age": extract_age,
"wasDerivedFrom": partial(extract_model, Biosample),
}


def extract_field(field, metadata):
if field in FIELD_EXTRACTORS:
return FIELD_EXTRACTORS[field](metadata)
else:
return metadata.get(field)


def nwb2asset(nwb_path):
metadata = get_metadata(nwb_path)
asset = AssetMeta.unvalidated()
for field in asset.__fields__.keys():
try:
setattr(asset, field, metadata[field])
except KeyError:
pass
return asset
return extract_model(AssetMeta, metadata)
31 changes: 31 additions & 0 deletions dandi/tests/test_metadata.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,31 @@
import pytest
from ..metadata import parse_age


@pytest.mark.parametrize(
"age,duration",
[
("5y", "P5Y"),
("5Y", "P5Y"),
("5 years", "P5Y"),
("1year", "P1Y"),
("0y", "P0Y"),
("2 months", "P2M"),
("2 M", "P2M"),
("2 m", "P2M"),
("2M", "P2M"),
("2m", "P2M"),
("3 weeks", "P3W"),
("3 w", "P3W"),
("3 W", "P3W"),
("3w", "P3W"),
("3W", "P3W"),
("0 days", "P0D"),
("7 d", "P7D"),
("7 D", "P7D"),
("7d", "P7D"),
("7D", "P7D"),
],
)
def test_parse_age(age, duration):
assert parse_age(age) == duration

0 comments on commit 3f2fe15

Please sign in to comment.