Skip to content

Commit

Permalink
test: add reference to test data
Browse files Browse the repository at this point in the history
  • Loading branch information
cmdoret committed Jan 17, 2024
1 parent b05494d commit 78495c6
Show file tree
Hide file tree
Showing 17 changed files with 180 additions and 84 deletions.
70 changes: 33 additions & 37 deletions data/ex/data.zarr/.zmetadata
Original file line number Diff line number Diff line change
Expand Up @@ -5,66 +5,62 @@
},
"ex/.zattrs": {
"@type": "MODO",
"creation_date": "2024-01-03T00:00:00",
"has_assay": [
"demo-assay"
],
"last_update_date": "2024-01-04T00:00:00"
"creation_date": "2024-01-17T00:00:00",
"description": "Example modo for tests",
"last_update_date": "2024-01-17T00:00:00",
"name": "Example"
},
"ex/.zgroup": {
"zarr_format": 2
},
"ex/demo-assay/.zattrs": {
"ex/assay1/.zattrs": {
"@type": "Assay",
"description": "Fake dataset used for tests.",
"description": "Example assay for tests",
"has_data": [
"demo1",
"demo1",
"demo2"
"ex/assay1/demo1"
],
"has_sample": [
"ex/assay1/sample1"
],
"name": "E. coli dummy WGS",
"name": "Assay 1",
"omics_type": [
"GENOMICS"
]
},
"ex/demo-assay/.zgroup": {
"ex/assay1/.zgroup": {
"zarr_format": 2
},
"ex/demo-assay/demo1/.zattrs": {
"@type": "AlignmentSet",
"ex/assay1/demo1/.zattrs": {
"@type": "DataEntity",
"data_format": "CRAM",
"data_path": "demo1.cram",
"description": "E. coli wgs",
"has_sample": [
"bac1"
"description": "Demo CRAM file for tests.",
"has_reference": [
"ex/assay1/demo1/reference1"
],
"name": "demo 1"
"name": "Demo 1"
},
"ex/demo-assay/demo1/.zgroup": {
"ex/assay1/demo1/.zgroup": {
"zarr_format": 2
},
"ex/demo-assay/demo1/bac1/.zattrs": {
"@type": "Sample",
"collector": [
"SDSC"
],
"description": "A bacterial sample",
"name": "bac 1",
"taxon_id": [
562
]
"ex/assay1/demo1/reference1/.zattrs": {
"@type": "ReferenceGenome",
"data_path": "reference.fa",
"name": "reference 1"
},
"ex/demo-assay/demo1/bac1/.zgroup": {
"ex/assay1/demo1/reference1/.zgroup": {
"zarr_format": 2
},
"ex/demo-assay/demo2/.zattrs": {
"@type": "AlignmentSet",
"data_format": "CRAM",
"data_path": "demo2.cram",
"description": "E. coli wgs resequencing",
"name": "demo 2"
"ex/assay1/sample1/.zattrs": {
"@type": "Sample",
"collector": [
"Foo university"
],
"description": "A dummy sample for tests.",
"name": "Sample 1",
"sex": "Male"
},
"ex/demo-assay/demo2/.zgroup": {
"ex/assay1/sample1/.zgroup": {
"zarr_format": 2
}
},
Expand Down
9 changes: 4 additions & 5 deletions data/ex/data.zarr/ex/.zattrs
Original file line number Diff line number Diff line change
@@ -1,8 +1,7 @@
{
"@type": "MODO",
"has_assay": [
"demo-assay"
],
"creation_date": "2024-01-03T00:00:00",
"last_update_date": "2024-01-04T00:00:00"
"creation_date": "2024-01-17T00:00:00",
"description": "Example modo for tests",
"last_update_date": "2024-01-17T00:00:00",
"name": "Example"
}
14 changes: 14 additions & 0 deletions data/ex/data.zarr/ex/assay1/.zattrs
Original file line number Diff line number Diff line change
@@ -0,0 +1,14 @@
{
"@type": "Assay",
"description": "Example assay for tests",
"has_data": [
"ex/assay1/demo1"
],
"has_sample": [
"ex/assay1/sample1"
],
"name": "Assay 1",
"omics_type": [
"GENOMICS"
]
}
File renamed without changes.
10 changes: 10 additions & 0 deletions data/ex/data.zarr/ex/assay1/demo1/.zattrs
Original file line number Diff line number Diff line change
@@ -0,0 +1,10 @@
{
"@type": "DataEntity",
"data_format": "CRAM",
"data_path": "demo1.cram",
"description": "Demo CRAM file for tests.",
"has_reference": [
"ex/assay1/demo1/reference1"
],
"name": "Demo 1"
}
File renamed without changes.
5 changes: 5 additions & 0 deletions data/ex/data.zarr/ex/assay1/demo1/reference1/.zattrs
Original file line number Diff line number Diff line change
@@ -0,0 +1,5 @@
{
"@type": "ReferenceGenome",
"data_path": "reference.fa",
"name": "reference 1"
}
9 changes: 9 additions & 0 deletions data/ex/data.zarr/ex/assay1/sample1/.zattrs
Original file line number Diff line number Diff line change
@@ -0,0 +1,9 @@
{
"@type": "Sample",
"collector": [
"Foo university"
],
"description": "A dummy sample for tests.",
"name": "Sample 1",
"sex": "Male"
}
File renamed without changes.
13 changes: 0 additions & 13 deletions data/ex/data.zarr/ex/demo-assay/.zattrs

This file was deleted.

10 changes: 0 additions & 10 deletions data/ex/data.zarr/ex/demo-assay/demo1/.zattrs

This file was deleted.

11 changes: 0 additions & 11 deletions data/ex/data.zarr/ex/demo-assay/demo1/bac1/.zattrs

This file was deleted.

7 changes: 0 additions & 7 deletions data/ex/data.zarr/ex/demo-assay/demo2/.zattrs

This file was deleted.

Binary file removed data/ex/demo2.cram
Binary file not shown.
100 changes: 100 additions & 0 deletions data/ex/reference.fa
Original file line number Diff line number Diff line change
@@ -0,0 +1,100 @@
>BA000007.3 Escherichia coli O157:H7 str. Sakai DNA, part of genome
AGCTTTTCATTCTGACTGCAACGGGCAATATGTCTCTGTGTGGATTAAAAAAAGAGTCTCTGACAGCAGCTTCTGAACTG
GTTACCTGCCGTGAGTAAATTAAAATTTTATTGACTTAGGTCACTAAATACTTTAACCAATATAGGCATAGCGCACAGAC
AGATAAAAATTACAGAGTACACAACATCCATGAAACGCATTAGCACCACCATTACCACCACCATCACCACCACCATCACC
ATTACCATTACCACAGGTAACGGTGCGGGCTGACGCGTACAGGAAACACAGAAAAAAGCCCGCACCTGACAGTGCGGGCT
TTTTTTTCGACCAAAGGTAACGAGGTAACAACCATGCGAGTGTTGAAGTTCGGCGGTACATCAGTGGCAAATGCAGAACG
TTTTCTGCGGGTTGCCGATATTCTGGAAAGCAATGCCAGGCAGGGGCAGGTGGCCACCGTCCTCTCTGCCCCCGCCAAAA
TCACCAACCACCTGGTGGCGATGATTGAAAAAACCATTAGCGGCCAGGATGCTTTACCCAATATCAGCGATGCCGAACGT
ATTTTTGCCGAACTTCTGACGGGACTCGCCGCCGCCCAGCCGGGATTCCCGCTGGCGCAATTGAAAACTTTCGTCGACCA
GGAATTTGCCCAAATAAAACATGTCCTGCATGGCATTAGTTTGTTAGGGCAGTGCCCGGATAGCATTAACGCTGCGCTGA
TTTGCCGTGGCGAGAAAATGTCGATCGCCATTATGGCCGGCGTATTAGAAGCGCGCGGTCACAACGTTACCGTTATCGAT
CCGGTCGAAAAACTGCTGGCAGTGGGGCATTACCTCGAATCTACTGTCGATATTGCAGAGTCCACCCGCCGTATTGCGGC
AAGTCGTATTCCGGCTGATCACATGGTGCTGATGGCAGGTTTCACCGCCGGTAATGAAAAAGGCGAACTGGTGGTACTTG
GACGCAACGGTTCCGACTACTCCGCGGCGGTGCTGGCTGCCTGTTTACGCGCCGATTGTTGCGAGATTTGGACGGACGTT
GACGGGGTATATACCTGCGACCCGCGTCAGGTGCCCGATGCGAGGTTGTTGAAATCGATGTCCTACCAGGAAGCGATGGA
GCTTTCCTACTTCGGCGCTAAAGTTCTTCACCCCCGCACCATTACCCCCATCGCCCAGTTCCAGATCCCTTGCCTGATTA
AAAATACCGGAAATCCTCAAGCTCCAGGTACGCTCATTGGTGCCAGTCGTGATGAAGACGAATTACCGGTCAAGGGCATT
TCCAATCTGAATAATATGGCAATGTTCAGCGTTTCCGGCCCGGGGATGAAAGGAATGGTCGGCATGGCGGCGCGCGTCTT
TGCTGCAATGTCACGCGCCCGTATTTCCGTGGTGCTGATTACGCAATCATCTTCCGAATACAGTATCAGTTTCTGCGTTC
CGCAAAGCGACTGTGTGCGAGCTGAACGGGCAATGCAGGAAGAGTTCTACCTGGAACTGAAAGAAGGCTTACTGGAGCCG
CTGGCGGTGACGGAACGGCTGGCCATTATCTCGGTGGTAGGTGATGGTATGCGCACCTTGCGTGGGATCTCGGCGAAATT
CTTTGCCGCGCTGGCCCGCGCCAATATCAACATTGTCGCTATTGCTCAGGGATCTTCTGAACGCTCAATCTCTGTCGTGG
TAAATAACGATGATGCGACCACTGGCGTGCGCGTTACTCATCAGATGCTGTTCAATACCGATCAGGTTATCGAAGTGTTT
GTGATTGGCGTCGGTGGCGTTGGCGGTGCGCTGCTGGAGCAACTGAAGCGTCAGCAAAGCTGGTTGAAGAATAAACATAT
CGACTTACGTGTCTGCGGTGTTGCTAACTCGAAGGCTCTGCTCACCAATGTGCATGGCCTAAATCTGGAAAACTGGCAGG
AAGAACTGGCGCAAGCCAAAGAGCCGTTTAATCTCGGGCGCTTAATTCGCCTCGTGAAAGAATATCATCTGCTGAACCCG
GTCATTGTTGACTGCACCTCCAGCCAGGCAGTGGCGGATCAATATGCCGACTTCCTGCGCGAAGGTTTCCACGTTGTCAC
GCCGAACAAAAAGGCCAACACCTCGTCGATGGATTACTACCATCTGTTGCGTCATGCGGCTGAAAAATCGCGGCGTAAAT
TCCTCTATGACACCAACGTTGGGGCTGGATTACCGGTTATTGAGAACCTGCAAAATCTGCTCAATGCTGGTGATGAATTG
ATGAAGTTCTCCGGCATTCTTTCAGGTTCGCTTTCTTATATCTTCGGCAAGTTAGACGAAGGCATGAGTTTCTCCGAGGC
GACTACGCTGGCGCGGGAAATGGGTTATACCGAACCGGATCCGCGAGATGATCTTTCTGGTATGGATGTAGCGCGTAAAC
TATTAATTCTCGCTCGTGAAACGGGACGTGAACTGGAGCTGGCGGATATTGAAATTGAACCTGTGCTGCCCGCAGAGTTT
AACGCTGAGGGTGATGTTGCCGCTTTTATGGCGAATCTGTCACAGCTCGACGATCTCTTTGCCGCGCGCGTGGCGAAGGC
CCGTGATGAAGGAAAAGTTTTGCGCTATGTTGGCAATATTGATGAAGATGGCGTCTGCCGCGTGAAGATTGCCGAAGTGG
ATGGTAATGATCCGCTGTTCAAAGTGAAAAATGGCGAAAACGCCCTGGCCTTTTATAGCCACTATTATCAGCCGCTGCCG
TTGGTGCTGCGCGGATATGGTGCGGGCAATGACGTTACCGCTGCCGGTGTCTTTGCCGATCTGCTACGTACCCTCTCATG
GAAGTTAGGAGTCTGACATGGTTAAAGTTTATGCCCCGGCTTCCAGTGCCAATATGAGCGTCGGGTTTGATGTGCTCGGG
GCGGCGGTGACACCCGTTGATGGTGCATTGCTCGGAGATGTAGTCACGGTTGAGTCGGCAGAGACATTCAGTCTCAACAA
CCTCGGACGCTTTGCCGATAAGCTGCCGTCAGAACCACGGGAAAATATCGTTTATCAGTGCTGGGAGCGTTTTTGCCAGG
AGCTGGGCAAGCAAATTCCAGTGGCGATGACTCTGGAAAAGAATATGCCGATCGGTTCGGGCTTAGGCTCCAGCGCCTGT
TCGGTGGTCGCGGCTCTGATGGCGATGAATGAACACTGCGGCAAGCCGCTTAATGACACCCGTTTGCTGGCTTTGATGGG
CGAGCTGGAAGGACGAATCTCCGGCAGCATTCATTACGACAACGTGGCACCGTGTTTTCTTGGTGGTATGCAGTTGATGA
TCGAAGAAAACGACATCATCAGCCAGCAAGTGCCAGGGTTTGATGAGTGGCTGTGGGTGCTGGCGTATCCGGGGATTAAA
GTCTCGACGGCAGAAGCCCGGGCTATTTTACCGGCGCAGTATCGCCGCCAGGATTGCATTGCGCACGGGCGACACTTGGC
AGGCTTCATTCACGCCTGCTATTCCCGTCAGCCTGAGCTTGCCGCGAAGCTGATGAAAGATGTTATCGCAGAACCCTACC
GTGAACGGTTACTGCCTGGCTTCCGGCAGGCGCGGCAGGCGGTCGCGGAAATCGGCGCGGTAGCGAGCGGTATCTCCGGC
TCCGGCCCGACCTTGTTTGCTCTGTGTGACAAGCCGGATACCGCCCAGCGCGTTGCCGACTGGTTGGGTAAGAACTACCT
GCAAAATCAGGAAGGTTTTGTTCATATTTGCCGGCTGGATACGGCGGGCGCACGAGTACTGGAAAACTAAATGAAACTCT
ACAATCTTAAAGATCACAATGAGCAGGTCAGCTTTGCGCAAGCCGTAACCCAGGGGTTGGGCAAAAATCAGGGGCTGTTT
TTTCCGCACGACCTGCCGGAATTCAGCCTGACTGAAATTGATGAGATGCTGAAGCTGGATTTTGTCACCCGCAGTGCGAA
GATCCTCTCGGCGTTTATTGGTGATGAAATCCCGCAGGAAATCCTGGAAGAGCGCGTGCGCGCGGCGTTTGCCTTCCCGG
CTCCGGTCGCCAATGTTGAAAGCGATGTCGGTTGTCTGGAATTGTTCCACGGGCCAACGCTGGCATTTAAAGATTTCGGC
GGTCGCTTTATGGCACAAATGCTGACCCATATTGCGGGCGATAAGCCAGTGACCATTCTGACCGCGACCTCCGGTGATAC
CGGAGCGGCAGTGGCTCATGCTTTCTACGGTTTACCGAATGTGAAAGTGGTTATCCTTTATCCACGAGGCAAAATCAGTC
CACTGCAAGAAAAACTGTTCTGTACATTGGGCGGCAATATCGAAACTGTTGCCATCGACGGCGATTTCGATGCCTGTCAG
GCGCTGGTGAAGCAGGCGTTTGATGATGAAGAGCTGAAAGTGGCGCTGGGGTTAAACTCAGCTAACTCGATTAACATTAG
CCGGTTGCTGGCGCAGATTTGCTACTACTTTGAAGCAGTTGCGCAGCTGCCGCAGGAAGCGCGCAACCAGCTGGTTGTCT
CGGTGCCAAGCGGAAACTTCGGCGATTTGACGGCGGGTCTGCTGGCGAAGTCACTCGGTCTGCCGGTGAAACGTTTTATT
GCTGCGACCAACGTGAACGATACCGTGCCACGTTTCCTGCATGACGGTCAGTGGTCACCCAAAGCGACTCAGGCGACGTT
ATCCAACGCGATGGACGTGAGTCAGCCGAACAACTGGCCGCGTGTGGAAGAGTTGTTCCGCCGCAAAATCTGGCAACTGA
AAGAGCTGGGTTATGCCGCCGTGGATGATGAAACCACGCAACAGACAATGCGTGAGTTAAAAGAACTGGGCTACACTTCG
GAGCCGCACGCTGCCGTAGCGTATCGTGCGCTGCGTGACCAGTTGAATCCAGGCGAATATGGCTTGTTCCTCGGCACCGC
GCATCCGGCGAAATTTAAAGAGAGCGTGGAAGCGATTCTCGGTGAAACGTTGGATCTGCCAAAAGAGCTGGCAGAACGTG
CCGATTTACCCTTGCTTTCGCATAATCTGCCCGCCGATTTTGCTGCGTTGCGTAAATTGATGATGAATCATCAGTAACAT
CTATTCATTATCTCAATCAGGCCGGGTTTGCTTTTATGCAGCCCGGCTTTTTTGTGAAGAAAATATGGAGAGAAACGACA
GGGAAAAAGGAGAAATTCTCAATAAATGCGGTAACTTAGAGATTAGGATTGCGGAGAATAACAACCGCCGCTCTCATCGC
GTAATCTCCGGATATCGACCCATAACGGGCAATGATAAAAGGAGTAACCTGTGAAAAAGATGCAATCTATCGTACTCGCA
CTTTCCCTGGTTCTGGTCGCTCCCATGGCAACGCAGGCTGCGGAAATTACGTTAGTCCCGTCAGTAAAATTACAGATAGG
CGATCGTGATAATCGCGGTTATTACTGGGATGGCGGTCACTGGCGCGACCACGGCTGGTGGAAACAACATTATGAATGGC
GAGGCAATCGCTGGCACCCACACGGACCGCCGCCACCGCCGCGTCACCATAAGAAAGCTCATCATGATCATCACGGCGGT
CATGGTCCAGGCAAACATCACCGCTAAATGACAAATGCCGGGTAACAATCCGGCATTCAGCGCCTGATGCGACGCTGGCG
CGTCTTATCAGGCCTACGTGAATTCTGCAATATATTGAATCTGCATGCTTTTGTAGGCCGGATAAGGCGTTCACGCCGCA
TCCGGCATTGACTACAAACTTAACGCTGCTCGTAGCGTTTAAACACCAGTTCGCCATTGCTGGAGGAAGCTTCATCAAAG
AAGTAACCTTCGCTATTAAAACCAGTCAGTTGCTCTGGTTTGGTCAGCCGATTTTCAATAATGAAACGACTCATCAGACC
GCGTGCTTTCTTAGCGTAGAAGCTGATTATCTTAAATTTGCCGTTCTTCTCATCGAGGAACACCGGCTTGATAATCTCGG
CATTCAATTTCTTCGGCTTCACCGATTTAAAATACTCATCTGACGCCAGATTAATCACCACATTATCGCCTTGTGCTGCG
AGCGCCTCGTTCAGCTTGTTGGTGATGATATCTCCCCAGAATTGATACAGATCTTTCCCTCGGGCATTCTCAAGACGGAT
CCCCATTTCCAGACGATAAGGCTGCATTAAATCGAGCGGGCGGAGTACGCCATACAAGCCGGAAAGCATTCGCAAATGCT
GTTGGGCAAAATCGAAATCGTCTTCGCTGAAGGTTTCGGCCTGCAAGCCGGTGTAGACATCACCTTTAAACGCCAGAATC
GCCTGGCGGGCATTCTCCGGCGTGAAATCTGGCTGCCAGTCATGAAAGCGAGCGGCGTTGATACCTGCCAGTTTGTCGCT
GATACGCATCAGCGTGCTAATCTGCGGAGGCGTCAGTTTCCGCGCTTCATGGATCAACTGCTGGGAATTGTCTAACAGCT
CCGGCAGTGTATATCGCGTGGTGGTCAACGGGCTTTGGTAATCAAGCGTTTTCGCAGGTGAAATAAGAATCAGCATATCC
AGTCCTTGCAGGAAATTTATGCCGACTTTAGCAAAAAAAGAGAATGAGTTGATCGATAGTTGTGATTACTCCTGCGAAAC
ATCATCCCACGCGTCCCGAGAAAGCTGGCGACCGATATCCGGATAACGCAACGGATCAAACACCGGGCGCACGCCGAGTT
TACGCTGGCGTAGATAATCACTGGCAATGGTATGAACCACAGGCGAGAGCAGTAATATGGCAGTCAAATTGGTAATAGCC
ATGCAGGCCATTATGATATCTGCCAGTTGCCACATCAGCGGAAGACTTAGCAAGGTGCCGCCGATGACCGTTGCGAAGGT
GCAGATCCGCAAACACCAGATCGCTTTAGGGTTGTTCAGGCGTAAAAAGAAGAGATTGTTTTCGGCATAAATGTAGTTGG
CAACGATGGAGCTGAAGGCAAACAGAATAACCACGAGGGTAACAAATTCAGCACCCCAGGAACCCATTAGCACCCGCATC
GCCTTCTGGATAAGCTGAATACCTTCCAGCGGCATGTAGGTTGTGCCGTTACCCGCCAGTAATATCAGCATGGCGCTTGC
CGTACAGATGACCAGGGTGTCGATAAAAATGCCAATCATCTGGACAATTCCTTGCGCTGCCGGATGCGGAGGCCAGGACG
CCGCTGCCGCTGCCGCGTTTGGCGTCGACCCCATTCCCGCCTCATTGGAAAACATACTGCGCTGAAAACCGTTAGTAATC
GCCTGGCTTAAGGTATATCCCGCCGCGCCGCCTGCCGCTTCCTGCCAGCCAAAAGCACTCTCAAAAATAGACCAAATGAC
GTGGGGAAGTTGCCCGATATTTATTACGCAAATCACCAGGCTGGTCAGTACCCAGATTATCGCCATCAACGGGACAAACC
CCTGCATGAGCCGGGCGACGCCATGAAGACCGCGAATGATTGCCAGCAGAGCAAAGACAGCAAGAATAATGCCTGTCACC
AGCGGGGGAAAATCAAAAGAAAAACTCAGAGCTCGGGCAACAGCGTTTGCCTGAACTCCGCTGAAAATTATGCCGTAGGC
GATGAGCAAAAAGACGGCGAACAGAACGCCCATCCAGCGCATCCCCAGCCCGCGCGCCATATACCATGCCGGTCCGCCAC
GAAACTGCCCATTGACGTCACGTTCTTTATAAAGTTGTGCAAGGGAACATTCGGCAAACGAGGTCGCCATGCCGATAAAC
GCGGCAACCCACATCCAAAAGACGGCTCCAGGTCCACCGGCGGTAATAGCCAGCGCAACGCCGGCCAGGTTGCCGCTACC
CACGCGCGCCGCAAGACTGGTACACAATGACTGAAATGAGGTTAAACCGCCTGGCTGTGGATGAATGCTATTTTTAAGAC
TTTTGCCAAACTGGCGGATGTAGCGAAACTGCACAAATCCGGTGCGAAAAGTGAACCAACAACCTGCGCCGAAGAGCAGG
6 changes: 5 additions & 1 deletion modo/api.py
Original file line number Diff line number Diff line change
Expand Up @@ -174,6 +174,10 @@ def add_element(
parent_path = next(self.archive.groups())[0]
else:
parent_path = part_of

element_path = parent_path + "/" + element.id

if part_of is not None:
parent_type = getattr(
model,
self.metadata[parent_path]["@type"],
Expand All @@ -187,7 +191,7 @@ def add_element(
# has_part is multivalued
if has_prop not in self.archive[part_of].attrs:
self.archive[part_of].attrs[has_prop] = []
self.archive[part_of].attrs[has_prop] += [element.id]
self.archive[part_of].attrs[has_prop] += [element_path]

# Add element to metadata
parent_group = self.archive[parent_path]
Expand Down

0 comments on commit 78495c6

Please sign in to comment.