diff --git a/src/data/valid/Database-data_objects_genomad.yaml b/src/data/valid/Database-data_objects_genomad.yaml new file mode 100644 index 0000000000..029c63ab43 --- /dev/null +++ b/src/data/valid/Database-data_objects_genomad.yaml @@ -0,0 +1,18 @@ +data_object_set: +- id: nmdc:dobj-11-dtTMNa + type: nmdc:DataObject + description: "Virus summary nmdc:ann0vx38" + name: nmdc_wfmgan-11-abc123_virus_summary.tsv + data_object_type: Virus Summary + file_size_bytes: 1234 +- id: nmdc:dobj-11-dtTMNc + type: nmdc:DataObject + description: "Plasmid summary nmdc:ann0vx38" + name: nmdc_wfmgan-11-abc123_plasmid_summary.tsv + data_object_type: Plasmid Summary + file_size_bytes: 1234 +- id: nmdc:dobj-11-dtTMNd + type: nmdc:DataObject + description: "agg results nmdc:ann0vx38" + name: nmdc_wfmgan-11-abc12_aggregated_classification.tsv + data_object_type: GeNomad Aggregated Classification diff --git a/src/schema/basic_slots.yaml b/src/schema/basic_slots.yaml index 6198d8fca3..de7089c236 100644 --- a/src/schema/basic_slots.yaml +++ b/src/schema/basic_slots.yaml @@ -607,6 +607,29 @@ enums: FileTypeEnum: permissible_values: + Virus Summary: + description: Tab separated file listing the viruses found by geNomad. + see_also: + - https://portal.nersc.gov/genomad/ + annotations: + file_name_pattern: '^_virus_summary\.tsv?$' + + Plasmid Summary: + description: Tab separated file listing the plasmids found be geNomad. + see_also: + - https://portal.nersc.gov/genomad/ + annotations: + file_name_pattern: '^_plasmid_summary\.tsv?$' + + GeNomad Aggregated Classification: + description: >- + Tab separated file which combines the results from neural network-based classification + and marker-based classification for virus and plasmid detection with geNomad. + see_also: + - https://portal.nersc.gov/genomad/ + annotations: + file_name_pattern: '^_aggregated_classification\.tsv?$' + Reference Calibration File: description: A file that contains data used to calibrate a natural organic matter or metabalomics analysis.