from pathlib import Path DATA_DIR = Path(__file__).parent / "data" ACCESSION_NUMBER = "accession_number" MIRRI_ACCESSION_NUMBER = 'mirri_accession_number' RESTRICTION_ON_USE = "restriction_on_use" NAGOYA_PROTOCOL = "nagoya_protocol" ABS_RELATED_FILES = "abs_related_files" MTA_FILES = "mta_file" OTHER_CULTURE_NUMBERS = "other_culture_collection_numbers" STRAIN_FROM_REGISTERED_COLLECTION = "strain_from_a_registered_collection" RISK_GROUP = "risk_group" DUAL_USE = "dual_use" QUARANTINE = "quarantine" ORGANISM_TYPE = "organism_type" TAXON_NAME = "taxon_name" TYPE = "type" INFRASUBSPECIFIC_NAME = "infrasubspecific_names" COMMENTS_ON_TAXONOMY = "comments_on_taxonomy" STATUS = "status" HISTORY_OF_DEPOSIT = "history_of_deposit" DEPOSITOR = "depositor" DATE_OF_DEPOSIT = "date_of_deposit" COLLECTED_BY = "collected_by" DATE_OF_COLLECTION = "date_of_collection" ISOLATED_BY = "isolated_by" DATE_OF_ISOLATION = "date_of_isolation" DATE_OF_INCLUSION = "date_of_inclusion_on_catalog" TESTED_TEMPERATURE_GROWTH_RANGE = "tested_temperature_growth_range" RECOMMENDED_GROWTH_TEMP = "recommended_growth_temperature" RECOMMENDED_GROWTH_MEDIUM = "recommended_media_for_growth" FORM_OF_SUPPLY = "form_of_supply" GEO_COORDS = "coordinates_of_geographic_origin" ACCESSION_NAME = "other_denomination" ALTITUDE = "altitude_of_geographic_origin" GEOGRAPHIC_ORIGIN = "geographic_origin" GMO = "gmo" GMO_CONSTRUCTION_INFO = "gmo_construction_information" MUTANT_INFORMATION = "mutant_information" GENOTYPE = "genotype" LITERATURE = "literature" SEXUAL_STATE = "sexual_state" PLOIDY = "ploidy" INTERSPECIFIC_HYBRID = "interspecific_hybrid" HYBRIDS = 'hybrids' PLANT_PATHOGENICITY_CODE = "plant_pathogenicity_code" PATHOGENICITY = "pathogenicity" ENZYME_PRODUCTION = "enzyme_production" PRODUCTION_OF_METABOLITES = "production_of_metabolites" APPLICATIONS = "applications" REMARKS = "remarks" PLASMIDS = "plasmids" PLASMIDS_COLLECTION_FIELDS = "plasmids_collections_fields" SUBSTRATE_HOST_OF_ISOLATION = "substrate_host_of_isolation" ISOLATION_HABITAT = "isolation_habitat" ONTOBIOTOPE_ISOLATION_HABITAT = "ontobiotope_term_for_the_isolation_habitat" LITERATURE_LINKED_TO_SEQ_GENOME = "literature_linked_to_the_sequence_genome" AXENIC_CULTURE = "axenic_culture" QPS ="qps" SITE_LINK = "site_links" # StrainId STRAIN_ID = "id" COLLECTION_CODE = "collection_code" STRAIN_PUI = "strain_pui" STRAIN_URL = "strain_url" ID_SYNONYMS = 'id_synonyms' # Taxonomy GENUS = "genus" SPECIES = "species" # Location COUNTRY = "countryOfOriginCode" SITE = "site" STATE = "state" PROVINCE = "province" MUNICIPALITY = "municipality" ISLAND = "island" OTHER = "other" LATITUDE = "latitude" LONGITUDE = "longitude" ALTITUDE = "altitude" GEOREF_METHOD = "georeferencingMethod" COORDUNCERTAINTY = "coordUncertainty" COORD_SPATIAL_REFERENCE = "coordenatesSpatialReference" LOCATION = "location" ALLOWED_COLLECTING_SITE_KEYS = [ COUNTRY, STATE, PROVINCE, ISLAND, MUNICIPALITY, OTHER, SITE, LATITUDE, LONGITUDE, ALTITUDE, GEOREF_METHOD, COORDUNCERTAINTY, COORD_SPATIAL_REFERENCE, ] MIRRI_FIELDS = [ {"attribute": "id", "label": "accessionNumber"}, {"attribute": "mirri_accession_number", "label": "mirriAccessionNumber"}, {"attribute": "qps", "label": "qps"}, {"attribute": "axenic_culture", "label": "axenicCulture"}, {"attribute": "restriction_on_use", "label": "useRestrictions"}, {"attribute": "nagoya_protocol", "label": "nagoyaConditions"}, {"attribute": ABS_RELATED_FILES, "label": "absFile"}, {"attribute": "mta_files", "label": "mtaFile"}, {"attribute": "other_numbers", "label": "otherCollectionNumbers"}, {"attribute": "is_from_registered_collection", "label": "registeredCollection"}, {"attribute": "risk_group", "label": "riskGroup"}, {"attribute": "is_potentially_harmful", "label": "dualUse"}, {"attribute": "is_subject_to_quarantine", "label": "euQuarantine"}, {"attribute": "taxonomy.organism_type", "label": "organismType"}, {"attribute": "taxonomy.taxon_name", "label": "speciesName"}, {"attribute": "taxonomy.infrasubspecific_name", "label": "infrasubspecificNames"}, {"attribute": "taxonomy.comments", "label": "taxonomyComments"}, {"attribute": "taxonomy.interspecific_hybrid", "label": "hybrid"}, {"attribute": "status", "label": "status"}, {"attribute": "history", "label": "depositHistory", }, {"attribute": "deposit.who", "label": "depositor"}, {"attribute": "deposit.date", "label": "depositDate"}, {"attribute": "catalog_inclusion_date", "label": "accessionDate"}, {"attribute": "collect.who", "label": "collector"}, {"attribute": "collect.date", "label": "collectionDate"}, {"attribute": "isolation.who", "label": "isolator"}, {"attribute": "isolation.date", "label": "isolationDate"}, {"attribute": "isolation.substrate_host_of_isolation", "label": "substrate"}, {"attribute": "growth.tested_temp_range", "label": "temperatureGrowthRange"}, {"attribute": "growth.recommended_temp", "label": "recommendedTemperature"}, {"attribute": "growth.recommended_media", "label": "recommendedMedium"}, {"attribute": "form_of_supply", "label": "supplyForms"}, {"attribute": "other_denominations", "label": "otherDenomination"}, {"attribute": "collect.location.coords", "label": "geographicCoordinates"}, {"attribute": "collect.site.links", "label": "siteLinks"}, {"attribute": "collect.location.altitude", "label": "country"}, {"attribute": "collect.location", "label": "geographicOrigin"}, {"attribute": "collect.habitat", "label": "isolationHabitat"}, {"attribute": "collect.habitat_ontobiotope", "label": "ontobiotopeTerms"}, {"attribute": "genetics.gmo", "label": "gmo"}, {"attribute": "genetics.gmo_construction", "label": "gmoConstruction"}, {"attribute": "genetics.mutant_info", "label": "mutant"}, {"attribute": "genetics.genotype", "label": "genotype"}, {"attribute": "genetics.sexual_state", "label": "sexualState"}, {"attribute": "genetics.ploidy", "label": "ploidy"}, {"attribute": "genetics.plasmids", "label": "plasmids"}, {"attribute": "genetics.plasmids_in_collections", "label": "plasmidCollections"}, {"attribute": "publications", "label": "identificationLiterature"}, {"attribute": PLANT_PATHOGENICITY_CODE, "label": "Plant pathogenicity code"}, {"attribute": "pathogenicity", "label": "pathogenicity"}, {"attribute": "enzyme_production", "label": "enzymes"}, {"attribute": "production_of_metabolites", "label": "metabolites"}, {"attribute": "type", "label": "type"}, {"attribute": "applications", "label": "applications", }, {"attribute": "remarks", "label": "remarks"}, {"attribute": LITERATURE_LINKED_TO_SEQ_GENOME, "label": "sequenceLiterature"}, ] ALLOWED_SUBTAXA = ["subspecies", "variety", "convarietas", "group", "forma", 'forma.specialis'] ALLOWED_TAXONOMIC_RANKS = ["family", "genus", "species"] + ALLOWED_SUBTAXA # nagoya NAGOYA_NO_RESTRICTIONS = "no_known_restrictions_under_the_Nagoya_protocol" NAGOYA_DOCS_AVAILABLE = "documents_providing_proof_of_legal_access_and_terms_of_use_available_at_the_collection" NAGOYA_PROBABLY_SCOPE = "strain_probably_in_scope,_please_contact_the_culture_collection" ALLOWED_NAGOYA_OPTIONS = [NAGOYA_NO_RESTRICTIONS, NAGOYA_DOCS_AVAILABLE, NAGOYA_PROBABLY_SCOPE] # Use restriction NO_RESTRICTION = "no_restriction" ONLY_RESEARCH = "only_research" COMMERCIAL_USE_WITH_AGREEMENT = "commercial_use_with_agreement" ALLOWED_RESTRICTION_USE_OPTIONS = [ NO_RESTRICTION, ONLY_RESEARCH, COMMERCIAL_USE_WITH_AGREEMENT, ] ALLOWED_RISK_GROUPS = ["1", "2", "3", "4"] AGAR = "Agar" CRYO = "Cryo" DRY_ICE = "Dry Ice" LIQUID_CULTURE_MEDIUM = "Liquid Culture Medium" LYO = "Lyo" OIL = "Oil" WATER = "Water" ALLOWED_FORMS_OF_SUPPLY = [AGAR, CRYO, DRY_ICE, LIQUID_CULTURE_MEDIUM, LYO, OIL, WATER] DEPOSIT = "deposit" ISOLATION = "isolation" COLLECT = "collect" GROWTH = "growth" GENETICS = "genetics" TAXONOMY = "taxonomy" # Markers MARKERS = "markers" MARKER_TYPE = "marker_type" MARKER_INSDC = "INSDC" MARKER_SEQ = "marker_seq" ALLOWED_MARKER_TYPES = [ {"acronym": "16S rRNA", "marker": "16S rRNA"}, {"acronym": "ACT", "marker": "Actin"}, {"acronym": "CaM", "marker": "Calmodulin"}, {"acronym": "EF-1α", "marker": "elongation factor 1-alpha (EF-1α)"}, {"acronym": "ITS", "marker": "nuclear ribosomal Internal Transcribed Spacer (ITS)"}, {"acronym": "LSU", "marker": "nuclear ribosomal Large SubUnit (LSU)"}, {"acronym": "RPB1", "marker": "Ribosomal RNA-coding genes RPB1"}, {"acronym": "RPB2", "marker": "Ribosomal RNA-coding genes RPB2"}, {"acronym": "TUBB", "marker": "β-Tubulin"}, ] PUBLICATIONS = "publications" PUB_ID = "pub_id" PUB_DOI = "pub_doi" PUB_PMID = "pub_pmid" PUB_PUBMED_ID = '' PUB_FULL_REFERENCE = "full_reference" PUB_TITLE = "title" PUB_AUTHORS = "authors" PUB_JOURNAL = "journal" PUB_YEAR = "year" PUB_VOLUME = "volume" PUB_ISSUE = "issue" PUB_FIRST_PAGE = "first_page" PUB_LAST_PAGE = "last_page" BOOK_TITLE = "book_title" BOOK_EDITOR = "book_editor" BOOK_PUBLISHER = "book_publisher" PUBLICATION_FIELDS = [ {"label": "ID", "attribute": PUB_ID}, {"label": "PMID", "attribute": PUB_PMID}, {"label": "DOI", "attribute": PUB_DOI}, {"label": "Full reference", "attribute": PUB_FULL_REFERENCE}, {"label": "Authors", "attribute": PUB_AUTHORS}, {"label": "Title", "attribute": PUB_TITLE}, {"label": "Journal", "attribute": PUB_JOURNAL}, {"label": "Year", "attribute": PUB_YEAR}, {"label": "Volume", "attribute": PUB_VOLUME}, {"label": "Issue", "attribute": PUB_ISSUE}, {"label": "First page", "attribute": PUB_FIRST_PAGE}, {"label": "Last page", "attribute": PUB_FIRST_PAGE}, {"label": "Book title", "attribute": BOOK_TITLE}, {"label": "Editors", "attribute": BOOK_EDITOR}, {"label": "Publisher", "attribute": BOOK_PUBLISHER}, ] # ploidy ANEUPLOID = 0 HAPLOID = 1 DIPLOID = 2 TRIPLOID = 3 TETRAPLOID = 4 POLYPLOID = 9 ALLOWED_PLOIDIES = [ANEUPLOID, HAPLOID, DIPLOID, TRIPLOID, TETRAPLOID, POLYPLOID] SUBTAXAS = { "subsp.": "subspecies", "var.": "variety", "convar.": "convarietas", "group.": "group", "f.": "forma", "f.sp.": "forma.specialis" } #Control VERSION = "Version" DATE = "Date" #Country codes COUNTRY = "Country" CODE = "Code" ADDITIONAL_INFORMATION_ON_THE_COUNTRY_OR_CODE = "Additional information on the country or code" #Country codes files COUNTRY_CODES_SHEET = [ {"label": "Country", "attribute": COUNTRY}, {"label": "Code", "attribute": CODE}, {"label": "Additional information on the country or code", "attribute": ADDITIONAL_INFORMATION_ON_THE_COUNTRY_OR_CODE}, ] #Controle files CONTROL_FIELDS = [ {"label": "Version", "attribute": VERSION}, {"label": "Date", "attribute": DATE}, ] # Excel sheet name LOCATIONS = "Geographic origin" # 'Locations' GROWTH_MEDIA = "Growth media" GENOMIC_INFO = "Genomic information" STRAINS = "Strains" LITERATURE_SHEET = "Literature" SEXUAL_STATE_SHEET = "Sexual state" RESOURCE_TYPES_VALUES = "Resource types values" FORM_OF_SUPPLY_SHEET = "Forms of supply" PLOIDY_SHEET = "Ploidy" ONTOBIOTOPE = "Ontobiotope" MARKERS = "Markers" CONTROL_SHEET = "Version" COUNTRY_CODES_SHEET = "Country codes" RESOURCE_SHEET = 'Resource types values'