Skip to content

Commit

Permalink
🔀 Merge pull request #119 from cnr-ibba/issue-117
Browse files Browse the repository at this point in the history
✨ add data for Guisandesa goats
  • Loading branch information
bunop authored May 22, 2024
2 parents 1ecc054 + 71d1c61 commit 9e682bd
Show file tree
Hide file tree
Showing 10 changed files with 384 additions and 8 deletions.
4 changes: 4 additions & 0 deletions .vscode/settings.json
Original file line number Diff line number Diff line change
Expand Up @@ -12,15 +12,19 @@
"Ensembl",
"Frizarta",
"INITDB",
"mapdata",
"mongodump",
"mongoexpress",
"mongorestore",
"pardir",
"pedfile",
"plinkio",
"probeset",
"SGID",
"smarterdb",
"SNPCHIMP",
"tabix",
"tqdm",
"vcftools"
]
}
9 changes: 8 additions & 1 deletion HISTORY.rst
Original file line number Diff line number Diff line change
Expand Up @@ -13,7 +13,14 @@ TODO
* Map affymetrix snps in *OARV3* coordinates
* Check if ``rs_id`` is still valid or not (with EVA)
* Manage python packages with `poetry <https://python-poetry.org/>`__

0.4.10.dev0
-----------

* Add data for Guisandesa goats (`#117 <https://github.com/cnr-ibba/SMARTER-database/issues/117>`)
* Rename ``manifacturer`` into ``manufacturer``
* Convert genotypes from *top* to *forward* (`#111 <https://github.com/cnr-ibba/SMARTER-database/issues/111>`__)
* Update dependencies

0.4.9 (2023-09-27)
------------------
Expand All @@ -22,7 +29,7 @@ TODO
* Add sex for *Fosses, Provencale* goat breeds
* Add *sex* while importing metadata
* Load multiple phenotypes for *Boutsko foreground* sheeps
* Add multiple phenotypes as a list (`103 <https://github.com/cnr-ibba/SMARTER-database/issues/103>`__)
* Add multiple phenotypes as a list (`#103 <https://github.com/cnr-ibba/SMARTER-database/issues/103>`__)
* Update *datasets* metadata
* Update dependencies

Expand Down
12 changes: 12 additions & 0 deletions Makefile
Original file line number Diff line number Diff line change
Expand Up @@ -72,6 +72,8 @@ initialize: requirements
$(PYTHON_INTERPRETER) src/data/import_iggc.py --datafile data/external/GOA/CONSORTIUM/capri4dbsnp-base-CHI-ARS-OAR-UMD.csv.gz \
--version CHI1.0 --date "06 Mar 2018" --chrom_column chi_1_0_chr --pos_column chi_1_0_pos --strand_column chi_1_0_strand
$(PYTHON_INTERPRETER) src/data/import_dbsnp.py --input_dir data/external/GOA/dbSNP --species_class Goat --sender IGGC --version CHI1.0
$(PYTHON_INTERPRETER) src/data/import_affymetrix.py --species_class goat --manifest data/external/GOA/AFFYMETRIX/Axiom_Goat_v2.r1.a1.annot.csv.gz \
--chip_name AffymetrixAxiomGoatv2 --version ARS1

## TODO: donwload data from EVA and EnsEMBL

Expand Down Expand Up @@ -141,6 +143,7 @@ data: requirements
$(PYTHON_INTERPRETER) src/data/add_breed.py --species_class sheep --name Texel --code TEX --alias TEX --dataset "OP925-969 1046-1085 1010-1020_20220323_texel_SMARTER.zip"
$(PYTHON_INTERPRETER) src/data/add_breed.py --species_class sheep --name Texel --code TEX --alias TEX --dataset "OP1586-1666 OP1087-1106 Placa6 Corr_Tex_Genotyping_20220810_SMARTER.zip"
$(PYTHON_INTERPRETER) src/data/add_breed.py --species_class sheep --name Corriedale --code CRR --alias CRR --dataset "OP1586-1666 OP1087-1106 Placa6 Corr_Tex_Genotyping_20220810_SMARTER.zip"
$(PYTHON_INTERPRETER) src/data/add_breed.py --species_class Goat --name Guisandesa --code GUI --alias Goat --dataset Guisandesa.zip

## load breeds into database relying on dataset
$(PYTHON_INTERPRETER) src/data/import_breeds.py --species_class Sheep --src_dataset="High density genotypes of French Sheep populations.zip" \
Expand Down Expand Up @@ -423,6 +426,9 @@ data: requirements
$(PYTHON_INTERPRETER) src/data/import_samples.py --src_dataset cortellari_et_al_2021.zip \
--datafile s41598-021-89900-2/cortellari_samples_fix.xlsx --code_column fid --id_column original_id \
--chip_name IlluminaGoatSNP50 --country_all Italy --species_all Goat
$(PYTHON_INTERPRETER) src/data/import_samples.py --src_dataset Guisandesa.zip \
--datafile Guisandesa/Guisandesa.xlsx --code_all GUI --id_column original_id \
--chip_name AffymetrixAxiomGoatv2 --country_all Spain --species_all Goat

## convert genotypes without creating samples in database (GOAT)
$(foreach ASSEMBLY, $(GOAT_ASSEMBLIES), $(PYTHON_INTERPRETER) src/data/import_from_plink.py --bfile ADAPTmap_genotypeTOP_20161201/binary_fileset/ADAPTmap_genotypeTOP_20161201 \
Expand All @@ -434,6 +440,9 @@ data: requirements
--dataset burren_et_al_2016.zip --chip_name IlluminaGoatSNP50 --assembly $(ASSEMBLY) --sample_field alias;)
$(foreach ASSEMBLY, $(GOAT_ASSEMBLIES), $(PYTHON_INTERPRETER) src/data/import_from_plink.py --bfile s41598-021-89900-2/Cortellari2021 \
--dataset cortellari_et_al_2021.zip --chip_name IlluminaGoatSNP50 --assembly $(ASSEMBLY);)
$(foreach ASSEMBLY, $(GOAT_ASSEMBLIES), $(PYTHON_INTERPRETER) src/data/import_from_plink.py --file "Guisandesa/Guisandesa Goat" \
--dataset Guisandesa.zip --src_coding affymetrix --chip_name AffymetrixAxiomGoatv2 --assembly $(ASSEMBLY) \
--search_field probeset_id --src_version ARS1 --src_imported_from affymetrix;)

## add additional metadata to samples
$(PYTHON_INTERPRETER) src/data/import_metadata.py --src_dataset "High density genotypes of French Sheep populations.zip" \
Expand Down Expand Up @@ -603,6 +612,9 @@ data: requirements
--dst_dataset SMARTER_CHFR.zip --datafile SMARTER_CHFR_phenotypes/pierre_animals.xlsx \
--id_column original_id --metadata_column animal_id --metadata_column lab_id \
--metadata_column owner --metadata_column milk_recording --sex_column sex
$(PYTHON_INTERPRETER) src/data/import_metadata.py --src_dataset Guisandesa.zip \
--datafile Guisandesa/Guisandesa.xlsx --id_column original_id \
--latitude_column latitude --longitude_column longitude

## add phenotypes to samples
$(PYTHON_INTERPRETER) src/data/import_phenotypes.py --src_dataset ADAPTmap_phenotype_20161201.zip \
Expand Down
2 changes: 1 addition & 1 deletion docs/initialize.rst
Original file line number Diff line number Diff line change
Expand Up @@ -83,7 +83,7 @@ such JSON file:
{
"name": "IlluminaOvineSNP50",
"species": "Sheep",
"manifacturer": "illumina",
"manufacturer": "illumina",
"n_of_snps": 0
},
{
Expand Down
Loading

0 comments on commit 9e682bd

Please sign in to comment.