From 1a51f7c5db2d163b392a743bf27eea8f90f6e1bb Mon Sep 17 00:00:00 2001 From: THIBERT-RIPOSO Anais <t20006223@V-PJ-47-048.salsa.univ-amu.fr> Date: Wed, 23 Oct 2024 14:01:57 +0200 Subject: [PATCH] =?UTF-8?q?scripts=20R=20des=20tp1=20=C3=A0=204?= MIME-Version: 1.0 Content-Type: text/plain; charset=UTF-8 Content-Transfer-Encoding: 8bit --- src/.Rhistory | 0 src/tp1.R | 45 +++++++++++++++++++++++++++++++++++++++++++++ src/tp2.R | 24 ++++++++++-------------- src/tp3.R | 25 +++++++++++++++++++++++++ src/tp4.R | 20 ++++++++++++++++++++ 5 files changed, 100 insertions(+), 14 deletions(-) create mode 100644 src/.Rhistory create mode 100644 src/tp1.R create mode 100644 src/tp3.R create mode 100644 src/tp4.R diff --git a/src/.Rhistory b/src/.Rhistory new file mode 100644 index 0000000..e69de29 diff --git a/src/tp1.R b/src/tp1.R new file mode 100644 index 0000000..44b14f3 --- /dev/null +++ b/src/tp1.R @@ -0,0 +1,45 @@ +options(repos = c(CRAN = "https://cloud.r-project.org")) +output_dir = "results/tp1" +dir.create(output_dir, showWarnings = F, recursive = T) + +# if (!require("BiocManager", quietly = TRUE)) +# install.packages("BiocManager") + +#if (!require("snpStats", quietly = TRUE)) +# BiocManager::install("snpStats") + +#if (!require("SNPRelate", quietly = TRUE)) +#BiocManager::install("SNPRelate") + +# Charger les bibliothèques +#library(snpStats) +#library(SNPRelate) +#library(devtools) +#library(plyr) + +# Les données analysées nécessitant beaucoup de RAM, nous allons sélectionner aléatoirement 250000 SNPs et réecrire des fichiers bed, bim, fam +penncath_bed_path = "results/data/penncath.bed" +penncath_bim_path = "results/data/penncath.bim" +penncath_fam_path = "results/data/penncath.fam" + +geno <- snpStats::read.plink(penncath_bed_path, penncath_bim_path, penncath_fam_path, select.snps=sample(1:861473, 25000, replace = FALSE ), na.strings = ("-9")) + +plink_base=file.path(output_dir, "plink_base") +snpStats::write.plink(plink_base, snps=geno$genotypes, pedigree=geno$fam[,1], id=geno$fam[,1], mother=geno$fam[,4], sex=geno$fam[,5], phenotype=geno$fam[,6], chromosome = geno$map[,1], genetic.distance = geno$map[,3], position = geno$map[,4], allele.1 = geno$map[,5], allele.2 = geno$map[,6], na.code = ("-9")) + +genoBim<-geno$map +colnames(genoBim)<-c("chr", "SNP", "gen.dist", "position", "A1", "A2") +#head(genoBim) + +genotype<-geno$genotype +#print(genotype) + +genoFam<-geno$fam +#head(genoFam) + +# On commence par libérer de l'espace +rm(geno) + +rdata_path = file.path(output_dir, "TP1_asbvg.RData") +save.image(rdata_path) + diff --git a/src/tp2.R b/src/tp2.R index 4977de1..1ab01b5 100644 --- a/src/tp2.R +++ b/src/tp2.R @@ -1,24 +1,20 @@ -wdir="/amuhome/t20006223/m2bsgreprod/src" -dir.create(wdir) -setwd(wdir) +#load data +load("results/tp1/TP1_asbvg.RData") -library(devtools) +#fichier de sortie +output_dir = "results/tp2" +dir.create(output_dir, showWarnings = F, recursive = T) + +#on installe et ouvre les packages/librairies nécessaires if (!require("BiocManager", quietly=TRUE)) install.packages("BiocManager") -if (!require("snpStats", quietly=TRUE)) - BiocManager::install("snpStats") - if (!require("SNPRelate", quietly=TRUE)) BiocManager::install("SNPRelate") -library(snpStats) +#on enregistre le fichier de sortie -library(SNPRelate) +rdata_path = file.path(output_dir, "TP2_asbvg.RData") +save.image(rdata_path) -# Les données analysées nécessitant beaucoup de RAM, nous allons sélectionner aléatoirement 250000 SNPs et réecrire des fichiers bed, bim, fam -penncath_bed_path = "/amuhome/t20006223/m2bsgreprod/results/data/penncath.bed" -penncath_bim_path = "/amuhome/t20006223/m2bsgreprod/results/data/penncath.bim" -penncath_fam_path = "/amuhome/t20006223/m2bsgreprod/results/data/penncath.fam" -geno <- snpStats::read.plink(penncath_bed_path, penncath_bim_path, penncath_fam_path, select.snps=sample(1:861473, 25000, replace = FALSE ), na.strings = ("-9")) diff --git a/src/tp3.R b/src/tp3.R new file mode 100644 index 0000000..94f2f04 --- /dev/null +++ b/src/tp3.R @@ -0,0 +1,25 @@ +#load data +load("results/tp2/TP2_asbvg.RData") + +#fichier de sortie +output_dir = "results/tp3" +dir.create(output_dir, showWarnings = F, recursive = T) + +#library +if (!require("BiocManager", quietly = TRUE)) + install.packages("BiocManager") + +if (!require("snpStats", quietly = TRUE)) + BiocManager::install("snpStats") + +#if (!require("doParallel", quietly = TRUE)) + # BiocManager::install("doParallel") + +library(snpStats) +library(plyr) +library(GenABEL) +#library(doParallel) + +rdata_path = file.path(output_dir,"TP3_asbvg.RData") +save.image(rdata_path) + diff --git a/src/tp4.R b/src/tp4.R new file mode 100644 index 0000000..8934080 --- /dev/null +++ b/src/tp4.R @@ -0,0 +1,20 @@ +#load data +load("results/tp3/TP3_asbvg.RData") + +#fichier de sortie +output_dir = "results/tp4" +dir.create(output_dir, showWarnings = F, recursive = T) + +#Library +if(!require("dplyr",quietly = T)) + install.packages("dplyr") + +if(!require("plyr",quietly = T)) + install.packages("plyr") + +if(!require("GenABEL",quietly = T)) + install.packages("GenABEL") + +rdata_path = file.path(output_dir,"TP4_asbvg.RData") +save.image(rdata_path) + -- GitLab