Commit 498d25a3e5245d2cbaa767c0d74807a65fd4c521

Authored by Efrain Gonzalez
1 parent 2bf073a859
Exists in master

For matching genes between two consolidated data files (UNTESTED)

Showing 1 changed file with 62 additions and 0 deletions   Show diff stats
... ... @@ -0,0 +1,62 @@
  1 +#Checking for similar genes in both data sets
  2 +
  3 +#Required libraries
  4 +library(MASS)
  5 +library(readr)
  6 +library(dplyr)
  7 +
  8 +Check2Match <- function(){
  9 +#Bring in the two files
  10 +##Number of rows with clinical data for first file
  11 +numrow1 <- "How many rows of clinical data are their in the first data set?: " %>%
  12 + readline(prompt = .) %>%
  13 + as.integer(.)
  14 +
  15 +##Number of rows with clinical data for second file
  16 +numrow2 <- "How many rows of clinical data are their in the second data set?: " %>%
  17 + readline(prompt = .) %>%
  18 + as.integer(.)
  19 +
  20 +edfile <- file.choose()
  21 +ed <- edfile %>%
  22 + read_delim(.,delim = "\t")
  23 +
  24 +ednocd <- ed[-(1:numrow1),]
  25 +eddfile <- file.choose()
  26 +edd <- eddfile %>%
  27 + read_delim(.,delim = "\t")
  28 +
  29 +eddnocd <- edd[-(1:numrow2),]
  30 +
  31 +##Number of columns that belong to the first data file
  32 +numbcol1 <- dim(ednocd)[2]
  33 +##Number of columns that belong to the second data file
  34 +numbcol2 <- dim(eddnocd)[2]
  35 +
  36 +##Fully matched both data sets
  37 +eddy <- inner_join(ednocd,eddnocd)
  38 +#Matched ed
  39 +eddy[,1:numbcol1]
  40 +Finedm <- rbind(ed[1:numrow1,],eddy[,1:numbcol1])
  41 +nam_fil_ed <- strsplit(edfile,"[\\|/]") %>%
  42 + .[[1]] %>%
  43 + .[length(.)] %>%
  44 + gsub("\\D","",.) %>%
  45 + c("GSE",.,"matched.txt") %>%
  46 + paste(collapse = "")
  47 +write.table(Finedm,file = nam_fil_ed,sep = "\t",row.names = FALSE)
  48 +#Matched edd
  49 +eddy[,(numbcol1 + 1):dim(eddy)[2]]
  50 +fineddm <- cbind(eddy[,1],eddy[,(numbcol1 + 1):dim(eddy)[2]])
  51 +Fineddm <- rbind(edd[1:numrow2,],fineddm)
  52 +nam_fil_edd <- strsplit(eddfile,"[\\|/]") %>%
  53 + .[[1]] %>%
  54 + .[length(.)] %>%
  55 + gsub("\\D","",.) %>%
  56 + c("GSE",.,"matched.txt") %>%
  57 + paste(collapse = "")
  58 +write.table(Fineddm,file = nam_fil_edd,sep = "\t",row.names = FALSE)
  59 +
  60 +}
  61 +
  62 +Check2Match()