Commit 679b62805671e900eb8f790c2866f091b576180d
1 parent
6b8f81e7b3
Exists in
master
completed code for path finding(TESTING)
Showing
1 changed file
with
44 additions
and
12 deletions
 
Show diff stats
RMarkovBlanket.r
| 1 | #Efrain Gonzalez | 1 | #Efrain Gonzalez | 
| 2 | #8/28/2017 | 2 | #8/25/2017 | 
| 3 | #Code for Markov Blanket | 3 | #Code for Markov Blanket | 
| 4 | 4 | ||
| 5 | 5 | ||
| 6 | #The required libraries | 6 | #The required libraries | 
| 7 | library(pryr) | 7 | library(pryr) | 
| 8 | library(MASS) | 8 | library(MASS) | 
| 9 | library(dplyr) | 9 | library(dplyr) | 
| 10 | library(tidyr) | 10 | library(tidyr) | 
| 11 | library(readr) | 11 | library(readr) | 
| 12 | library(stringr) | 12 | library(stringr) | 
| 13 | 13 | ||
| 14 | 14 | ||
| 15 | #Have the user choose an original Dot file that they want to use | 15 | #Have the user choose an original Dot file that they want to use | 
| 16 | DotFile <- file.choose() | 16 | DotFile <- file.choose() | 
| 17 | TheDotP1 <- read_delim(DotFile,delim = "\t",col_names = FALSE) %>% | 17 | TheDotP1 <- read_delim(DotFile,delim = "\t",col_names = FALSE) %>% | 
| 18 | dplyr::filter(!grepl("->|[{}]",X1)) %>% | 18 | dplyr::filter(!grepl("->|[{}]",X1)) %>% | 
| 19 | dplyr::filter(!grepl("Banjo",X1)) %>% | 19 | dplyr::filter(!grepl("Banjo",X1)) %>% | 
| 20 | dplyr::filter(!grepl("labeljust",X1)) | 20 | dplyr::filter(!grepl("labeljust",X1)) | 
| 21 | counterP1 <- 1 | 21 | counterP1 <- 1 | 
| 22 | sizeDotP1 <- dim(TheDotP1)[1] | 22 | sizeDotP1 <- dim(TheDotP1)[1] | 
| 23 | NewDotP1 <- matrix("0",ncol = 2, nrow = sizeDotP1) | 23 | NewDotP1 <- matrix("0",ncol = 2, nrow = sizeDotP1) | 
| 24 | for(counterP1 in 1:sizeDotP1){ | 24 | for(counterP1 in 1:sizeDotP1){ | 
| 25 | coldataP1 <- str_trim(TheDotP1[counterP1,1]) %>% | 25 | coldataP1 <- str_trim(TheDotP1[counterP1,1]) %>% | 
| 26 | as.character(.,stringsAsFactors = FALSE) | 26 | as.character(.,stringsAsFactors = FALSE) | 
| 27 | if(grepl("Banjo|labeljust|>",coldataP1)==FALSE){ | 27 | if(grepl("Banjo|labeljust|>",coldataP1)==FALSE){ | 
| 28 | NumberP1 <- strsplit(coldataP1," ") %>% | 28 | NumberP1 <- strsplit(coldataP1," ") %>% | 
| 29 | .[[1]]%>% | 29 | .[[1]]%>% | 
| 30 | .[1] | 30 | .[1] | 
| 31 | VarNameP1 <- strsplit(coldataP1," ") %>% | 31 | VarNameP1 <- strsplit(coldataP1," ") %>% | 
| 32 | .[[1]] %>% | 32 | .[[1]] %>% | 
| 33 | .[2] %>% | 33 | .[2] %>% | 
| 34 | strsplit(.,"\"") %>% | 34 | strsplit(.,"\"") %>% | 
| 35 | .[[1]] %>% | 35 | .[[1]] %>% | 
| 36 | .[grep("^\\w|^\\d",.)] | 36 | .[grep("^\\w|^\\d",.)] | 
| 37 | NewDotP1[counterP1,1] <- VarNameP1 | 37 | NewDotP1[counterP1,1] <- VarNameP1 | 
| 38 | NewDotP1[counterP1,2] <- NumberP1 | 38 | NewDotP1[counterP1,2] <- NumberP1 | 
| 39 | } | 39 | } | 
| 40 | if(grepl("->",coldataP1) == TRUE){ | 40 | if(grepl("->",coldataP1) == TRUE){ | 
| 41 | break | 41 | break | 
| 42 | } | 42 | } | 
| 43 | } | 43 | } | 
| 44 | 44 | ||
| 45 | 45 | ||
| 46 | TheDotP2 <- read_delim(DotFile,delim = "\t",col_names = FALSE) %>% | 46 | TheDotP2 <- read_delim(DotFile,delim = "\t",col_names = FALSE) %>% | 
| 47 | dplyr::filter(grepl("->",X1)) | 47 | dplyr::filter(grepl("->",X1)) | 
| 48 | counterP2 <- 1 | 48 | counterP2 <- 1 | 
| 49 | sizeDotP2 <- dim(TheDotP2)[1] | 49 | sizeDotP2 <- dim(TheDotP2)[1] | 
| 50 | NewDotP2 <- matrix("0",ncol = 2, nrow = sizeDotP2) | 50 | NewDotP2 <- matrix("0",ncol = 2, nrow = sizeDotP2) | 
| 51 | for(counterP2 in 1:sizeDotP2){ | 51 | for(counterP2 in 1:sizeDotP2){ | 
| 52 | coldataP2 <- str_trim(TheDotP2[counterP2,1]) %>% | 52 | coldataP2 <- str_trim(TheDotP2[counterP2,1]) %>% | 
| 53 | as.character(.,stringsAsFactors = FALSE) | 53 | as.character(.,stringsAsFactors = FALSE) | 
| 54 | ParentNumP2 <- strsplit(coldataP2,"->") %>% | 54 | ParentNumP2 <- strsplit(coldataP2,"->") %>% | 
| 55 | .[[1]]%>% | 55 | .[[1]]%>% | 
| 56 | .[1] | 56 | .[1] | 
| 57 | ChildNumP2 <- strsplit(coldataP2,"->") %>% | 57 | ChildNumP2 <- strsplit(coldataP2,"->") %>% | 
| 58 | .[[1]] %>% | 58 | .[[1]] %>% | 
| 59 | .[2] %>% | 59 | .[2] %>% | 
| 60 | strsplit(.,";") %>% | 60 | strsplit(.,";") %>% | 
| 61 | .[[1]] %>% | 61 | .[[1]] %>% | 
| 62 | .[1] | 62 | .[1] | 
| 63 | NewDotP2[counterP2,1] <- ParentNumP2 | 63 | NewDotP2[counterP2,1] <- ParentNumP2 | 
| 64 | NewDotP2[counterP2,2] <- ChildNumP2 | 64 | NewDotP2[counterP2,2] <- ChildNumP2 | 
| 65 | } | 65 | } | 
| 66 | 66 | ||
| 67 | colnames(NewDotP2) <- c("Parents","Children") | 67 | colnames(NewDotP2) <- c("Parents","Children") | 
| 68 | 68 | ||
| 69 | #Matching numbers to variable names | 69 | #Matching numbers to variable names | 
| 70 | NewDotP2_2 <- NewDotP2 | 70 | NewDotP2_2 <- NewDotP2 | 
| 71 | for(i in 1:sizeDotP1){ | 71 | for(i in 1:sizeDotP1){ | 
| 72 | #Where is the variable located within NewDotP2 (column one only)? | 72 | #Where is the variable located within NewDotP2 (column one only)? | 
| 73 | chngreq <- grep(paste0("^",NewDotP1[i,2],"$"),NewDotP2_2[,1]) | 73 | chngreq <- grep(paste0("^",NewDotP1[i,2],"$"),NewDotP2_2[,1]) | 
| 74 | if(is.na(sum(chngreq)) == FALSE){ | 74 | if(is.na(sum(chngreq)) == FALSE){ | 
| 75 | if(sum(chngreq) > 0){ | 75 | if(sum(chngreq) > 0){ | 
| 76 | NewDotP2_2[chngreq,1] <- gsub(paste0("^",NewDotP1[i,2],"$"),NewDotP1[i,1],NewDotP2_2[chngreq,1]) | 76 | NewDotP2_2[chngreq,1] <- gsub(paste0("^",NewDotP1[i,2],"$"),NewDotP1[i,1],NewDotP2_2[chngreq,1]) | 
| 77 | } | 77 | } | 
| 78 | } | 78 | } | 
| 79 | #i <- i + 1 | 79 | #i <- i + 1 | 
| 80 | } | 80 | } | 
| 81 | NewDotP2_2 | 81 | NewDotP2_2 | 
| 82 | for(j in 1:sizeDotP1){ | 82 | for(j in 1:sizeDotP1){ | 
| 83 | #Where is the variable located within NewDotP2 (column two only)? | 83 | #Where is the variable located within NewDotP2 (column two only)? | 
| 84 | chngreq <- grep(paste0("^",NewDotP1[j,2],"$"),NewDotP2_2[,2]) | 84 | chngreq <- grep(paste0("^",NewDotP1[j,2],"$"),NewDotP2_2[,2]) | 
| 85 | if(is.na(sum(chngreq)) == FALSE){ | 85 | if(is.na(sum(chngreq)) == FALSE){ | 
| 86 | if(sum(chngreq) > 0){ | 86 | if(sum(chngreq) > 0){ | 
| 87 | NewDotP2_2[chngreq,2] <- gsub(paste0("^",NewDotP1[j,2],"$"),NewDotP1[j,1],NewDotP2_2[chngreq,2]) | 87 | NewDotP2_2[chngreq,2] <- gsub(paste0("^",NewDotP1[j,2],"$"),NewDotP1[j,1],NewDotP2_2[chngreq,2]) | 
| 88 | } | 88 | } | 
| 89 | } | 89 | } | 
| 90 | #j <- j + 1 | 90 | #j <- j + 1 | 
| 91 | } | 91 | } | 
| 92 | 92 | ||
| 93 | lrgMarkov <- dim(NewDotP2_2)[1] | 93 | lrgMarkov <- dim(NewDotP2_2)[1] | 
| 94 | Blanky <- function(MarkovDegree = 20, VariableStartName = "Alzheimer", VariableEndName = "GRIN2A"){ | 94 | Blanky <- function(MarkovDegree = 20, VariableStartName = "Alzheimer", VariableEndName = "GRIN2A"){ | 
| 95 | #Finding the Parents and Children | 95 | #Finding the Parents and Children | 
| 96 | d <- 1 | 96 | d <- 1 | 
| 97 | AllNamList1 <- vector("list",length = 3) | 97 | AllNamList1 <- vector("list",length = 3) | 
| 98 | #AllNamList <- vector("list", length = 3) | 98 | #AllNamList <- vector("list", length = 3) | 
| 99 | ##Finding the Parents of the Parents | 99 | ##Finding the Parents of the Parents | 
| 100 | ##A list of lists | 100 | ##A list of lists | 
| 101 | ##outer set by the degree of the Markov blanket | 101 | ##outer set by the degree of the Markov blanket | 
| 102 | AllVarList <- vector("list",length = 3) | 102 | AllVarList <- vector("list",length = 3) | 
| 103 | varfound <- 0 | 103 | varfound <- 0 | 
| 104 | for(d in 1:MarkovDegree){ | 104 | for(d in 1:MarkovDegree){ | 
| 105 | colnames(NewDotP2_2) <- NULL | 105 | colnames(NewDotP2_2) <- NULL | 
| 106 | ##Which variable are you looking for? | 106 | ##Which variable are you looking for? | 
| 107 | ##This is the VariableEndName | 107 | ##This is the VariableEndName | 
| 108 | if(d == 1){ | 108 | if(d == 1){ | 
| 109 | ##Finding the Parents for the variable | 109 | ##Finding the Parents for the variable | 
| 110 | LocPofVar <- grep(paste0("^",VariableStartName,"$"),NewDotP2_2[,2]) | 110 | LocPofVar <- grep(paste0("^",VariableStartName,"$"),NewDotP2_2[,2]) | 
| 111 | PofVar <- NewDotP2_2[LocPofVar,1] | 111 | PofVar <- NewDotP2_2[LocPofVar,1] | 
| 112 | AllNamList1[[1]] <- PofVar | 112 | AllNamList1[[1]] <- PofVar | 
| 113 | AllNamList1[[1]] <- AllNamList1[[1]][!duplicated(AllNamList1[[1]])] | 113 | AllNamList1[[1]] <- AllNamList1[[1]][!duplicated(AllNamList1[[1]])] | 
| 114 | varfound <- varfound + sum(grepl(paste0("^",VariableEndName,"$"),AllNamList1[[1]])) | 114 | varfound <- varfound + sum(grepl(paste0("^",VariableEndName,"$"),AllNamList1[[1]])) | 
| 115 | 115 | ||
| 116 | ##Finding the Children for the variable | 116 | ##Finding the Children for the variable | 
| 117 | LocCofVar <- grep(paste0("^",VariableStartName,"$"),NewDotP2_2[,1]) | 117 | LocCofVar <- grep(paste0("^",VariableStartName,"$"),NewDotP2_2[,1]) | 
| 118 | CofVar <- NewDotP2_2[LocCofVar,2] | 118 | CofVar <- NewDotP2_2[LocCofVar,2] | 
| 119 | AllNamList1[[2]] <- CofVar | 119 | AllNamList1[[2]] <- CofVar | 
| 120 | AllNamList1[[2]] <- AllNamList1[[2]][!duplicated(AllNamList1[[2]])] | 120 | AllNamList1[[2]] <- AllNamList1[[2]][!duplicated(AllNamList1[[2]])] | 
| 121 | varfound <- varfound + sum(grepl(paste0("^",VariableEndName,"$"),AllNamList1[[2]])) | 121 | varfound <- varfound + sum(grepl(paste0("^",VariableEndName,"$"),AllNamList1[[2]])) | 
| 122 | 122 | ||
| 123 | ##Finding the Co-Parents of the Children for the variable | 123 | ##Finding the Co-Parents of the Children for the variable | 
| 124 | NumofChild <- length(CofVar) | 124 | NumofChild <- length(CofVar) | 
| 125 | if(NumofChild > 0){ | 125 | if(NumofChild > 0){ | 
| 126 | ##Creating a list of the Co-Parents for each of the children | 126 | ##Creating a list of the Co-Parents for each of the children | 
| 127 | ##list size is based on the amount of Children | 127 | ##list size is based on the amount of Children | 
| 128 | COPlist <- vector("character", length = 0) | 128 | COPlist <- vector("character", length = 0) | 
| 129 | nc <- 1 | 129 | nc <- 1 | 
| 130 | for(nc in 1:NumofChild){ | 130 | for(nc in 1:NumofChild){ | 
| 131 | LocCOPofVar <- grep(paste0("^",CofVar[nc],"$"),NewDotP2_2[,2]) | 131 | LocCOPofVar <- grep(paste0("^",CofVar[nc],"$"),NewDotP2_2[,2]) | 
| 132 | COPofVar <- NewDotP2_2[LocCOPofVar,1] | 132 | COPofVar <- NewDotP2_2[LocCOPofVar,1] | 
| 133 | if(sum(grepl(VariableStartName,COPofVar)) >= 1){ | 133 | if(sum(grepl(VariableStartName,COPofVar)) >= 1){ | 
| 134 | #positions of variable start name within the vector of co parents | 134 | #positions of variable start name within the vector of co parents | 
| 135 | posoforig <- grep(paste0("^",VariableStartName,"$"),COPofVar) | 135 | posoforig <- grep(paste0("^",VariableStartName,"$"),COPofVar) | 
| 136 | COPofVar <- COPofVar[-posoforig] | 136 | COPofVar <- COPofVar[-posoforig] | 
| 137 | COPlist <- append(COPlist,COPofVar) | 137 | COPlist <- append(COPlist,COPofVar) | 
| 138 | } else{ | 138 | } else{ | 
| 139 | #COPlist[[nc]] <- COPofVar[COPofVar!=VariableStartName] | 139 | #COPlist[[nc]] <- COPofVar[COPofVar!=VariableStartName] | 
| 140 | COPlist <- append(COPlist,COPofVar) | 140 | COPlist <- append(COPlist,COPofVar) | 
| 141 | } | 141 | } | 
| 142 | #nc <- nc + 1 | 142 | #nc <- nc + 1 | 
| 143 | } | 143 | } | 
| 144 | } else { | 144 | } else { | 
| 145 | ##Making COPlist empty | 145 | ##Making COPlist empty | 
| 146 | COPlist <- vector("character",length = 0) | 146 | COPlist <- vector("character",length = 0) | 
| 147 | } | 147 | } | 
| 148 | AllNamList1[[3]] <- COPlist | 148 | AllNamList1[[3]] <- COPlist | 
| 149 | AllNamList1[[3]] <- AllNamList1[[3]][!duplicated(AllNamList1[[3]])] | 149 | AllNamList1[[3]] <- AllNamList1[[3]][!duplicated(AllNamList1[[3]])] | 
| 150 | varfound <- varfound + sum(grepl(paste0("^",VariableEndName,"$"),AllNamList1[[3]])) | 150 | varfound <- varfound + sum(grepl(paste0("^",VariableEndName,"$"),AllNamList1[[3]])) | 
| 151 | 151 | ||
| 152 | AllVarList[[1]] <- AllNamList1 | 152 | AllVarList[[1]] <- AllNamList1 | 
| 153 | 153 | ||
| 154 | } else if(d > 1){ | 154 | } else if(d > 1){ | 
| 155 | ##inner set by the length of the previous AllVarlist we are working on | 155 | ##inner set by the length of the previous AllVarlist we are working on | 
| 156 | lPreVList <- length(AllVarList[[d-1]]) | 156 | lPreVList <- length(AllVarList[[d-1]]) | 
| 157 | ef <- 1 | 157 | ef <- 1 | 
| 158 | ##PCCP will eventually equal the total size that we expect for the iteration (#d) | 158 | ##PCCP will eventually equal the total size that we expect for the iteration (#d) | 
| 159 | ## which is just lPreVList * 3 | 159 | ## which is just lPreVList * 3 | 
| 160 | PCCP <- 1 | 160 | PCCP <- 1 | 
| 161 | newsize <- (lPreVList * 3) | 161 | newsize <- (lPreVList * 3) | 
| 162 | if(d > 3){ | 162 | if(d > 3){ | 
| 163 | AllVarList[[d]] <- vector("list") | 163 | AllVarList[[d]] <- vector("list") | 
| 164 | } | 164 | } | 
| 165 | for(ef in 1:lPreVList){ | 165 | for(ef in 1:lPreVList){ | 
| 166 | ##Finding the Parents | 166 | ##Finding the Parents | 
| 167 | NumofVars <- length(AllVarList[[d-1]][[ef]]) | 167 | NumofVars <- length(AllVarList[[d-1]][[ef]]) | 
| 168 | if(NumofVars > 0){ | 168 | if(NumofVars > 0){ | 
| 169 | ##Creating a list of the Parents for each of the Variables | 169 | ##Creating a list of the Parents for each of the Variables | 
| 170 | ##list size is based on the amount of Previous Variables | 170 | ##list size is based on the amount of Previous Variables | 
| 171 | PofVlist <- vector("character", length = 0) | 171 | PofVlist <- vector("character", length = 0) | 
| 172 | np <- 1 | 172 | np <- 1 | 
| 173 | for(np in 1:NumofVars){ | 173 | for(np in 1:NumofVars){ | 
| 174 | LocPofVar <- grep(paste0("^",AllVarList[[d-1]][[ef]][np],"$"),NewDotP2_2[,2]) | 174 | LocPofVar <- grep(paste0("^",AllVarList[[d-1]][[ef]][np],"$"),NewDotP2_2[,2]) | 
| 175 | PofVar <- NewDotP2_2[LocPofVar,1] | 175 | PofVar <- NewDotP2_2[LocPofVar,1] | 
| 176 | PofVlist <- append(PofVlist,PofVar) | 176 | PofVlist <- append(PofVlist,PofVar) | 
| 177 | #np <- np + 1 | 177 | #np <- np + 1 | 
| 178 | } | 178 | } | 
| 179 | } else { | 179 | } else { | 
| 180 | ##Making COPlist empty | 180 | ##Making COPlist empty | 
| 181 | PofVlist <- vector("character",length = 0) | 181 | PofVlist <- vector("character",length = 0) | 
| 182 | } | 182 | } | 
| 183 | AllVarList[[d]][[PCCP]] <- PofVlist | 183 | AllVarList[[d]][[PCCP]] <- PofVlist | 
| 184 | AllVarList[[d]][[PCCP]] <- AllVarList[[d]][[PCCP]][!duplicated(AllVarList[[d]][[PCCP]])] | 184 | AllVarList[[d]][[PCCP]] <- AllVarList[[d]][[PCCP]][!duplicated(AllVarList[[d]][[PCCP]])] | 
| 185 | ##Have you found the VariableEndName? | 185 | ##Have you found the VariableEndName? | 
| 186 | varfound <- varfound + sum(grepl(paste0("^",VariableEndName,"$"),AllVarList[[d]][[PCCP]])) | 186 | varfound <- varfound + sum(grepl(paste0("^",VariableEndName,"$"),AllVarList[[d]][[PCCP]])) | 
| 187 | PCCP <- PCCP + 1 | 187 | PCCP <- PCCP + 1 | 
| 188 | 188 | ||
| 189 | ##Finding the Children | 189 | ##Finding the Children | 
| 190 | if(NumofVars > 0){ | 190 | if(NumofVars > 0){ | 
| 191 | ##Creating a list of the Children for each of the Previous Parents | 191 | ##Creating a list of the Children for each of the Previous Parents | 
| 192 | ##list size is based on the amount of Previous Parents | 192 | ##list size is based on the amount of Previous Parents | 
| 193 | CofVlist <- vector("character", length = 0) | 193 | CofVlist <- vector("character", length = 0) | 
| 194 | np <- 1 | 194 | np <- 1 | 
| 195 | for(np in 1:NumofVars){ | 195 | for(np in 1:NumofVars){ | 
| 196 | LocCofVar <- grep(paste0("^",AllVarList[[d-1]][[ef]][np],"$"),NewDotP2_2[,1]) | 196 | LocCofVar <- grep(paste0("^",AllVarList[[d-1]][[ef]][np],"$"),NewDotP2_2[,1]) | 
| 197 | CofVar <- NewDotP2_2[LocCofVar,2] | 197 | CofVar <- NewDotP2_2[LocCofVar,2] | 
| 198 | #if(sum(grepl(VariableStartName,CofVar)) >= 1){ | 198 | #if(sum(grepl(VariableStartName,CofVar)) >= 1){ | 
| 199 | # #positions of variable start name within the vector of co parents | 199 | # #positions of variable start name within the vector of co parents | 
| 200 | # posoforig <- grep(VariableStartName,COPofVar) | 200 | # posoforig <- grep(VariableStartName,COPofVar) | 
| 201 | # COPofVar <- COPofVar[-posoforig] | 201 | # COPofVar <- COPofVar[-posoforig] | 
| 202 | # COPlist <- append(COPlist,COPofVar) | 202 | # COPlist <- append(COPlist,COPofVar) | 
| 203 | #} else{ | 203 | #} else{ | 
| 204 | CofVlist <- append(CofVlist,CofVar) | 204 | CofVlist <- append(CofVlist,CofVar) | 
| 205 | #} | 205 | #} | 
| 206 | #np <- np + 1 | 206 | #np <- np + 1 | 
| 207 | } | 207 | } | 
| 208 | } else { | 208 | } else { | 
| 209 | ##Making CofPlist empty | 209 | ##Making CofPlist empty | 
| 210 | CofVlist <- vector("character",length = 0) | 210 | CofVlist <- vector("character",length = 0) | 
| 211 | } | 211 | } | 
| 212 | AllVarList[[d]][[PCCP]] <- CofVlist | 212 | AllVarList[[d]][[PCCP]] <- CofVlist | 
| 213 | AllVarList[[d]][[PCCP]] <- AllVarList[[d]][[PCCP]][!duplicated(AllVarList[[d]][[PCCP]])] | 213 | AllVarList[[d]][[PCCP]] <- AllVarList[[d]][[PCCP]][!duplicated(AllVarList[[d]][[PCCP]])] | 
| 214 | ##Have you found the VariableEndName yet? | 214 | ##Have you found the VariableEndName yet? | 
| 215 | varfound <- varfound + sum(grepl(paste0("^",VariableEndName,"$"),AllVarList[[d]][[PCCP]])) | 215 | varfound <- varfound + sum(grepl(paste0("^",VariableEndName,"$"),AllVarList[[d]][[PCCP]])) | 
| 216 | PCCP <- PCCP + 1 | 216 | PCCP <- PCCP + 1 | 
| 217 | 217 | ||
| 218 | ##Finding the Co-Parents | 218 | ##Finding the Co-Parents | 
| 219 | NumofCVars <- length(CofVlist) | 219 | NumofCVars <- length(CofVlist) | 
| 220 | if(NumofCVars > 0){ | 220 | if(NumofCVars > 0){ | 
| 221 | ncp <- 1 | 221 | ncp <- 1 | 
| 222 | CPofClist <- vector("character",length = 0) | 222 | CPofClist <- vector("character",length = 0) | 
| 223 | for(ncp in 1:NumofCVars){ | 223 | for(ncp in 1:NumofCVars){ | 
| 224 | LocCPofCVar <- grep(paste0("^",CofVlist[ncp],"$"),NewDotP2_2[,2]) | 224 | LocCPofCVar <- grep(paste0("^",CofVlist[ncp],"$"),NewDotP2_2[,2]) | 
| 225 | CPofCVar <- NewDotP2_2[LocCPofCVar,1] | 225 | CPofCVar <- NewDotP2_2[LocCPofCVar,1] | 
| 226 | #if(sum(grepl(,CPofCVar)) >= 1){ | 226 | #if(sum(grepl(,CPofCVar)) >= 1){ | 
| 227 | # #positions of variable start name within the vector of co parents | 227 | # #positions of variable start name within the vector of co parents | 
| 228 | # posoforig <- grep(VariableStartName,COPofVar) | 228 | # posoforig <- grep(VariableStartName,COPofVar) | 
| 229 | # COPofVar <- COPofVar[-posoforig] | 229 | # COPofVar <- COPofVar[-posoforig] | 
| 230 | # COPlist <- append(COPlist,COPofVar) | 230 | # COPlist <- append(COPlist,COPofVar) | 
| 231 | #} else{ | 231 | #} else{ | 
| 232 | CPofClist <- append(CPofClist,CPofCVar) | 232 | CPofClist <- append(CPofClist,CPofCVar) | 
| 233 | #} | 233 | #} | 
| 234 | #ncp <- ncp + 1 | 234 | #ncp <- ncp + 1 | 
| 235 | } | 235 | } | 
| 236 | 236 | ||
| 237 | } else { | 237 | } else { | 
| 238 | ##Making COPlist empty | 238 | ##Making COPlist empty | 
| 239 | CPofClist <- vector("character",length = 0) | 239 | CPofClist <- vector("character",length = 0) | 
| 240 | } | 240 | } | 
| 241 | AllVarList[[d]][[PCCP]] <- CPofClist | 241 | AllVarList[[d]][[PCCP]] <- CPofClist | 
| 242 | AllVarList[[d]][[PCCP]] <- AllVarList[[d]][[PCCP]][!duplicated(AllVarList[[d]][[PCCP]])] | 242 | AllVarList[[d]][[PCCP]] <- AllVarList[[d]][[PCCP]][!duplicated(AllVarList[[d]][[PCCP]])] | 
| 243 | ##Have you found VariableEndName now? | 243 | ##Have you found VariableEndName now? | 
| 244 | varfound <- varfound + sum(grepl(paste0("^",VariableEndName,"$"),AllVarList[[d]][[PCCP]])) | 244 | varfound <- varfound + sum(grepl(paste0("^",VariableEndName,"$"),AllVarList[[d]][[PCCP]])) | 
| 245 | PCCP <- PCCP + 1 | 245 | PCCP <- PCCP + 1 | 
| 246 | #ef <- ef + 1 | 246 | #ef <- ef + 1 | 
| 247 | } | 247 | } | 
| 248 | } | 248 | } | 
| 249 | 249 | ||
| 250 | ##Stop if you have found the VariableEndName value | 250 | ##Stop if you have found the VariableEndName value | 
| 251 | if(varfound > 0){ | 251 | if(varfound > 0){ | 
| 252 | break | 252 | break | 
| 253 | } | 253 | } | 
| 254 | #d <- d + 1 | 254 | #d <- d + 1 | 
| 255 | } | 255 | } | 
| 256 | ##The Markov Degree is that found below | 256 | ##The Markov Degree is that found below | 
| 257 | d | 257 | d | 
| 258 | } | 258 | } | 
| 259 | 259 | ||
| 260 | 260 | ||
| 261 | 261 | ||
| 262 | #############Methods for finding paths############# | 262 | #############Methods for finding paths############# | 
| 263 | ###Beyond Here Everything is still experimental### | 263 | ###Beyond Here Everything is still experimental### | 
| 264 | #Find the path to the variable in question | 264 | #Find the path to the variable in question | 
| 265 | RshipList <- vector("list",length = d) | 265 | RshipList <- vector("list",length = d) | 
| 266 | l = d | 266 | l = d | 
| 267 | for(l in d:1){ | 267 | for(l in d:1){ | 
| 268 | if(l == d){ | 268 | if(l == d){ | 
| 269 | RshipList[[l]] <- VariableEndName | 269 | RshipList[[l]] <- VariableEndName | 
| 270 | for(ship in 1:length(AllVarList[[d]])){ | 270 | for(ship in 1:length(AllVarList[[d]])){ | 
| 271 | if(sum(grepl(paste0("^",VariableEndName,"$"),AllVarList[[d]][[ship]])) > 0){ | 271 | if(sum(grepl(paste0("^",VariableEndName,"$"),AllVarList[[d]][[ship]])) > 0){ | 
| 272 | break | 272 | break | 
| 273 | } | 273 | } | 
| 274 | } | 274 | } | 
| 275 | 275 | ||
| 276 | } else { | 276 | } else { | 
| 277 | modship <- ship %% 3 | 277 | modship <- ship %% 3 | 
| 278 | intship <- as.integer(ship/3) | 278 | intship <- as.integer(ship/3) | 
| 279 | if(modship > 0){ | 279 | if(modship > 0){ | 
| 280 | intship <- intship + 1 | 280 | intship <- intship + 1 | 
| 281 | } | 281 | } | 
| 282 | RshipList[[l]] <- AllVarList[[l]][[intship]] | 282 | RshipList[[l]] <- AllVarList[[l]][[intship]] | 
| 283 | ship <- intship | 283 | ship <- intship | 
| 284 | } | 284 | } | 
| 285 | #l <- l - 1 | 285 | #l <- l - 1 | 
| 286 | } | 286 | } | 
| 287 | #Full actual path | 287 | #Full actual path | 
| 288 | k = d | 288 | k = d | 
| 289 | prevar <- VariableEndName | 289 | prevar <- VariableEndName | 
| 290 | Pathlisting <- vector("list",length = d) | 290 | Pathlisting <- vector("list",length = d) | 
| 291 | Pathlisting[[d]] <- prevar | 291 | Pathlisting[[d]] <- prevar | 
| 292 | for(k in d:1){ | 292 | for(k in d:2){ | 
| 293 | if(k == d){ | 293 | if(k == d){ | 
| 294 | for(ship in 1:length(AllVarList[[d]])){ | 294 | for(ship in 1:length(AllVarList[[d]])){ | 
| 295 | if(sum(grepl(paste0("^",VariableEndName,"$"),AllVarList[[d]][[ship]])) > 0){ | 295 | if(sum(grepl(paste0("^",VariableEndName,"$"),AllVarList[[d]][[ship]])) > 0){ | 
| 296 | break | 296 | break | 
| 297 | } | 297 | } | 
| 298 | } | 298 | } | 
| 299 | 299 | ||
| 300 | } | 300 | } | 
| 301 | modship <- ship %% 3 | 301 | modship <- ship %% 3 | 
| 302 | intship <- as.integer(ship/3) | 302 | intship <- as.integer(ship/3) | 
| 303 | if(modship > 0){ | 303 | if(modship > 0){ | 
| 304 | intship <- intship + 1 | 304 | intship <- intship + 1 | 
| 305 | } | 305 | } | 
| 306 | if(modship == 0){ | 306 | if(modship == 0){ | 
| 307 | ##When modship == 0 then we are refering to a CoParent | 307 | ##When modship == 0 then we are refering to a CoParent | 
| 308 | ##Gives how many children the full set of CoParents has | 308 | ##Gives how many children the full set of CoParents has | 
| 309 | lenCoP <- length(AllVarList[[k]][[(ship - 1)]]) | 309 | lenCoP <- length(AllVarList[[k]][[(ship - 1)]]) | 
| 310 | ##variables that are actually children of the coparent | 310 | ##variables that are actually children of the coparent | 
| 311 | actvar <- vector("character",length = 0) | 311 | actvar <- vector("character",length = 0) | 
| 312 | ##Parents of actvar | 312 | ##Parents of actvar | 
| 313 | Pactvar <- vector("character",length =0) | 313 | Pactvar <- vector("character",length =0) | 
| 314 | ##variables that could have led to the previous set of variables | 314 | ##variables that could have led to the previous set of variables | 
| 315 | Wanvar <- vector("character",length = 0) | 315 | Wanvar <- vector("character",length = 0) | 
| 316 | m <- 1 | 316 | m <- 1 | 
| 317 | for(m in 1:lenCoP){ | 317 | for(m in 1:lenCoP){ | 
| 318 | LCPoVar <- grep(paste0("^",AllVarList[[k]][[(ship - 1)]][m],"$"),NewDotP2_2[,2]) | 318 | LCPoVar <- grep(paste0("^",AllVarList[[k]][[(ship - 1)]][m],"$"),NewDotP2_2[,2]) | 
| 319 | CPoVar <- NewDotP2_2[LCPoVar,1] | 319 | CPoVar <- NewDotP2_2[LCPoVar,1] | 
| 320 | lenprevar <- length(prevar) | 320 | lenprevar <- length(prevar) | 
| 321 | y <- 1 | 321 | y <- 1 | 
| 322 | for(y in 1:lenprevar){ | 322 | for(y in 1:lenprevar){ | 
| 323 | 323 | ||
| 324 | if(sum(grepl(prevar[y],CPoVar)) >= 1){ | 324 | if(sum(grepl(prevar[y],CPoVar)) >= 1){ | 
| 325 | actvar <- append(actvar,AllVarList[[k]][[(ship - 1)]][m]) | 325 | actvar <- append(actvar,AllVarList[[k]][[(ship - 1)]][m]) | 
| 326 | Pactvar <- append(Pactvar,CPoVar) | 326 | Pactvar <- append(Pactvar,CPoVar) | 
| 327 | } | 327 | } | 
| 328 | #y <- y + 1 | 328 | #y <- y + 1 | 
| 329 | } | 329 | } | 
| 330 | #m <- m + 1 | 330 | #m <- m + 1 | 
| 331 | 331 | ||
| 332 | } | 332 | } | 
| 333 | Pactvar <- Pactvar[!duplicated(Pactvar)] | 333 | Pactvar <- Pactvar[!duplicated(Pactvar)] | 
| 334 | ##Searching to see if any of the parents are in the previous degree | 334 | ##Searching to see if any of the parents are in the previous degree | 
| 335 | ##The right children will have both the current variable and a previous degrees variable as parents | 335 | ##The right children will have both the current variable and a previous degrees variable as parents | 
| 336 | o <- 1 | 336 | o <- 1 | 
| 337 | for(o in 1:length(Pactvar)){ | 337 | for(o in 1:length(Pactvar)){ | 
| 338 | if(sum(grepl(Pactvar[o],AllVarList[[(k - 1)]][[intship]])) >= 1){ | 338 | if(sum(grepl(Pactvar[o],AllVarList[[(k - 1)]][[intship]])) >= 1){ | 
| 339 | Wanvar <- append(Wanvar,Pactvar[o]) | 339 | Wanvar <- append(Wanvar,Pactvar[o]) | 
| 340 | } | 340 | } | 
| 341 | #o <- o + 1 | 341 | #o <- o + 1 | 
| 342 | } | 342 | } | 
| 343 | Wanvar <- Wanvar[!duplicated(Wanvar)] | 343 | Wanvar <- Wanvar[!duplicated(Wanvar)] | 
| 344 | prevar <- Wanvar | 344 | prevar <- Wanvar | 
| 345 | 345 | ||
| 346 | } else if(modship == 1){ | 346 | } else if(modship == 1){ | 
| 347 | #When modship == 1 then we are referring to a Parent | 347 | #When modship == 1 then we are referring to a Parent | 
| 348 | LCofVar <- grep(paste0("^",prevar,"$"),NewDotP2_2[,1]) | 348 | lengprevar <- length(prevar) | 
| 349 | CoVar <- NewDotP2_2[LCofVar,1] | 349 | t <- 1 | 
| 350 | lenC <- length(CoVar) | 350 | ##All children of these parents | 
| 351 | for(o in 1:lenC){ | 351 | TCoVar <- vector("character",length = 0) | 
| 352 | if(grepl(CoVar[o],AllVarList[[k]][[intship]]) == TRUE){ | 352 | ##variables that could have led to these parents | 
| 353 | 353 | leadVar <- vector("character",length = 0) | |
| 354 | 354 | for(t in 1: lengprevar){ | |
| 355 | LCofVar <- grep(paste0("^",prevar[t],"$"),NewDotP2_2[,1]) | ||
| 356 | CoVar <- NewDotP2_2[LCofVar,2] | ||
| 357 | TCoVar <- append(TCoVar,CoVar) | ||
| 358 | } | ||
| 359 | TCoVar <- TCoVar[!duplicated(TCoVar)] | ||
| 360 | s <- 1 | ||
| 361 | ##Searching for the children that are also in the previous degree | ||
| 362 | for(s in 1:length(TCoVar)){ | ||
| 363 | if(sum(grepl(TCoVar[s],AllVarList[[(k - 1)]][[intship]])) >= 1){ | ||
| 364 | leadVar <- append(leadVar,TCoVar[s]) | ||
| 355 | } | 365 | } | 
| 356 | |||
| 357 | } | 366 | } | 
| 358 | 367 | leadVar <- leadVar[!duplicated(leadVar)] | |
| 368 | prevar <- leadVar | ||
| 359 | 369 | ||
| 360 | } else if(modship == 2){ | 370 | } else if(modship == 2){ | 
| 361 | #When modship == 0 then we are referring to a Child | 371 | #When modship == 2 then we are referring to a Child | 
| 372 | lenprevar <- length(prevar) | ||
| 373 | x <- 1 | ||
| 374 | ##All parents of these children | ||
| 375 | TPoVar <- vector("character",length = 0) | ||
| 376 | ##variables that could have led to these children based on the | ||
| 377 | drctVar <- vector("character",length = 0) | ||
| 378 | for(x in 1:lenprevar){ | ||
| 379 | LPoVar <- grep(paste0("^",prevar[x],"$"),NewDotP2_2[,2]) | ||
| 380 | PoVar <- NewDotP2_2[LPoVar,1] | ||
| 381 | TPoVar <- append(TPoVar,PoVar) | ||
| 382 | } | ||
| 383 | TPoVar <- TPoVar[!duplicated(TPoVar)] | ||
| 384 | y <- 1 | ||
| 385 | ##Searching for the parents that are also in the previous degree | ||
| 386 | for(y in 1:length(TPoVar)){ | ||
| 387 | if(sum(grepl(TPoVar[y],AllVarList[[(k - 1)]][[intship]])) >= 1){ | ||
| 388 | drctVar <- append(drctVar,TPoVar[y]) | ||
| 389 | } | ||
| 390 | } | ||
| 391 | drctVar <- drctVar[!duplicated(drctVar)] | ||
| 392 | prevar <- drctVar | ||
| 393 | |||
| 362 | 394 | ||
| 363 | } | 395 | } | 
| 364 | 396 | ||
| 365 | ship <- intship | 397 | ship <- intship | 
| 366 | 398 | ||
| 367 | Pathlisting[[(k - 1)]] <- prevar | 399 | Pathlisting[[(k - 1)]] <- prevar | 
| 368 | } | 400 | } |