| 
									
										
										
										
											2021-10-19 13:39:55 +02:00
										 |  |  | #' Rank the results by computing a score. | 
					
						
							|  |  |  | #' | 
					
						
							| 
									
										
										
										
											2021-11-05 14:47:33 +01:00
										 |  |  | #' This function takes the result of [analyze()] and creates a score by | 
					
						
							| 
									
										
										
										
											2021-10-19 13:39:55 +02:00
										 |  |  | #' computing a weighted mean across the different methods' results. | 
					
						
							|  |  |  | #' | 
					
						
							| 
									
										
										
										
											2021-11-05 14:47:33 +01:00
										 |  |  | #' @param analysis Analysis object resulting from [analyze()]. | 
					
						
							|  |  |  | #' @param weights Named list pairing method names with weighting factors. Only | 
					
						
							|  |  |  | #'   methods that are contained within this list will be included. | 
					
						
							| 
									
										
										
										
											2021-10-19 13:39:55 +02:00
										 |  |  | #' | 
					
						
							| 
									
										
										
										
											2021-11-05 14:47:33 +01:00
										 |  |  | #' @returns A ranking object. The object extends the analysis with additional | 
					
						
							|  |  |  | #'   columns containing the `score` and the `rank` of each gene. It will be | 
					
						
							|  |  |  | #'   ordered by rank. | 
					
						
							| 
									
										
										
										
											2021-10-19 13:39:55 +02:00
										 |  |  | #' | 
					
						
							|  |  |  | #' @export | 
					
						
							| 
									
										
										
										
											2021-11-05 14:47:33 +01:00
										 |  |  | ranking <- function(analysis, weights) { | 
					
						
							|  |  |  |     if (!"geposan_analysis" %chin% class(analysis)) { | 
					
						
							|  |  |  |         stop("Invalid analyis. Use geposan::analyze().") | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     ranking <- copy(analysis) | 
					
						
							|  |  |  |     ranking[, score := 0.0] | 
					
						
							| 
									
										
										
										
											2021-10-19 13:39:55 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |     for (method in names(weights)) { | 
					
						
							| 
									
										
										
										
											2021-11-05 14:47:33 +01:00
										 |  |  |         weighted <- weights[[method]] * ranking[, ..method] | 
					
						
							|  |  |  |         ranking[, score := score + weighted] | 
					
						
							| 
									
										
										
										
											2021-10-19 13:39:55 +02:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     # Normalize scores to be between 0.0 and 1.0. | 
					
						
							| 
									
										
										
										
											2021-11-05 14:47:33 +01:00
										 |  |  |     ranking[, score := score / sum(unlist(weights))] | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     setorder(ranking, -score) | 
					
						
							|  |  |  |     ranking[, rank := .I] | 
					
						
							| 
									
										
										
										
											2021-10-19 13:39:55 +02:00
										 |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-11-05 14:47:33 +01:00
										 |  |  |     structure( | 
					
						
							|  |  |  |         ranking, | 
					
						
							|  |  |  |         class = c("geposan_ranking", "geposan_analysis", class(ranking)) | 
					
						
							|  |  |  |     ) | 
					
						
							| 
									
										
										
										
											2021-10-19 13:39:55 +02:00
										 |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-11-05 23:05:40 +01:00
										 |  |  | #' S3 method for plotting a ranking. | 
					
						
							|  |  |  | #' | 
					
						
							|  |  |  | #' @param gene_sets A list of gene sets (containing vectors of gene IDs) that | 
					
						
							|  |  |  | #'   will be highlighted in the plot. | 
					
						
							|  |  |  | #' @param labels Labels for the gene sets. | 
					
						
							|  |  |  | #' | 
					
						
							|  |  |  | #' @seealso ranking() | 
					
						
							|  |  |  | #' | 
					
						
							|  |  |  | #' @export | 
					
						
							|  |  |  | plot.geposan_ranking <- function(ranking, gene_sets = NULL, labels = NULL) { | 
					
						
							|  |  |  |     if (!requireNamespace("plotly", quietly = TRUE)) { | 
					
						
							|  |  |  |         stop("Please install \"plotly\" to use this function.") | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     plot <- plotly::plot_ly() |> | 
					
						
							|  |  |  |         plotly::add_trace( | 
					
						
							|  |  |  |             data = ranking, | 
					
						
							|  |  |  |             x = ~rank, | 
					
						
							|  |  |  |             y = ~score, | 
					
						
							|  |  |  |             color = "All genes", | 
					
						
							|  |  |  |             type = "scatter", | 
					
						
							|  |  |  |             mode = "markers", | 
					
						
							|  |  |  |             hoverinfo = "skip" | 
					
						
							|  |  |  |         ) |> | 
					
						
							|  |  |  |         plotly::layout( | 
					
						
							|  |  |  |             xaxis = list(title = "Rank"), | 
					
						
							|  |  |  |             yaxis = list(title = "Score") | 
					
						
							|  |  |  |         ) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     if (length(gene_sets) > 0) { | 
					
						
							|  |  |  |         # Take out the genes to be highlighted. | 
					
						
							|  |  |  |         gene_set_data <- ranking[gene %chin% unlist(gene_sets)] | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         # Add labels for each gene set. | 
					
						
							|  |  |  |         for (i in seq_along(gene_sets)) { | 
					
						
							|  |  |  |             gene_set_data[gene %chin% gene_sets[[i]], label := labels[i]] | 
					
						
							|  |  |  |         } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         # Include gene information which will be used for laebling | 
					
						
							|  |  |  |         gene_set_data <- merge(gene_set_data, genes, by.x = "gene", by.y = "id") | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         plot <- plot |> plotly::add_trace( | 
					
						
							|  |  |  |             data = gene_set_data, | 
					
						
							|  |  |  |             x = ~rank, | 
					
						
							|  |  |  |             y = ~score, | 
					
						
							|  |  |  |             color = ~label, | 
					
						
							|  |  |  |             text = ~name, | 
					
						
							|  |  |  |             type = "scatter", | 
					
						
							|  |  |  |             mode = "markers", | 
					
						
							|  |  |  |             marker = list(size = 20) | 
					
						
							|  |  |  |         ) | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     plot | 
					
						
							|  |  |  | } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-10-19 13:39:55 +02:00
										 |  |  | #' Find the best weights to rank the results. | 
					
						
							|  |  |  | #' | 
					
						
							|  |  |  | #' This function finds the optimal parameters to [ranking()] that result in the | 
					
						
							|  |  |  | #' reference genes ranking particulary high. | 
					
						
							|  |  |  | #' | 
					
						
							| 
									
										
										
										
											2021-11-05 14:47:33 +01:00
										 |  |  | #' @param analysis Results from [analyze()] or [ranking()]. | 
					
						
							| 
									
										
										
										
											2021-10-19 13:39:55 +02:00
										 |  |  | #' @param methods Methods to include in the score. | 
					
						
							|  |  |  | #' @param reference_gene_ids IDs of the reference genes. | 
					
						
							| 
									
										
										
										
											2021-10-21 11:42:44 +02:00
										 |  |  | #' @param target The optimization target. It may be one of "mean", "min" or | 
					
						
							|  |  |  | #'   "max" and results in the respective rank being optimized. | 
					
						
							| 
									
										
										
										
											2021-10-19 13:39:55 +02:00
										 |  |  | #' | 
					
						
							| 
									
										
										
										
											2021-11-05 14:47:33 +01:00
										 |  |  | #' @returns Named list pairing method names with their optimal weights. This | 
					
						
							|  |  |  | #'   can be used as an argument to [ranking()]. | 
					
						
							| 
									
										
										
										
											2021-10-19 13:39:55 +02:00
										 |  |  | #' | 
					
						
							|  |  |  | #' @export | 
					
						
							| 
									
										
										
										
											2021-11-05 14:47:33 +01:00
										 |  |  | optimal_weights <- function(analysis, methods, reference_gene_ids, | 
					
						
							|  |  |  |                             target = "mean") { | 
					
						
							|  |  |  |     if (!"geposan_analysis" %chin% class(analysis)) { | 
					
						
							|  |  |  |         stop("Invalid analyis. Use geposan::analyze().") | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-10-19 13:39:55 +02:00
										 |  |  |     # Create the named list from the factors vector. | 
					
						
							|  |  |  |     weights <- function(factors) { | 
					
						
							|  |  |  |         result <- NULL | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         mapply(function(method, factor) { | 
					
						
							|  |  |  |             result[[method]] <<- factor | 
					
						
							|  |  |  |         }, methods, factors) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |         result | 
					
						
							|  |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-10-21 11:42:44 +02:00
										 |  |  |     # Compute the target rank of the reference genes when applying the weights. | 
					
						
							|  |  |  |     target_rank <- function(factors) { | 
					
						
							| 
									
										
										
										
											2021-11-05 14:47:33 +01:00
										 |  |  |         data <- ranking(analysis, weights(factors)) | 
					
						
							| 
									
										
										
										
											2021-10-21 11:42:44 +02:00
										 |  |  | 
 | 
					
						
							|  |  |  |         data[gene %chin% reference_gene_ids, if (target == "min") { | 
					
						
							|  |  |  |             min(rank) | 
					
						
							|  |  |  |         } else if (target == "max") { | 
					
						
							|  |  |  |             max(rank) | 
					
						
							|  |  |  |         } else { | 
					
						
							|  |  |  |             mean(rank) | 
					
						
							|  |  |  |         }] | 
					
						
							| 
									
										
										
										
											2021-10-19 13:39:55 +02:00
										 |  |  |     } | 
					
						
							|  |  |  | 
 | 
					
						
							| 
									
										
										
										
											2021-10-21 11:42:44 +02:00
										 |  |  |     factors <- stats::optim(rep(1.0, length(methods)), target_rank)$par | 
					
						
							| 
									
										
										
										
											2021-10-21 16:21:55 +02:00
										 |  |  |     factors[factors < 0.0] <- 0.0 | 
					
						
							| 
									
										
										
										
											2021-10-19 13:39:55 +02:00
										 |  |  |     total_weight <- sum(factors) | 
					
						
							|  |  |  | 
 | 
					
						
							|  |  |  |     weights(factors / total_weight) | 
					
						
							|  |  |  | } |