mirror of
				https://github.com/johrpan/geposan.git
				synced 2025-10-26 10:47:25 +01:00 
			
		
		
		
	
		
			
				
	
	
		
			30 lines
		
	
	
	
		
			1.1 KiB
		
	
	
	
		
			R
		
	
	
	
	
	
			
		
		
	
	
			30 lines
		
	
	
	
		
			1.1 KiB
		
	
	
	
		
			R
		
	
	
	
	
	
| # Score the mean distance of genes to the telomeres across species.
 | |
| #
 | |
| # A score will be given to each gene such that 0.0 corresponds to the maximal
 | |
| # mean distance across all genes and 1.0 corresponds to a distance of 0.
 | |
| proximity <- function(preset, progress = NULL) {
 | |
|     species_ids <- preset$species_ids
 | |
|     gene_ids <- preset$gene_ids
 | |
| 
 | |
|     cached("proximity", c(species_ids, gene_ids), {
 | |
|         # Prefilter distances by species and gene.
 | |
|         distances <- geposan::distances[
 | |
|             species %chin% preset$species_ids & gene %chin% preset$gene_ids
 | |
|         ]
 | |
| 
 | |
|         # Compute the score as described above.
 | |
| 
 | |
|         distances <- distances[, .(mean_distance = mean(distance)), by = "gene"]
 | |
|         max_distance <- distances[, max(mean_distance)]
 | |
|         distances[, score := 1 - mean_distance / max_distance]
 | |
| 
 | |
|         if (!is.null(progress)) {
 | |
|             # We do everything in one go, so it's not possible to report
 | |
|             # detailed progress information. As the method is relatively quick,
 | |
|             # this should not be a problem.
 | |
|             progress(1.0)
 | |
|         }
 | |
| 
 | |
|         distances[, .(gene, score)]
 | |
|     })
 | |
| }
 |