mirror of
https://github.com/johrpan/ubigen.git
synced 2025-10-26 19:57:24 +01:00
Introduce more variation measures
This commit is contained in:
parent
2eec3285f9
commit
76f81ab6a7
3 changed files with 22 additions and 3 deletions
BIN
data/genes.rda
BIN
data/genes.rda
Binary file not shown.
|
|
@ -33,6 +33,15 @@ results <- data[, .(
|
||||||
above_95 = mean(expression > expression_95)
|
above_95 = mean(expression > expression_95)
|
||||||
), by = "gene"]
|
), by = "gene"]
|
||||||
|
|
||||||
|
results[, `:=`(
|
||||||
|
qcv_expression = iqr_expression / median_expression,
|
||||||
|
qcv_expression_normalized =
|
||||||
|
iqr_expression_normalized / median_expression_normalized,
|
||||||
|
cv_expression = sd_expression / mean_expression,
|
||||||
|
cv_expression_normalized =
|
||||||
|
sd_expression_normalized / mean_expression_normalized
|
||||||
|
)]
|
||||||
|
|
||||||
# Normalize values to the range of 0.0 to 1.0.
|
# Normalize values to the range of 0.0 to 1.0.
|
||||||
results[, `:=`(
|
results[, `:=`(
|
||||||
median_expression_normalized =
|
median_expression_normalized =
|
||||||
|
|
@ -45,6 +54,11 @@ results[, `:=`(
|
||||||
min(iqr_expression_normalized, na.rm = TRUE)) /
|
min(iqr_expression_normalized, na.rm = TRUE)) /
|
||||||
(max(iqr_expression_normalized, na.rm = TRUE) -
|
(max(iqr_expression_normalized, na.rm = TRUE) -
|
||||||
min(iqr_expression_normalized, na.rm = TRUE)),
|
min(iqr_expression_normalized, na.rm = TRUE)),
|
||||||
|
qcv_expression_normalized =
|
||||||
|
(qcv_expression_normalized -
|
||||||
|
min(qcv_expression_normalized, na.rm = TRUE)) /
|
||||||
|
(max(qcv_expression_normalized, na.rm = TRUE) -
|
||||||
|
min(qcv_expression_normalized, na.rm = TRUE)),
|
||||||
mean_expression_normalized =
|
mean_expression_normalized =
|
||||||
(mean_expression_normalized -
|
(mean_expression_normalized -
|
||||||
min(mean_expression_normalized, na.rm = TRUE)) /
|
min(mean_expression_normalized, na.rm = TRUE)) /
|
||||||
|
|
@ -54,7 +68,12 @@ results[, `:=`(
|
||||||
(sd_expression_normalized -
|
(sd_expression_normalized -
|
||||||
min(sd_expression_normalized, na.rm = TRUE)) /
|
min(sd_expression_normalized, na.rm = TRUE)) /
|
||||||
(max(sd_expression_normalized, na.rm = TRUE) -
|
(max(sd_expression_normalized, na.rm = TRUE) -
|
||||||
min(sd_expression_normalized, na.rm = TRUE))
|
min(sd_expression_normalized, na.rm = TRUE)),
|
||||||
|
cv_expression_normalized =
|
||||||
|
(cv_expression_normalized -
|
||||||
|
min(cv_expression_normalized, na.rm = TRUE)) /
|
||||||
|
(max(cv_expression_normalized, na.rm = TRUE) -
|
||||||
|
min(cv_expression_normalized, na.rm = TRUE))
|
||||||
)]
|
)]
|
||||||
|
|
||||||
fwrite(results, file = here("scripts", "output", "results.csv"))
|
fwrite(results, file = here("scripts", "output", "results.csv"))
|
||||||
|
|
|
||||||
|
|
@ -10,8 +10,8 @@ genes <- fread(here("scripts", "input", "genes.csv"))
|
||||||
data <- fread(here("scripts", "output", "results.csv"))
|
data <- fread(here("scripts", "output", "results.csv"))
|
||||||
|
|
||||||
data[, score := 0.5 * above_95 +
|
data[, score := 0.5 * above_95 +
|
||||||
0.25 * mean_expression_normalized +
|
0.25 * median_expression_normalized +
|
||||||
-0.25 * sd_expression_normalized]
|
-0.25 * qcv_expression_normalized]
|
||||||
|
|
||||||
# Normalize scores to be between 0.0 and 1.0.
|
# Normalize scores to be between 0.0 and 1.0.
|
||||||
data[, score := (score - min(score, na.rm = TRUE)) /
|
data[, score := (score - min(score, na.rm = TRUE)) /
|
||||||
|
|
|
||||||
Loading…
Add table
Add a link
Reference in a new issue