Skip to content

Commit 839eb64

Browse files
authored
Merge pull request #71 from diazrenata/diss
Include 95th percentile of sim dissimilarity scores (directly shows how dissimilar observed would need to be to be "Extreme")
2 parents daad385 + 38972db commit 839eb64

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

65 files changed

+50125
-50938
lines changed

R/metrics.R

+1
Original file line numberDiff line numberDiff line change
@@ -491,6 +491,7 @@ po_central_tendency <- function(fs_df, fs_po_df) {
491491
real_r2 = real_rsq,
492492
best_po_sim = ct_sim,
493493
sim_pos_from_best = mean(ct_pos$prop_off),
494+
sim_pos_from_best_95 = quantile(ct_pos$prop_off, probs = .95, na.rm = T),
494495
sim_r2_from_best = mean(ct_pos$rsq),
495496
sim_r2_from_best_median = median(ct_pos$rsq),
496497
ncomparisons = nrow(ct_pos),

analysis/bbs_pipeline.R

+17-17
Original file line numberDiff line numberDiff line change
@@ -53,27 +53,27 @@ cache$del(key = "lock", namespace = "session")
5353

5454
## Run the pipeline
5555
nodename <- Sys.info()["nodename"]
56-
if(grepl("ufhpc", nodename)) {
57-
print("I know I am on the HiPerGator!")
58-
library(clustermq)
59-
options(clustermq.scheduler = "slurm", clustermq.template = here::here("slurm_clustermq.tmpl"))
60-
## Run the pipeline parallelized for HiPerGator
61-
make(all,
62-
force = TRUE,
63-
cache = cache,
64-
cache_log_file = here::here("analysis", "drake", "cache_log_bbs.txt"),
65-
verbose = 1,
66-
parallelism = "clustermq",
67-
jobs = 100,
68-
caching = "master",
69-
memory_strategy = "autoclean",
70-
garbage_collection = TRUE) # Important for DBI caches!
71-
} else {
56+
# if(grepl("ufhpc", nodename)) {
57+
# print("I know I am on the HiPerGator!")
58+
# library(clustermq)
59+
# options(clustermq.scheduler = "slurm", clustermq.template = here::here("slurm_clustermq.tmpl"))
60+
# ## Run the pipeline parallelized for HiPerGator
61+
# make(all,
62+
# force = TRUE,
63+
# cache = cache,
64+
# cache_log_file = here::here("analysis", "drake", "cache_log_bbs.txt"),
65+
# verbose = 1,
66+
# parallelism = "clustermq",
67+
# jobs = 100,
68+
# caching = "master",
69+
# memory_strategy = "autoclean",
70+
# garbage_collection = TRUE) # Important for DBI caches!
71+
# } else {
7272
library(clustermq)
7373
options(clustermq.scheduler = "multicore")
7474
# Run the pipeline on multiple local cores
7575
system.time(make(all, cache = cache, cache_log_file = here::here("analysis", "drake", "cache_log_bbs.txt"), verbose = 1, memory_strategy = "autoclean"))
76-
}
76+
#}
7777

7878
#system.time(make(all, cache = cache, cache_log_file = here::here("analysis", "drake", "cache_log_bbs.txt")))
7979

analysis/gentry_pipeline.R

+17-17
Original file line numberDiff line numberDiff line change
@@ -51,27 +51,27 @@ cache$del(key = "lock", namespace = "session")
5151

5252
## Run the pipeline
5353
nodename <- Sys.info()["nodename"]
54-
if(grepl("ufhpc", nodename)) {
55-
print("I know I am on the HiPerGator!")
56-
library(clustermq)
57-
options(clustermq.scheduler = "slurm", clustermq.template = here::here("slurm_clustermq.tmpl"))
58-
## Run the pipeline parallelized for HiPerGator
59-
make(all,
60-
force = TRUE,
61-
cache = cache,
62-
cache_log_file = here::here("analysis", "drake", "cache_log_gentry.txt"),
63-
verbose = 1,
64-
parallelism = "clustermq",
65-
jobs = 100,
66-
caching = "master",
67-
memory_strategy = "autoclean",
68-
garbage_collection = TRUE) # Important for DBI caches!
69-
} else {
54+
# if(grepl("ufhpc", nodename)) {
55+
# print("I know I am on the HiPerGator!")
56+
# library(clustermq)
57+
# options(clustermq.scheduler = "slurm", clustermq.template = here::here("slurm_clustermq.tmpl"))
58+
# ## Run the pipeline parallelized for HiPerGator
59+
# make(all,
60+
# force = TRUE,
61+
# cache = cache,
62+
# cache_log_file = here::here("analysis", "drake", "cache_log_gentry.txt"),
63+
# verbose = 1,
64+
# parallelism = "clustermq",
65+
# jobs = 100,
66+
# caching = "master",
67+
# memory_strategy = "autoclean",
68+
# garbage_collection = TRUE) # Important for DBI caches!
69+
# } else {
7070
library(clustermq)
7171
options(clustermq.scheduler = "multicore")
7272
# Run the pipeline on multiple local cores
7373
system.time(make(all, cache = cache, cache_log_file = here::here("analysis", "drake", "cache_log_gentry.txt"), verbose = 1, memory_strategy = "autoclean"))
74-
}
74+
#}
7575

7676
#system.time(make(all, cache = cache, cache_log_file = here::here("analysis", "drake", "cache_log_gentry.txt")))
7777

Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.
Binary file not shown.

analysis/mcdb_pipeline.R

+20-20
Original file line numberDiff line numberDiff line change
@@ -48,30 +48,30 @@ all <- drake_plan(
4848
db <- DBI::dbConnect(RSQLite::SQLite(), here::here("analysis", "drake", "drake-cache-mcdb.sqlite"))
4949
cache <- storr::storr_dbi("datatable", "keystable", db)
5050
cache$del(key = "lock", namespace = "session")
51-
52-
## Run the pipeline
53-
nodename <- Sys.info()["nodename"]
54-
if(grepl("ufhpc", nodename)) {
55-
print("I know I am on the HiPerGator!")
56-
library(clustermq)
57-
options(clustermq.scheduler = "slurm", clustermq.template = here::here("slurm_clustermq.tmpl"))
58-
## Run the pipeline parallelized for HiPerGator
59-
make(all,
60-
force = TRUE,
61-
cache = cache,
62-
cache_log_file = here::here("analysis", "drake", "cache_log_mcdb.txt"),
63-
verbose = 1,
64-
parallelism = "clustermq",
65-
jobs = 20,
66-
caching = "master",
67-
memory_strategy = "autoclean",
68-
garbage_collection = TRUE) # Important for DBI caches!
69-
} else {
51+
#
52+
# ## Run the pipeline
53+
# nodename <- Sys.info()["nodename"]
54+
# if(grepl("ufhpc", nodename)) {
55+
# print("I know I am on the HiPerGator!")
56+
# library(clustermq)
57+
# options(clustermq.scheduler = "slurm", clustermq.template = here::here("slurm_clustermq.tmpl"))
58+
# ## Run the pipeline parallelized for HiPerGator
59+
# make(all,
60+
# force = TRUE,
61+
# cache = cache,
62+
# cache_log_file = here::here("analysis", "drake", "cache_log_mcdb.txt"),
63+
# verbose = 1,
64+
# parallelism = "clustermq",
65+
# jobs = 20,
66+
# caching = "master",
67+
# memory_strategy = "autoclean",
68+
# garbage_collection = TRUE) # Important for DBI caches!
69+
# } else {
7070
library(clustermq)
7171
options(clustermq.scheduler = "multicore")
7272
# Run the pipeline on multiple local cores
7373
system.time(make(all, cache = cache, cache_log_file = here::here("analysis", "drake", "cache_log_mcdb.txt"), verbose = 1, memory_strategy = "autoclean"))
74-
}
74+
#}
7575

7676
DBI::dbDisconnect(db)
7777
rm(cache)

analysis/miscabund_pipeline.R

+17-17
Original file line numberDiff line numberDiff line change
@@ -53,27 +53,27 @@ cache$del(key = "lock", namespace = "session")
5353

5454
# Run the pipeline
5555
nodename <- Sys.info()["nodename"]
56-
if(grepl("ufhpc", nodename)) {
57-
print("I know I am on the HiPerGator!")
58-
library(clustermq)
59-
options(clustermq.scheduler = "slurm", clustermq.template = here::here("slurm_clustermq.tmpl"))
60-
## Run the pipeline parallelized for HiPerGator
61-
make(all,
62-
force = TRUE,
63-
cache = cache,
64-
cache_log_file = here::here("analysis", "drake", "cache_log_miscabund.txt"),
65-
verbose = 1,
66-
parallelism = "clustermq",
67-
jobs = 100,
68-
caching = "master",
69-
memory_strategy = "autoclean",
70-
garbage_collection = TRUE) # Important for DBI caches!
71-
} else {
56+
# if(grepl("ufhpc", nodename)) {
57+
# print("I know I am on the HiPerGator!")
58+
# library(clustermq)
59+
# options(clustermq.scheduler = "slurm", clustermq.template = here::here("slurm_clustermq.tmpl"))
60+
# ## Run the pipeline parallelized for HiPerGator
61+
# make(all,
62+
# force = TRUE,
63+
# cache = cache,
64+
# cache_log_file = here::here("analysis", "drake", "cache_log_miscabund.txt"),
65+
# verbose = 1,
66+
# parallelism = "clustermq",
67+
# jobs = 100,
68+
# caching = "master",
69+
# memory_strategy = "autoclean",
70+
# garbage_collection = TRUE) # Important for DBI caches!
71+
# } else {
7272
library(clustermq)
7373
options(clustermq.scheduler = "multicore")
7474
# Run the pipeline on multiple local cores
7575
system.time(make(all, cache = cache, cache_log_file = here::here("analysis", "drake", "cache_log_miscabund.txt"), verbose = 1, memory_strategy = "autoclean"))
76-
}
76+
#}
7777

7878
#system.time(make(all, cache = cache, cache_log_file = here::here("analysis", "drake", "cache_log_miscabund.txt")))
7979

0 commit comments

Comments
 (0)