Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
5 changes: 5 additions & 0 deletions .devcontainer/devcontainer.json
Original file line number Diff line number Diff line change
Expand Up @@ -13,5 +13,10 @@
"ghcr.io/devcontainers/features/docker-in-docker:2": {},
// For building singularity
"ghcr.io/devcontainers/features/go:1": {}
},
"hostRequirements": {
"cpus": 4,
"memory": "16gb",
"storage": "32gb"
}
}
3 changes: 3 additions & 0 deletions _typos.toml
Original file line number Diff line number Diff line change
Expand Up @@ -2,3 +2,6 @@
# Ignore data files
extend-glob = ["*.txt"]
check-file = false

[default.extend-words]
STIP = "STIP"
9 changes: 4 additions & 5 deletions docs/_static/config/beginner.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -23,13 +23,12 @@ containers:

algorithms:
- name: "pathlinker"
params:
include: true
include: true
runs:
run1:
k: 1

# run2: # uncomment for step 3.2
# k: [10, 100] # uncomment for step 3.2
# run2: # uncomment for step 3.2
# k: [10, 100] # uncomment for step 3.2

# Here we specify which pathways to run and other file location information.
# Assume that if a dataset label does not change, the lists of associated input files do not change
Expand Down
98 changes: 38 additions & 60 deletions docs/_static/config/intermediate.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -21,76 +21,46 @@ containers:
# then myAlg will be run on (a=1,b=0.5),(a=1,b=0.75),(a=2,b=0.5), and (a=2,b=0,75). Pretty neat, but be
# careful: too many parameters might make your runs take a long time.

# TODO: get rid of the algorithms that will take too long to run
algorithms:
- name: "pathlinker"
include: true
runs:
run1:
k: 1
run2:
k: [10, 100]
- name: omicsintegrator1
include: true
runs:
run1:
b: [0.55, 2, 10]
d: 10
g: 1e-3
r: 0.01
w: 0.1
mu: 0.008
k: [1, 10, 100, 1000]

- name: omicsintegrator2
include: true
runs:
run1:
b: 4
g: 0
run2:
b: 2
g: 3
- name: meo
include: true
runs:
run1:
local_search: [true, false]
max_path_length: [2, 3]
rand_restarts: 10
- name: allpairs
include: true
- name: domino
include: true
runs:
run1:
slice_threshold: 0.3
module_threshold: 0.05
b: [4, 10]
g: [0, 3]
w: [0.25, 6]

- name: mincostflow
include: true
runs:
run1:
capacity: 15
flow: 80
run2:
capacity: 1
flow: 6
run3:
capacity: 5
flow: 60
capacity: [15, 30]
flow: [80, 15]

- name: "strwr"
include: true
runs:
run1:
alpha: [0.85]
alpha: 0.85
threshold: [100, 200]

- name: "rwr"
include: true
runs:
run1:
alpha: [0.85]
alpha: 0.85
threshold: [100, 200]

# Here we specify which pathways to run and other file location information.
# Assume that if a dataset label does not change, the lists of associated input files do not change
datasets: # TODO update this based on the dataset that I set up
datasets:
- # Labels can only contain letters, numbers, or underscores
label: egfr
node_files: ["tps-egfr-prizes.txt"] # the input nodes
Expand All @@ -100,33 +70,41 @@ datasets: # TODO update this based on the dataset that I set up
# Relative path from the spras directory where these files live
data_dir: "input"

gold_standards:
- # Labels can only contain letters, numbers, or underscores
label: gs_egfr
node_files: ["gs-egfr.txt"]
data_dir: "input"
# List of dataset labels to compare with the specific gold standard dataset
dataset_labels: ["egfr"]

reconstruction_settings:

# Set where everything is saved
locations:
reconstruction_dir: "output/intermediate"

analysis:
summary:
include: false # set to true for step 4

# Machine learning analysis (e.g. clustering) of the pathway output files for each dataset
ml:
# ml analysis per dataset
include: false # set to true for step 3

# adds ml analysis per algorithm output
# only runs for algorithms with multiple parameter combinations chosen
aggregate_per_algorithm: false
# specify how many principal components to calculate
components: 2
# boolean to show the labels on the pca graph
labels: true
# 'ward', 'complete', 'average', 'single'
# if linkage: ward, must use metric: euclidean
linkage: 'ward'
# 'euclidean', 'manhattan', 'cosine'
metric: 'euclidean'
# controls whether kernel density estimation (KDE) is computed and visualized on top of PCA plots.
# the coordinates of the KDE maximum (kde_peak) are also saved to the PCA coordinates output file.
# KDE needs to be run in order to select a parameter combination with PCA because the maximum kernel density is used
# to pick the 'best' parameter combination.
kde: false
aggregate_per_algorithm: false # set to true for step 4
# overalls a kernel density estimation over pca
kde: false # set to true for step 4
# removes empty pathways from consideration in ml analysis (pca only)
remove_empty_pathways: false
remove_empty_pathways: false # set to true for step 4

evaluation:
# evaluation per dataset-goldstandard pair
# evaluation will not run unless ml include is set to true
include: false # set to true for step 4
# adds evaluation per algorithm per dataset-goldstandard pair
# evaluation per algorithm will not run unless ml include and ml aggregate_per_algorithm are set to true
aggregate_per_algorithm: false # set to true for step 4
Binary file modified docs/_static/images/hac-horizontal.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file modified docs/_static/images/hac-vertical.png
Comment thread
ntalluri marked this conversation as resolved.
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file modified docs/_static/images/jaccard-heatmap.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file modified docs/_static/images/pca-kde.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file modified docs/_static/images/pca.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file modified docs/_static/images/pr-pca-chosen-pathway-per-algorithm-nodes.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Binary file modified docs/_static/images/pr-per-pathway-nodes.png
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Loading
Sorry, something went wrong. Reload?
Sorry, we cannot display this file.
Sorry, this file is invalid so it cannot be displayed.
Loading
Loading