Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion .pre-commit-config.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -11,7 +11,7 @@ repos:
hooks:
- id: black
args: ["--config", "./pyproject.toml"]
language_version: python3.7
language_version: python3

- repo: https://github.com/asottile/seed-isort-config
rev: v2.2.0
Expand Down
Original file line number Diff line number Diff line change
Expand Up @@ -121,3 +121,4 @@ trainer:
- name: micro_auc
seed: 1337
use_gpu: true
initialise_hidden_states: false
Original file line number Diff line number Diff line change
Expand Up @@ -121,3 +121,4 @@ trainer:
- name: micro_auc
seed: 1337
use_gpu: true
initialise_hidden_states: false
Original file line number Diff line number Diff line change
Expand Up @@ -121,3 +121,4 @@ trainer:
- name: micro_auc
seed: 1337
use_gpu: true
initialise_hidden_states: false
Original file line number Diff line number Diff line change
Expand Up @@ -121,3 +121,4 @@ trainer:
- name: micro_auc
seed: 1337
use_gpu: true
initialise_hidden_states: false
Original file line number Diff line number Diff line change
Expand Up @@ -117,3 +117,4 @@ trainer:
- name: micro_auc
seed: 1337
use_gpu: true
initialise_hidden_states: false
Original file line number Diff line number Diff line change
Expand Up @@ -121,3 +121,4 @@ trainer:
- name: micro_auc
seed: 1337
use_gpu: true
initialise_hidden_states: false
1 change: 1 addition & 0 deletions configs/dcan/mimic3_50.yml
Original file line number Diff line number Diff line change
Expand Up @@ -125,3 +125,4 @@ trainer:
- name: micro_auc
seed: 1
use_gpu: true
initialise_hidden_states: false
1 change: 1 addition & 0 deletions configs/dcan/mimic3_50_old.yml
Original file line number Diff line number Diff line change
Expand Up @@ -125,3 +125,4 @@ trainer:
- name: micro_auc
seed: 1
use_gpu: true
initialise_hidden_states: false
1 change: 1 addition & 0 deletions configs/dcan/mimic3_full.yml
Original file line number Diff line number Diff line change
Expand Up @@ -125,3 +125,4 @@ trainer:
- name: micro_auc
seed: 1
use_gpu: true
initialise_hidden_states: false
1 change: 1 addition & 0 deletions configs/dcan/mimic3_full_old.yml
Original file line number Diff line number Diff line change
Expand Up @@ -125,3 +125,4 @@ trainer:
- name: micro_auc
seed: 1
use_gpu: true
initialise_hidden_states: false
1 change: 1 addition & 0 deletions configs/fusion/mimic3_50.yml
Original file line number Diff line number Diff line change
Expand Up @@ -126,3 +126,4 @@ trainer:
- name: micro_auc
seed: 1337
use_gpu: true
initialise_hidden_states: true
1 change: 1 addition & 0 deletions configs/fusion/mimic3_50_old.yml
Original file line number Diff line number Diff line change
Expand Up @@ -126,3 +126,4 @@ trainer:
- name: micro_auc
seed: 1337
use_gpu: true
initialise_hidden_states: false
1 change: 1 addition & 0 deletions configs/fusion/mimic3_full.yml
Original file line number Diff line number Diff line change
Expand Up @@ -126,3 +126,4 @@ trainer:
- name: micro_auc
seed: 1337
use_gpu: true
initialise_hidden_states: false
1 change: 1 addition & 0 deletions configs/fusion/mimic3_full_old.yml
Original file line number Diff line number Diff line change
Expand Up @@ -126,3 +126,4 @@ trainer:
- name: micro_auc
seed: 1337
use_gpu: true
initialise_hidden_states: false
128 changes: 128 additions & 0 deletions configs/gatedcnn_nci/mimic3_50.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,128 @@
paths:
mimic_dir: &mimic_dir datasets/mimic3/csv
static_dir: &static_dir datasets/mimic3/static
dataset_dir: &dataset_dir datasets/mimic3_50
word2vec_dir: &word2vec_dir datasets/mimic3_50/word2vec
output_dir: &output_dir results/gatedcnn_nci_mimic3_50

dataset:
name: base_dataset
data_common: &data_common
column_names:
hadm_id: "HADM_ID"
clinical_note: "TEXT"
labels: "LABELS"
word2vec_dir: *word2vec_dir
pad_token: "<pad>"
unk_token: "<unk>"
dataset_dir: *dataset_dir
label_file: labels.json
max_length: 2500
params:
train:
<<: *data_common
data_file: train.json
val:
<<: *data_common
data_file: val.json
test:
<<: *data_common
data_file: test.json

model:
name: gatedcnn_nci
params:
version: mimic3
dataset_dir: *dataset_dir
mimic_dir: *mimic_dir
static_dir: *static_dir
embed_dir: *word2vec_dir
max_length: 2500
dropout: 0.2
input_dim: 100
hidden_dim: 100
output_dim: 50
bidirectional: false
use_description: true
pad_token: "<pad>"
unk_token: "<unk>"
kernel_size: 3
init_mean: 0
init_std: 0.01
levels: 3

trainer:
name: base_trainer
params:
output_dir: *output_dir
data_loader:
batch_size: 16
num_workers: 4
shuffle: false
drop_last: true
loss:
name: BinaryCrossEntropyLoss
params: null
optimizer:
name: adam
params:
lr: 0.0001
weight_decay: 0.0
max_epochs: 200
lr_scheduler: null
stopping_criterion:
metric:
name: prec_at_8
desired: max
patience: 10
checkpoint_saver:
name: base_saver
params:
checkpoint_dir: *output_dir
interval: 1
max_to_keep: 5
ckpt_fname_format: "ckpt-{}.pth"
best_fname_format: "best-{}.pth"
metric:
name: prec_at_8
class: prec_at_k
params:
k: 8
desired: max
eval_metrics: &eval_metrics
- name: prec_at_5
class: prec_at_k
params:
k: 5
- name: prec_at_8
class: prec_at_k
params:
k: 8
- name: macro_f1
- name: micro_f1
- name: macro_auc
- name: micro_auc
graph:
writer:
name: tensorboard
params:
log_dir: *output_dir
train:
interval: 100
interval_unit: step
metric:
- name: loss
val:
interval: 1
interval_unit: epoch
metric:
- name: loss
- name: prec_at_5
- name: prec_at_8
- name: macro_f1
- name: micro_f1
- name: macro_auc
- name: micro_auc
seed: 1337
use_gpu: true
initialise_hidden_states: true
128 changes: 128 additions & 0 deletions configs/gatedcnn_nci/mimic3_50_old.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,128 @@
paths:
mimic_dir: &mimic_dir datasets/mimic3/csv
static_dir: &static_dir datasets/mimic3/static
dataset_dir: &dataset_dir datasets/mimic3_50_old
word2vec_dir: &word2vec_dir datasets/mimic3_50_old/word2vec
output_dir: &output_dir results/gatedcnn_nci_mimic3_50_old

dataset:
name: base_dataset
data_common: &data_common
column_names:
hadm_id: "HADM_ID"
clinical_note: "TEXT"
labels: "LABELS"
word2vec_dir: *word2vec_dir
pad_token: "<pad>"
unk_token: "<unk>"
dataset_dir: *dataset_dir
label_file: labels.json
max_length: 2500
params:
train:
<<: *data_common
data_file: train.json
val:
<<: *data_common
data_file: val.json
test:
<<: *data_common
data_file: test.json

model:
name: gatedcnn_nci
params:
version: mimic3
dataset_dir: *dataset_dir
mimic_dir: *mimic_dir
static_dir: *static_dir
embed_dir: *word2vec_dir
max_length: 2500
dropout: 0.2
input_dim: 100
hidden_dim: 100
output_dim: 50
bidirectional: false
use_description: true
pad_token: "<pad>"
unk_token: "<unk>"
kernel_size: 3
init_mean: 0
init_std: 0.01
levels: 3

trainer:
name: base_trainer
params:
output_dir: *output_dir
data_loader:
batch_size: 16
num_workers: 4
shuffle: false
drop_last: true
loss:
name: BinaryCrossEntropyLoss
params: null
optimizer:
name: adam
params:
lr: 0.01
weight_decay: 0.0
max_epochs: 100
lr_scheduler: null
stopping_criterion:
metric:
name: prec_at_8
desired: max
patience: 10
checkpoint_saver:
name: base_saver
params:
checkpoint_dir: *output_dir
interval: 1
max_to_keep: 5
ckpt_fname_format: "ckpt-{}.pth"
best_fname_format: "best-{}.pth"
metric:
name: prec_at_8
class: prec_at_k
params:
k: 8
desired: max
eval_metrics: &eval_metrics
- name: prec_at_5
class: prec_at_k
params:
k: 5
- name: prec_at_8
class: prec_at_k
params:
k: 8
- name: macro_f1
- name: micro_f1
- name: macro_auc
- name: micro_auc
graph:
writer:
name: tensorboard
params:
log_dir: *output_dir
train:
interval: 100
interval_unit: step
metric:
- name: loss
val:
interval: 1
interval_unit: epoch
metric:
- name: loss
- name: prec_at_5
- name: prec_at_8
- name: macro_f1
- name: micro_f1
- name: macro_auc
- name: micro_auc
seed: 1337
use_gpu: true
initialise_hidden_states: true
Loading