Skip to content

Commit

Permalink
feat: adapt training procedure to uniref
Browse files Browse the repository at this point in the history
  • Loading branch information
CFisicaro committed Mar 7, 2022
1 parent 2d2eead commit 058b07a
Show file tree
Hide file tree
Showing 2 changed files with 4 additions and 4 deletions.
4 changes: 2 additions & 2 deletions proteonemo/conf/bert_inference_from_preprocessed_config.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -36,7 +36,7 @@ model:
hidden_size: 768
initializer_range: 0.02
intermediate_size: 3072
max_position_embeddings: 512
max_position_embeddings: 1024
num_attention_heads: 12
num_hidden_layers: 12
type_vocab_size: 2
Expand All @@ -47,7 +47,7 @@ model:

infer_ds:
data_file: '/data/WIKIPEDIA/hdf5_lower_case_1_seq_len_512_max_pred_80_masked_lm_prob_0.15_random_seed_12345_dupe_factor_5/wikicorpus_en/wikicorpus_en_training_0.hdf5' # path to hdf5 file (or directory)
max_predictions_per_seq: 80
max_predictions_per_seq: 160
batch_size: 16
shuffle: false
num_samples: -1
Expand Down
4 changes: 2 additions & 2 deletions proteonemo/conf/bert_pretrained_from_preprocessed_config.yaml
Original file line number Diff line number Diff line change
Expand Up @@ -47,7 +47,7 @@ model:
hidden_size: 768
initializer_range: 0.02
intermediate_size: 3072
max_position_embeddings: 512
max_position_embeddings: 1024
num_attention_heads: 12
num_hidden_layers: 12
type_vocab_size: 2
Expand All @@ -58,7 +58,7 @@ model:

train_ds:
data_file: '/data/WIKIPEDIA/hdf5_lower_case_1_seq_len_512_max_pred_80_masked_lm_prob_0.15_random_seed_12345_dupe_factor_5/wikicorpus_en' # path to hdf5 file (or directory)
max_predictions_per_seq: 80
max_predictions_per_seq: 160
batch_size: 16
shuffle: true
num_samples: -1
Expand Down

0 comments on commit 058b07a

Please sign in to comment.