Skip to content

Commit

Permalink
Merge branch 'comet-integration' of https://github.com/comet-ml/gpt-neox
Browse files Browse the repository at this point in the history
 into comet-integration
  • Loading branch information
Quentin-Anthony committed Sep 9, 2024
2 parents f0a4b70 + 962314e commit c6681b5
Showing 1 changed file with 33 additions and 0 deletions.
33 changes: 33 additions & 0 deletions configs/local_setup_comet.yml
Original file line number Diff line number Diff line change
@@ -0,0 +1,33 @@
# Suggested data paths when using GPT-NeoX locally
{
"data_path": "/workspace/gpt-neox-main/data/enwik8/enwik8_text_document",

# or for weighted datasets:
# "train-data-paths": ["data/enwik8/enwik8_text_document", "data/enwik8/enwik8_text_document"],
# "test-data-paths": ["data/enwik8/enwik8_text_document", "data/enwik8/enwik8_text_document"],
# "valid-data-paths": ["data/enwik8/enwik8_text_document", "data/enwik8/enwik8_text_document"],
# "train-data-weights": [1., 2.],
# "test-data-weights": [2., 1.],
# "valid-data-weights": [0.5, 0.4],

# If weight_by_num_documents is True, Builds dataset weights from a multinomial distribution over groups of data according to the number of documents in each group.
# WARNING: setting this to True will override any user provided weights
# "weight_by_num_documents": false,
# "weighted_sampler_alpha": 0.3,

"vocab_file": "/workspace/gpt-neox-main/data/gpt2-vocab.json",
"merge_file": "/workspace/gpt-neox-main/data/gpt2-merges.txt",

"save": "checkpoints",
"load": "checkpoints",
"checkpoint_validation_with_forward_pass": False,

"tensorboard_dir": "tensorboard",
"log_dir": "logs",
"use_comet": True,
"comet_workspace": "test_workspace", # CHANGE ME
"comet_project": "test_project",
"comet_experiment_name": "test_experiment",
"comet_tags": ["test_tag1", "test_tag2"],
"comet_others": {"test_others"},
}

0 comments on commit c6681b5

Please sign in to comment.