Skip to content

Commit

Permalink
Increase default hparams a bit
Browse files Browse the repository at this point in the history
  • Loading branch information
jmaczan committed Jul 14, 2024
1 parent 990376a commit 57f3e26
Show file tree
Hide file tree
Showing 2 changed files with 4 additions and 4 deletions.
6 changes: 3 additions & 3 deletions src/gpt.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,11 +7,11 @@
torch.manual_seed(1995)

default_context_window = 256
default_embedding_dimension = 256
default_embedding_dimension = 384
default_vocabulary_size = 300
default_attention_heads_count = 4
default_attention_heads_count = 6
default_transformer_blocks_count = 6
default_batch_size = 32
default_batch_size = 64


class GPT(nn.Module):
Expand Down
2 changes: 1 addition & 1 deletion src/train.py
Original file line number Diff line number Diff line change
Expand Up @@ -14,7 +14,7 @@


default_num_epochs = 50
default_learning_rate = 3e-4 # 0.001 before, but then I took it from Karpathy's videos
default_learning_rate = 3e-4 # 0.001 before, but then I took it from Karpathy's videos

checkpoints_directory = "checkpoints"
os.makedirs(checkpoints_directory, exist_ok=True)
Expand Down

0 comments on commit 57f3e26

Please sign in to comment.