Phi 2.0 - Extra Hyperparameters
warmup_steps: 100
evals_per_epoch: 4
saves_per_epoch: 1
debug:
deepspeed:
weight_decay: 0.1
fsdp:
fsdp_config:
resize_token_embeddings_to_32x: true
special_tokens:
pad_token: "<|endoftext|>"Training Hyperparameters
warmup_steps: 100
warmup_steps: 100evals_per_epoch: 4
evals_per_epoch: 4saves_per_epoch: 1
saves_per_epoch: 1Deepspeed and FSDP
deepspeed:
deepspeed:fsdp_config:
fsdp_config:weight decay: 1
weight decay: 1Special Tokens and Token Embeddings
resize_token_embeddings_to_32x:
resize_token_embeddings_to_32x:pad_token
pad_tokenLast updated
Was this helpful?

