SystemAdmin123 commited on
Commit
ed01ca0
·
verified ·
1 Parent(s): ef68994

Training in progress, step 100

Browse files
Files changed (3) hide show
  1. axolotl_config.yaml +4 -2
  2. model.safetensors +1 -1
  3. training_args.bin +1 -1
axolotl_config.yaml CHANGED
@@ -1,5 +1,5 @@
1
  base_model: trl-internal-testing/tiny-random-LlamaForCausalLM
2
- batch_size: 256
3
  bf16: true
4
  chat_template: tokenizer_default_fallback_alpaca
5
  datasets:
@@ -24,7 +24,7 @@ hub_strategy: checkpoint
24
  learning_rate: 0.0002
25
  logging_steps: 10
26
  lr_scheduler: cosine
27
- max_steps: 20000
28
  micro_batch_size: 32
29
  model_type: AutoModelForCausalLM
30
  num_epochs: 100
@@ -38,6 +38,8 @@ save_total_limit: 1
38
  sequence_len: 2048
39
  tokenizer_type: LlamaTokenizerFast
40
  torch_dtype: bf16
 
 
41
  trust_remote_code: true
42
  val_set_size: 0.1
43
  wandb_entity: ''
 
1
  base_model: trl-internal-testing/tiny-random-LlamaForCausalLM
2
+ batch_size: 128
3
  bf16: true
4
  chat_template: tokenizer_default_fallback_alpaca
5
  datasets:
 
24
  learning_rate: 0.0002
25
  logging_steps: 10
26
  lr_scheduler: cosine
27
+ max_steps: 10000
28
  micro_batch_size: 32
29
  model_type: AutoModelForCausalLM
30
  num_epochs: 100
 
38
  sequence_len: 2048
39
  tokenizer_type: LlamaTokenizerFast
40
  torch_dtype: bf16
41
+ training_args_kwargs:
42
+ hub_private_repo: true
43
  trust_remote_code: true
44
  val_set_size: 0.1
45
  wandb_entity: ''
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ae2287b45658d1cae69b4bfe25e777f022036e8d980148fa7635d454487588a9
3
  size 2066752
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25a257c5b2e34eda80e3d84f1a8cc4247ba163d63b057609915a20d5c03487fe
3
  size 2066752
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:9629b97ec393ef093e4840cb93f3f7c6eafc6cfa1b3cb229133bf54718ca98cb
3
  size 6840
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:11cf48786efac37806223cc8882d4253d84ff8c3599dc92c9fda0e12bc8a651f
3
  size 6840