salmanshahid commited on
Commit
cdde16f
1 Parent(s): ae588f2

Upload training_config.yml with huggingface_hub

Browse files
Files changed (1) hide show
  1. training_config.yml +8 -14
training_config.yml CHANGED
@@ -8,6 +8,7 @@ model:
8
  lora_rank: 8
9
  lora_alpha: 16
10
  perception_tokens: 2
 
11
  tokenizer:
12
  _component_: models.a2a_tokenizer
13
  path: checkpoints/Meta-Llama-3-8B-Instruct/tokenizer.model
@@ -18,28 +19,21 @@ checkpointer:
18
  - consolidated.00.pth
19
  adapter_checkpoint: null
20
  recipe_checkpoint: null
21
- output_dir: output
22
  model_type: LLAMA3
23
  resume_from_checkpoint: false
 
 
 
 
 
24
  dataset:
25
  _component_: ds.EvenBatcher
26
  dataset:
27
  _component_: ds.RoundRobinDataset
28
  datasets:
29
  - _component_: ds.LlavaInstructDataset
30
- ib_embed_path: ds/coco_llava_instruct/*.ib_embed.pt
31
- clip_embed_path: ds/coco_llava_instruct/*.clip_embed.pt
32
- caption_path: ds/coco_llava_instruct/*.caption.pt
33
- train_on_input: false
34
- - _component_: ds.LlavaInstructDataset
35
- ib_embed_path: ds/vision_flan/*.ib_embed.pt
36
- clip_embed_path: ds/vision_flan/*.clip_embed.pt
37
- caption_path: ds/vision_flan/*.caption.pt
38
- train_on_input: false
39
- - _component_: ds.CaptionInstructDataset
40
- ib_embed_path: ds/sam_llava/00.ib_embed.pt
41
- clip_embed_path: ds/sam_llava/00.clip_embed.pt
42
- caption_path: ds/sam_llava/00.caption.pt
43
  train_on_input: false
44
  seed: null
45
  shuffle: true
 
8
  lora_rank: 8
9
  lora_alpha: 16
10
  perception_tokens: 2
11
+ use_clip: false
12
  tokenizer:
13
  _component_: models.a2a_tokenizer
14
  path: checkpoints/Meta-Llama-3-8B-Instruct/tokenizer.model
 
19
  - consolidated.00.pth
20
  adapter_checkpoint: null
21
  recipe_checkpoint: null
22
+ output_dir: output_checkpoints/experiment_1
23
  model_type: LLAMA3
24
  resume_from_checkpoint: false
25
+ interim_checkpoint_steps: 5000
26
+ interim_gen_steps: null
27
+ max_new_tokens: 100
28
+ temperature: 0.6
29
+ top_k: 300
30
  dataset:
31
  _component_: ds.EvenBatcher
32
  dataset:
33
  _component_: ds.RoundRobinDataset
34
  datasets:
35
  - _component_: ds.LlavaInstructDataset
36
+ dataset_path: ds/coco_llava_instruct/output.parquet
 
 
 
 
 
 
 
 
 
 
 
 
37
  train_on_input: false
38
  seed: null
39
  shuffle: true