models: | |
- model: Warit2/GemOmniscien | |
parameters: | |
density: 0.5 | |
weight: 0.5 | |
- model: google/gemma-2b-it | |
parameters: | |
density: 0.5 | |
weight: 0.5 # weight gradient | |
merge_method: ties | |
base_model: Warit2/GemOmniscien | |
parameters: | |
normalize: true | |
int8_mask: true | |
dtype: bfloat16 | |
# models: | |
# - model: unsloth/gemma-7b-bnb-4bit | |
# layer_range: [0, 32] | |
# # no parameters necessary for base model | |
# - model: mistralai/Mistral-7B-v0.1 | |
# layer_range: [24, 32] | |
# merge_method: passthrough | |
# # base_model: unsloth/gemma-7b-bnb-4bit | |
# parameters: | |
# normalize: true | |
# int8_mask: true | |
# dtype: float16 | |
# slices: | |
# - sources: | |
# - model: unsloth/gemma-2b-bnb-4bit | |
# layer_range: [0, 16] | |
# - sources: | |
# - model: NousResearch/Nous-Hermes-llama-2-7b | |
# layer_range: [0, 22] | |
# merge_method: passthrough | |
# dtype: bfloat16 | |
# models: | |
# - model: unsloth/gemma-2b-bnb-4bit | |
# parameters: | |
# density: 0.53 | |
# weight: 0.45 | |
# - model: TinyLlama/TinyLlama-1.1B-Chat-v1.0 | |
# parameters: | |
# weight: 0.5 | |
# merge_method: ties | |
# base_model: unsloth/gemma-2b-bnb-4bit | |
# parameters: | |
# int8_mask: true | |
# dtype: bfloat16 | |