dtype: bfloat16 | |
merge_method: passthrough | |
slices: | |
- sources: | |
- layer_range: [0, 70] | |
model: TheDrummer/Behemoth-123B-v1 | |
- sources: | |
- layer_range: [18, 88] | |
model: TheDrummer/Behemoth-123B-v1 |
dtype: bfloat16 | |
merge_method: passthrough | |
slices: | |
- sources: | |
- layer_range: [0, 70] | |
model: TheDrummer/Behemoth-123B-v1 | |
- sources: | |
- layer_range: [18, 88] | |
model: TheDrummer/Behemoth-123B-v1 |