nitky commited on
Commit
6782f94
1 Parent(s): ccdb476

Upload 2 files

Browse files
Files changed (1) hide show
  1. mergekit_config.yml +61 -0
mergekit_config.yml ADDED
@@ -0,0 +1,61 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ merge_method: task_arithmetic
2
+ base_model: mistralai/Mistral-7B-v0.1
3
+ models:
4
+ - model: tokyotech-llm/Swallow-MS-7b-v0.1
5
+ parameters:
6
+ weight:
7
+ - filter: embed_tokens
8
+ value: 1.0
9
+ - value: 0
10
+ dtype: bfloat16
11
+ tokenizer_source: model:tokyotech-llm/Swallow-MS-7b-v0.1
12
+ name: Mistral-7B-v0.1-VE-Swallow-MS
13
+ ---
14
+ merge_method: task_arithmetic
15
+ base_model: nitky/Flavor-7b # private model
16
+ models:
17
+ - model: tokyotech-llm/Swallow-MS-7b-v0.1
18
+ parameters:
19
+ weight:
20
+ - filter: embed_tokens
21
+ value: 1.0
22
+ - value: 0
23
+ dtype: bfloat16
24
+ tokenizer_source: model:tokyotech-llm/Swallow-MS-7b-v0.1
25
+ name: Flavor-7b-VE-Swallow-MS
26
+ ---
27
+ merge_method: task_arithmetic
28
+ base_model: stabilityai/japanese-stablelm-base-gamma-7b
29
+ models:
30
+ - model: tokyotech-llm/Swallow-MS-7b-v0.1
31
+ parameters:
32
+ weight:
33
+ - filter: embed_tokens
34
+ value: 1.0
35
+ - value: 0
36
+ dtype: bfloat16
37
+ tokenizer_source: model:tokyotech-llm/Swallow-MS-7b-v0.1
38
+ name: japanese-stablelm-base-gamma-7b-VE-Swallow-MS
39
+ ---
40
+ merge_method: task_arithmetic
41
+ base_model: Mistral-7B-v0.1-VE-Swallow-MS
42
+ models:
43
+ - model: tokyotech-llm/Swallow-MS-7b-v0.1
44
+ parameters:
45
+ weight: 1.0
46
+ - model: Flavor-7b-VE-Swallow-MS
47
+ parameters:
48
+ weight: 0.5
49
+ - model: japanese-stablelm-base-gamma-7b-VE-Swallow-MS
50
+ parameters:
51
+ weight: -0.5
52
+ dtype: bfloat16
53
+ name: Oumuamua-7b-base-preset
54
+ ---
55
+ merge_method: model_stock
56
+ base_model: Mistral-7B-v0.1-VE-Swallow-MS
57
+ models:
58
+ - model: tokyotech-llm/Swallow-MS-7b-v0.1
59
+ - model: Oumuamua-7b-base-preset
60
+ dtype: bfloat16
61
+ name: Oumuamua-7b-base