File size: 2,791 Bytes
049ec21
cde73c1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
049ec21
 
 
 
 
 
 
 
 
 
 
cde73c1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
049ec21
 
 
cde73c1
 
 
 
 
 
 
049ec21
cde73c1
 
049ec21
cde73c1
 
049ec21
cde73c1
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
049ec21
2ce61d3
049ec21
cde73c1
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
import gradio as gr
import yaml

MARKDOWN_DESCRIPTION = """
# mergekit config.yaml generator

GUI to template a YAML configuration file for mergekit, which you can then copy/paste into [mergekit-gui](https://huggingface.co/spaces/arcee-ai/mergekit-gui) 🔥
"""

DEFAULT_PARAMETERS = """
t:
- filter: self_attn
  value: [0, 0.5, 0.3, 0.7, 1]
- filter: mlp
  value: [1, 0.5, 0.7, 0.3, 0]
- value: 0.5
"""


def create_config_yaml(
    model1,
    model1_layers,
    model2,
    model2_layers,
    merge_method,
    base_model,
    parameters,
    dtype,
) -> str:
    dict_config = {
        "slices": [
            {
                "sources": [
                    {"model": model1, "layer_range": yaml.safe_load(model1_layers)},
                    {"model": model2, "layer_range": yaml.safe_load(model2_layers)},
                ]
            }
        ],
        "merge_method": merge_method,
        "base_model": base_model,
    }

    if parameters:
        dict_config["parameters"] = yaml.safe_load(parameters)
    if dtype:
        dict_config["dtype"] = dtype

    return yaml.dump(dict_config, sort_keys=False)


# make sure to add the themes as well
with gr.Blocks() as demo:
    gr.Markdown(MARKDOWN_DESCRIPTION)
    with gr.Row():
        # model_name_input = gr.Textbox(label="Model Name", value="my-merge")
        model1_input = gr.Textbox(label="Model 1", value="BioMistral/BioMistral-7B")
        model1_layers_input = gr.Textbox(
            label="Model 1 Layer Range", placeholder="[start, end]", value="[0, 32]"
        )
        model2_input = gr.Textbox(
            label="Model 2", value="CorticalStack/pastiche-crown-clown-7b-dare-dpo"
        )
        model2_layers_input = gr.Textbox(
            label="Model 2 Layer Range", placeholder="[start, end]", value="[0, 32]"
        )
    merge_method_input = gr.Dropdown(
        label="Merge Method", choices=["slerp", "linear"], value="slerp"
    )
    base_model_input = gr.Textbox(label="Base Model", value="BioMistral/BioMistral-7B")
    parameters_input = gr.Code(
        language="yaml",
        label="Merge Parameters",
        value=DEFAULT_PARAMETERS,
    )
    dtype_input = gr.Textbox(label="Dtype", value="bfloat16")

    create_button = gr.Button("Create config.yaml", variant="primary")

    output_zone = gr.Code(language="yaml", lines=10)

    create_button.click(
        fn=create_config_yaml,
        inputs=[
            model1_input,
            model1_layers_input,
            model2_input,
            model2_layers_input,
            merge_method_input,
            base_model_input,
            parameters_input,
            dtype_input,
        ],
        outputs=[output_zone],
    )

    gr.Markdown("A Space by [1littlecoder](https://huggingface.co/1littlecoder)")

demo.launch()