my_model_Eperiment2 / config.json
Erica tong
Upload BertForMultilabelSequenceClassification
91026c7 verified
{
"_name_or_path": "distilbert-base-uncased",
"activation": "gelu",
"architectures": [
"BertForMultilabelSequenceClassification"
],
"attention_dropout": 0.1,
"attention_probs_dropout_prob": 0.1,
"classifier_dropout": null,
"dim": 768,
"dropout": 0.1,
"hidden_act": "gelu",
"hidden_dim": 3072,
"hidden_dropout_prob": 0.1,
"hidden_size": 768,
"id2label": {
"0": "sub_labels_01",
"1": "sub_labels_02",
"10": "sub_labels_11",
"11": "sub_labels_12",
"12": "sub_labels_13",
"13": "sub_labels_14",
"14": "sub_labels_15",
"15": "sub_labels_16",
"16": "sub_labels_17",
"17": "sub_labels_18",
"18": "sub_labels_19",
"19": "sub_labels_20",
"2": "sub_labels_03",
"20": "sub_labels_21",
"21": "sub_labels_22",
"22": "sub_labels_23",
"23": "sub_labels_24",
"3": "sub_labels_04",
"4": "sub_labels_05",
"5": "sub_labels_06",
"6": "sub_labels_07",
"7": "sub_labels_08",
"8": "sub_labels_09",
"9": "sub_labels_10"
},
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"sub_labels_01": 0,
"sub_labels_02": 1,
"sub_labels_03": 2,
"sub_labels_04": 3,
"sub_labels_05": 4,
"sub_labels_06": 5,
"sub_labels_07": 6,
"sub_labels_08": 7,
"sub_labels_09": 8,
"sub_labels_10": 9,
"sub_labels_11": 10,
"sub_labels_12": 11,
"sub_labels_13": 12,
"sub_labels_14": 13,
"sub_labels_15": 14,
"sub_labels_16": 15,
"sub_labels_17": 16,
"sub_labels_18": 17,
"sub_labels_19": 18,
"sub_labels_20": 19,
"sub_labels_21": 20,
"sub_labels_22": 21,
"sub_labels_23": 22,
"sub_labels_24": 23
},
"layer_norm_eps": 1e-12,
"max_position_embeddings": 512,
"model_type": "bert",
"n_heads": 12,
"n_layers": 6,
"num_attention_heads": 12,
"num_hidden_layers": 12,
"pad_token_id": 0,
"position_embedding_type": "absolute",
"qa_dropout": 0.1,
"seq_classif_dropout": 0.2,
"sinusoidal_pos_embds": false,
"tie_weights_": true,
"torch_dtype": "float32",
"transformers_version": "4.23.1",
"type_vocab_size": 2,
"use_cache": true,
"vocab_size": 30522
}