juanquivilla's picture
Training in progress, step 1000
413cdbf verified
{
"_name_or_path": "microsoft/Phi-3-mini-4k-instruct",
"architectures": [
"Phi3ForTokenClassification"
],
"attention_dropout": 0.0,
"auto_map": {
"AutoConfig": "microsoft/Phi-3-mini-4k-instruct--configuration_phi3.Phi3Config",
"AutoModelForCausalLM": "microsoft/Phi-3-mini-4k-instruct--modeling_phi3.Phi3ForCausalLM"
},
"bos_token_id": 1,
"embd_pdrop": 0.0,
"eos_token_id": 32000,
"hidden_act": "silu",
"hidden_size": 3072,
"id2label": {
"0": "O",
"1": "B-BOD",
"2": "I-BOD",
"3": "B-BUILDING",
"4": "I-BUILDING",
"5": "B-CARDISSUER",
"6": "I-CARDISSUER",
"7": "B-CITY",
"8": "I-CITY",
"9": "B-COUNTRY",
"10": "I-COUNTRY",
"11": "B-DATE",
"12": "I-DATE",
"13": "B-DRIVERLICENSE",
"14": "I-DRIVERLICENSE",
"15": "B-EMAIL",
"16": "I-EMAIL",
"17": "B-GEOCOORD",
"18": "I-GEOCOORD",
"19": "B-GIVENNAME1",
"20": "I-GIVENNAME1",
"21": "B-GIVENNAME2",
"22": "I-GIVENNAME2",
"23": "B-IDCARD",
"24": "I-IDCARD",
"25": "B-IP",
"26": "I-IP",
"27": "B-LASTNAME1",
"28": "I-LASTNAME1",
"29": "B-LASTNAME2",
"30": "I-LASTNAME2",
"31": "B-LASTNAME3",
"32": "I-LASTNAME3",
"33": "B-PASS",
"34": "I-PASS",
"35": "B-PASSPORT",
"36": "I-PASSPORT",
"37": "B-POSTCODE",
"38": "I-POSTCODE",
"39": "B-SECADDRESS",
"40": "I-SECADDRESS",
"41": "B-SEX",
"42": "I-SEX",
"43": "B-SOCIALNUMBER",
"44": "I-SOCIALNUMBER",
"45": "B-STATE",
"46": "I-STATE",
"47": "B-STREET",
"48": "I-STREET",
"49": "B-TEL",
"50": "I-TEL",
"51": "B-TIME",
"52": "I-TIME",
"53": "B-TITLE",
"54": "I-TITLE",
"55": "B-USERNAME",
"56": "I-USERNAME"
},
"initializer_range": 0.02,
"intermediate_size": 8192,
"label2id": {
"B-BOD": 1,
"B-BUILDING": 3,
"B-CARDISSUER": 5,
"B-CITY": 7,
"B-COUNTRY": 9,
"B-DATE": 11,
"B-DRIVERLICENSE": 13,
"B-EMAIL": 15,
"B-GEOCOORD": 17,
"B-GIVENNAME1": 19,
"B-GIVENNAME2": 21,
"B-IDCARD": 23,
"B-IP": 25,
"B-LASTNAME1": 27,
"B-LASTNAME2": 29,
"B-LASTNAME3": 31,
"B-PASS": 33,
"B-PASSPORT": 35,
"B-POSTCODE": 37,
"B-SECADDRESS": 39,
"B-SEX": 41,
"B-SOCIALNUMBER": 43,
"B-STATE": 45,
"B-STREET": 47,
"B-TEL": 49,
"B-TIME": 51,
"B-TITLE": 53,
"B-USERNAME": 55,
"I-BOD": 2,
"I-BUILDING": 4,
"I-CARDISSUER": 6,
"I-CITY": 8,
"I-COUNTRY": 10,
"I-DATE": 12,
"I-DRIVERLICENSE": 14,
"I-EMAIL": 16,
"I-GEOCOORD": 18,
"I-GIVENNAME1": 20,
"I-GIVENNAME2": 22,
"I-IDCARD": 24,
"I-IP": 26,
"I-LASTNAME1": 28,
"I-LASTNAME2": 30,
"I-LASTNAME3": 32,
"I-PASS": 34,
"I-PASSPORT": 36,
"I-POSTCODE": 38,
"I-SECADDRESS": 40,
"I-SEX": 42,
"I-SOCIALNUMBER": 44,
"I-STATE": 46,
"I-STREET": 48,
"I-TEL": 50,
"I-TIME": 52,
"I-TITLE": 54,
"I-USERNAME": 56,
"O": 0
},
"max_position_embeddings": 4096,
"model_type": "phi3",
"num_attention_heads": 32,
"num_hidden_layers": 32,
"num_key_value_heads": 32,
"original_max_position_embeddings": 4096,
"pad_token_id": 32000,
"resid_pdrop": 0.0,
"rms_norm_eps": 1e-05,
"rope_scaling": null,
"rope_theta": 10000.0,
"sliding_window": 2047,
"tie_word_embeddings": false,
"torch_dtype": "bfloat16",
"transformers_version": "4.41.1",
"use_cache": false,
"vocab_size": 32064
}