yangwang825's picture
End of training
2222fb6 verified
{
"architectures": [
"UnmaskingQwen3ForTokenClassification"
],
"attention_bias": false,
"attention_dropout": 0.0,
"bos_token_id": 151643,
"eos_token_id": 151645,
"head_dim": 128,
"hidden_act": "silu",
"hidden_size": 1024,
"id2label": {
"0": "O",
"1": "B-unique_identifier",
"2": "I-unique_identifier",
"3": "B-date_of_birth",
"4": "I-date_of_birth",
"5": "B-ssn",
"6": "I-ssn",
"7": "B-date_time",
"8": "I-date_time",
"9": "B-person_name",
"10": "I-person_name",
"11": "B-email",
"12": "I-email",
"13": "B-location",
"14": "I-location",
"15": "B-phone_number",
"16": "I-phone_number",
"17": "B-ipv4",
"18": "I-ipv4",
"19": "B-credit_card_number",
"20": "I-credit_card_number",
"21": "B-user_name",
"22": "I-user_name",
"23": "B-company_name",
"24": "I-company_name",
"25": "B-account_number",
"26": "I-account_number",
"27": "B-api_key",
"28": "I-api_key",
"29": "B-ipv6",
"30": "I-ipv6",
"31": "B-password",
"32": "I-password",
"33": "B-url",
"34": "I-url",
"35": "B-swift_bic",
"36": "I-swift_bic",
"37": "B-cvv",
"38": "I-cvv",
"39": "B-pin",
"40": "I-pin"
},
"initializer_range": 0.02,
"intermediate_size": 3072,
"label2id": {
"B-account_number": 25,
"B-api_key": 27,
"B-company_name": 23,
"B-credit_card_number": 19,
"B-cvv": 37,
"B-date_of_birth": 3,
"B-date_time": 7,
"B-email": 11,
"B-ipv4": 17,
"B-ipv6": 29,
"B-location": 13,
"B-password": 31,
"B-person_name": 9,
"B-phone_number": 15,
"B-pin": 39,
"B-ssn": 5,
"B-swift_bic": 35,
"B-unique_identifier": 1,
"B-url": 33,
"B-user_name": 21,
"I-account_number": 26,
"I-api_key": 28,
"I-company_name": 24,
"I-credit_card_number": 20,
"I-cvv": 38,
"I-date_of_birth": 4,
"I-date_time": 8,
"I-email": 12,
"I-ipv4": 18,
"I-ipv6": 30,
"I-location": 14,
"I-password": 32,
"I-person_name": 10,
"I-phone_number": 16,
"I-pin": 40,
"I-ssn": 6,
"I-swift_bic": 36,
"I-unique_identifier": 2,
"I-url": 34,
"I-user_name": 22,
"O": 0
},
"max_position_embeddings": 40960,
"max_window_layers": 28,
"model_type": "qwen3",
"num_attention_heads": 16,
"num_hidden_layers": 28,
"num_key_value_heads": 8,
"rms_norm_eps": 1e-06,
"rope_scaling": null,
"rope_theta": 1000000,
"sliding_window": null,
"tie_word_embeddings": true,
"torch_dtype": "float32",
"transformers_version": "4.51.3",
"use_cache": true,
"use_sliding_window": false,
"vocab_size": 151936,
"auto_map": {
"AutoModelForTokenClassification": "modeling_unmasking_qwen.UnmaskingQwen3ForTokenClassification"
}
}