{ "add_cross_attention": false, "architectures": [ "BertForSequenceClassification" ], "attention_probs_dropout_prob": 0.1, "bos_token_id": null, "classifier_dropout": null, "dtype": "float32", "eos_token_id": null, "hidden_act": "gelu", "hidden_dropout_prob": 0.1, "hidden_size": 384, "id2label": { "0": "code_generation", "1": "code_debugging", "2": "math_reasoning", "3": "creative_writing", "4": "summarization", "5": "translation", "6": "information_retrieval", "7": "data_analysis", "8": "web_search", "9": "general_chat" }, "initializer_range": 0.02, "intermediate_size": 1536, "is_decoder": false, "label2id": { "code_debugging": 1, "code_generation": 0, "creative_writing": 3, "data_analysis": 7, "general_chat": 9, "information_retrieval": 6, "math_reasoning": 2, "summarization": 4, "translation": 5, "web_search": 8 }, "layer_norm_eps": 1e-12, "max_position_embeddings": 512, "model_type": "bert", "num_attention_heads": 12, "num_hidden_layers": 12, "pad_token_id": 0, "problem_type": "single_label_classification", "tie_word_embeddings": true, "transformers_version": "5.1.0", "type_vocab_size": 2, "use_cache": false, "vocab_size": 30522 }