| { | |
| "_name_or_path": "../output/MiniLMv2-userflow-v2-opt", | |
| "architectures": [ | |
| "RobertaForSequenceClassification" | |
| ], | |
| "attention_probs_dropout_prob": 0.1, | |
| "bos_token_id": 0, | |
| "classifier_dropout": null, | |
| "eos_token_id": 2, | |
| "hidden_act": "gelu", | |
| "hidden_dropout_prob": 0.1, | |
| "hidden_size": 384, | |
| "id2label": { | |
| "0": "OTHER", | |
| "1": "agrees_praising_thanking", | |
| "2": "asks_source", | |
| "3": "continue", | |
| "4": "continue_or_finnish_code", | |
| "5": "improve_or_modify_answer", | |
| "6": "lack_of_understandment", | |
| "7": "model_wrong_or_try_again", | |
| "8": "more_listing_or_expand", | |
| "9": "repeat_answers_or_question", | |
| "10": "request_example", | |
| "11": "user_complains_repetition", | |
| "12": "user_doubts_answer", | |
| "13": "user_goodbye", | |
| "14": "user_reminds_question", | |
| "15": "user_wants_agent_to_answer", | |
| "16": "user_wants_explanation", | |
| "17": "user_wants_more_detail", | |
| "18": "user_wants_shorter_longer_answer", | |
| "19": "user_wants_simplier_explanation", | |
| "20": "user_wants_yes_or_no" | |
| }, | |
| "initializer_range": 0.02, | |
| "intermediate_size": 1536, | |
| "label2id": { | |
| "OTHER": 0, | |
| "agrees_praising_thanking": 1, | |
| "asks_source": 2, | |
| "continue": 3, | |
| "continue_or_finnish_code": 4, | |
| "improve_or_modify_answer": 5, | |
| "lack_of_understandment": 6, | |
| "model_wrong_or_try_again": 7, | |
| "more_listing_or_expand": 8, | |
| "repeat_answers_or_question": 9, | |
| "request_example": 10, | |
| "user_complains_repetition": 11, | |
| "user_doubts_answer": 12, | |
| "user_goodbye": 13, | |
| "user_reminds_question": 14, | |
| "user_wants_agent_to_answer": 15, | |
| "user_wants_explanation": 16, | |
| "user_wants_more_detail": 17, | |
| "user_wants_shorter_longer_answer": 18, | |
| "user_wants_simplier_explanation": 19, | |
| "user_wants_yes_or_no": 20 | |
| }, | |
| "layer_norm_eps": 1e-05, | |
| "max_position_embeddings": 514, | |
| "model_type": "roberta", | |
| "num_attention_heads": 12, | |
| "num_hidden_layers": 6, | |
| "pad_token_id": 1, | |
| "position_embedding_type": "absolute", | |
| "problem_type": "single_label_classification", | |
| "torch_dtype": "float32", | |
| "transformers_version": "4.30.0", | |
| "type_vocab_size": 1, | |
| "use_cache": true, | |
| "vocab_size": 50265 | |
| } | |