sordonia's picture
Upload model
6f6c01c verified
{"base_model": "microsoft/Phi-3.5-mini-instruct", "class_name": "mttl.models.expert_model.MultiExpertModelConfig", "default_expert_name": null, "expert_infos": [{"expert_name": "information_extraction_and_comprehension_tasks", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "information_extraction_and_transformation_tasks", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "diverse_question-answer_tasks_with_contextual_understanding", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "summarization_and_condensation_tasks", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "generating_questions_based_on_given_information", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "answering_specific_questions_based_on_provided_information", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "generating_summaries_and_titles_for_texts", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "summarization_and_title_generation_tasks", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "evaluative_and_interpretative_tasks", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "short_story_continuation_and_completion_tasks", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "generating_and_extracting_textual_content", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "logical_reasoning_and_inference_tasks", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "identifying_and_analyzing_pronoun_references_and_narrators", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "extracting_specific_information_from_textual_contexts", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "concise_question-answering_and_information_extraction", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "diverse_question-answer_and_translation_tasks", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "mathematical_problem_solving_and_calculation_tasks", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "evaluating_and_comparing_textual_information", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "error_identification_and_sequence_validation_tasks", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "text_formatting_and_correction_tasks", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "multilingual_translation_and_interpretation_tasks", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "classification_and_categorization_tasks", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "sentiment_analysis_and_review_classification", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "creative_and_contextual_writing_prompts", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "evaluating_and_comparing_sentence_meanings_and_contexts", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}, {"expert_name": "step-by-step_how-to_guides", "class_name": "mttl.models.library.expert.ExpertInfo", "expert_task_name": null, "parent_node": null, "expert_config": {"modify_modules": ".*", "class_name": "mttl.models.modifiers.lora.LoRAConfig", "modify_layers": "qkv_proj|o_proj|down_proj|gate_up_proj", "tie_params": null, "lora_rank": 16, "lora_alpha": 32, "lora_dropout": 0.05, "lora_init_b_random": false}, "training_config": null, "expert_model": "microsoft/Phi-3.5-mini-instruct"}], "selector_config": {"router_granularity": "*", "class_name": "mttl.models.containers.selectors.arrow_selector.ArrowSelectorConfig", "lora_merge_after": false, "selector_logging": false, "num_experts": 0, "library_id": null, "selector_data_id": null, "router_temp": 1.0, "top_k": 2, "proto_init": "arrow", "input_norm_fn": "id", "proto_norm_fn": "id"}}