{ "lr_encoder": "1e-5", "lr_others": "1e-4", "weight_decay_encoder": 0.01, "weight_decay_other": 0.01, "num_steps": 500000, "warmup_ratio": 0.1, "train_batch_size": 8, "eval_every": 15000, "gradient_accumulation": 8, "eval_batch_size": 32, "num_layers_freeze": null, "early_stopping_patience": null, "early_stopping_delta": 0.0, "save_at": [ 15000, 30000, 45000, 60000, 75000, 90000, 105000, 120000, 135000, 150000, 165000, 180000, 195000, 210000, 225000, 240000, 255000, 270000, 285000, 300000, 315000, 330000, 345000, 360000, 375000, 390000, 405000, 420000, 435000, 450000, 465000, 480000, 495000, 500000 ], "max_saves": 8, "max_width": 6, "model_name": "microsoft/deberta-v3-large", "fine_tune": true, "subtoken_pooling": "first", "hidden_size": 768, "scorer": "dot", "rel_mode": "marker", "span_marker_mode": "markerv1", "refine_prompt": false, "refine_relation": false, "ffn_mul": 4, "dropout": 0.4, "scheduler": "cosine_with_warmup", "loss_func": "binary_cross_entropy_loss", "alpha": 0.6, "gamma": 3, "label_embed_strategy": "both", "use_typed_relations": true, "consistency_loss_weight": 0.1, "enable_ner_module": true, "ner_threshold": 0.5, "ner_fn_loss_weight": 1.5, "ner_loss_weight": 100.0, "rel_loss_weight": 1.0, "ner_threshold_offset": -0.02, "training_phase": "ner_only", "span_f1_target": 0.7, "relation_f1_target": 0.7, "coref_classifier": false, "coref_loss_weight": 10.0, "coreference_label": null, "dataset_name": "custom", "root_dir": "multi_domain", "train_data": [ "data/multi_domain_train_processed.jsonl" ], "eval_data": [ "data/multi_domain_test_processed.jsonl" ], "prev_path": "./ner-glirel-log/saved_at/model_60000", "size_sup": -1, "num_train_rel_types": 40, "num_unseen_rel_types": 15, "top_k": 1, "random_drop": false, "max_len": 512, "eval_threshold": [ 0.1, 0.2, 0.3, 0.5, 0.6, 0.7 ], "max_entity_pair_distance": null, "fixed_relation_types": false, "name": "large", "log_dir": "ner-glirel-log-2/" }