{ "_name_or_path": "answerdotai/ModernBERT-base", "architectures": [ "Adapter" ], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 50281, "classifier_activation": "gelu", "classifier_bias": false, "classifier_dropout": 0.0, "classifier_pooling": "mean", "classifiers_size": [ 3, 2, 2, 2, 2, 2, 1, 2, 3, 2, 2, 2, 3, 3, 3, 3, 3, 3, 2, 2, 3, 2, 2, 2, 2, 2, 6, 2, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 3, 2, 2, 2, 2, 3, 3, 3, 3, 3, 3, 3, 3, 2, 2, 2, 2, 2, 2, 16, 100, 13, 100, 8, 3, 3, 2, 3, 2, 4, 3, 2, 3, 2, 2, 2, 2, 2, 3, 2, 3, 2, 4, 3, 3, 3, 2, 3, 1, 2, 2, 3, 13, 2, 2, 3, 2, 2, 3, 3, 3, 3, 2, 3, 3, 2, 3, 2, 2, 2, 2, 2, 3, 4, 3, 3, 2, 2, 3, 3, 2, 2, 2, 2, 2, 4, 3, 2, 2, 2, 3, 3, 3, 2, 3 ], "cls_token_id": 50281, "decoder_bias": true, "deterministic_flash_attn": false, "embedding_dropout": 0.0, "eos_token_id": 50282, "global_attn_every_n_layers": 3, "global_rope_theta": 160000.0, "gradient_checkpointing": false, "hidden_activation": "gelu", "hidden_size": 768, "id2label": { "0": "entailment", "1": "neutral", "2": "contradiction" }, "initializer_cutoff_factor": 2.0, "initializer_range": 0.02, "intermediate_size": 1152, "label2id": { "contradiction": 2, "entailment": 0, "neutral": 1 }, "labels_list": [ [ "entailment", "neutral", "contradiction" ], [ "entailment", "not_entailment" ], [ "entailment", "not_entailment" ], [ "not_entailment", "entailment" ], [ "not_equivalent", "equivalent" ], [ "not_duplicate", "duplicate" ], [], [ "False", "True" ], [ "entailment", "contradiction", "neutral" ], [ "False", "True" ], [ "False", "True" ], [ "entailment", "not_entailment" ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "neutral", "contradiction" ], [ "A_contradicts_B", "A_entails_B", "A_neutral_B" ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "neutral" ], [ "entailment", "non-entailment" ], [ "entailment", "neutral", "contradiction" ], [ "not-entailed", "entailed" ], [ "not-entailed", "entailed" ], [ "not-entailed", "entailed" ], [ "not-entailed", "entailed" ], [ "not-entailed", "entailed" ], [ "1", "2", "3", "4", "5", "6" ], [ "not-entailed", "entailed" ], [ "not-entailed", "entailed" ], [ "valid", "invalid" ], [ "valid", "invalid" ], [ "valid", "invalid" ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "neutral", "contradiction" ], [ 0, 1, 2 ], [ 0, 1, 2 ], [ 0, 1, 2 ], [ 0, 1, 2 ], [ 0, 1, 2 ], [ 0, 1 ], [ 0, 1 ], [ 0, 1 ], [ 0, 1 ], [ 0, 1, 2 ], [ 0, 1, 2 ], [ 0, 1, 2 ], [ 0, 1, 2 ], [ 0, 1, 2 ], [ 0, 1, 2 ], [ 0, 1, 2 ], [ 0, 1, 2 ], [ 0, 1 ], [ 0, 1 ], [ 0, 1 ], [ "not_paraphrase", "paraphrase" ], [ "unacceptable", "acceptable" ], [ "negative", "positive" ], [ "Synchrony", "Contrast", "Asynchronous", "Conjunction", "List", "Condition", "Pragmatic concession", "Restatement", "Pragmatic cause", "Alternative", "Pragmatic condition", "Pragmatic contrast", "Instantiation", "Exception", "Cause", "Concession" ], [], [ "1", "2", "3", "4", "5", "6", "7", "8", "9", "10", "11", "12", "13" ], [ "Adjustments", "Agreements", "Amendments", "Anti-Corruption Laws", "Applicable Laws", "Approvals", "Arbitration", "Assignments", "Assigns", "Authority", "Authorizations", "Base Salary", "Benefits", "Binding Effects", "Books", "Brokers", "Capitalization", "Change In Control", "Closings", "Compliance With Laws", "Confidentiality", "Consent To Jurisdiction", "Consents", "Construction", "Cooperation", "Costs", "Counterparts", "Death", "Defined Terms", "Definitions", "Disability", "Disclosures", "Duties", "Effective Dates", "Effectiveness", "Employment", "Enforceability", "Enforcements", "Entire Agreements", "Erisa", "Existence", "Expenses", "Fees", "Financial Statements", "Forfeitures", "Further Assurances", "General", "Governing Laws", "Headings", "Indemnifications", "Indemnity", "Insurances", "Integration", "Intellectual Property", "Interests", "Interpretations", "Jurisdictions", "Liens", "Litigations", "Miscellaneous", "Modifications", "No Conflicts", "No Defaults", "No Waivers", "Non-Disparagement", "Notices", "Organizations", "Participations", "Payments", "Positions", "Powers", "Publicity", "Qualifications", "Records", "Releases", "Remedies", "Representations", "Sales", "Sanctions", "Severability", "Solvency", "Specific Performance", "Submission To Jurisdiction", "Subsidiaries", "Successors", "Survival", "Tax Withholdings", "Taxes", "Terminations", "Terms", "Titles", "Transactions With Affiliates", "Use Of Proceeds", "Vacations", "Venues", "Vesting", "Waiver Of Jury Trials", "Waivers", "Warranties", "Withholdings" ], [], [ "negative", "neutral", "positive" ], [ "negative", "neutral", "positive" ], [ "False", "True" ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "neutral" ], [ "contrasting", "entailment", "neutral", "reasoning" ], [ "entailment", "neutral", "contradiction" ], [ "nothate", "hate" ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "neutral" ], [ "strengthener", "weakener" ], [ "strengthener", "weakener" ], [ "entailment", "neutral" ], [ "entailment", "neutral" ], [ "entailment", "neutral", "contradiction" ], [ "contradiction", "entailment" ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "not_entailment" ], [ "entailment", "non-entailment", "not entailment - contradiction", "not entailment - unknown" ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "neutral", "contradiction" ], [ "False", "True" ], [ "entailment", "neutral", "contradiction" ], [], [ "entailment", "not-entailment" ], [ "entailment", "not_entailment" ], [ "entailment", "neutral", "contradiction" ], [ "ad hominem", "ad populum", "appeal to emotion", "circular reasoning", "equivocation", "fallacy of credibility", "fallacy of extension", "fallacy of logic", "fallacy of relevance", "false causality", "false dilemma", "faulty generalization", "intentional" ], [ "no", "yes" ], [ false, true ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "neutral" ], [ "entailment", "neutral" ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "neutral", "contradiction" ], [ "DISPROVED", "PROVED", "UNKNOWN" ], [ "DISPROVED", "PROVED", "UNKNOWN" ], [ "entailment", "not_entailment" ], [ "contradict", "neutral", "support" ], [ "entailment", "neutral", "contradiction" ], [ "contradiction", "entailment" ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "not_entailment" ], [ "False", "True" ], [ "entailment", "not entailment" ], [ "False", "True" ], [ "entailment", "not entailment" ], [ "entailment", "neutral", "contradiction" ], [ "contradiction", "entailment", "neutral", "self_contradiction" ], [ "contradiction", "entailment", "neutral" ], [ "contradiction", "entailment", "neutral" ], [ "Contradiction", "Entailment" ], [ "entailment", "not-entailment" ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "not_entailment" ], [ "entailment", "non_entailment" ], [ "consistent", "inconsistent" ], [ "entailment", "not_entailment" ], [ "entailment", "not_entailment" ], [ "contrasting", "entailment", "neutral", "reasoning" ], [ "entailment", "neutral", "contradiction" ], [ "No", "Yes" ], [ "No.", "Yes." ], [ "entailment", "not_entailment" ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "neutral", "contradiction" ], [ "entailment", "neutral", "contradiction" ], [ "not-entailed", "entailed" ], [ 0, 1, 2 ] ], "layer_norm_eps": 1e-05, "local_attention": 128, "local_rope_theta": 10000.0, "max_position_embeddings": 2048, "mlp_bias": false, "mlp_dropout": 0.0, "model_type": "modernbert", "norm_bias": false, "norm_eps": 1e-05, "num_attention_heads": 12, "num_hidden_layers": 22, "pad_token_id": 50283, "position_embedding_type": "absolute", "problem_type": "single_label_classification", "reference_compile": true, "sep_token_id": 50282, "sparse_pred_ignore_index": -100, "sparse_prediction": false, "tasks": [ "glue/mnli", "glue/qnli", "glue/rte", "glue/wnli", "glue/mrpc", "glue/qqp", "glue/stsb", "super_glue/boolq", "super_glue/cb", "super_glue/multirc", "super_glue/wic", "super_glue/axg", "anli/a1", "anli/a2", "anli/a3", "sick/label", "sick/entailment_AB", "snli", "scitail/snli_format", "hans", "WANLI", "recast/recast_ner", "recast/recast_sentiment", "recast/recast_verbnet", "recast/recast_megaveridicality", "recast/recast_verbcorner", "recast/recast_kg_relations", "recast/recast_factuality", "recast/recast_puns", "probability_words_nli/reasoning_1hop", "probability_words_nli/usnli", "probability_words_nli/reasoning_2hop", "nan-nli", "nli_fever", "breaking_nli", "conj_nli", "fracas", "dialogue_nli", "mpe", "dnc", "recast_white/fnplus", "recast_white/sprl", "recast_white/dpr", "robust_nli/IS_CS", "robust_nli/LI_LI", "robust_nli/ST_WO", "robust_nli/PI_SP", "robust_nli/PI_CD", "robust_nli/ST_SE", "robust_nli/ST_NE", "robust_nli/ST_LM", "robust_nli_is_sd", "robust_nli_li_ts", "add_one_rte", "paws/labeled_final", "glue/cola", "glue/sst2", "pragmeval/pdtb", "lex_glue/eurlex", "lex_glue/scotus", "lex_glue/ledgar", "lex_glue/unfair_tos", "dynasent/dynabench.dynasent.r1.all/r1", "dynasent/dynabench.dynasent.r2.all/r2", "cycic_classification", "lingnli", "monotonicity-entailment", "scinli", "naturallogic", "dynahate", "syntactic-augmentation-nli", "autotnli", "defeasible-nli/atomic", "defeasible-nli/snli", "help-nli", "nli-veridicality-transitivity", "lonli", "dadc-limit-nli", "folio", "tomi-nli", "puzzte", "temporal-nli", "counterfactually-augmented-snli", "cnli", "boolq-natural-perturbations", "equate", "chaos-mnli-ambiguity", "logiqa-2.0-nli", "mindgames", "ConTRoL-nli", "logical-fallacy", "cladder", "conceptrules_v2", "zero-shot-label-nli", "scone", "monli", "SpaceNLI", "propsegment/nli", "FLD.v2/default", "FLD.v2/star", "SDOH-NLI", "scifact_entailment", "AdjectiveScaleProbe-nli", "resnli", "semantic_fragments_nli", "dataset_train_nli", "nlgraph", "ruletaker", "PARARULE-Plus", "logical-entailment", "nope", "LogicNLI", "contract-nli/contractnli_a/seg", "contract-nli/contractnli_b/full", "nli4ct_semeval2024", "biosift-nli", "SIGA-nli", "FOL-nli", "doc-nli", "mctest-nli", "natural-language-satisfiability", "idioms-nli", "lifecycle-entailment", "MSciNLI", "hover-3way/nli", "seahorse_summarization_evaluation", "missing-item-prediction/contrastive", "Pol_NLI", "synthetic-retrieval-NLI/count", "synthetic-retrieval-NLI/position", "synthetic-retrieval-NLI/binary", "babi_nli", "gen_debiased_nli" ], "torch_dtype": "float32", "transformers_version": "4.48.0.dev0", "vocab_size": 50368 }