| { |
| "_name_or_path": "answerdotai/ModernBERT-large", |
| "architectures": [ |
| "Adapter" |
| ], |
| "attention_bias": false, |
| "attention_dropout": 0.0, |
| "bos_token_id": 50281, |
| "classifier_activation": "gelu", |
| "classifier_bias": false, |
| "classifier_dropout": 0.0, |
| "classifier_pooling": "mean", |
| "classifiers_size": [ |
| 3, |
| 2, |
| 2, |
| 2, |
| 2, |
| 2, |
| 1, |
| 2, |
| 3, |
| 2, |
| 2, |
| 2, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 2, |
| 2, |
| 3, |
| 2, |
| 2, |
| 2, |
| 2, |
| 2, |
| 6, |
| 2, |
| 2, |
| 2, |
| 2, |
| 2, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 2, |
| 2, |
| 2, |
| 2, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 3, |
| 2, |
| 2, |
| 2, |
| 2, |
| 2, |
| 2, |
| 16, |
| 100, |
| 13, |
| 100, |
| 8, |
| 3, |
| 3, |
| 2, |
| 3, |
| 2, |
| 4, |
| 3, |
| 2, |
| 3, |
| 2, |
| 2, |
| 2, |
| 2, |
| 2, |
| 3, |
| 2, |
| 3, |
| 2, |
| 4, |
| 3, |
| 3, |
| 3, |
| 2, |
| 3, |
| 1, |
| 2, |
| 2, |
| 3, |
| 13, |
| 2, |
| 2, |
| 3, |
| 2, |
| 2, |
| 3, |
| 3, |
| 3, |
| 3, |
| 2, |
| 3, |
| 2, |
| 3, |
| 2, |
| 3, |
| 2, |
| 2, |
| 2, |
| 2, |
| 2, |
| 3, |
| 4, |
| 3, |
| 3, |
| 2, |
| 2, |
| 3, |
| 3, |
| 2, |
| 2, |
| 2, |
| 2, |
| 2, |
| 4, |
| 3, |
| 2, |
| 2, |
| 2, |
| 3, |
| 3, |
| 3, |
| 2, |
| 3 |
| ], |
| "cls_token_id": 50281, |
| "decoder_bias": true, |
| "deterministic_flash_attn": false, |
| "embedding_dropout": 0.0, |
| "eos_token_id": 50282, |
| "global_attn_every_n_layers": 3, |
| "global_rope_theta": 160000.0, |
| "gradient_checkpointing": false, |
| "hidden_activation": "gelu", |
| "hidden_size": 1024, |
| "id2label": { |
| "0": "entailment", |
| "1": "neutral", |
| "2": "contradiction" |
| }, |
| "initializer_cutoff_factor": 2.0, |
| "initializer_range": 0.02, |
| "intermediate_size": 2624, |
| "label2id": { |
| "contradiction": 2, |
| "entailment": 0, |
| "neutral": 1 |
| }, |
| "labels_list": [ |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "not_entailment" |
| ], |
| [ |
| "entailment", |
| "not_entailment" |
| ], |
| [ |
| "not_entailment", |
| "entailment" |
| ], |
| [ |
| "not_equivalent", |
| "equivalent" |
| ], |
| [ |
| "not_duplicate", |
| "duplicate" |
| ], |
| [], |
| [ |
| "False", |
| "True" |
| ], |
| [ |
| "entailment", |
| "contradiction", |
| "neutral" |
| ], |
| [ |
| "False", |
| "True" |
| ], |
| [ |
| "False", |
| "True" |
| ], |
| [ |
| "entailment", |
| "not_entailment" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "A_contradicts_B", |
| "A_entails_B", |
| "A_neutral_B" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "neutral" |
| ], |
| [ |
| "entailment", |
| "non-entailment" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "not-entailed", |
| "entailed" |
| ], |
| [ |
| "not-entailed", |
| "entailed" |
| ], |
| [ |
| "not-entailed", |
| "entailed" |
| ], |
| [ |
| "not-entailed", |
| "entailed" |
| ], |
| [ |
| "not-entailed", |
| "entailed" |
| ], |
| [ |
| "1", |
| "2", |
| "3", |
| "4", |
| "5", |
| "6" |
| ], |
| [ |
| "not-entailed", |
| "entailed" |
| ], |
| [ |
| "not-entailed", |
| "entailed" |
| ], |
| [ |
| "valid", |
| "invalid" |
| ], |
| [ |
| "valid", |
| "invalid" |
| ], |
| [ |
| "valid", |
| "invalid" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| 0, |
| 1, |
| 2 |
| ], |
| [ |
| 0, |
| 1, |
| 2 |
| ], |
| [ |
| 0, |
| 1, |
| 2 |
| ], |
| [ |
| 0, |
| 1, |
| 2 |
| ], |
| [ |
| 0, |
| 1, |
| 2 |
| ], |
| [ |
| 0, |
| 1 |
| ], |
| [ |
| 0, |
| 1 |
| ], |
| [ |
| 0, |
| 1 |
| ], |
| [ |
| 0, |
| 1 |
| ], |
| [ |
| 0, |
| 1, |
| 2 |
| ], |
| [ |
| 0, |
| 1, |
| 2 |
| ], |
| [ |
| 0, |
| 1, |
| 2 |
| ], |
| [ |
| 0, |
| 1, |
| 2 |
| ], |
| [ |
| 0, |
| 1, |
| 2 |
| ], |
| [ |
| 0, |
| 1, |
| 2 |
| ], |
| [ |
| 0, |
| 1, |
| 2 |
| ], |
| [ |
| 0, |
| 1, |
| 2 |
| ], |
| [ |
| 0, |
| 1 |
| ], |
| [ |
| 0, |
| 1 |
| ], |
| [ |
| 0, |
| 1 |
| ], |
| [ |
| "not_paraphrase", |
| "paraphrase" |
| ], |
| [ |
| "unacceptable", |
| "acceptable" |
| ], |
| [ |
| "negative", |
| "positive" |
| ], |
| [ |
| "Synchrony", |
| "Contrast", |
| "Asynchronous", |
| "Conjunction", |
| "List", |
| "Condition", |
| "Pragmatic concession", |
| "Restatement", |
| "Pragmatic cause", |
| "Alternative", |
| "Pragmatic condition", |
| "Pragmatic contrast", |
| "Instantiation", |
| "Exception", |
| "Cause", |
| "Concession" |
| ], |
| [], |
| [ |
| "1", |
| "2", |
| "3", |
| "4", |
| "5", |
| "6", |
| "7", |
| "8", |
| "9", |
| "10", |
| "11", |
| "12", |
| "13" |
| ], |
| [ |
| "Adjustments", |
| "Agreements", |
| "Amendments", |
| "Anti-Corruption Laws", |
| "Applicable Laws", |
| "Approvals", |
| "Arbitration", |
| "Assignments", |
| "Assigns", |
| "Authority", |
| "Authorizations", |
| "Base Salary", |
| "Benefits", |
| "Binding Effects", |
| "Books", |
| "Brokers", |
| "Capitalization", |
| "Change In Control", |
| "Closings", |
| "Compliance With Laws", |
| "Confidentiality", |
| "Consent To Jurisdiction", |
| "Consents", |
| "Construction", |
| "Cooperation", |
| "Costs", |
| "Counterparts", |
| "Death", |
| "Defined Terms", |
| "Definitions", |
| "Disability", |
| "Disclosures", |
| "Duties", |
| "Effective Dates", |
| "Effectiveness", |
| "Employment", |
| "Enforceability", |
| "Enforcements", |
| "Entire Agreements", |
| "Erisa", |
| "Existence", |
| "Expenses", |
| "Fees", |
| "Financial Statements", |
| "Forfeitures", |
| "Further Assurances", |
| "General", |
| "Governing Laws", |
| "Headings", |
| "Indemnifications", |
| "Indemnity", |
| "Insurances", |
| "Integration", |
| "Intellectual Property", |
| "Interests", |
| "Interpretations", |
| "Jurisdictions", |
| "Liens", |
| "Litigations", |
| "Miscellaneous", |
| "Modifications", |
| "No Conflicts", |
| "No Defaults", |
| "No Waivers", |
| "Non-Disparagement", |
| "Notices", |
| "Organizations", |
| "Participations", |
| "Payments", |
| "Positions", |
| "Powers", |
| "Publicity", |
| "Qualifications", |
| "Records", |
| "Releases", |
| "Remedies", |
| "Representations", |
| "Sales", |
| "Sanctions", |
| "Severability", |
| "Solvency", |
| "Specific Performance", |
| "Submission To Jurisdiction", |
| "Subsidiaries", |
| "Successors", |
| "Survival", |
| "Tax Withholdings", |
| "Taxes", |
| "Terminations", |
| "Terms", |
| "Titles", |
| "Transactions With Affiliates", |
| "Use Of Proceeds", |
| "Vacations", |
| "Venues", |
| "Vesting", |
| "Waiver Of Jury Trials", |
| "Waivers", |
| "Warranties", |
| "Withholdings" |
| ], |
| [], |
| [ |
| "negative", |
| "neutral", |
| "positive" |
| ], |
| [ |
| "negative", |
| "neutral", |
| "positive" |
| ], |
| [ |
| "False", |
| "True" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "neutral" |
| ], |
| [ |
| "contrasting", |
| "entailment", |
| "neutral", |
| "reasoning" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "nothate", |
| "hate" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "neutral" |
| ], |
| [ |
| "strengthener", |
| "weakener" |
| ], |
| [ |
| "strengthener", |
| "weakener" |
| ], |
| [ |
| "entailment", |
| "neutral" |
| ], |
| [ |
| "entailment", |
| "neutral" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "contradiction", |
| "entailment" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "not_entailment" |
| ], |
| [ |
| "entailment", |
| "non-entailment", |
| "not entailment - contradiction", |
| "not entailment - unknown" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "False", |
| "True" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [], |
| [ |
| "entailment", |
| "not-entailment" |
| ], |
| [ |
| "entailment", |
| "not_entailment" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "ad hominem", |
| "ad populum", |
| "appeal to emotion", |
| "circular reasoning", |
| "equivocation", |
| "fallacy of credibility", |
| "fallacy of extension", |
| "fallacy of logic", |
| "fallacy of relevance", |
| "false causality", |
| "false dilemma", |
| "faulty generalization", |
| "intentional" |
| ], |
| [ |
| "no", |
| "yes" |
| ], |
| [ |
| false, |
| true |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "neutral" |
| ], |
| [ |
| "entailment", |
| "neutral" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "DISPROVED", |
| "PROVED", |
| "UNKNOWN" |
| ], |
| [ |
| "DISPROVED", |
| "PROVED", |
| "UNKNOWN" |
| ], |
| [ |
| "entailment", |
| "not_entailment" |
| ], |
| [ |
| "contradict", |
| "neutral", |
| "support" |
| ], |
| [ |
| false, |
| true |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "contradiction", |
| "entailment" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "not_entailment" |
| ], |
| [ |
| "False", |
| "True" |
| ], |
| [ |
| "entailment", |
| "not entailment" |
| ], |
| [ |
| "False", |
| "True" |
| ], |
| [ |
| "entailment", |
| "not entailment" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "contradiction", |
| "entailment", |
| "neutral", |
| "self_contradiction" |
| ], |
| [ |
| "contradiction", |
| "entailment", |
| "neutral" |
| ], |
| [ |
| "contradiction", |
| "entailment", |
| "neutral" |
| ], |
| [ |
| "Contradiction", |
| "Entailment" |
| ], |
| [ |
| "entailment", |
| "not-entailment" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "not_entailment" |
| ], |
| [ |
| "entailment", |
| "non_entailment" |
| ], |
| [ |
| "consistent", |
| "inconsistent" |
| ], |
| [ |
| "entailment", |
| "not_entailment" |
| ], |
| [ |
| "entailment", |
| "not_entailment" |
| ], |
| [ |
| "contrasting", |
| "entailment", |
| "neutral", |
| "reasoning" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "No", |
| "Yes" |
| ], |
| [ |
| "No.", |
| "Yes." |
| ], |
| [ |
| "entailment", |
| "not_entailment" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "entailment", |
| "neutral", |
| "contradiction" |
| ], |
| [ |
| "not-entailed", |
| "entailed" |
| ], |
| [ |
| 0, |
| 1, |
| 2 |
| ] |
| ], |
| "layer_norm_eps": 1e-05, |
| "local_attention": 128, |
| "local_rope_theta": 10000.0, |
| "max_position_embeddings": 2048, |
| "mlp_bias": false, |
| "mlp_dropout": 0.0, |
| "model_type": "modernbert", |
| "norm_bias": false, |
| "norm_eps": 1e-05, |
| "num_attention_heads": 16, |
| "num_hidden_layers": 28, |
| "pad_token_id": 50283, |
| "position_embedding_type": "absolute", |
| "problem_type": "single_label_classification", |
| "reference_compile": true, |
| "sep_token_id": 50282, |
| "sparse_pred_ignore_index": -100, |
| "sparse_prediction": false, |
| "tasks": [ |
| "glue/mnli", |
| "glue/qnli", |
| "glue/rte", |
| "glue/wnli", |
| "glue/mrpc", |
| "glue/qqp", |
| "glue/stsb", |
| "super_glue/boolq", |
| "super_glue/cb", |
| "super_glue/multirc", |
| "super_glue/wic", |
| "super_glue/axg", |
| "anli/a1", |
| "anli/a2", |
| "anli/a3", |
| "sick/label", |
| "sick/entailment_AB", |
| "snli", |
| "scitail/snli_format", |
| "hans", |
| "WANLI", |
| "recast/recast_ner", |
| "recast/recast_sentiment", |
| "recast/recast_verbnet", |
| "recast/recast_megaveridicality", |
| "recast/recast_verbcorner", |
| "recast/recast_kg_relations", |
| "recast/recast_factuality", |
| "recast/recast_puns", |
| "probability_words_nli/reasoning_1hop", |
| "probability_words_nli/usnli", |
| "probability_words_nli/reasoning_2hop", |
| "nan-nli", |
| "nli_fever", |
| "breaking_nli", |
| "conj_nli", |
| "fracas", |
| "dialogue_nli", |
| "mpe", |
| "dnc", |
| "recast_white/fnplus", |
| "recast_white/sprl", |
| "recast_white/dpr", |
| "robust_nli/IS_CS", |
| "robust_nli/LI_LI", |
| "robust_nli/ST_WO", |
| "robust_nli/PI_SP", |
| "robust_nli/PI_CD", |
| "robust_nli/ST_SE", |
| "robust_nli/ST_NE", |
| "robust_nli/ST_LM", |
| "robust_nli_is_sd", |
| "robust_nli_li_ts", |
| "add_one_rte", |
| "paws/labeled_final", |
| "glue/cola", |
| "glue/sst2", |
| "pragmeval/pdtb", |
| "lex_glue/eurlex", |
| "lex_glue/scotus", |
| "lex_glue/ledgar", |
| "lex_glue/unfair_tos", |
| "dynasent/dynabench.dynasent.r1.all/r1", |
| "dynasent/dynabench.dynasent.r2.all/r2", |
| "cycic_classification", |
| "lingnli", |
| "monotonicity-entailment", |
| "scinli", |
| "naturallogic", |
| "dynahate", |
| "syntactic-augmentation-nli", |
| "autotnli", |
| "defeasible-nli/atomic", |
| "defeasible-nli/snli", |
| "help-nli", |
| "nli-veridicality-transitivity", |
| "lonli", |
| "dadc-limit-nli", |
| "folio", |
| "tomi-nli", |
| "puzzte", |
| "temporal-nli", |
| "counterfactually-augmented-snli", |
| "cnli", |
| "boolq-natural-perturbations", |
| "equate", |
| "chaos-mnli-ambiguity", |
| "logiqa-2.0-nli", |
| "mindgames", |
| "ConTRoL-nli", |
| "logical-fallacy", |
| "cladder", |
| "conceptrules_v2", |
| "zero-shot-label-nli", |
| "scone", |
| "monli", |
| "SpaceNLI", |
| "propsegment/nli", |
| "FLD.v2/default", |
| "FLD.v2/star", |
| "SDOH-NLI", |
| "scifact_entailment", |
| "feasibilityQA", |
| "AdjectiveScaleProbe-nli", |
| "resnli", |
| "semantic_fragments_nli", |
| "dataset_train_nli", |
| "nlgraph", |
| "ruletaker", |
| "PARARULE-Plus", |
| "logical-entailment", |
| "nope", |
| "LogicNLI", |
| "contract-nli/contractnli_a/seg", |
| "contract-nli/contractnli_b/full", |
| "nli4ct_semeval2024", |
| "biosift-nli", |
| "SIGA-nli", |
| "FOL-nli", |
| "doc-nli", |
| "mctest-nli", |
| "natural-language-satisfiability", |
| "idioms-nli", |
| "lifecycle-entailment", |
| "MSciNLI", |
| "hover-3way/nli", |
| "seahorse_summarization_evaluation", |
| "missing-item-prediction/contrastive", |
| "Pol_NLI", |
| "synthetic-retrieval-NLI/count", |
| "synthetic-retrieval-NLI/position", |
| "synthetic-retrieval-NLI/binary", |
| "babi_nli", |
| "gen_debiased_nli" |
| ], |
| "torch_dtype": "float32", |
| "transformers_version": "4.48.0.dev0", |
| "vocab_size": 50368 |
| } |
|
|