Edit on GitHub

model = AutoAdapterModel.from_pretrained("bert-base-multilingual-cased")
config = AdapterConfig.load("pfeiffer", non_linearity="gelu", reduction_factor=2)
model.load_adapter("hu/wiki@ukp", config=config)

Description

Properties

Pre-trained model
bert-base-multilingual-cased
Adapter type
Prediction Head
  Yes
Task
Hungarian
Dataset

Architecture

Name
pfeiffer
Non-linearity
gelu
Reduction factor
2
{
  "ln_after": false,
  "ln_before": false,
  "mh_adapter": false,
  "output_adapter": true,
  "adapter_residual_before_ln": false,
  "non_linearity": "gelu",
  "original_ln_after": true,
  "original_ln_before": true,
  "reduction_factor": 2,
  "residual_before_ln": true
}

Author

  Name
Jonas Pfeiffer
  E-Mail
  GitHub
  Twitter

Versions

Identifier Comment Score Download
1 DEFAULT

Citations

Adapter
@inproceedings{pfeiffer20madx,
  title = "{MAD-X}: {A}n {A}dapter-{B}ased {F}ramework for {M}ulti-{T}ask {C}ross-{L}ingual {T}ransfer",
  author = "Pfeiffer, Jonas  and
    Vuli{\'c}, Ivan  and
    Gurevych, Iryna  and
    Ruder, Sebastian",
  booktitle = "Proceedings of the 2020 Conference on Empirical Methods in Natural Language Processing (EMNLP)",
  year = "2020",
  address = "Online",
  publisher = "Association for Computational Linguistics",
  url = "https://www.aclweb.org/anthology/2020.emnlp-main.617",
  pages = "7654--7673",
}
Architecture
@misc{pfeiffer2020adapterfusion,
  title={AdapterFusion: Non-Destructive Task Composition for Transfer Learning},
  author={Jonas Pfeiffer and Aishwarya Kamath and Andreas Rücklé and Kyunghyun Cho and Iryna Gurevych},
  year={2020},
  eprint={2005.00247},
  archivePrefix={arXiv},
  primaryClass={cs.CL}
}