You signed in with another tab or window. Reload to refresh your session.You signed out in another tab or window. Reload to refresh your session.You switched accounts on another tab or window. Reload to refresh your session.Dismiss alert
frommplm_simimportLoader# loading existing results given model_name and corpus_nameloader=Loader.from_pretrained(model_name='cis-lmu/glot500-base', corpus_name='flores200')
# Or loading results given similarity file# loader = Loader.from_tsv('your_similarity_file.tsv')# Getting similarity given language pairs# iso3_scriptsim=loader.get_sim('eng_Latn', 'cmn_Hani')
# or language namesim=loader.get_sim('English', 'Chinese')
Executor
frommplm_simimportLoader# model_name: any text/speech language model support by Huggingface# corpus_name: specific corpus name for saving# corpus_path: path for multi-parallel corpora, see corpora_demo for file formatting# corpus_type: text or speechexecutor=Executor(model_name='cis-lmu/glot500-base', corpus_name='own',
corpus_path='corpora/own', corpus_type='text')
# Runexecutor.run()
Citation
@article{DBLP:journals/corr/abs-2305-13684,
author = {Peiqin Lin and
Chengzhi Hu and
Zheyu Zhang and
Andr{\'{e}} F. T. Martins and
Hinrich Sch{\"{u}}tze},
title = {mPLM-Sim: Unveiling Better Cross-Lingual Similarity and Transfer in
Multilingual Pretrained Language Models},
journal = {CoRR},
volume = {abs/2305.13684},
year = {2023},
url = {https://doi.org/10.48550/arXiv.2305.13684},
doi = {10.48550/ARXIV.2305.13684},
eprinttype = {arXiv},
eprint = {2305.13684},
timestamp = {Mon, 05 Jun 2023 15:42:15 +0200},
biburl = {https://dblp.org/rec/journals/corr/abs-2305-13684.bib},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
About
mPLM-Sim: Better Cross-Lingual Similarity and Transfer in Multilingual Pretrained Language Models