@article{Gentner1983, author = {Dedre Gentner}, title = {Structure-Mapping: A Theoretical Framework for Analogy}, journal = {Cognitive Science}, year = {1983}, volume = {7}, number = {2}, pages = {155--170} } @book{Holyoak1995, author = {Keith J. Holyoak and Paul Thagard}, title = {Mental Leaps: Analogy in Creative Thought}, publisher = {MIT Press}, year = {1995} } @article{Falkenhainer1989, author = {Brian Falkenhainer and Kenneth D. Forbus and Dedre Gentner}, title = {The Structure-Mapping Engine: Algorithm and Examples}, journal = {Artificial Intelligence}, year = {1989}, volume = {41}, number = {1}, pages = {1--63} } @inproceedings{Hokamp2017, author = {Chris Hokamp and Qun Liu}, title = {Lexically Constrained Decoding for Sequence Generation Using Grid Beam Search}, booktitle = {Proceedings of ACL}, year = {2017}, pages = {1535--1546} } @inproceedings{Anderson2017, author = {Peter Anderson and Basura Fernando and Mark Johnson and Stephen Gould}, title = {Guided Open Vocabulary Image Captioning with Constrained Beam Search}, booktitle = {Proceedings of EMNLP}, year = {2017}, pages = {936--945} } @inproceedings{Lu2022, author = {Ximing Lu and Sean Welleck and Jack Hessel and Yejin Choi}, title = {NeuroLogic Decoding: (Un)supervised Neural Text Generation with Predicate Logic Constraints}, booktitle = {Proceedings of NAACL}, year = {2022}, pages = {2373--2387} } @inproceedings{Dathathri2020, author = {Sumanth Dathathri and Andrea Madotto and Janice Lan and Jane Hung and Eric Frank and Piero Molino and Jason Yosinski and Rosanne Liu}, title = {Plug and Play Language Models: A Simple Approach to Controlled Text Generation}, booktitle = {Proceedings of ICLR}, year = {2020} } @article{Shannon1948, author = {Claude E. Shannon}, title = {A Mathematical Theory of Communication}, journal = {Bell System Technical Journal}, year = {1948}, volume = {27}, pages = {379--423, 623--656} } @article{Kullback1951, author = {Solomon Kullback and Richard A. Leibler}, title = {On Information and Sufficiency}, journal = {Annals of Mathematical Statistics}, year = {1951}, volume = {22}, number = {1}, pages = {79--86} } @article{Lin1991, author = {Jianhua Lin}, title = {Divergence Measures Based on the Shannon Entropy}, journal = {IEEE Transactions on Information Theory}, year = {1991}, volume = {37}, number = {1}, pages = {145--151} } @inproceedings{Mikolov2013, author = {Tomas Mikolov and Ilya Sutskever and Kai Chen and Greg Corrado and Jeffrey Dean}, title = {Distributed Representations of Words and Phrases and their Compositionality}, booktitle = {Advances in Neural Information Processing Systems}, year = {2013}, pages = {3111--3119} } @inproceedings{Conneau2018, author = {Alexis Conneau and Guillaume Lample and Marc'Aurelio Ranzato and Ludovic Denoyer and Herv{\'e} J{\'e}gou}, title = {Word Translation Without Parallel Data}, booktitle = {Proceedings of ICLR}, year = {2018} } @inproceedings{Devlin2019, author = {Jacob Devlin and Ming{-}Wei Chang and Kenton Lee and Kristina Toutanova}, title = {BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding}, booktitle = {Proceedings of NAACL}, year = {2019}, pages = {4171--4186} } @article{Ruder2019, author = {Sebastian Ruder and Ivan Vuli{\'c} and Anders S{\o}gaard}, title = {A Survey of Cross-Lingual Word Embedding Models}, journal = {Journal of Artificial Intelligence Research}, year = {2019}, volume = {65}, pages = {569--631} } @article{Brown2020, author = {Tom B. Brown and Benjamin Mann and Nick Ryder and Melanie Subbiah and Jared Kaplan and Prafulla Dhariwal and Arvind Neelakantan and Pranav Shyam and Girish Sastry and Amanda Askell and others}, title = {Language Models are Few-Shot Learners}, journal = {Advances in Neural Information Processing Systems}, year = {2020}, volume = {33}, pages = {1877--1901} } @article{Ouyang2022, author = {Long Ouyang and Jeff Wu and Xu Jiang and Diogo Almeida and Carroll L. Wainwright and Pamela Mishkin and Chong Zhang and Sandhini Agarwal and Katarina Slama and Alex Ray and others}, title = {Training Language Models to Follow Instructions with Human Feedback}, journal = {Advances in Neural Information Processing Systems}, year = {2022}, volume = {35}, pages = {27730--27744} } @article{Touvron2023, author = {Hugo Touvron and Louis Martin and Kevin Stone and Peter Albert and Amjad Almahairi and Yasmine Babaei and Nikolay Bashlykov and Soumya Batra and Prajjwal Bhargava and Shruti Bhosale and others}, title = {LLaMA: Open and Efficient Foundation Language Models}, journal = {arXiv preprint arXiv:2302.13971}, year = {2023} } @article{OpenAI2023, author = {{OpenAI}}, title = {GPT-4 Technical Report}, journal = {arXiv preprint arXiv:2303.08774}, year = {2023} } @article{Alexandrov2024BgGPT, title = {BgGPT 1.0: Extending English-centric LLMs to other languages}, author = {Anton Alexandrov and Veselin Raychev and Dimitar I. Dimitrov and Ce Zhang and Martin Vechev and Kristina Toutanova}, journal = {arXiv preprint arXiv:2412.10893}, year = {2024}, url = {https://arxiv.org/abs/2412.10893}, eprint = {2412.10893}, archivePrefix= {arXiv}, primaryClass = {cs.CL} }