default search action
BibTeX records: Young Jin Kim 0001
@article{DBLP:journals/corr/abs-2503-01743,
author = {Abdelrahman Abouelenin and
Atabak Ashfaq and
Adam Atkinson and
Hany Awadalla and
Nguyen Bach and
Jianmin Bao and
Alon Benhaim and
Martin Cai and
Vishrav Chaudhary and
Congcong Chen and
Dong Chen and
Dongdong Chen and
Jun{-}Kun Chen and
Weizhu Chen and
Yen{-}Chun Chen and
Yi{-}ling Chen and
Qi Dai and
Xiyang Dai and
Ruchao Fan and
Mei Gao and
Min Gao and
Amit Garg and
Abhishek Goswami and
Junheng Hao and
Amr Hendy and
Yuxuan Hu and
Xin Jin and
Mahmoud Khademi and
Dongwoo Kim and
Young Jin Kim and
Gina Lee and
Jinyu Li and
Yunsheng Li and
Chen Liang and
Xihui Lin and
Zeqi Lin and
Mengchen Liu and
Yang Liu and
Gilsinia Lopez and
Chong Luo and
Piyush Madan and
Vadim Mazalov and
Arindam Mitra and
Ali Mousavi and
Anh Nguyen and
Jing Pan and
Daniel Perez{-}Becker and
Jacob Platin and
Thomas Portet and
Kai Qiu and
Bo Ren and
Liliang Ren and
Sambuddha Roy and
Ning Shang and
Yelong Shen and
Saksham Singhal and
Subhojit Som and
Xia Song and
Tetyana Sych and
Praneetha Vaddamanu and
Shuohang Wang and
Yiming Wang and
Zhenghao Wang and
Haibin Wu and
Haoran Xu and
Weijian Xu and
Yifan Yang and
Ziyi Yang and
Donghan Yu and
Ishmam Zabir and
Jianwen Zhang and
Li Lyna Zhang and
Yunan Zhang and
Xiren Zhou},
title = {Phi-4-Mini Technical Report: Compact yet Powerful Multimodal Language
Models via Mixture-of-LoRAs},
journal = {CoRR},
volume = {abs/2503.01743},
year = {2025}
}
@article{DBLP:journals/corr/abs-2504-21233,
author = {Haoran Xu and
Baolin Peng and
Hany Awadalla and
Dongdong Chen and
Yen{-}Chun Chen and
Mei Gao and
Young Jin Kim and
Yunsheng Li and
Liliang Ren and
Yelong Shen and
Shuohang Wang and
Weijian Xu and
Jianfeng Gao and
Weizhu Chen},
title = {Phi-4-Mini-Reasoning: Exploring the Limits of Small Reasoning Language
Models in Math},
journal = {CoRR},
volume = {abs/2504.21233},
year = {2025}
}
@article{DBLP:journals/corr/abs-2506-18349,
author = {Zichong Li and
Chen Liang and
Zixuan Zhang and
Ilgee Hong and
Young Jin Kim and
Weizhu Chen and
Tuo Zhao},
title = {SlimMoE: Structured Compression of Large MoE Models via Expert Slimming
and Distillation},
journal = {CoRR},
volume = {abs/2506.18349},
year = {2025}
}
@article{DBLP:journals/corr/abs-2507-06607,
author = {Liliang Ren and
Congcong Chen and
Haoran Xu and
Young Jin Kim and
Adam Atkinson and
Zheng Zhan and
Jiankai Sun and
Baolin Peng and
Liyuan Liu and
Shuohang Wang and
Hao Cheng and
Jianfeng Gao and
Weizhu Chen and
Yelong Shen},
title = {Decoder-Hybrid-Decoder Architecture for Efficient Reasoning with Long
Generation},
journal = {CoRR},
volume = {abs/2507.06607},
year = {2025}
}
@inproceedings{DBLP:conf/iclr/Xu0SA24,
author = {Haoran Xu and
Young Jin Kim and
Amr Sharaf and
Hany Hassan Awadalla},
title = {A Paradigm Shift in Machine Translation: Boosting Translation Performance
of Large Language Models},
booktitle = {{ICLR}},
publisher = {OpenReview.net},
year = {2024}
}
@inproceedings{DBLP:conf/icml/XuSCTSDM024,
author = {Haoran Xu and
Amr Sharaf and
Yunmo Chen and
Weiting Tan and
Lingfeng Shen and
Benjamin Van Durme and
Kenton Murray and
Young Jin Kim},
title = {Contrastive Preference Optimization: Pushing the Boundaries of {LLM}
Performance in Machine Translation},
booktitle = {{ICML}},
publisher = {OpenReview.net},
year = {2024}
}
@article{DBLP:journals/corr/abs-2401-08417,
author = {Haoran Xu and
Amr Sharaf and
Yunmo Chen and
Weiting Tan and
Lingfeng Shen and
Benjamin Van Durme and
Kenton Murray and
Young Jin Kim},
title = {Contrastive Preference Optimization: Pushing the Boundaries of {LLM}
Performance in Machine Translation},
journal = {CoRR},
volume = {abs/2401.08417},
year = {2024}
}
@article{DBLP:journals/corr/abs-2409-12136,
author = {Liyuan Liu and
Young Jin Kim and
Shuohang Wang and
Chen Liang and
Yelong Shen and
Hao Cheng and
Xiaodong Liu and
Masahiro Tanaka and
Xiaoxia Wu and
Wenxiang Hu and
Vishrav Chaudhary and
Zeqi Lin and
Chengruidong Zhang and
Jilong Xue and
Hany Awadalla and
Jianfeng Gao and
Weizhu Chen},
title = {{GRIN:} GRadient-INformed MoE},
journal = {CoRR},
volume = {abs/2409.12136},
year = {2024}
}
@inproceedings{DBLP:conf/acl/JawaharMLKALABG23,
author = {Ganesh Jawahar and
Subhabrata Mukherjee and
Xiaodong Liu and
Young Jin Kim and
Muhammad Abdul{-}Mageed and
Laks V. S. Lakshmanan and
Ahmed Hassan Awadallah and
S{\'{e}}bastien Bubeck and
Jianfeng Gao},
title = {AutoMoE: Heterogeneous Mixture-of-Experts with Adaptive Computation
for Efficient Neural Machine Translation},
booktitle = {{ACL} (Findings)},
pages = {9116--9132},
publisher = {Association for Computational Linguistics},
year = {2023}
}
@article{DBLP:journals/corr/abs-2302-09210,
author = {Amr Hendy and
Mohamed Abdelrehim and
Amr Sharaf and
Vikas Raunak and
Mohamed Gabr and
Hitokazu Matsushita and
Young Jin Kim and
Mohamed Afify and
Hany Hassan Awadalla},
title = {How Good Are {GPT} Models at Machine Translation? {A} Comprehensive
Evaluation},
journal = {CoRR},
volume = {abs/2302.09210},
year = {2023}
}
@article{DBLP:journals/corr/abs-2308-09723,
author = {Young Jin Kim and
Rawn Henry and
Raffy Fahim and
Hany Hassan Awadalla},
title = {FineQuant: Unlocking Efficiency with Fine-Grained Weight-Only Quantization
for LLMs},
journal = {CoRR},
volume = {abs/2308.09723},
year = {2023}
}
@article{DBLP:journals/corr/abs-2308-15772,
author = {Hai Pham and
Young Jin Kim and
Subhabrata Mukherjee and
David P. Woodruff and
Barnab{\'{a}}s P{\'{o}}czos and
Hany Hassan Awadalla},
title = {Task-Based MoE for Multitask Multilingual Machine Translation},
journal = {CoRR},
volume = {abs/2308.15772},
year = {2023}
}
@article{DBLP:journals/corr/abs-2309-11674,
author = {Haoran Xu and
Young Jin Kim and
Amr Sharaf and
Hany Hassan Awadalla},
title = {A Paradigm Shift in Machine Translation: Boosting Translation Performance
of Large Language Models},
journal = {CoRR},
volume = {abs/2309.11674},
year = {2023}
}
@article{DBLP:journals/corr/abs-2310-02410,
author = {Young Jin Kim and
Raffy Fahim and
Hany Hassan Awadalla},
title = {Mixture of Quantized Experts (MoQE): Complementary Effect of Low-bit
Quantization and Robustness},
journal = {CoRR},
volume = {abs/2310.02410},
year = {2023}
}
@inproceedings{DBLP:conf/amta/AmerAKMH22,
author = {Hossam Amer and
Mohamed Afify and
Young Jin Kim and
Hitokazu Matsushita and
Hany Hassan},
title = {Fast Vocabulary Projection Method via Clustering for Multilingual
Machine Translation on {GPU}},
booktitle = {{AMTA}},
pages = {58--69},
publisher = {Association for Machine Translation in the Americas},
year = {2022}
}
@inproceedings{DBLP:conf/iclr/Zuo00KHZGZ22,
author = {Simiao Zuo and
Xiaodong Liu and
Jian Jiao and
Young Jin Kim and
Hany Hassan and
Ruofei Zhang and
Jianfeng Gao and
Tuo Zhao},
title = {Taming Sparsely Activated Transformer with Stochastic Experts},
booktitle = {{ICLR}},
publisher = {OpenReview.net},
year = {2022}
}
@inproceedings{DBLP:conf/icml/0013KMH22,
author = {Rui Liu and
Young Jin Kim and
Alexandre Muzio and
Hany Hassan},
title = {Gating Dropout: Communication-efficient Regularization for Sparsely
Activated Transformers},
booktitle = {{ICML}},
series = {Proceedings of Machine Learning Research},
volume = {162},
pages = {13782--13792},
publisher = {{PMLR}},
year = {2022}
}
@article{DBLP:journals/corr/abs-2205-14336,
author = {Rui Liu and
Young Jin Kim and
Alexandre Muzio and
Barzan Mozafari and
Hany Hassan Awadalla},
title = {Gating Dropout: Communication-efficient Regularization for Sparsely
Activated Transformers},
journal = {CoRR},
volume = {abs/2205.14336},
year = {2022}
}
@article{DBLP:journals/corr/abs-2208-06874,
author = {Hossam Amer and
Young Jin Kim and
Mohamed Afify and
Hitokazu Matsushita and
Hany Hassan Awadalla},
title = {Fast Vocabulary Projection Method via Clustering for Multilingual
Machine Translation on {GPU}},
journal = {CoRR},
volume = {abs/2208.06874},
year = {2022}
}
@article{DBLP:journals/corr/abs-2210-07535,
author = {Ganesh Jawahar and
Subhabrata Mukherjee and
Xiaodong Liu and
Young Jin Kim and
Muhammad Abdul{-}Mageed and
Laks V. S. Lakshmanan and
Ahmed Hassan Awadallah and
S{\'{e}}bastien Bubeck and
Jianfeng Gao},
title = {AutoMoE: Neural Architecture Search for Efficient Sparsely Activated
Transformers},
journal = {CoRR},
volume = {abs/2210.07535},
year = {2022}
}
@article{DBLP:journals/corr/abs-2211-10017,
author = {Young Jin Kim and
Rawn Henry and
Raffy Fahim and
Hany Hassan Awadalla},
title = {Who Says Elephants Can't Run: Bringing Large Scale MoE Models into
Cloud Scale Production},
journal = {CoRR},
volume = {abs/2211.10017},
year = {2022}
}
@article{DBLP:journals/corr/abs-2109-10465,
author = {Young Jin Kim and
Ammar Ahmad Awan and
Alexandre Muzio and
Andr{\'{e}}s Felipe Cruz{-}Salinas and
Liyang Lu and
Amr Hendy and
Samyam Rajbhandari and
Yuxiong He and
Hany Hassan Awadalla},
title = {Scalable and Efficient MoE Training for Multitask Multilingual Models},
journal = {CoRR},
volume = {abs/2109.10465},
year = {2021}
}
@article{DBLP:journals/corr/abs-2110-04260,
author = {Simiao Zuo and
Xiaodong Liu and
Jian Jiao and
Young Jin Kim and
Hany Hassan and
Ruofei Zhang and
Tuo Zhao and
Jianfeng Gao},
title = {Taming Sparsely Activated Transformer with Stochastic Experts},
journal = {CoRR},
volume = {abs/2110.04260},
year = {2021}
}
@article{DBLP:journals/corr/abs-2010-13382,
author = {Young Jin Kim and
Hany Hassan Awadalla},
title = {FastFormers: Highly Efficient Transformer Models for Natural Language
Understanding},
journal = {CoRR},
volume = {abs/2010.13382},
year = {2020}
}
@article{DBLP:journals/simulation/KimMF19,
author = {Young Jin Kim and
Dimitri Mavris and
Richard Fujimoto},
title = {Time- and space-parallel simulation of air traffic networks},
journal = {Simul.},
volume = {95},
number = {12},
year = {2019}
}
@inproceedings{DBLP:conf/emnlp/KimJHAHGB19,
author = {Young Jin Kim and
Marcin Junczys{-}Dowmunt and
Hany Hassan and
Alham Fikri Aji and
Kenneth Heafield and
Roman Grundkiewicz and
Nikolay Bogoychev},
title = {From Research to Production and Back: Ludicrously Fast Neural Machine
Translation},
booktitle = {NGT@EMNLP-IJCNLP},
pages = {280--288},
publisher = {Association for Computational Linguistics},
year = {2019}
}
@phdthesis{DBLP:phd/basesearch/Kim18b,
author = {Young Jin Kim},
title = {A deep learning and parallel simulation methodology for air traffic
management},
school = {Georgia Institute of Technology, Atlanta, GA, {USA}},
year = {2018}
}
@inproceedings{DBLP:conf/wsc/KimMF17,
author = {Young Jin Kim and
Dimitri Mavris and
Richard Fujimoto},
title = {Time-parallel simulation of air traffic networks},
booktitle = {{WSC}},
pages = {1013--1024},
publisher = {{IEEE}},
year = {2017}
}
@inproceedings{DBLP:conf/syscon/CraisseKKCBLGM16,
author = {Jeremie Craisse and
Simon Kruger and
Young Jin Kim and
Imon Chakraborty and
Simon Briceno and
Yongchang Li and
Elena Garcia and
Dimitri N. Mavris},
title = {Creation of a decision-support methodology for selecting more-electric
aircraft subsystem technologies},
booktitle = {SysCon},
pages = {1--7},
publisher = {{IEEE}},
year = {2016}
}
manage site settings
To protect your privacy, all features that rely on external API calls from your browser are turned off by default. You need to opt-in for them to become active. All settings here will be stored as cookies with your web browser. For more information see our F.A.Q.