@inproceedings{24701052200f4fda8bccf68b8c2e1cd8,
title = "Best of Both Worlds: High Performance Interactive and Batch Launching",
abstract = "Rapid launch of thousands of jobs is essential for effective interactive supercomputing, big data analysis, and AI algorithm development. Achieving thousands of launches per second has required hardware to be available to receive these jobs. This paper presents a novel preemptive approach to implement 'spot' jobs on MIT SuperCloud systems allowing the resources to be fully utilized for both long running batch jobs while still providing fast launch for interactive jobs. The new approach separates the job preemption and scheduling operations and can achieve 100 times faster performance in the scheduling of a job with preemption when compared to using the standard scheduler-provided automatic preemption-based capability. The results demonstrate that the new approach can schedule interactive jobs preemptively at a performance comparable to when the required computing resources are idle and available. The spot job capability can be deployed without disrupting the interactive user experience while increasing the overall system utilization.",
keywords = "cluster utilization, cron job, preemption, scheduling performance, spot jobs",
author = "Chansup Byun and Jeremy Kepner and William Arcand and David Bestor and Bill Bergeron and Vijay Gadepally and Michael Houle and Matthew Hubbell and Michael Jones and Andrew Kirby and Anna Klein and Peter Michaleas and Lauren Milechin and Julie Mullen and Andrew Prout and Antonio Rosa and Siddharth Samsi and Charles Yee and Albert Reuther",
note = "Funding Information: This material is based upon work supported by the Assistant Secretary of Defense for Research and Engineering under Air Force Contract No. FA8721-05-C-0002 and/or FA8702-15-D-0001. Any opinions, findings, conclusions or recommendations expressed in this material are those of the author(s) and do not necessarily reflect the views of the Assistant Secretary of Defense for Research and Engineering. Publisher Copyright: {\textcopyright} 2020 IEEE.; 2020 IEEE High Performance Extreme Computing Conference, HPEC 2020 ; Conference date: 21-09-2020 Through 25-09-2020",
year = "2020",
month = sep,
day = "22",
doi = "10.1109/HPEC43674.2020.9286142",
language = "English",
series = "2020 IEEE High Performance Extreme Computing Conference, HPEC 2020",
publisher = "Institute of Electrical and Electronics Engineers Inc.",
booktitle = "2020 IEEE High Performance Extreme Computing Conference, HPEC 2020",
}