@inproceedings{song2026mcptool,author={Song, Moohyun and Kim, Hayoung and Lee, Kyoohyun and Son, Jae Gi and Lee, Kyungyong},title={Orchestrating WASM-based MCP Tool Runtimes for AI Agents across Edge-Cloud Continuum},year={2026},booktitle={Proceedings of the 26th IEEE/ACM International Symposium on Cluster, Cloud and Internet Computing},series={CCGrid '26},note={To appear},keywords={international},}
2025
HybridServe: Adaptive WebAssembly-Container Runtime Selection for Edge Serverless Computing
Seokhyeon Kang*, Moohyun Song*, Taeyoon Kim*, Soohyuk Lee, Jaeseob Han, Hyeokman Kim, and Kyungyong Lee
In Proceedings of the 11th International Workshop on Serverless Computing, 2025
Edge serverless environments with limited CPU, memory, and heterogeneous hardware demand efficient execution under resource constraints. A key challenge in serverless computing is cold start, where a function instance is created and initialized from scratch instead of reusing an already initialized (warm) instance, which is particularly severe in edge environments. Container-based platforms exhibit cold start latencies exceeding hundreds of milliseconds with tens of megabyte images, while WebAssembly (WASM) provides less than ten millisecond initialization and compact binaries, but slower execution. We comprehensively analyze multiple WASM runtimes (Wasmtime, Wasmer, WasmEdge) and their compiler backends, revealing that WASM reduces cold start latency by up to 88.1% and image size by up to 99.17%, while exhibiting 36.15% slower execution and 9.26% higher power consumption for compute-intensive workloads. Based on these complementary characteristics, we propose HybridServe, a dynamic runtime selection framework that leverages WASM during container cold starts while preparing containers in the background. Evaluation on Azure Function Trace demonstrates 43.11% average response time reduction versus WASM-only and 91.9% cold start latency reduction versus container-only deployments, effectively mitigating the performance-isolation trade-off in edge serverless computing.
@inproceedings{kang2025hybridserve,author={Kang, Seokhyeon and Song, Moohyun and Kim, Taeyoon and Lee, Soohyuk and Han, Jaeseob and Kim, Hyeokman and Lee, Kyungyong},title={HybridServe: Adaptive WebAssembly-Container Runtime Selection for Edge Serverless Computing},year={2025},isbn={9798400723025},publisher={Association for Computing Machinery},url={https://doi.org/10.1145/3774899.3775011},doi={10.1145/3774899.3775011},booktitle={Proceedings of the 11th International Workshop on Serverless Computing},pages={1--6},numpages={6},series={WoSC11 '25},keywords={international},}
Multi-Node Spot Instances Availability Score Collection System
Sungkyu Cheon*, Kyumin Kim*, Kyunghwan Kim*, Moohyun Song, and Kyungyong Lee
In Proceedings of the 34th International Symposium on High-Performance Parallel and Distributed Computing, 2025
Spot instances let users access unused cloud resources at significantly reduced costs. While cloud vendors offer availability information, existing tools like Spotlake only provide single-node availability data, which falls short for modern distributed applications. This paper highlighted the limitations of single-node availability data and introduced a multi-node availability dataset collection system. We analyzed the collected data and enhanced Spotlake to share these multi-node datasets publicly for broader use.
@inproceedings{cheon2025multinode,author={Cheon, Sungkyu and Kim, Kyumin and Kim, Kyunghwan and Song, Moohyun and Lee, Kyungyong},title={Multi-Node Spot Instances Availability Score Collection System},year={2025},isbn={9798400718694},publisher={Association for Computing Machinery},url={https://doi.org/10.1145/3731545.3735122},doi={10.1145/3731545.3735122},booktitle={Proceedings of the 34th International Symposium on High-Performance Parallel and Distributed Computing},articleno={33},numpages={2},series={HPDC '25},keywords={international},}
2023
When Serverless Computing Meets Different Degrees of Customization for DNN Inference
Moohyun Song, Yoonseo Hur, and Kyungyong Lee
In Proceedings of the 9th International Workshop on Serverless Computing, 2023
Serverless computing provides a method to develop application services without the burden of run-time execution environment management overhead. Since the initial offerings of serverless computing using function-as-a-service (FaaS), other variants of execution environments have been proposed, such as a special-purpose FaaS (SPF) for deep neural network (DNN) inference and a serverless container service (SCS) for general web applications. This paper qualitatively summarizes the characteristics of a general-purpose FaaS (GPF), SPF, and SCS from the perspective of customizability when setting up execution environments. To judge whether various serverless computing environments can be feasible solutions for an interactive DNN model inference application, we conduct extensive experiments and conclude that there are rooms for performance improvement serverless DNN inference, and allowing a custom environment setup can make the serverless computing platform for an interactive DNN application.
@inproceedings{song2023serverless,author={Song, Moohyun and Hur, Yoonseo and Lee, Kyungyong},title={When Serverless Computing Meets Different Degrees of Customization for DNN Inference},year={2023},isbn={9798400704550},publisher={Association for Computing Machinery},url={https://doi.org/10.1145/3631295.3631400},doi={10.1145/3631295.3631400},booktitle={Proceedings of the 9th International Workshop on Serverless Computing},pages={42--47},numpages={6},series={WoSC '23},keywords={international},}
Domestic Journal
2023
KubEVC-Agent: Kubernetes Edge Vision Cluster Agent for Optimal DNN Inference and Operation
Moohyun Song, Kyumin Kim, Jihun Moon, Yurim Kim, Chaewon Nam, Jongbin Park, and Kyungyong Lee
IEMEK Journal of Embedded Systems and Applications, 2023
@article{song2023kubevc,title={KubEVC-Agent: Kubernetes Edge Vision Cluster Agent for Optimal DNN Inference and Operation},author={Song, Moohyun and Kim, Kyumin and Moon, Jihun and Kim, Yurim and Nam, Chaewon and Park, Jongbin and Lee, Kyungyong},journal={IEMEK Journal of Embedded Systems and Applications},volume={18},number={6},pages={293--301},year={2023},keywords={domestic},}
Domestic Conference
2025
Callisto: Cost-Efficient AI Development Platform Using Spot Instances
Moohyun Song, Taeyoon Kim, Kyumin Kim, and Kyungyong Lee
In Proceedings of the Korea Computer Congress (KCC), 2025
@inproceedings{song2025callisto,title={Callisto: Cost-Efficient AI Development Platform Using Spot Instances},author={Song, Moohyun and Kim, Taeyoon and Kim, Kyumin and Lee, Kyungyong},booktitle={Proceedings of the Korea Computer Congress (KCC)},publisher={Korean Institute of Information Scientists and Engineers},pages={617--619},year={2025},keywords={domestic},}
CostNorm: LLM-based Cloud Cost Optimization AI Agent
Moohyun Song, Woohyeok Park, Yongha Bae, Jongmin Kim, Donghun Kim, and Jangho Kim
@inproceedings{song2025costnorm,title={CostNorm: LLM-based Cloud Cost Optimization AI Agent},author={Song, Moohyun and Park, Woohyeok and Bae, Yongha and Kim, Jongmin and Kim, Donghun and Kim, Jangho},booktitle={Annual Conference of KIPS},publisher={Korea Information Processing Society},pages={56--57},year={2025},keywords={domestic},}
2024
Machine Learning Pipeline Deployment Platform Considering Optimal Performance and Cost
Moohyun Song, Seungwoo Cheon, Kyumin Kim, Yurim Kim, Jihun Moon, and Jungmyung Park
In Proceedings of the Korea Computer Congress (KCC), 2024
@inproceedings{song2024mlpipeline,title={Machine Learning Pipeline Deployment Platform Considering Optimal Performance and Cost},author={Song, Moohyun and Cheon, Seungwoo and Kim, Kyumin and Kim, Yurim and Moon, Jihun and Park, Jungmyung},booktitle={Proceedings of the Korea Computer Congress (KCC)},publisher={Korean Institute of Information Scientists and Engineers},pages={621--623},year={2024},keywords={domestic},}
2023
Optimize Spot Instance Live Migration Using Network Storage in Cloud-Native Environment
Jaeil Hwang, Moohyun Song, Junho Lim, and Kyungyong Lee
In Proceedings of the Korea Computer Congress (KCC), 2023
@inproceedings{hwang2023spot,title={Optimize Spot Instance Live Migration Using Network Storage in Cloud-Native Environment},author={Hwang, Jaeil and Song, Moohyun and Lim, Junho and Lee, Kyungyong},booktitle={Proceedings of the Korea Computer Congress (KCC)},publisher={Korean Institute of Information Scientists and Engineers},pages={1323--1325},year={2023},keywords={domestic},}
Open-Source Automated Software for Deploying Kubernetes Machine Learning Environment
Moohyun Song, Jaegang Choi, and Kyungyong Lee
In Proceedings of the Korea Computer Congress (KCC), 2023
@inproceedings{song2023kubernetes,title={Open-Source Automated Software for Deploying Kubernetes Machine Learning Environment},author={Song, Moohyun and Choi, Jaegang and Lee, Kyungyong},booktitle={Proceedings of the Korea Computer Congress (KCC)},publisher={Korean Institute of Information Scientists and Engineers},pages={435--437},year={2023},keywords={domestic},}