
@Article{cmc.2026.076083,
AUTHOR = {Shasha Li, Bin Ji, Xiaodong Liu, Jun Ma, Jie Yu},
TITLE = {ComAlign: A Benchmark Aligning Natural Language with Operating System Commands},
JOURNAL = {Computers, Materials \& Continua},
VOLUME = {87},
YEAR = {2026},
NUMBER = {2},
PAGES = {--},
URL = {http://www.techscience.com/cmc/v87n2/66643},
ISSN = {1546-2226},
ABSTRACT = {Aligning natural language with operating system (OS) commands allows users to perform complex computer tasks through simple natural language descriptions. However, due to the complex nature of natural language, it still remains challenging to achieve precise alignment. In this paper, we present <b>ComAlign</b>, a Chinese benchmark dataset that pairs Chinese natural language descriptions with corresponding OS commands. ComAlign covers a broad range of <mml:math id="mml-ieqn-1"><mml:mn>82</mml:mn></mml:math> distinct OS command types with a total of <mml:math id="mml-ieqn-2"><mml:mn>1811</mml:mn></mml:math> natural language descriptions. We elaborate on the construction of ComAlign and construct three baselines to evaluate the alignment accuracy on ComAlign. Experimental results show that even advanced large language models struggle with certain ambiguously phrased OS commands. Specifically, the best performing baseline achieves 46.9% alignment accuracy. We demonstrate that ComAlign is collected from real-world application scenarios, making it particularly suitable for developing and benchmarking intelligent OS and agent systems that support user-machine interactions through natural language.},
DOI = {10.32604/cmc.2026.076083}
}



