@inproceedings{81b19d29b12e4432a0b2fbf11d9be827,
title = "Mixture-of-Trees: Learning to Select and Weigh Reasoning Paths for Efficient LLM Inference",
abstract = "We introduce Mixture-of-Trees (MoT), a novel framework that integrates sparse expert activation with structured tree-based reasoning for efficient LLM inference. MoT employs a learned gating mechanism to selectively activate only the most relevant expert reasoning trees for each problem, where experts use models of varying capacities based on task complexity. The framework features three key innovations: (1) sparse expert activation through unified gating networks, (2) specialized expert trees that leverage domain-specific expertise while optimizing the quality-efficiency trade-off, and (3) collaborative debate mechanisms for conflicting solutions. Additionally, MoT includes a shared baseline tree with early stopping—activated experts perform lightweight validation and terminate early when confidence is high. Experiments across five benchmarks (GSM8K, MATH, AIME 2024, MMLU, HotpotQA) show that MoT achieves 2-7 percentage point accuracy improvements while reducing LLM calls by 37-40\% compared to existing multi-path methods.",
author = "Yangbo Wei and Zhen Huang and Shaoqiang Lu and Junhong Qian and Dongge Qin and Lin, \{Ting Jung\} and Xing, \{Wei W.\} and Chen Wu and Lei He",
note = "Publisher Copyright: {\textcopyright} 2026, Association for the Advancement of Artificial Intelligence (www.aaai.org). All rights reserved.; 40th AAAI Conference on Artificial Intelligence, AAAI 2026 ; Conference date: 20-01-2026 Through 27-01-2026",
year = "2026",
doi = "10.1609/aaai.v40i40.40677",
language = "English",
isbn = "9781577359067",
series = "Proceedings of the AAAI Conference on Artificial Intelligence",
publisher = "Association for the Advancement of Artificial Intelligence",
number = "40",
pages = "33854--33862",
editor = "Sven Koenig and Chad Jenkins and Taylor, \{Matthew E.\}",
booktitle = "Proceedings of the AAAI Conference on Artificial Intelligence",
edition = "40",
}