@inproceedings{9c45fa1aee96433397d91172a603a58d,
title = "Performance of xLSTM for Semantic Segmentation of Remotely Sensed Images",
abstract = "Recent advancements in autoregressive networks with linear complexity have driven significant research progress, demonstrating exceptional performance in large language models. A representative model is the Extended Long Short-Term Memory (xLSTM), which incorporates gating mechanisms and memory structures, performing comparably to Transformer architectures in long-sequence language tasks. Autoregressive networks such as xLSTM can utilize image serialization to extend their application to visual tasks such as classification and segmentation. Although existing studies have demonstrated Vision-LSTM's impressive results in image classification, its performance in image semantic segmentation remains unverified. Our study represents the first attempt to evaluate the effectiveness of Vision-LSTM in the semantic segmentation of remotely sensed images. This evaluation is based on a specifically designed encoder-decoder architecture named Seg-LSTM, and comparisons with state-of-the-art segmentation networks. Our study found that Vision-LSTM's performance in semantic segmentation was limited and generally inferior to Vision-Transformers-based and Vision-Mamba-based models in most comparative tests. Future research directions for enhancing Vision-LSTM are recommended. The source code is available from https://github.com/zhuqinfeng1999/Seg-LSTM.",
keywords = "High-resolution, Image, Remote Sensing, Semantic Segmentation, Vision-LSTM, xLSTM",
author = "Qinfeng Zhu and Yuanzhi Cai and Lei Fan",
note = "Publisher Copyright: {\textcopyright} 2024 Copyright held by the owner/author(s). Publication rights licensed to ACM.; 7th International Conference on Sensors, Signal and Image Processing, SSIP 2024 ; Conference date: 22-11-2024 Through 24-11-2024",
year = "2025",
month = jul,
day = "7",
doi = "10.1145/3725949.3725967",
language = "English",
series = "ACM International Conference Proceeding Series",
publisher = "Association for Computing Machinery",
pages = "90--96",
booktitle = "7th International Conference on Sensors, Signal and Image Processing, SSIP 2024 - Proceedings",
}