@inproceedings{ffaa108cf7604e2d95c9ce4afce7add0,
title = "SITH: Semantic Interpreter for Transformer Hierarchy",
abstract = "While Transformers and their derivatives have shown strong performance in various NLP tasks, understanding their internal mechanisms remains challenging. Mainstream interpretability research often focuses solely on numerical attributes, neglecting the complex semantic structure inherent in the model. We have developed the SITH(Semantic Interpreter for Transformer Hierarchy) framework to address this issue. We focus on creating universal text representation methods and uncovering the semantic principles of the Transformer's hierarchical structure. We use the convex hull method to represent sequence semantics in an n-dimensional Semantic Euclidean space and define different evaluation indicators through convex hull to analyze semantic quality and quantity changes. Our analysis takes a dual perspective: a multi-layer cumulative perspective and an individual layer-to-layer shift perspective. When applied to machine translation, our results reveal potential semantic processes and emphasize the effectiveness of stacking and hierarchical differences. These insights are valuable for fine-tuning hyperparameters at the encoder and decoder layers.",
keywords = "Convex Hull, Interpretability, Semantic Analysis, Transformer",
author = "Cheng Zhang and Jinxin Lv and Jingxu Cao and Jiachuan Sheng and Dawei Song and Tiancheng Zhang",
note = "Publisher Copyright: {\textcopyright} 2024 IEEE.; 36th IEEE International Conference on Tools with Artificial Intelligence, ICTAI 2024 ; Conference date: 28-10-2024 Through 30-10-2024",
year = "2024",
doi = "10.1109/ICTAI62512.2024.00023",
language = "English",
series = "Proceedings - International Conference on Tools with Artificial Intelligence, ICTAI",
publisher = "IEEE Computer Society",
pages = "102--107",
booktitle = "Proceedings - 2024 IEEE 36th International Conference on Tools with Artificial Intelligence, ICTAI 2024",
address = "United States",
}