@article{xu2024tls, title = {TLS-MWP: A Tensor-based Long-and Short-range Convolution for Multiple Weather Prediction}, author = {Xu, Guangning and Ng, Michael K and Ye, Yunming and Li, Xutao and Song, Ge and Zhang, Bowen and Huang, Zhichao}, journal = {IEEE Transactions on Circuits and Systems for Video Technology}, volume = {34}, number = {9}, pages = {8382-8397}, paperurl = {https://ieeexplore.ieee.org/document/10475377/}, codeurl = {https://github.com/xuguangning1218/TLS_MWP}, corresponding = {Ng, M. K.; Ye, Y.}, year = {2024} }
Weather prediction plays a crucial role in human development. Recently, deep learning has demonstrated promising prospects in weather forecasting by integrating convolutional neural networks (CNNs) and recurrent neural networks (RNNs). However, two main challenges still exist in multiple weather condition prediction. The first challenge considers multiple weather condition correlations in predictions. The second challenge is how to model long- and short-range spatial dependencies under multiple weather conditions. A novel operator named as tensor-based long- and short-range convolution (TLS-Conv) is proposed to address these challenges. Within this operator, the node & relation attention is utilized to identify the contributions of spatial grid points and weather conditions for prediction. Additionally, the adaptive tensor graph convolution (ATGCN) is tailored to dynamically capture long-range spatial dependencies within multiple weather conditions. Finally, the traditional convolution is integrated with the ATGCN to model both long- and short-range spatial dependencies and weather condition correlations. Building upon the TLS-Conv, the tensor-based long- and short-range convolution for multiple weather prediction (TLS-MWP) model is proposed to predict multiple weather conditions. Extensive experiments are conducted under real-world weather conditions to evaluate its performance. These results unequivocally demonstrate that TLS-MWP surpasses previous methods. The code is available on GitHub at: https://github.com/xuguangning1218/TLS_MWP.
@article{XU2024FHDTIE, title = {FHDTIE: Fine-grained Heterogeneous Data Fusion for Tropical Cyclone Intensity Estimation}, journal = {IEEE Transactions on Geoscience and Remote Sensing}, author = {Xu, Guangning and Ng, Michael K and Ye, Yunming and Zhang, Bowen}, paperurl = {#}, codeurl = {https://github.com/xuguangning1218/FHDTIE}, corresponding = {Ng, M. K.; Zhang, B.}, year = {2024} }
A tropical cyclone is a highly destructive extreme weather phenomenon. Estimating intensity of a tropical cyclone can help provide early warnings, guiding specific disaster defense measures. However, two main challenges hinder performance improvement. The first challenge is how to combine heterogeneous tropical cyclone data into a latent space so that the model can leverage the cloud structure of satellite imagery and the comprehensive meteorological information from reanalysis and forecast data for intensity estimation. The second challenge lies in detecting multiple pseudo fine-grained areas for the final estimation, since tropical cyclones are highly diverse extreme weather phenomena. Neglecting any of these pseudo fine-grained areas or relying solely on a single one can potentially result in subpar estimation performance. To address challenges mentioned above, a fine-grained heterogeneous data fusion framework named FHDTIE is proposed. Two key components in this framework can address the aforementioned challenges. One component is the Heterogeneous Data Fuser (HDF), which offers shape matching and channel fusing strategies for heterogeneous data fusion. The other component is called Fine-grained Cluster Features Integrator (FCFI). It utilizes a clustering method to identify multiple pseudo fine-grained areas. Within these areas, the U-Net is used to automatically learn pseudo fine-grained area representations, and then the Graph Neural Network handles information interaction across these representations. Extensive experiments were conducted to demonstrate the robustness and superiority of the proposed fine-grained heterogeneous data fusion framework. The code is available at GitHub: https://github.com/xuguangning1218/FHDTIE.
@article{lin2023spherical, title = {Spherical Neural Operator Network for Global Weather Prediction}, author = {Lin, Kenghong and Li, Xutao and Ye, Yunming and Feng, Shanshan and Zhang, Baoquan and Xu, Guangning and Wang, Ziye}, journal = {IEEE Transactions on Circuits and Systems for Video Technology}, paperurl = {https://ieeexplore.ieee.org/abstract/document/10335752}, corresponding = {Li, X.}, year = {2023} }
Global weather forecast is an important spatial-temporal prediction problem, which can provide numerous societal benefits such as extreme weather forewarning, traffic scheduling, and agricultural planning. Though many spatial-temporal prediction models have been proposed, they suffer from two drawbacks for global weather forecasts, namely 1) ignoring the physical mechanism and spherical characteristics and 2) not effectively exploiting the global and local correlations. To address the above drawbacks, in this paper, we formalize global weather state dynamics as partial differential equations (PDEs) in spherical space and infer the state of the global weather system by solving these PDEs. Specifically, we use Green’s function method to solve the PDEs and find that the solution of the spherical PDEs can be obtained by the spherical convolution. We further proposed a novel Spherical Neural Operator, SNO, which consists of spherical convolution and vanilla convolution. The former is used to solve these PDEs and model the global correlations in spherical space, and the latter is used to capture the local correlations. Upon the operator, a global weather prediction model is developed. Extensive experimental results demonstrate the effectiveness and superiority of our method over state-of-the-art approaches.
@article{xu2023tfg, title = {TFG-Net: Tropical Cyclone Intensity Estimation from a Fine-grained perspective with the Graph convolution neural network}, author = {Xu, Guangning and Li, Yan and Ma, Chi and Li, Xutao and Ye, Yunming and Lin, Qingquan and Huang, Zhichao and Chen, Shidong}, journal = {Engineering Applications of Artificial Intelligence}, volume = {118}, pages = {105673}, paperurl = {https://www.sciencedirect.com/science/article/pii/S0952197622006637}, codeurl = {https://github.com/xuguangning1218/TI_Estimation}, corresponding = {Li, Y.}, year = {2023} }
Tropical Cyclone Intensity Estimation (TIE) is a fundamental study subject for tropical cyclone development, flood or landslide avoidance, etc. Despite considerable efforts, two main challenges remain unresolved in this critical endeavor. The first challenge is that the TIE task is frequently conducted as a coarse-grained recognition problem rather than a fine-grained one. The second challenge is that the prediction fails to consider general wind speed information. To conquer these two challenges, we offer a novel model, namely Tropical cyclone intensity estimation from a Fine-grained perspective with the Graph convolution neural Network (TFG-Net). It is composed of three key components, viz., the Backbone, the Fine-grained Tropical cyclone Features Extractor (FTFE), and the Wind Scale Transition Rule Generator (WTRG), which aim at extracting general spatial features, subtle spatial features, and general wind speed information, respectively. To validate the proposed method, extensive experiments on a well-known real-world tropical dataset named GridSat were carried out. Following the standard benchmark task setting that the model estimates the wind speed from a given satellite image, the proposed TFG-Net reaches 11.12 knots in the RMSE metric, which outperforms 33.33%, 2.54% to the traditional method and the state-of-the-art deep learning method, respectively. The code is available on GitHub:https://github.com/xuguangning1218/TI_Estimation and its reproductive result is available on Code Ocean: https://doi.org/10.24433/CO.6606867.v1.
@article{li2023multi, title = {Multi-relational graph convolutional networks: Generalization guarantees and experiments}, author = {Li, Xutao and Ng, Michael K and Xu, Guangning and Yip, Andy}, journal = {Neural Networks}, volume = {161}, pages = {343--358}, paperurl = {https://www.sciencedirect.com/science/article/pii/S0893608023000576}, corresponding = {Yip, A}, year = {2023} }
The class of multi-relational graph convolutional networks (MRGCNs) is a recent extension of standard graph convolutional networks (GCNs) to handle heterogenous graphs with multiple types of relationships. MRGCNs have been shown to yield results superior than traditional GCNs in various machine learning tasks. The key idea is to introduce a new kind of convolution operated on tensors that can effectively exploit correlations exhibited in multiple relationships. The main objective of this paper is to analyze the algorithmic stability and generalization guarantees of MRGCNs to confirm the usefulness of MRGCNs. Our contributions are of three folds. First, we develop a matrix representation of various tensor operations underneath MRGCNs to simplify the analysis significantly. Next, we prove the uniform stability of MRGCNs and deduce the convergence of the generalization gap to support the usefulness of MRGCNs. The analysis sheds lights on the design of MRGCNs, for instance, how the data should be scaled to achieve the uniform stability of the learning process. Finally, we provide experimental results to demonstrate the stability results.
@article{huang2023multi, title = {Multi-view knowledge graph fusion via knowledge-aware attentional graph neural network}, author = {Huang, Zhichao and Li, Xutao and Ye, Yunming and Zhang, Baoquan and Xu, Guangning and Gan, Wensheng}, journal = {Applied Intelligence}, volume = {53}, number = {4}, pages = {3652--3671}, paperurl = {https://www.sciencedirect.com/science/article/pii/S0893608023000576}, corresponding = {Li, X.; Ye, Y.}, year = {2023} }
The class of multi-relational graph convolutional networks (MRGCNs) is a recent extension of standard graph convolutional networks (GCNs) to handle heterogenous graphs with multiple types of relationships. MRGCNs have been shown to yield results superior than traditional GCNs in various machine learning tasks. The key idea is to introduce a new kind of convolution operated on tensors that can effectively exploit correlations exhibited in multiple relationships. The main objective of this paper is to analyze the algorithmic stability and generalization guarantees of MRGCNs to confirm the usefulness of MRGCNs. Our contributions are of three folds. First, we develop a matrix representation of various tensor operations underneath MRGCNs to simplify the analysis significantly. Next, we prove the uniform stability of MRGCNs and deduce the convergence of the generalization gap to support the usefulness of MRGCNs. The analysis sheds lights on the design of MRGCNs, for instance, how the data should be scaled to achieve the uniform stability of the learning process. Finally, we provide experimental results to demonstrate the stability results.
@article{luo2022reconstitution, title = {The reconstitution predictive network for precipitation nowcasting}, author = {Luo, Chuyao and Xu, Guangning and Li, Xutao and Ye, Yunming}, journal = {Neurocomputing}, volume = {507}, pages = {1--15}, paperurl = {https://www.sciencedirect.com/science/article/pii/S0925231222009195}, codeurl = {https://github.com/luochuyao/RST_LSTM}, corresponding = {Li, X.; Ye, Y.}, year = {2022} }
Precipitation nowcasting is an indispensable task for traffic routing and disaster avoidance. Due to its strenuous movement, even the most recent deep learning techniques in computer vision deliver unsatisfactory performance. The main reason can be attributed to the following two aspects: 1) The traditional convolution in the input has a limited field to extract spatial representation. 2) The convolution in state-to-state connection might lead to mismatch problems and inaccurate strength predictions. To address the two drawbacks, we propose an innovative algorithm the Reconstitute Spatiotemporal LSTM (RST-LSTM) based on Convolutional Recurrent Neural Network (ConvRNN). In the proposed model, we present the local and global reconstitution scheme into the current input and the hidden state respectively. The local reconstitution (LR) can adaptively adjust the perceptual field of convolution so as to extract more useful spatial information and exclude invalid representation. Moreover, in the hidden state, the global reconstitution (GR) is embedded to alleviate the problem of mismatching between the current input and hidden state. Experimental results in MovingMNIST++ show that our approach can achieve the best predictions for those data with more drastic changes in the adjacent time. For radar data in CIKM AnalytiCup 2017 (we name it RadarCIKM in this paper), our method outperforms the state-of-the-art competitors. Furthermore, we notice that GR can promote the nowcasting in the high radar echo region and LR can reduce the error.
@article{xu2022ls, title = {LS-NTP: Unifying long-and short-range spatial correlations for near-surface temperature prediction}, author = {Xu, Guangning and Li, Xutao and Feng, Shanshan and Ye, Yunming and Tu, Zhihua and Lin, Kenghong and Huang, Zhichao}, journal = {Neural Networks}, volume = {155}, pages = {242--257}, paperurl = {https://www.sciencedirect.com/science/article/pii/S0893608022002787}, codeurl = {https://github.com/xuguangning1218/LS_NTP}, corresponding = {Ye, Y.}, year = {2022} }
The near-surface temperature prediction (NTP) is an important spatial–temporal forecast problem, which can be used to prevent temperature crises. Most of the previous approaches fail to explicitly model the long- and short-range spatial correlations simultaneously, which is critical to making an accurate temperature prediction. In this study, both long- and short-range spatial correlations are captured to fill this gap by a novel convolution operator named Long- and Short-range Convolution (LS-Conv). The proposed LS-Conv operator includes three key components, namely, Node-based Spatial Attention (NSA), Long-range Adaptive Graph Constructor (LAGC), and Long- and Short-range Integrator (LSI). To capture long-range spatial correlations, NSA and LAGC are proposed to evaluate node importance aiming at auto-constructing long-range spatial correlations, which is named as Long-range aware Graph Convolution Network (LR-GCN). After that, the Short-range aware Convolution Neural Network (SR-CNN) accounts for the short-range spatial correlations. Finally, LSI is proposed to capture both long- and short-range spatial correlations by intra-unifying LR-GCN and SR-CNN. Upon the proposed LS-Conv operator, a new model called Long- and Short-range for NPT (LS-NTP) is developed. Extensive experiments are conducted on two real-world datasets and the results demonstrate that the proposed method outperforms state-of-the-art techniques. The source code is available on GitHub:https://github.com/xuguangning1218/LS_NTP.
@article{xu2022saf, title = {SAF-Net: A spatio-temporal deep learning method for typhoon intensity prediction}, author = {Xu, Guangning and Lin, Kenghong and Li, Xutao and Ye, Yunming}, journal = {Pattern Recognition Letters}, volume = {155}, pages = {121--127}, paperurl = {https://www.sciencedirect.com/science/article/pii/S0167865521004037}, codeurl = {https://github.com/xuguangning1218/TI_Prediction}, corresponding = {Li, X.; Ye, Y.}, year = {2022} }
A typhoon is a destructive weather system that can cause severe casualties and economic losses. Typhoon intensity (TI) is a measurement to evaluate its ruinous degree. Hence, typhoon intensity prediction is an important research problem and many methods have been proposed. However, most of the existing approaches have very limited capability to combine the 2D Typhoon Structure Domain-expert Knowledge (2D-TSDK) and the 3D Typhoon Structure Data-driven Knowledge (3D-TSDK) for the TI prediction. To address this issue, this paper proposes a spatio-temporal deep learning method named Spatial Attention Fusing Network (SAF-Net). The designed model aims to fuse the 2D-TSDK and the 3D-TSDK by developing a specific Wide & Deep framework. In the data-driven component, a special Spatial Attention (SA) module is designed to automatically select high-response wind speed areas and embedded into a three-branch CNN to exploit the 3D-TSDK. Then, the Wide & Deep framework integrates the 2D-TSDK and the 3D-TSDK for the TI prediction. Comprehensive experiments have been conducted on a real-world dataset, and the result shows that the proposed method outperforms state-of-the-art typhoon intensity prediction methods. The code is available in GitHub:https://github.com/xuguangning1218/TI_Prediction.
@article{xu2022convgru, title = {AM-ConvGRU: A spatio-temporal model for typhoon path prediction}, author = {Xu, Guangning and Xian, Di and Fournier-Viger, Philippe and Li, Xutao and Ye, Yunming and Hu, Xiuqing}, journal = {Neural Computing and Applications}, volume = {34}, number = {8}, pages = {5905--5921}, paperurl = {https://link.springer.com/article/10.1007/s00521-021-06724-x}, codeurl = {https://github.com/xuguangning1218/Typhoon_Path}, corresponding = {Xian, D.; Li, X.}, year = {2022} }
Typhoons are one of the most destructive types of disasters. Several statistical models have been designed to predict their paths to reduce damage, casualties, and economic loss. To further increase prediction accuracy, two key challenges are (1) to extract better nonlinear 3D features of typhoons, which is hard due to their complex high-dimensional properties, and (2) to combine suitable 2D and 3D features in a proper way to improve predictions. To address these challenges, this paper presents a novel spatio-temporal deep learning model named Attention-based Multi ConvGRU (AM-ConvGRU). To automatically select high response isobaric planes of typhoons when considering their whole 3D structures, AM-ConvGRU leverages the Residual Channel Attention Block (RCAB). Furthermore, it integrates a novel model named Multi-ConvGRU to extract large-scale nonlinear spatial features of typhoons. Moreover, the approach relies on a Wide & Deep framework to fuse the traditional Generalized Linear Model (GLM) with the proposed AM-ConvGRU model. To evaluate the designed approach, extensive experiments have been conducted using real-world typhoons data from the Western North Pacific (WNP) basin obtained from both the China Meteorological Administration (CMA) dataset and the EAR-Interim dataset maintained by the European Centre for Medium-Range Weather Forecasts (ECMWF). Results show that the proposed method outperforms state-of-the-art deep learning typhoon prediction methods. The source code is available on GitHub with the following link:https://github.com/xuguangning1218/Typhoon_Path.
@inproceedings{ding2024edda, title = {EDDA: A Encoder-Decoder Data Augmentation Framework for Zero-Shot Stance Detection}, author = {Ding, Daijun and Dong, Li and Huang, Zhichao and Xu, Guangning and Huang, Xu and Liu, Bo and Jing, Liwen and Zhang, Bowen}, booktitle = {Proceedings of the 30th International Conference on Computational Linguistics (COLING)}, paperurl = {https://arxiv.org/abs/2403.15715}, codeurl = {https://github.com/Szu-Ddj/EDDA}, corresponding = {Zhang, B}, year = {2024} }
Stance detection aims to determine the attitude expressed in text towards a given target. Zero-shot stance detection (ZSSD) has emerged to classify stances towards unseen targets during inference. Recent data augmentation techniques for ZSSD increase transferable knowledge between targets through text or target augmentation. However, these methods exhibit limitations. Target augmentation lacks logical connections between generated targets and source text, while text augmentation relies solely on training data, resulting in insufficient generalization. To address these issues, we propose an encoder-decoder data augmentation (EDDA) framework. The encoder leverages large language models and chain-of-thought prompting to summarize texts into target-specific if-then rationales, establishing logical relationships. The decoder generates new samples based on these expressions using a semantic correlation word replacement strategy to increase syntactic diversity. We also analyze the generated expressions to develop a rationale-enhanced network that fully utilizes the augmented data. Experiments on benchmark datasets demonstrate our approach substantially improves over state-of-the-art ZSSD techniques. The proposed EDDA framework increases semantic relevance and syntactic variety in augmented texts while enabling interpretable rationale-based learning.
@inproceedings{xu2023int, title = {Int-GNN: A user intention aware graph neural network for session-based recommendation}, author = {Xu, Guangning and Yang, Jinyang and Guo, Jinjin and Huang, Zhichao and Zhang, Bowen}, booktitle = {ICASSP 2023-2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)}, pages = {1--5}, paperurl = {https://ieeexplore.ieee.org/document/10097031}, codeurl = {https://github.com/xuguangning1218/IntGNN_ICASSP2023}, corresponding = {Huang, Z.; Zhang, B.}, year = {2023} }
Session-Based Recommendation (SBR) is a spotlight research problem. Although many efforts have been made, challenges still exist. The key to unlocking this shackle is the user intention, an intuitive but hard-to-model concept in the anonymous session. Unlike previous research, we suggest mining potential user intention by counting the number of item occurrences in a user session and considering the long interval between item re-interactions. Beyond these, we take user preference, a biased user intention, into account in the prediction stage. Forming these together, we propose a model named user Intention aware Graph Neural Network (Int-GNN) aiming at capturing user intention. Extensive experiments have been conducted on three real-world datasets, and the results show the superiority of our method. The code is available on GitHub: https://github.com/xuguangning1218/IntGNN_ICASSP2023
@inproceedings{zhang2023twitter, title = {Twitter stance detection via neural production systems}, author = {Zhang, Bowen and Ding, Daijun and Xu, Guangning and Guo, Jinjin and Huang, Zhichao and Huang, Xu}, booktitle = {ICASSP 2023-2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)}, pages = {1--5}, paperurl = {https://ieeexplore.ieee.org/document/10094597}, corresponding = {Xu, G.; Zhang, B}, year = {2023} }
Stance detection is an important task, which aims to classify the attitude of an opinionated text toward a given target. In this paper, we develop an interpretable neural production system for stance detection (NPS4SD). NPS4SD is an end-to-end deep learning model, which consists of a set of knowledge rules that are applied by binding with specific entities. NPS4SD consists of two main components: a pretrained model for learning the text representation and a variable binding network (VBN) to bind the knowledge rules with text entities. Extensive experiments are conducted to evaluate the effectiveness of the proposed NPS4SD model on three real-world datasets with in-domain, cross-target and zero-shot setups. Experimental results demonstrate that NPS4SD achieves substantially better performance than the strong competitors for the stance detection task.
@inproceedings{guo2023knowledge, title = {Knowledge-Aware Few Shot Learning for Event Detection from Short Texts}, author = {Guo, Jinjin and Huang, Zhichao and Xu, Guangning and Zhang, Bowen and Duan, Chaoqun}, booktitle = {ICASSP 2023-2023 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)}, pages = {1--5}, paperurl = {https://ieeexplore.ieee.org/document/10095891}, corresponding = {Huang, Z.; Duan, C.}, year = {2023} }
Event detection in a city is crucial for the government to listen to the voice of the citizens, be aware of the real occurrences in a city, and then make wiser policies. However, in reality some important events with few samples are easily to be overwhelmed by the massive information and hard to be recognized, and additionally the limited word description from the short texts even makes the recognition harder. To address the problems, we propose a knowledge-aware event detector by incorporating the external knowledge to detect the events with few examples. The external knowledge incorporation with different semantic relations is capable to enrich the short texts. In addition, we leverage the representative few shot learning framework to formulate the event detection as the text classification problem. The proposed model is evaluated on two widely event-detection datasets. The experiments show a consistent accuracy improvement. The findings validates that our model with the knowledge infusion is effective to detect the few shot events from the short texts.
Guangning Xu
Research Assistant Professor
Hong Kong Baptist Univerity
FSC1004, Hong Kong Baptist Univerity, Kowloon Tong, Kowloon, Hong Kong, China
© 2024 Guangning Xu