Skip to content

Commit 9ae6944

Browse files
committed
Added mtbench to config files and added Benchmark tag
1 parent 6992958 commit 9ae6944

2 files changed

Lines changed: 16 additions & 0 deletions

File tree

components/tag.tsx

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -36,6 +36,10 @@ function PublicationTag({ tag }: { tag: Tag }) {
3636
name = "Geometric and Graph Learning";
3737
color = "warning";
3838
break;
39+
case Tag.Benchmark:
40+
name = "Benchmark";
41+
color = "primary";
42+
break;
3943
}
4044

4145
return (

config/publications.ts

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -3,6 +3,7 @@ export enum Tag {
33
MultiModalFoundationModel = "Multi-Modal Foundation Model",
44
TrustworthyAI = "Trustworthy AI",
55
Applications = "Applications",
6+
Benchmark = "Benchmark",
67
}
78

89
export interface Publication {
@@ -18,6 +19,17 @@ export interface Publication {
1819
}
1920

2021
export const publications: Publication[] = [
22+
{
23+
title: "MTBench: A Multimodal Time Series Benchmark for Temporal Reasoning and Question Answering",
24+
authors: "Jialin Chen, Aosong Feng, Ziyu Zhao, Juan Garza, Gaukhar Nurbek, Ali Maatouk, Leandros Tassiulas, Yifeng Gao3, Rex Ying",
25+
venue: "KDD, 2025",
26+
page: "mtbench",
27+
code: "https://github.com/Graph-and-Geometric-Learning/MTBencht",
28+
paper: "",
29+
abstract: "We introduce MTBench, a large-scale benchmark designed to evaluate large language models (LLMs) on time series and text understanding across financial and weather domains. MTBench comprises of paired time-series and textual data, including financial news with corresponding stock price movements and weather reports aligned with historical temperature records.",
30+
impact: "We evaluate state-of-the-art LLMs on MTBench, analyzing their effectiveness in modeling the complex relationships between news narratives and temporal patterns. Our findings reveal significant challenges in current models, including difficulties in capturing long-term dependencies, interpreting causality in financial and weather trends, and effectively fusing multimodal information.",
31+
tags: [Tag.Benchmark, Tag.MultiModalFoundationModel],
32+
},
2133
{
2234
title: "Lorentzian Residual Neural Networks",
2335
authors: "Neil He, Menglin Yang, Rex Ying",

0 commit comments

Comments
 (0)