Skip to content

Commit 1cef8bf

Browse files
committed
Add AVMeme-Exam zero shot classification task
1 parent 5f0e107 commit 1cef8bf

2 files changed

Lines changed: 121 additions & 0 deletions

File tree

mteb/tasks/zeroshot_classification/eng/__init__.py

Lines changed: 6 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -2,6 +2,10 @@
22
AVEDatasetVideoZeroShotClassification,
33
AVEDatasetZeroShotClassification,
44
)
5+
from .avmeme_exam_classification import (
6+
AVMemeAudioVideoZeroShotClassification,
7+
AVMemeVideoZeroShotClassification,
8+
)
59
from .birdsnap import BirdsnapZeroShotClassification
610
from .breakfast_classification import BreakfastZeroShotClassification
711
from .caltech101 import Caltech101ZeroShotClassification
@@ -56,6 +60,8 @@
5660
"CLEVR",
5761
"AVEDatasetVideoZeroShotClassification",
5862
"AVEDatasetZeroShotClassification",
63+
"AVMemeAudioVideoZeroShotClassification",
64+
"AVMemeVideoZeroShotClassification",
5965
"BirdsnapZeroShotClassification",
6066
"BreakfastZeroShotClassification",
6167
"CIFAR10ZeroShotClassification",
Lines changed: 115 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,115 @@
1+
from __future__ import annotations
2+
3+
from mteb.abstasks.task_metadata import TaskMetadata
4+
from mteb.abstasks.zeroshot_classification import AbsTaskZeroShotClassification
5+
6+
CITATION = r"""
7+
@inproceedings{jiang2026avmeme,
8+
author = {Jiang, Xilin and Wang, Qiaolin and Wu, Junkai and He, Xiaomin and Xu, Zhongweiyang and Ma, Yinghao and Piao, Minshuo and Yang, Kaiyi and Zheng, Xiuwen and Shimizu, Riki and others},
9+
journal = {arXiv preprint arXiv:2601.17645},
10+
title = {AVMeme Exam: A Multimodal Multilingual Multicultural Benchmark for LLMs' Contextual and Cultural Knowledge and Thinking},
11+
year = {2026},
12+
}
13+
"""
14+
15+
16+
class AVMemeAudioVideoZeroShotClassification(AbsTaskZeroShotClassification):
17+
metadata = TaskMetadata(
18+
name="AVMemeAudioVideoZeroShot",
19+
description="AVMeme Exam is a multimodal, multilingual, and multicultural benchmark of over 1,000 iconic Internet audio-visual memes spanning speech, songs, music, and sound effects. Each meme is paired with a Q&A assessing levels of understanding from surface content to context, emotion, usage, and world knowledge. This zero-shot classification task predicts the sound category of each meme clip.",
20+
reference="https://arxiv.org/pdf/2601.17645",
21+
dataset={
22+
"path": "mteb/AVMeme-Exam",
23+
"revision": "7070d1979d9a4943dd49b2e72858eb1e54f6bd5b",
24+
},
25+
type="VideoZeroshotClassification",
26+
category="va2t",
27+
eval_splits=["test"],
28+
eval_langs=[
29+
"bos-Latn",
30+
"bre-Latn",
31+
"deu-Latn",
32+
"eng-Latn",
33+
"fas-Arab",
34+
"fin-Latn",
35+
"fra-Latn",
36+
"hin-Deva",
37+
"ita-Latn",
38+
"jpn-Jpan",
39+
"kor-Hang",
40+
"por-Latn",
41+
"rus-Cyrl",
42+
"spa-Latn",
43+
"tel-Telu",
44+
"zho-Hans",
45+
],
46+
main_score="accuracy",
47+
date=("2026-01-25", "2026-01-25"),
48+
domains=["Web", "Entertainment", "Music"],
49+
task_subtypes=["Topic classification"],
50+
license="cc-by-4.0",
51+
annotations_creators="human-annotated",
52+
dialect=[],
53+
modalities=["video", "audio"],
54+
sample_creation="found",
55+
bibtex_citation=CITATION,
56+
is_beta=True,
57+
)
58+
input_column_name = ("video", "audio")
59+
label_column_name: str = "category"
60+
61+
def get_candidate_labels(self) -> list[str]:
62+
return [
63+
name for name in self.dataset["test"].features[self.label_column_name].names
64+
]
65+
66+
67+
class AVMemeVideoZeroShotClassification(AbsTaskZeroShotClassification):
68+
metadata = TaskMetadata(
69+
name="AVMemeVideoZeroShot",
70+
description="AVMeme Exam is a multimodal, multilingual, and multicultural benchmark of over 1,000 iconic Internet audio-visual memes spanning speech, songs, music, and sound effects. Each meme is paired with a Q&A assessing levels of understanding from surface content to context, emotion, usage, and world knowledge. This zero-shot classification task predicts the sound category of each meme clip.",
71+
reference="https://arxiv.org/pdf/2601.17645",
72+
dataset={
73+
"path": "mteb/AVMeme-Exam",
74+
"revision": "7070d1979d9a4943dd49b2e72858eb1e54f6bd5b",
75+
},
76+
type="VideoZeroshotClassification",
77+
category="v2t",
78+
eval_splits=["test"],
79+
eval_langs=[
80+
"bos-Latn",
81+
"bre-Latn",
82+
"deu-Latn",
83+
"eng-Latn",
84+
"fas-Arab",
85+
"fin-Latn",
86+
"fra-Latn",
87+
"hin-Deva",
88+
"ita-Latn",
89+
"jpn-Jpan",
90+
"kor-Hang",
91+
"por-Latn",
92+
"rus-Cyrl",
93+
"spa-Latn",
94+
"tel-Telu",
95+
"zho-Hans",
96+
],
97+
main_score="accuracy",
98+
date=("2026-01-25", "2026-01-25"),
99+
domains=["Web", "Entertainment", "Music"],
100+
task_subtypes=["Topic classification"],
101+
license="cc-by-4.0",
102+
annotations_creators="human-annotated",
103+
dialect=[],
104+
modalities=["video"],
105+
sample_creation="found",
106+
bibtex_citation=CITATION,
107+
is_beta=True,
108+
)
109+
input_column_name = "video"
110+
label_column_name: str = "category"
111+
112+
def get_candidate_labels(self) -> list[str]:
113+
return [
114+
name for name in self.dataset["test"].features[self.label_column_name].names
115+
]

0 commit comments

Comments
 (0)