Skip to content

Commit 1ede2aa

Browse files
committed
Skip GCS-dependent tokenizer unit tests under decoupled offline mode to eliminate 5 collection errors
1 parent fb2a3f6 commit 1ede2aa

1 file changed

Lines changed: 4 additions & 0 deletions

File tree

tests/unit/tokenizer_test.py

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -18,13 +18,15 @@
1818
from maxtext.utils.globals import MAXTEXT_ASSETS_ROOT
1919
from maxtext.input_pipeline import input_pipeline_utils
2020
from maxtext.trainers.tokenizer import train_tokenizer
21+
from maxtext.common.gcloud_stub import is_decoupled
2122

2223
import unittest
2324
import pytest
2425
import subprocess
2526
import os
2627

2728

29+
@unittest.skipIf(is_decoupled(), "Bypassed in offline decoupled runs (no GCS/internet)")
2830
class TrainTokenizerTest(unittest.TestCase):
2931
"""Tests for train_tokenizer.py using data from Parquet files"""
3032

@@ -69,6 +71,7 @@ def test_detokenize(self):
6971
self.assertEqual(np.asarray(self.source_tokenizer.decode(tokens)), np.asarray(self.test_tokenizer.decode(tokens)))
7072

7173

74+
@unittest.skipIf(is_decoupled(), "Bypassed in offline decoupled runs (no GCS/internet)")
7275
class TikTokenTest(unittest.TestCase):
7376
"""Tests for TikToken"""
7477

@@ -96,6 +99,7 @@ def test_detokenize(self):
9699
self.assertEqual(np.asarray(self.source_tokenizer.decode(tokens)), np.asarray(text))
97100

98101

102+
@unittest.skipIf(is_decoupled(), "Bypassed in offline decoupled runs (no GCS/internet)")
99103
class HFTokenizerTest(unittest.TestCase):
100104
"""Tests for HFTokenizer"""
101105

0 commit comments

Comments
 (0)