Skip to content

Commit

Permalink
Disable flaky twitter bots dataset loading test. (#3439)
Browse files Browse the repository at this point in the history
  • Loading branch information
justinxzhao committed Aug 11, 2023
1 parent 3691dbe commit 7ecdfa5
Showing 1 changed file with 10 additions and 9 deletions.
19 changes: 10 additions & 9 deletions tests/ludwig/datasets/test_dataset_configs.py
Original file line number Diff line number Diff line change
Expand Up @@ -15,15 +15,16 @@ def test_get_config_and_load(tmpdir):
assert df is not None
assert len(df) == 18721 # Expected number of rows in Yosemite temperatures dataset.

# Test loading dataset without 'split' and 'Unnamed: 0' columns in config.
twitter_bots_config = ludwig.datasets._get_dataset_config("twitter_bots")
assert isinstance(twitter_bots_config, DatasetConfig)

twitter_bots_dataset = ludwig.datasets.get_dataset("twitter_bots", cache_dir=tmpdir)
assert isinstance(twitter_bots_dataset, DatasetLoader)
df = twitter_bots_dataset.load()
assert df is not None
assert len(df.columns) == 22 # Expected number of columns in Twitter bots dataset including split column.
# DISABLED: Flaky for tests, probably due to the dataset size.
# # Test loading dataset without 'split' and 'Unnamed: 0' columns in config.
# twitter_bots_config = ludwig.datasets._get_dataset_config("twitter_bots")
# assert isinstance(twitter_bots_config, DatasetConfig)

# twitter_bots_dataset = ludwig.datasets.get_dataset("twitter_bots", cache_dir=tmpdir)
# assert isinstance(twitter_bots_dataset, DatasetLoader)
# df = twitter_bots_dataset.load()
# assert df is not None
# assert len(df.columns) == 22 # Expected number of columns in Twitter bots dataset including split column.


def test_get_config_kaggle(tmpdir):
Expand Down

0 comments on commit 7ecdfa5

Please sign in to comment.