Skip to content

Commit

Permalink
Remove audio from media dataset
Browse files Browse the repository at this point in the history
  • Loading branch information
kcz358 committed Dec 27, 2024
1 parent c9c3302 commit 37b753e
Showing 1 changed file with 3 additions and 1 deletion.
4 changes: 3 additions & 1 deletion lmms_eval/api/task.py
Original file line number Diff line number Diff line change
Expand Up @@ -29,7 +29,7 @@
import datasets
import numpy as np
from accelerate import Accelerator
from datasets import DownloadConfig, Image, Sequence
from datasets import Audio, DownloadConfig, Image, Sequence
from huggingface_hub import snapshot_download
from loguru import logger as eval_logger
from PIL import ImageFile
Expand Down Expand Up @@ -1065,6 +1065,8 @@ def concat_tar_parts(tar_parts, output_tar):
remove_cols.append(feature)
elif isinstance(features[feature], Sequence) and isinstance(features[feature].feature, Image):
remove_cols.append(feature)
elif isinstance(features[feature], Audio):
remove_cols.append(feature)
for remove_col in remove_cols:
self.dataset_no_image[doc_name] = self.dataset_no_image[doc_name].remove_columns(remove_col)

Expand Down

0 comments on commit 37b753e

Please sign in to comment.