data_juicer_agents.tools.plan.build_dataset_spec#

build_dataset_spec tool package.

class data_juicer_agents.tools.plan.build_dataset_spec.BuildDatasetSpecInput(*, intent: str, export_path: str, dataset_source: DatasetSource, dataset_profile: Dict[str, ~typing.Any]=<factory>, modality_hint: str = '', text_keys_hint: List[str] = <factory>, image_key_hint: str = '', audio_key_hint: str = '', video_key_hint: str = '', image_bytes_key_hint: str = '', **extra_data: Any)[源代码]#

基类：BaseModel

model_config = {'extra': 'allow'}#: Configuration for the model, should be a dictionary conforming to [ConfigDict][pydantic.config.ConfigDict].

intent: str#

export_path: str#

dataset_source: DatasetSource#

dataset_profile: Dict[str, Any]#

modality_hint: str#

text_keys_hint: List[str]#

image_key_hint: str#

audio_key_hint: str#

video_key_hint: str#

image_bytes_key_hint: str#

data_juicer_agents.tools.plan.build_dataset_spec.build_dataset_spec(*, user_intent: str, dataset_source: DatasetSource | None = None, export_path: str, dataset_profile: Dict[str, Any] | None = None, modality_hint: str = '', text_keys_hint: Iterable[Any] | None = None, image_key_hint: str = '', audio_key_hint: str = '', video_key_hint: str = '', image_bytes_key_hint: str = '', **kwargs: Any) → Dict[str, Any][源代码]#

data_juicer_agents.tools.plan.build_dataset_spec#

本页