Source code for data_juicer_agents.tools.plan.build_dataset_spec.input

# -*- coding: utf-8 -*-
"""Input models for build_dataset_spec."""

from __future__ import annotations

from typing import Any, Dict, List

from pydantic import BaseModel, Field


[docs] class BuildDatasetSpecInput(BaseModel): intent: str = Field(description="User intent for the current planning task.") dataset_path: str = Field(description="Input dataset path.") export_path: str = Field(description="Output dataset path.") dataset_profile: Dict[str, Any] = Field( description="Dataset inspection payload returned by inspect_dataset.", ) modality_hint: str = Field(default="", description="Optional explicit modality override.") text_keys_hint: List[str] = Field(default_factory=list, description="Optional text key overrides.") image_key_hint: str = Field(default="", description="Optional image key override.") audio_key_hint: str = Field(default="", description="Optional audio key override.") video_key_hint: str = Field(default="", description="Optional video key override.") image_bytes_key_hint: str = Field(default="", description="Optional image-bytes key override.")