name: content-moderation-env version: "1.0.0" description: > AI-powered content moderation environment. Agents triage text, social posts, and multimodal content (including deepfake detection) across three difficulty levels using the standard OpenEnv step/reset/state API. author: openenv-participant license: MIT tasks: - id: text_spam difficulty: easy description: Classify email/message content as spam or legitimate content_type: text num_items: 5 score_range: [0.0, 1.0] - id: content_moderation difficulty: medium description: Multi-label social media content moderation content_type: text num_items: 5 score_range: [0.0, 1.0] - id: deepfake_detection difficulty: hard description: Detect AI-manipulated/deepfake media and make moderation decisions content_type: multimodal num_items: 5 score_range: [0.0, 1.0] action_space: type: object fields: decision: type: string enum: [approve, reject, escalate, flag] reason: type: string confidence: type: float range: [0.0, 1.0] labels: type: array items: string valid_values: - spam - scam - phishing - pharmaceutical_spam - hate_speech - violence - harassment - misinformation - adult_content - deepfake - political_manipulation - fraud observation_space: type: object fields: content_id: string content_type: string text: optional string image_description: optional string detector_score: optional float metadata: object step_num: integer total_steps: integer endpoints: reset: POST /reset step: POST /step state: GET /state close: POST /close tasks: GET /tasks health: GET /health docker: context: server dockerfile: server/Dockerfile huggingface: space_sdk: docker tags: - openenv - content-moderation - deepfake-detection