Spaces:

DLPO
/

api_light_hf

Running

File size: 6,367 Bytes

cf7f643

# HF Inference API Model Configuration
# Hugging Face Inference API / Inference Providers 経由で利用可能なモデルを定義
# 価格: 2026/03時点の公開価格 (USD per 1M tokens, 目安)

default_model: meta-llama/Llama-3.3-70B-Instruct
fallback_order:
  - meta-llama/Llama-3.3-70B-Instruct
  - Qwen/Qwen2.5-72B-Instruct
  - mistralai/Mistral-7B-Instruct-v0.3

models:
  # ============================================
  # Meta Llama 3.3 (テキスト/JSON向け主力)
  # ============================================
  meta-llama/Llama-3.3-70B-Instruct:
    provider: huggingface
    task: text-generation
    supports_json: true
    supports_structured_output: false
    supports_images: false
    description: "Llama 3.3 70B - 高精度テキスト生成"
    pricing:
      input: 0.30
      output: 0.60
    recommended_for:
      - default
      - high_accuracy
      - complex_reasoning
      - japanese

  meta-llama/Llama-3.1-8B-Instruct:
    provider: huggingface
    task: text-generation
    supports_json: true
    supports_structured_output: false
    supports_images: false
    description: "Llama 3.1 8B - 軽量・高速テキスト生成"
    pricing:
      input: 0.06
      output: 0.12
    recommended_for:
      - speed
      - cost_efficiency

  # ============================================
  # Qwen 2.5 (日本語対応・JSON向け)
  # ============================================
  Qwen/Qwen2.5-72B-Instruct:
    provider: huggingface
    task: text-generation
    supports_json: true
    supports_structured_output: false
    supports_images: false
    description: "Qwen 2.5 72B - 多言語対応（日本語強め）"
    pricing:
      input: 0.30
      output: 0.60
    recommended_for:
      - high_accuracy
      - japanese
      - long_context

  Qwen/Qwen2.5-7B-Instruct:
    provider: huggingface
    task: text-generation
    supports_json: true
    supports_structured_output: false
    supports_images: false
    description: "Qwen 2.5 7B - 軽量日本語対応"
    pricing:
      input: 0.06
      output: 0.12
    recommended_for:
      - speed
      - cost_efficiency
      - japanese

  # ============================================
  # Mistral (テキスト向け)
  # ============================================
  mistralai/Mistral-7B-Instruct-v0.3:
    provider: huggingface
    task: text-generation
    supports_json: true
    supports_structured_output: false
    supports_images: false
    description: "Mistral 7B - 軽量汎用テキスト生成"
    pricing:
      input: 0.06
      output: 0.12
    recommended_for:
      - speed
      - cost_efficiency

  mistralai/Mixtral-8x7B-Instruct-v0.1:
    provider: huggingface
    task: text-generation
    supports_json: true
    supports_structured_output: false
    supports_images: false
    description: "Mixtral 8x7B - 高精度MoEテキスト生成"
    pricing:
      input: 0.27
      output: 0.27
    recommended_for:
      - high_accuracy
      - coding

  # ============================================
  # Vision / Multimodal (画像入力対応)
  # ============================================
  meta-llama/Llama-3.2-11B-Vision-Instruct:
    provider: huggingface
    task: image-text-to-text
    supports_json: true
    supports_structured_output: false
    supports_images: true
    description: "Llama 3.2 11B Vision - 画像+テキスト入力"
    pricing:
      input: 0.18
      output: 0.18
    recommended_for:
      - vision
      - multimodal
      - image_analysis

  meta-llama/Llama-3.2-90B-Vision-Instruct:
    provider: huggingface
    task: image-text-to-text
    supports_json: true
    supports_structured_output: false
    supports_images: true
    description: "Llama 3.2 90B Vision - 高精度画像+テキスト入力"
    pricing:
      input: 0.90
      output: 0.90
    recommended_for:
      - vision
      - multimodal
      - high_accuracy

  Qwen/Qwen2.5-VL-72B-Instruct:
    provider: huggingface
    task: image-text-to-text
    supports_json: true
    supports_structured_output: false
    supports_images: true
    description: "Qwen2.5-VL 72B - 高精度ビジョン言語モデル（日本語対応）"
    pricing:
      input: 0.90
      output: 0.90
    recommended_for:
      - vision
      - multimodal
      - japanese
      - high_accuracy

  Qwen/Qwen2.5-VL-7B-Instruct:
    provider: huggingface
    task: image-text-to-text
    supports_json: true
    supports_structured_output: false
    supports_images: true
    description: "Qwen2.5-VL 7B - 軽量ビジョン言語モデル（日本語対応）"
    pricing:
      input: 0.18
      output: 0.18
    recommended_for:
      - vision
      - speed
      - cost_efficiency
      - japanese

  # ============================================
  # Image Generation (HF FLUX系)
  # ============================================
  black-forest-labs/FLUX.1-dev:
    provider: huggingface
    task: text-to-image
    supports_json: false
    supports_structured_output: false
    supports_images: false
    description: "FLUX.1 Dev - 高品質テキストから画像生成"
    recommended_for:
      - image_generation

  black-forest-labs/FLUX.1-schnell:
    provider: huggingface
    task: text-to-image
    supports_json: false
    supports_structured_output: false
    supports_images: false
    description: "FLUX.1 Schnell - 高速テキストから画像生成"
    recommended_for:
      - image_generation
      - speed

# ============================================
# Model Aliases
# ============================================
aliases:
  llama3: meta-llama/Llama-3.3-70B-Instruct
  llama3-small: meta-llama/Llama-3.1-8B-Instruct
  llama3-vision: meta-llama/Llama-3.2-11B-Vision-Instruct
  llama3-vision-large: meta-llama/Llama-3.2-90B-Vision-Instruct
  qwen: Qwen/Qwen2.5-72B-Instruct
  qwen-small: Qwen/Qwen2.5-7B-Instruct
  qwen-vision: Qwen/Qwen2.5-VL-72B-Instruct
  qwen-vision-small: Qwen/Qwen2.5-VL-7B-Instruct
  mistral: mistralai/Mistral-7B-Instruct-v0.3
  mixtral: mistralai/Mixtral-8x7B-Instruct-v0.1
  flux: black-forest-labs/FLUX.1-dev
  flux-fast: black-forest-labs/FLUX.1-schnell

# ============================================
# Environment Variables
# ============================================
# HF_TOKEN: Hugging Face API トークン（必須）
# HF_MODEL: デフォルトモデルの上書き（任意）