Spaces:

DLPO
/

api_light_hf

Sleeping

App Files Files Community

api_light_hf / src /config /models.yaml

Renecto

deploy api_light_hf (2026-03-12 12:47:03)

cf7f643 5 days ago

raw

history blame contribute delete

6.37 kB

	# HF Inference API Model Configuration
	# Hugging Face Inference API / Inference Providers 経由で利用可能なモデルを定義
	# 価格: 2026/03時点の公開価格 (USD per 1M tokens, 目安)

	default_model: meta-llama/Llama-3.3-70B-Instruct
	fallback_order:
	- meta-llama/Llama-3.3-70B-Instruct
	- Qwen/Qwen2.5-72B-Instruct
	- mistralai/Mistral-7B-Instruct-v0.3

	models:
	# ============================================
	# Meta Llama 3.3 (テキスト/JSON向け主力)
	# ============================================
	meta-llama/Llama-3.3-70B-Instruct:
	provider: huggingface
	task: text-generation
	supports_json: true
	supports_structured_output: false
	supports_images: false
	description: "Llama 3.3 70B - 高精度テキスト生成"
	pricing:
	input: 0.30
	output: 0.60
	recommended_for:
	- default
	- high_accuracy
	- complex_reasoning
	- japanese

	meta-llama/Llama-3.1-8B-Instruct:
	provider: huggingface
	task: text-generation
	supports_json: true
	supports_structured_output: false
	supports_images: false
	description: "Llama 3.1 8B - 軽量・高速テキスト生成"
	pricing:
	input: 0.06
	output: 0.12
	recommended_for:
	- speed
	- cost_efficiency

	# ============================================
	# Qwen 2.5 (日本語対応・JSON向け)
	# ============================================
	Qwen/Qwen2.5-72B-Instruct:
	provider: huggingface
	task: text-generation
	supports_json: true
	supports_structured_output: false
	supports_images: false
	description: "Qwen 2.5 72B - 多言語対応（日本語強め）"
	pricing:
	input: 0.30
	output: 0.60
	recommended_for:
	- high_accuracy
	- japanese
	- long_context

	Qwen/Qwen2.5-7B-Instruct:
	provider: huggingface
	task: text-generation
	supports_json: true
	supports_structured_output: false
	supports_images: false
	description: "Qwen 2.5 7B - 軽量日本語対応"
	pricing:
	input: 0.06
	output: 0.12
	recommended_for:
	- speed
	- cost_efficiency
	- japanese

	# ============================================
	# Mistral (テキスト向け)
	# ============================================
	mistralai/Mistral-7B-Instruct-v0.3:
	provider: huggingface
	task: text-generation
	supports_json: true
	supports_structured_output: false
	supports_images: false
	description: "Mistral 7B - 軽量汎用テキスト生成"
	pricing:
	input: 0.06
	output: 0.12
	recommended_for:
	- speed
	- cost_efficiency

	mistralai/Mixtral-8x7B-Instruct-v0.1:
	provider: huggingface
	task: text-generation
	supports_json: true
	supports_structured_output: false
	supports_images: false
	description: "Mixtral 8x7B - 高精度MoEテキスト生成"
	pricing:
	input: 0.27
	output: 0.27
	recommended_for:
	- high_accuracy
	- coding

	# ============================================
	# Vision / Multimodal (画像入力対応)
	# ============================================
	meta-llama/Llama-3.2-11B-Vision-Instruct:
	provider: huggingface
	task: image-text-to-text
	supports_json: true
	supports_structured_output: false
	supports_images: true
	description: "Llama 3.2 11B Vision - 画像+テキスト入力"
	pricing:
	input: 0.18
	output: 0.18
	recommended_for:
	- vision
	- multimodal
	- image_analysis

	meta-llama/Llama-3.2-90B-Vision-Instruct:
	provider: huggingface
	task: image-text-to-text
	supports_json: true
	supports_structured_output: false
	supports_images: true
	description: "Llama 3.2 90B Vision - 高精度画像+テキスト入力"
	pricing:
	input: 0.90
	output: 0.90
	recommended_for:
	- vision
	- multimodal
	- high_accuracy

	Qwen/Qwen2.5-VL-72B-Instruct:
	provider: huggingface
	task: image-text-to-text
	supports_json: true
	supports_structured_output: false
	supports_images: true
	description: "Qwen2.5-VL 72B - 高精度ビジョン言語モデル（日本語対応）"
	pricing:
	input: 0.90
	output: 0.90
	recommended_for:
	- vision
	- multimodal
	- japanese
	- high_accuracy

	Qwen/Qwen2.5-VL-7B-Instruct:
	provider: huggingface
	task: image-text-to-text
	supports_json: true
	supports_structured_output: false
	supports_images: true
	description: "Qwen2.5-VL 7B - 軽量ビジョン言語モデル（日本語対応）"
	pricing:
	input: 0.18
	output: 0.18
	recommended_for:
	- vision
	- speed
	- cost_efficiency
	- japanese

	# ============================================
	# Image Generation (HF FLUX系)
	# ============================================
	black-forest-labs/FLUX.1-dev:
	provider: huggingface
	task: text-to-image
	supports_json: false
	supports_structured_output: false
	supports_images: false
	description: "FLUX.1 Dev - 高品質テキストから画像生成"
	recommended_for:
	- image_generation

	black-forest-labs/FLUX.1-schnell:
	provider: huggingface
	task: text-to-image
	supports_json: false
	supports_structured_output: false
	supports_images: false
	description: "FLUX.1 Schnell - 高速テキストから画像生成"
	recommended_for:
	- image_generation
	- speed

	# ============================================
	# Model Aliases
	# ============================================
	aliases:
	llama3: meta-llama/Llama-3.3-70B-Instruct
	llama3-small: meta-llama/Llama-3.1-8B-Instruct
	llama3-vision: meta-llama/Llama-3.2-11B-Vision-Instruct
	llama3-vision-large: meta-llama/Llama-3.2-90B-Vision-Instruct
	qwen: Qwen/Qwen2.5-72B-Instruct
	qwen-small: Qwen/Qwen2.5-7B-Instruct
	qwen-vision: Qwen/Qwen2.5-VL-72B-Instruct
	qwen-vision-small: Qwen/Qwen2.5-VL-7B-Instruct
	mistral: mistralai/Mistral-7B-Instruct-v0.3
	mixtral: mistralai/Mixtral-8x7B-Instruct-v0.1
	flux: black-forest-labs/FLUX.1-dev
	flux-fast: black-forest-labs/FLUX.1-schnell

	# ============================================
	# Environment Variables
	# ============================================
	# HF_TOKEN: Hugging Face API トークン（必須）
	# HF_MODEL: デフォルトモデルの上書き（任意）