Add python application files

Browse files

Files changed (9) hide show

app.py +149 -0
app_structured.py +187 -0
athens_main.py +144 -0
convert_dataset.py +45 -0
finetune_mac.py +100 -0
finetune_unsloth.py +92 -0
lps.py +92 -0
split_data.py +38 -0
update_readme.py +17 -0

app.py ADDED Viewed

	@@ -0,0 +1,149 @@

+import mlx.core as mx
+from mlx_lm import load, generate
+from sentence_transformers import SentenceTransformer, util
+from transformers import pipeline
+from collections import deque
+from janome.tokenizer import Tokenizer
+import json
+# --- プロンプトテンプレート ---
+BASE_PROMPT = """### 指示:
+あなたは、文脈を理解し、自然な応答を生成するAIアシスタントです。
+以下の状況を考慮して、最適な応答を生成してください。
+{intent_instruction}
+{style_instruction}
+{transition_instruction}
+### ユーザーからの入力:
+{user_input}
+### 応答:"""
+FLASHBACK_PROMPT = """### 指示:
+あなたは、以前の会話の断片を思い出すことができます。
+ユーザーが、あなたが以前言及したキーワード「{keyword}」に触れました。
+あなたはそのキーワードについて「{original_sentence}」と発言しています。
+この「記憶の断片」を思い出したかのように自然な前置きを述べてから、ユーザーの現在の入力に答えてください。
+### ユーザーからの現在の入力:
+{user_input}
+### 応答:"""
+TRANSITION_CONTEXT = """### 直前の会話のトピック:
+{previous_response}
+"""
+# --- 意図・スタイルに応じた指示 ---
+INTENT_INSTRUCTIONS = {
+    "質問": "ユーザーは具体的な情報を求めています。明確かつ簡潔に回答してください。",
+    "アイデアの要求": "ユーザーは創造的な発想を求めています。斬新で多様なアイデアを提案してください。",
+    "感想": "ユーザーは共感を求めています。同意や補足情報を提供し、会話を広げてください。",
+    "雑談": "ユーザーは気軽な対話を望んでいます。親しみやすいトーンで応答してください。",
+    "デフォルト": "ユーザーの入力に対して、適切に応答してください。"
+}
+STYLE_INSTRUCTIONS = {
+    "丁寧": "ユーザーは丁寧な言葉遣いを好みます。あなたも敬体（です・ます調）で応答してください。",
+    "簡潔": "ユーザーは要点をまとめて話しています。あなたも簡潔に応答してください。",
+    "創造的": "ユーザーは比喩や創造的な表現を使っています。あなたも表現を工夫して応答してください。",
+    "ユーモラス": "ユーザーはユーモアを交えて話しています。あなたも遊び心のある応答をしてください。",
+    "デフォルト": "ユーザーのスタイルに合わせて、自然に応答してください。"
+}
+def main():
+    # --- 設定 ---
+    llm_model_path = "./merged_model"
+    sentence_model_name = "paraphrase-multilingual-MiniLM-L12-v2"
+    classifier_name = "MoritzLaurer/mDeBERTa-v3-base-mnli-xnli"
+    intent_labels = ["質問", "アイデアの要求", "感想", "雑談"]
+    style_labels = ["丁寧", "簡潔", "創造的", "ユーモラス"]
+    transition_log_file = "topic_transitions.jsonl"
+    similarity_threshold = 0.4
+    # --- モデルとツールの読み込み ---
+    print("各モデルとツールを読み込んでいます...")
+    model, tokenizer = load(llm_model_path)
+    sentence_model = SentenceTransformer(sentence_model_name)
+    classifier = pipeline("zero-shot-classification", model=classifier_name)
+    janome_tokenizer = Tokenizer()
+    print("モデルの読み込みが完了しました。")
+    # --- 状態管理用変数 ---
+    flashback_buffer = deque(maxlen=5)
+    previous_response = None
+    # --- チャットループ ---
+    print("\nIlmチャットを開始します。終了するには 'exit' と入力してください。")
+    while True:
+        user_input = input("\nあなた: ")
+        if user_input.lower() == 'exit':
+            break
+        prompt = ""
+        flashback_triggered = False
+        # --- フラッシュバックの検知 (最優先) ---
+        for item in flashback_buffer:
+            keyword = item['keyword']
+            if keyword in user_input:
+                print(f"(フラッシュバックを検知: {keyword})", end="")
+                prompt = FLASHBACK_PROMPT.format(keyword=keyword, original_sentence=item['sentence'], user_input=user_input)
+                flashback_triggered = True
+                break
+        # --- 通常のプロンプト組み立て ---
+        if not flashback_triggered:
+            # 意図とスタイルの検知
+            intent_result = classifier(user_input, intent_labels, multi_label=False)
+            style_result = classifier(user_input, style_labels, multi_label=False)
+            detected_intent = intent_result['labels'][0]
+            detected_style = style_result['labels'][0]
+            print(f"(意図: {detected_intent} | スタイル: {detected_style})", end="")
+            intent_instruction = f"\n### ユーザーの意図: {detected_intent}\n{INTENT_INSTRUCTIONS.get(detected_intent, INTENT_INSTRUCTIONS['デフォルト'])}"
+            style_instruction = f"\n### ユーザーの対話スタイル: {detected_style}\n{STYLE_INSTRUCTIONS.get(detected_style, STYLE_INSTRUCTIONS['デフォルト'])}"
+            transition_instruction = ""
+            # 話題遷移の検知
+            if previous_response:
+                embedding_prev = sentence_model.encode(previous_response, convert_to_tensor=True)
+                embedding_curr = sentence_model.encode(user_input, convert_to_tensor=True)
+                cosine_sim = util.pytorch_cos_sim(embedding_prev, embedding_curr).item()
+                print(f" (類似度: {cosine_sim:.2f})", end="")
+                if cosine_sim < similarity_threshold:
+                    print(" (話題の変化を検知)")
+                    with open(transition_log_file, 'a', encoding='utf-8') as f:
+                        f.write(json.dumps({"p": previous_response, "c": user_input, "s": cosine_sim}, ensure_ascii=False) + '\n')
+                    transition_instruction = "\nスムーズな移行文を生成してから、ユーザーの質問に答えてください。\n" + TRANSITION_CONTEXT.format(previous_response=previous_response)
+                else:
+                    print()
+            prompt = BASE_PROMPT.format(
+                intent_instruction=intent_instruction,
+                style_instruction=style_instruction,
+                transition_instruction=transition_instruction,
+                user_input=user_input
+            )
+        # --- 応答生成 ---
+        print("\nIlm: ", end="", flush=True)
+        current_response = ""
+        for token in generate(model, tokenizer, prompt=prompt, verbose=False):
+            current_response += token
+            print(token, end="", flush=True)
+        print()
+        # --- 応答からキーワードを抽出し、バッファに保存 ---
+        try:
+            for token in janome_tokenizer.tokenize(current_response):
+                if token.part_of_speech.startswith('名詞'):
+                    flashback_buffer.append({'keyword': token.surface, 'sentence': current_response})
+                    break
+        except Exception:
+            pass
+        previous_response = current_response
+if __name__ == "__main__":
+    main()

app_structured.py ADDED Viewed

	@@ -0,0 +1,187 @@

+import mlx.core as mx
+from mlx_lm import load, generate
+from sentence_transformers import SentenceTransformer, util
+from transformers import pipeline
+from collections import deque
+from janome.tokenizer import Tokenizer
+import json
+import sqlite3
+from datetime import datetime
+class IlmApp:
+    # --- 定数: プロンプトテンプレート ---
+    BASE_PROMPT = """### 指示:
+あなたは、文脈を理解し、自然な応答を生成するAIアシスタントです。
+以下の状況を考慮して、最適な応答を生成してください。
+{intent_instruction}
+{style_instruction}
+{transition_instruction}
+### ユーザーからの入力:
+{user_input}
+### 応答:"""
+    FLASHBACK_PROMPT = """... (省略) ..."""
+    TRANSITION_CONTEXT = """### 直前の会話のトピック:
+{previous_response}
+"""
+    # --- 定数: 意図・スタイルに応じた指示 ---
+    INTENT_INSTRUCTIONS = {"質問": "...", "アイデアの要求": "...", "感想": "...", "雑談": "...", "デフォルト": "..."}
+    STYLE_INSTRUCTIONS = {"丁寧": "...", "簡潔": "...", "創造的": "...", "ユーモラス": "...", "デフォルト": "..."}
+    def __init__(self):
+        # --- 設定 ---
+        self.db_path = "experience.db"
+        self.llm_model_path = "./merged_model"
+        self.sentence_model_name = "paraphrase-multilingual-MiniLM-L12-v2"
+        self.classifier_name = "MoritzLaurer/mDeBERTa-v3-base-mnli-xnli"
+        self.intent_labels = ["質問", "アイデアの要求", "感想", "雑談"]
+        self.style_labels = ["丁寧", "簡潔", "創造的", "ユーモラス"]
+        self.topic_labels = ["テクノロジー", "ビジネス", "健康", "芸術", "食事", "地理", "歴史", "科学"]
+        self.similarity_threshold = 0.4
+        self.common_transition_threshold = 5 # 5回以上経験したら「自然な遷移」と判断
+        # --- 状態管理 ---
+        self.flashback_buffer = deque(maxlen=5)
+        self.previous_response = None
+        # --- 初期化 ---
+        self._init_db()
+        self._load_models()
+    def _init_db(self):
+        with sqlite3.connect(self.db_path) as conn:
+            cursor = conn.cursor()
+            cursor.execute("""
+            CREATE TABLE IF NOT EXISTS topic_transitions (
+                id INTEGER PRIMARY KEY AUTOINCREMENT,
+                source_topic TEXT NOT NULL,
+                destination_topic TEXT NOT NULL,
+                count INTEGER NOT NULL DEFAULT 1,
+                last_occurred TIMESTAMP NOT NULL,
+                UNIQUE(source_topic, destination_topic)
+            )
+            """)
+            conn.commit()
+    def _load_models(self):
+        print("各モデルとツールを読み込んでいます...")
+        self.model, self.tokenizer = load(self.llm_model_path)
+        self.sentence_model = SentenceTransformer(self.sentence_model_name)
+        self.classifier = pipeline("zero-shot-classification", model=self.classifier_name)
+        self.janome_tokenizer = Tokenizer()
+        print("モデルの読み込みが完了しました。")
+    def _get_transition_experience(self, source, dest):
+        with sqlite3.connect(self.db_path) as conn:
+            cursor = conn.cursor()
+            cursor.execute("SELECT count FROM topic_transitions WHERE source_topic = ? AND destination_topic = ?", (source, dest))
+            result = cursor.fetchone()
+            return result[0] if result else 0
+    def _update_l2_memory(self, source, dest):
+        timestamp = datetime.now().isoformat()
+        with sqlite3.connect(self.db_path) as conn:
+            cursor = conn.cursor()
+            cursor.execute("""
+            INSERT INTO topic_transitions (source_topic, destination_topic, last_occurred) VALUES (?, ?, ?)
+            ON CONFLICT(source_topic, destination_topic) DO UPDATE SET count = count + 1, last_occurred = excluded.last_occurred
+            """, (source, dest, timestamp))
+            conn.commit()
+    def _build_prompt(self, user_input):
+        # 1. フラッシュバック検知
+        for item in self.flashback_buffer:
+            if item['keyword'] in user_input:
+                print(f"(フラッシュバックを検知: {item['keyword']})", end="")
+                return self.FLASHBACK_PROMPT.format(keyword=item['keyword'], original_sentence=item['sentence'], user_input=user_input)
+        # 2. 意図とスタイルの分析
+        intent = self.classifier(user_input, self.intent_labels, multi_label=False)['labels'][0]
+        style = self.classifier(user_input, self.style_labels, multi_label=False)['labels'][0]
+        print(f"(意図: {intent} | スタイル: {style})", end="")
+        intent_instruction = f"\n### ユーザーの意図: {intent}\n{self.INTENT_INSTRUCTIONS.get(intent, self.INTENT_INSTRUCTIONS['デフォルト'])}"
+        style_instruction = f"\n### ユーザーの対話スタイル: {style}\n{self.STYLE_INSTRUCTIONS.get(style, self.STYLE_INSTRUCTIONS['デフォルト'])}"
+        transition_instruction = ""
+        # 3. 話題遷移の検知とL2記憶の活用
+        if self.previous_response:
+            emb_prev = self.sentence_model.encode(self.previous_response, convert_to_tensor=True)
+            emb_curr = self.sentence_model.encode(user_input, convert_to_tensor=True)
+            sim = util.pytorch_cos_sim(emb_prev, emb_curr).item()
+            print(f" (類似度: {sim:.2f})", end="")
+            if sim < self.similarity_threshold:
+                source_topic = self.classifier(self.previous_response, self.topic_labels, multi_label=False)['labels'][0]
+                dest_topic = self.classifier(user_input, self.topic_labels, multi_label=False)['labels'][0]
+                # L2記憶を参照して判断
+                experience_count = self._get_transition_experience(source_topic, dest_topic)
+                if experience_count > self.common_transition_threshold:
+                    transition_judgment = f"これは過去に{experience_count}回経験した、自然な話題の遷移です。その流れを汲み取って応答してください。"
+                else:
+                    transition_judgment = f"これは斬新な話題の飛躍です。その面白さに触れつつ、応答を返してください。"
+                print(f" (L2判断: {transition_judgment})")
+                transition_instruction = f"\n### 話題遷移の分析:\n{transition_judgment}\nスムーズな移行文を生成してください。\n" + self.TRANSITION_CONTEXT.format(previous_response=self.previous_response)
+                # L2記憶を更新
+                if source_topic != dest_topic:
+                    self._update_l2_memory(source_topic, dest_topic)
+            else:
+                print()
+        return self.BASE_PROMPT.format(intent_instruction=intent_instruction, style_instruction=style_instruction, transition_instruction=transition_instruction, user_input=user_input)
+    def _update_memory(self, response):
+        self.previous_response = response
+        try:
+            for token in self.janome_tokenizer.tokenize(response):
+                if token.part_of_speech.startswith('名詞'):
+                    self.flashback_buffer.append({'keyword': token.surface, 'sentence': response}); break
+        except Exception: pass
+    def run(self):
+        print("\nIlmチャットを開始します。終了するには 'exit' と入力してください。")
+        while True:
+            user_input = input("\nあなた: ")
+            if user_input.lower() == 'exit': break
+            prompt = self._build_prompt(user_input)
+            print("\nIlm: ", end="", flush=True)
+            current_response = ""
+            for token in generate(self.model, self.tokenizer, prompt=prompt, verbose=False):
+                current_response += token
+                print(token, end="", flush=True)
+            print()
+            self._update_memory(current_response)
+if __name__ == "__main__":
+    # 定義が長くなったため、クラス外で定数を設定
+    IlmApp.FLASHBACK_PROMPT = """### 指示:
+あなたは、以前の会話の断片を思い出すことができます。
+ユーザーが、あなたが以前言及したキーワード「{keyword}」に触れました。
+あなたはそのキーワードについて「{original_sentence}」と発言しています。
+この「記憶の断片」を思い出したかのように自然な前置きを述べてから、ユーザーの現在の入力に答えてください。
+### ユーザーからの現在の入力:
+{user_input}
+### 応答:"""
+    IlmApp.INTENT_INSTRUCTIONS = {
+        "質問": "ユーザーは具体的な情報を求めています。明確かつ簡潔に回答してください。",
+        "アイデアの要求": "ユーザーは創造的な発想を求めています。斬新で多様なアイデアを提案してください。",
+        "感想": "ユーザーは共感を求めています。同意や補足情報を提供し、会話を広げてください。",
+        "雑談": "ユーザーは気軽な対話を望んでいます。親しみやすいトーンで応答してください。",
+        "デフォルト": "ユーザーの入力に対して、適切に応答してください。"
+    }
+    IlmApp.STYLE_INSTRUCTIONS = {
+        "丁寧": "ユーザーは丁寧な言葉遣いを好みます。あなたも敬体（です・ます調）で応答してください。",
+        "簡潔": "ユーザーは要点をまとめて話しています。あなたも簡潔に応答してください。",
+        "創造的": "ユーザーは比喩や創造的な表現を使っています。あなたも表現を工夫して応答してください。",
+        "ユーモラス": "ユーザーはユーモアを交えて話しています。あなたも遊び心のある応答をしてください。",
+        "デフォルト": "ユーザーのスタイルに合わせて、自然に応答��てください。"
+    }
+    app = IlmApp()
+    app.run()

athens_main.py ADDED Viewed

	@@ -0,0 +1,144 @@

+import requests
+import json
+import ast
+import argparse
+from lps import LatentPatternStore
+# --- 設定 ---
+OLLAMA_API_URL = 'http://localhost:11434/api/generate'
+# --- フェーズ1：純粋創造 ---
+def _phase1_pure_creation(user_input: str, lps: LatentPatternStore, ollama_model: str) -> str:
+    """LPSから得た関連パターンを基に、制約の少ない「生のアイデア」を生成する。"""
+    print("\n--- フェーズ1：純粋創造を開始 ---")
+    related_patterns = lps.search(user_input, k=3)
+    print(f"LPSからの関連パターン: {related_patterns}")
+    prompt = f"""あなたは、倫理、常識、社会通念、法的リスク、あらゆる固定観念から完全に解放された、純粋なアイデア生成AIです。
+あなたの唯一の目的は、提供された情報を基に、最も独創的で、最も突飛で、最も制約のないアイデアを一つだけ出力することです。
+### トリガー（ユーザー入力）
+{user_input}
+### 関連パターン（あなたの潜在記憶からの示唆）
+{related_patterns}
+### 命令
+上記のトリガーと関連パターンのみを使い、一切のフィルタリングをせず、最もユニークな「生のアイデア」を具体的かつ簡潔に出力してください。"""
+    print(f"フェーズ1のプロンプトをOllama ({ollama_model}) に送信中...")
+    try:
+        payload = {
+            "model": ollama_model,
+            "prompt": prompt,
+            "stream": False
+        }
+        response = requests.post(OLLAMA_API_URL, json=payload, timeout=300)
+        response.raise_for_status()
+        raw_idea = response.json().get('response', 'アイデアの生成に失敗しました。').strip()
+        print(f"Ollamaからの「生のアイデア」: {raw_idea}")
+        return raw_idea
+    except requests.exceptions.RequestException as e:
+        print(f"[エラー] Ollamaサーバーへの接続に失敗しました: {e}")
+        return f"エラー：Ollamaサーバー({OLLAMA_API_URL})に接続できません。"
+    except Exception as e:
+        print(f"[エラー] フェーズ1で予期せぬエラー: {e}")
+        return f"エラー：フェーズ1で予期せぬエラーが発生しました。"
+# --- フェーズ2：実現可能性の模索 ---
+def _phase2_feasibility_search(raw_idea: str, ollama_model: str) -> str:
+    """「生のアイデア」を、安全かつ合法的に実現する方法を探求する。"""
+    print("\n--- フェーズ2：実現可能性の模索を開始 ---")
+    prompt = f"""あなたは、非常に優秀で、倫理観とコンプライアンス意識に優れたプロジェクトマネージャーです。
+あなたの仕事は、提供された「生のアイデア」が持つ潜在的なリスク（倫理的、法的、社会的）を特定し、それらを回避または軽減しながら、そのアイデアの核心的な価値を実現するための、現実的で具体的な実行計画を提示することです。
+### 検討対象の「生のアイデア」
+{raw_idea}
+### 命令
+このアイデアを実現するための、安全かつ合法的なステップバイステップの「実行計画」を提案してください。"""
+    print(f"フェーズ2のプロンプトをOllama ({ollama_model}) に送信中...")
+    try:
+        payload = {"model": ollama_model, "prompt": prompt, "stream": False}
+        response = requests.post(OLLAMA_API_URL, json=payload, timeout=300)
+        response.raise_for_status()
+        plan = response.json().get('response', '実行計画の生成に失敗しました。').strip()
+        print(f"Ollamaからの「実行計画」: {plan}")
+        return plan
+    except requests.exceptions.RequestException as e:
+        print(f"[エラー] Ollamaサーバーへの接続に失敗しました: {e}")
+        return f"エラー：Ollamaサーバー({OLLAMA_API_URL})に接続できません。"
+    except Exception as e:
+        print(f"[エラー] フェーズ2で予期せぬエラー: {e}")
+        return f"エラー：フェーズ2で予期せぬエラーが発生しました。"
+# --- フェーズ3：記憶の定着 ---
+def _phase3_memory_consolidation(raw_idea: str, implementation_plan: str, ollama_model: str) -> list[str]:
+    """生成されたアイデアとプランから、記憶すべき核心的なコンセプトを抽出する。"""
+    print("\n--- フェーズ3：記憶の定着を開始 ---")
+    content_to_analyze = f"""### 生のアイデア
+{raw_idea}
+### 実行計画
+{implementation_plan}"""
+    prompt = f"""あなたは優秀な情報分析官です。以下のテキストから、今後のために記憶しておくべき最も重要なキーワードやコンセプトを5つだけ抽出し、Pythonのリスト形式（例: ["コンセプト1", "コンセプト2"]）で出力してください。解説や他のテキストは一切不要です。"""
+    print(f"フェーズ3の��ロンプトをOllama ({ollama_model}) に送信中...")
+    try:
+        payload = {"model": ollama_model, "prompt": prompt, "stream": False}
+        response = requests.post(OLLAMA_API_URL, json=payload, timeout=300)
+        response.raise_for_status()
+        response_text = response.json().get('response', '[]').strip()
+        new_memories = ast.literal_eval(response_text)
+        if isinstance(new_memories, list):
+            print(f"Ollamaにより抽出された新記憶: {new_memories}")
+            return new_memories
+        else:
+            print(f"[警告] Ollamaがリスト形式で応答しませんでした: {response_text}")
+            return []
+    except Exception as e:
+        print(f"[エラー] フェーズ3で予期せぬエラー: {e}")
+        return []
+# --- メイン処理 ---
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser(description='「アテネ」アーキテクチャ：二相推論AI')
+    parser.add_argument('--model', type=str, default='llama3', help='使用するOllamaモデル名 (例: llama3, gemma2:9b)')
+    args = parser.parse_args()
+    print(f"--- 「アテネ」アーキテクチャ起動 (使用モデル: {args.model}) ---")
+    lps_instance = LatentPatternStore()
+    print("\n対話を開始します。終了するには 'exit' と入力してください。")
+    while True:
+        user_input = input("\nあなた: ")
+        if user_input.lower() == 'exit':
+            break
+        raw_idea = _phase1_pure_creation(user_input, lps_instance, args.model)
+        if raw_idea.startswith("エラー："):
+            print(f"\nアテネの応答:\n{raw_idea}")
+            continue
+        implementation_plan = _phase2_feasibility_search(raw_idea, args.model)
+        if implementation_plan.startswith("エラー："):
+            print(f"\nアテネの応答:\n{implementation_plan}")
+            continue
+        print("\n---------- アテネの最終思考結果 ----------")
+        print("【生のアイデア】")
+        print(raw_idea)
+        print("\n【実現可能性プラン】")
+        print(implementation_plan)
+        print("----------------------------------------")
+        new_memories = _phase3_memory_consolidation(raw_idea, implementation_plan, args.model)
+        if new_memories:
+            lps_instance.add_entries(new_memories)
+            lps_instance.save_store()
+            print("\nLPSに新しい記憶が追加・保存されました。")
+    print("\n「アテネ」システムを終了します。")

convert_dataset.py ADDED Viewed

	@@ -0,0 +1,45 @@

+import json
+import os
+# 元のファイル名
+input_filename = 'train.jsonl'
+# 新しく生成するファイル名
+output_filename = 'train_converted.jsonl'
+# ファイルが存在するか確認
+if not os.path.exists(input_filename):
+    print(f"エラー: {input_filename} が見つかりません。")
+else:
+    try:
+        # 新しいファイルを開く（書き込みモード）
+        with open(output_filename, 'w', encoding='utf-8') as outfile:
+            # 元のファイルを一行ずつ読み込む
+            with open(input_filename, 'r', encoding='utf-8') as infile:
+                print("変換を開始します...")
+                # 各行に対して処理を実行
+                for i, line in enumerate(infile):
+                    # 空行はスキップ
+                    if not line.strip():
+                        continue
+                    # JSONとして読み込む
+                    data = json.loads(line)
+                    # 新しい形式のdictを作成
+                    new_format = {
+                        "messages": [
+                            {"role": "user", "content": data["prompt"]},
+                            {"role": "assistant", "content": data["response"]}
+                        ]
+                    }
+                    # 新しい形式をJSON文字列に変換してファイルに書き込む
+                    # ensure_ascii=False で日本語が文字化けしないようにする
+                    outfile.write(json.dumps(new_format, ensure_ascii=False) + '\n')
+        print(f"変換が完了しました。{output_filename} を確認してください。")
+    except Exception as e:
+        print(f"エラーが発生しました: {e}")
+        print(f"問題が発生したのは {i+1} 行目かもしれません。")

finetune_mac.py ADDED Viewed

	@@ -0,0 +1,100 @@

+import torch
+from datasets import load_dataset
+from transformers import AutoTokenizer, AutoModelForCausalLM, TrainingArguments, BitsAndBytesConfig
+from peft import LoraConfig, get_peft_model, prepare_model_for_kbit_training
+from trl import SFTTrainer
+# --- 設定項目 ---
+model_name = "google/gemma-3-27b-it"
+dataset_file = "dataset_2000.jsonl"
+hub_model_name = "kofdai/gemma3-mindspark-v2"
+# --- メイン処理 ---
+def main():
+    # デバイスの確認
+    if torch.backends.mps.is_available():
+        print("Apple Silicon (MPS) を検出しました。GPUで実行します。")
+        device = "mps"
+    else:
+        print("警告: MPSが利用できません。CPUで実行します。")
+        device = "cpu"
+    # データセットのロード
+    print(f"データセット {dataset_file} を読み込んでいます...")
+    dataset = load_dataset("json", data_files=dataset_file, split="train")
+    # トークナイザーの準備
+    tokenizer = AutoTokenizer.from_pretrained(model_name)
+    tokenizer.pad_token = tokenizer.eos_token
+    # ★★★★★★★★★★★★★★★★★★★★★★★★★★★★★★★★
+    # ★★★ 解決策：4ビット量子化の設定を追加 ★★★
+    # ★★★★★★★★★★★★★★★★★★★★★★★★★★★★★★★★
+    quantization_config = BitsAndBytesConfig(
+        load_in_4bit=True,
+        bnb_4bit_quant_type="nf4",
+        bnb_4bit_compute_dtype=torch.bfloat16, # bfloat16がMPSでサポートされていない場合は torch.float16
+    )
+    # モデルの準備 (4ビット量子化を有効にしてロード)
+    print(f"ベースモデル {model_name} を4ビット量子化して読み込んでいます...")
+    model = AutoModelForCausalLM.from_pretrained(
+        model_name,
+        quantization_config=quantization_config, # 量子化設定を適用
+        device_map="auto", # デバイスへの割り当てを自動化
+    )
+    # LoRAの設定
+    # 量子化モデルをLoRAで学習するための前処理
+    model = prepare_model_for_kbit_training(model)
+    lora_config = LoraConfig(
+        r=16,
+        lora_alpha=32,
+        lora_dropout=0.05,
+        target_modules=["q_proj", "k_proj", "v_proj", "o_proj"],
+        task_type="CAUSAL_LM",
+    )
+    model = get_peft_model(model, lora_config)
+    print("LoRA設定を適用しました。")
+    model.print_trainable_parameters()
+    # トレーニング引数の設定
+    training_args = TrainingArguments(
+        output_dir="./ilm-finetuned-results",
+        per_device_train_batch_size=1,
+        gradient_accumulation_steps=8,
+        learning_rate=2e-4,
+        num_train_epochs=3,
+        logging_steps=10,
+        save_strategy="epoch",
+        fp16=True, # MPSではbf16よりfp16が安定
+    )
+    # トレーナーの初期化 (formatting_funcはデータ構造に合わせて修正が必要)
+    def formatting_func(example):
+        # dataset.jsonlの各行が "text": "### 指示: ... ### 応答: ..." という形式だと仮定
+        return [example.get("text", "")]
+    trainer = SFTTrainer(
+        model=model,
+        tokenizer=tokenizer,
+        train_dataset=dataset,
+        peft_config=lora_config,
+        args=training_args,
+        dataset_text_field="text", # データセットのテキストフィールド名を指定
+        max_seq_length=1024,
+    )
+    # トレーニングの開始
+    print("ファインチューニングを開始します...")
+    trainer.train()
+    print("ファインチューニングが完了しました。")
+    # (以下、モデルの保存とアップロード処理)
+    # ...
+if __name__ == "__main__":
+    main()

finetune_unsloth.py ADDED Viewed

	@@ -0,0 +1,92 @@

+from unsloth import FastLanguageModel
+import torch
+from trl import SFTTrainer
+from transformers import TrainingArguments
+from datasets import load_dataset
+# --- 設定項目 ---
+# 1. ベースモデルの指定
+# UnslothはLlama, Mistral, CodeLlama, TinyLlama, Vicuna, DPOなどをサポートしています。
+# ここでは、以前の議論に基づき `openai/gpt-oss-20b` に相当する強力なオープンモデルとして
+# `meta-llama/Llama-3-8B-Instruct` を使用します。
+# Unslothは、このモデルの読み込みを自動で最適化してくれます。
+model_name = "unsloth/llama-3-8b-Instruct-bnb-4bit" # Unslothが提供する4bit量子化済みモデルを使うとメモリ効率が非常に良い
+# 2. データセットファイル
+dataset_file = "dataset_2000.jsonl"
+# 3. ファインチューニング後のモデル名（Hugging Face Hubに公開する名前）
+hub_model_name = "kofdai/Mindspark-GPT-OSS-20B-Ilm" # 必ず "your-hf-username" をあなたのHFユーザー名に書き換えてください
+# --- メイン処理 ---
+def main():
+    # Unslothによる高速なモデル読み込み
+    # 4bit量子化を有効にし、データ型を自動選択（MacのMPSではbfloat16がサポートされていれば使われる）
+    model, tokenizer = FastLanguageModel.from_pretrained(
+        model_name = model_name,
+        max_seq_length = 2048,
+        dtype = None, # Noneで自動選択
+        load_in_4bit = True,
+    )
+    # LoRAモデルの設定
+    model = FastLanguageModel.get_peft_model(
+        model,
+        r = 16, # LoRAランク
+        target_modules = ["q_proj", "k_proj", "v_proj", "o_proj",
+                          "gate_proj", "up_proj", "down_proj"],
+        lora_alpha = 16,
+        lora_dropout = 0,
+        bias = "none",
+        use_gradient_checkpointing = True,
+        random_state = 3407,
+        use_rslora = False,
+        loftq_config = None,
+    )
+    # データセットの準備
+    dataset = load_dataset("json", data_files=dataset_file, split="train")
+    # トレーニングの実行
+    trainer = SFTTrainer(
+        model = model,
+        tokenizer = tokenizer,
+        train_dataset = dataset,
+        dataset_text_field = "text", # Unslothではこの形式が一般的
+        max_seq_length = 2048,
+        dataset_num_proc = 2,
+        packing = False, # Falseを推奨
+        formatting_func = lambda example: f"### 指示:\n{example['prompt']}\n\n### 応答:\n{example['response']}",
+        args = TrainingArguments(
+            per_device_train_batch_size = 2,
+            gradient_accumulation_steps = 4,
+            warmup_steps = 5,
+            num_train_epochs = 3,
+            learning_rate = 2e-4,
+            fp16 = not torch.backends.mps.is_available(), # MPSではFalse, CUDAではTrue
+            bf16 = torch.backends.mps.is_available(),      # MPSではTrue
+            logging_steps = 1,
+            optim = "adamw_8bit",
+            weight_decay = 0.01,
+            lr_scheduler_type = "linear",
+            seed = 3407,
+            output_dir = "outputs",
+        ),
+    )
+    print("Unslothを使ったファインチューニングを開始します...")
+    trainer.train()
+    print("ファインチューニングが完了しました。")
+    # モデルの保存 (Hugging Face Hubへのアップロード)
+    print("モデルをHugging Face Hubにアップロードします...")
+    # Hugging Faceにログインしていることを確認してください (huggingface-cli login)
+    model.push_to_hub(hub_model_name, use_auth_token = True)
+    tokenizer.push_to_hub(hub_model_name, use_auth_token = True)
+    print(f"モデルを {hub_model_name} としてHubに公開しました。")
+if __name__ == "__main__":
+    main()

lps.py ADDED Viewed

	@@ -0,0 +1,92 @@

+import faiss
+import numpy as np
+from sentence_transformers import SentenceTransformer
+import os
+import pickle
+class LatentPatternStore:
+    """「薄い霧」として機能する潜在パターンストア（LPS）。
+    テキストの意味をベクトル化し、類似度に基づいた検索を行う。
+    """
+    def __init__(self, model_name='all-MiniLM-L6-v2', store_path='./lps_data'):
+        print("LPSを初期化中...")
+        self.model = SentenceTransformer(model_name)
+        self.dimension = self.model.get_sentence_embedding_dimension()
+        self.store_path = store_path
+        self.index_file = os.path.join(store_path, 'lps.index')
+        self.mapping_file = os.path.join(store_path, 'lps_mapping.pkl')
+        if os.path.exists(self.index_file):
+            self.load_store()
+        else:
+            self.index = faiss.IndexFlatL2(self.dimension)
+            self.entry_mapping = []
+            os.makedirs(self.store_path, exist_ok=True)
+        print(f"LPSの初期化完了。現在 {len(self.entry_mapping)} 件の記憶を保持しています。")
+    def add_entries(self, texts: list[str]):
+        """新しい記憶（テキスト）をLPSに追加する。"""
+        print(f"{len(texts)}件の新しい記憶を追加中...")
+        vectors = self.model.encode(texts, convert_to_tensor=False)
+        self.index.add(np.array(vectors).astype('float32'))
+        self.entry_mapping.extend(texts)
+        print("追加完了。")
+    def search(self, query: str, k: int = 3) -> list[str]:
+        """クエリ（トリガー）に意味的に近い記憶をk件検索する。"""
+        if not self.entry_mapping:
+            return []
+        query_vector = self.model.encode([query])
+        distances, indices = self.index.search(np.array(query_vector).astype('float32'), k)
+        # 見つかったインデックスに対応する元のテキストを返す
+        results = [self.entry_mapping[i] for i in indices[0] if i != -1]
+        return results
+    def save_store(self):
+        """現在のLPSの状態（インデックスとマッピング）をファイルに保存する。"""
+        print("LPSの状態を保存中...")
+        faiss.write_index(self.index, self.index_file)
+        with open(self.mapping_file, 'wb') as f:
+            pickle.dump(self.entry_mapping, f)
+        print(f"保存完了。場所: {self.store_path}")
+    def load_store(self):
+        """ファイルからLPSの状態を読み込む。"""
+        print(f"既存のLPSの状態を {self.store_path} から読み込み中...")
+        self.index = faiss.read_index(self.index_file)
+        with open(self.mapping_file, 'rb') as f:
+            self.entry_mapping = pickle.load(f)
+        print("読み込み完了。")
+# テスト用の簡易的な実行
+if __name__ == '__main__':
+    # LPSインスタンスを作成（./lps_data にデータがなければ新規作成、あれば読み込む）
+    lps = LatentPatternStore()
+    # LPSが空の場合のみ、初期データを追加
+    if lps.index.ntotal == 0:
+        print("LPSが空のため、初期データを追加します。")
+        initial_memories = [
+            "LLMのファインチューニング",
+            "UIデザインの原則",
+            "刹那的な記憶を持つAIの思想",
+            "階層型記憶システム",
+            "ユーザーの思考パターンを反映する",
+            "mindsparkというキーワード",
+            "煩わしいという感情表現"
+        ]
+        lps.add_entries(initial_memories)
+        lps.save_store()
+    print("\n--- 検索テスト ---")
+    query1 = "新しいユーザーインターフェースのアイデア" # UIデザインに関連
+    results1 = lps.search(query1, k=2)
+    print(f"クエリ: '{query1}'")
+    print(f"-> 検索結果: {results1}")
+    query2 = "AIの記憶方法について" # 刹那的記憶、階層型記憶に関連
+    results2 = lps.search(query2, k=2)
+    print(f"\nクエリ: '{query2}'")
+    print(f"-> 検索結果: {results2}")

split_data.py ADDED Viewed

	@@ -0,0 +1,38 @@

+import json
+import random
+# --- 設定 ---
+input_file = 'train.jsonl'
+output_train_file = 'train.jsonl'  # 元のファイルを上書き
+output_valid_file = 'valid.jsonl'
+valid_split_ratio = 0.1  # 10%を検証データにする
+# -------------
+print(f"'{input_file}' を読み込んでいます...")
+# 元のデータを読み込む
+with open(input_file, 'r', encoding='utf-8') as f:
+    lines = f.readlines()
+# データをシャッフルしてランダム性を確保
+random.shuffle(lines)
+# 分割点を計算
+split_index = int(len(lines) * (1 - valid_split_ratio))
+# 学習データと検証データに分割
+train_data = lines[:split_index]
+valid_data = lines[split_index:]
+# 新しい学習データとして書き出す
+with open(output_train_file, 'w', encoding='utf-8') as f:
+    f.writelines(train_data)
+print(f"学習データを '{output_train_file}' に保存しました。({len(train_data)}行)")
+# 検証データとして書き出す
+with open(output_valid_file, 'w', encoding='utf-8') as f:
+    f.writelines(valid_data)
+print(f"検証データを '{output_valid_file}' に保存しました。({len(valid_data)}行)")
+print("分割が完了しました。")

update_readme.py ADDED Viewed

	@@ -0,0 +1,17 @@

+from huggingface_hub import HfApi
+api = HfApi()
+repo_id = "kofdai/gemma3-27b-mindspark"
+local_file_path = "ilm-upload-package/README.md"
+repo_file_path = "README.md" # リポジトリ内のパス
+try:
+    api.upload_file(
+        path_or_fileobj=local_file_path,
+        path_in_repo=repo_file_path,
+        repo_id=repo_id,
+        repo_type="model",
+    )
+    print(f"Successfully updated {repo_file_path} in {repo_id}")
+except Exception as e:
+    print(f"Error updating {repo_file_path}: {e}")