HyukII
/

text-emotion-model

@@ -1,186 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "code",
-      "execution_count": 1,
-      "metadata": {
-        "id": "HtXIxG2kUpgO"
-      },
-      "outputs": [
-        {
-          "name": "stderr",
-          "output_type": "stream",
-          "text": [
-            "/home/2021111971/.conda/envs/gpu_env/lib/python3.11/site-packages/tqdm/auto.py:21: TqdmWarning: IProgress not found. Please update jupyter and ipywidgets. See https://ipywidgets.readthedocs.io/en/stable/user_install.html\n",
-            "  from .autonotebook import tqdm as notebook_tqdm\n",
-            "2025-08-17 15:05:50.559882: E external/local_xla/xla/stream_executor/cuda/cuda_fft.cc:467] Unable to register cuFFT factory: Attempting to register factory for plugin cuFFT when one has already been registered\n",
-            "WARNING: All log messages before absl::InitializeLog() is called are written to STDERR\n",
-            "E0000 00:00:1755410750.582529   76530 cuda_dnn.cc:8579] Unable to register cuDNN factory: Attempting to register factory for plugin cuDNN when one has already been registered\n",
-            "E0000 00:00:1755410750.589567   76530 cuda_blas.cc:1407] Unable to register cuBLAS factory: Attempting to register factory for plugin cuBLAS when one has already been registered\n",
-            "W0000 00:00:1755410750.608699   76530 computation_placer.cc:177] computation placer already registered. Please check linkage and avoid linking the same target more than once.\n",
-            "W0000 00:00:1755410750.608723   76530 computation_placer.cc:177] computation placer already registered. Please check linkage and avoid linking the same target more than once.\n",
-            "W0000 00:00:1755410750.608726   76530 computation_placer.cc:177] computation placer already registered. Please check linkage and avoid linking the same target more than once.\n",
-            "W0000 00:00:1755410750.608728   76530 computation_placer.cc:177] computation placer already registered. Please check linkage and avoid linking the same target more than once.\n",
-            "2025-08-17 15:05:50.614673: I tensorflow/core/platform/cpu_feature_guard.cc:210] This TensorFlow binary is optimized to use available CPU instructions in performance-critical operations.\n",
-            "To enable the following instructions: AVX2 FMA, in other operations, rebuild TensorFlow with the appropriate compiler flags.\n"
-          ]
-        },
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "cuda\n"
-          ]
-        }
-      ],
-      "source": [
-        "from transformers import AutoTokenizer, AutoModelForSequenceClassification\n",
-        "import torch, json, os\n",
-        "import torch.nn.functional as F\n",
-        "import re\n",
-        "\n",
-        "\n",
-        "LOAD_DIR = \"/home/2021111971/todai/model2/final_model\"\n",
-        "\n",
-        "try:\n",
-        "    tok = AutoTokenizer.from_pretrained(LOAD_DIR)\n",
-        "    model = AutoModelForSequenceClassification.from_pretrained(LOAD_DIR).eval()\n",
-        "except Exception as e:\n",
-        "    print(f\"Error loading model or tokenizer from {LOAD_DIR}: {e}\")\n",
-        "    print(\"Please ensure the path is correct and the directory contains the necessary model files.\")\n",
-        "    raise\n",
-        "\n",
-        "\n",
-        "device = \"cuda\" if torch.cuda.is_available() else \"cpu\"\n",
-        "print(device)\n",
-        "model.to(device)\n",
-        "\n",
-        "with open(os.path.join(LOAD_DIR, \"label_map.json\"), \"r\", encoding=\"utf-8\") as f:\n",
-        "    lm = json.load(f)\n",
-        "id2label = {int(k): v for k, v in lm[\"id2label\"].items()}\n",
-        "num_labels = len(id2label)"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": 2,
-      "metadata": {
-        "id": "VE8FmoqOUq3p"
-      },
-      "outputs": [],
-      "source": [
-        "\n",
-        "# ==== 2) 단문 예측 ====\n",
-        "def predict_emotion_and_print(text, max_len=256):\n",
-        "    with torch.no_grad():\n",
-        "        enc = tok(text, truncation=True, padding=True, max_length=max_len, return_tensors=\"pt\").to(device)\n",
-        "        probs = F.softmax(model(**enc).logits, dim=-1).cpu().numpy()[0]\n",
-        "    print(\"=== 감정 분석 결과 ===\")\n",
-        "    for lab, pct in sorted({id2label[i]: float(probs[i]*100) for i in range(num_labels)}.items(),\n",
-        "                           key=lambda x: -x[1]):\n",
-        "        print(f\"{lab:<5} : {pct:.2f}%\")\n",
-        "    print(\"======================\")\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": 3,
-      "metadata": {
-        "id": "-O-jiHwiUvFx"
-      },
-      "outputs": [],
-      "source": [
-        "# ==== 3) 일기(여러 문장) → 문장 단위 집계 ====\n",
-        "# (문장마다 예측 → 개수 비율로 퍼센트 계산)\n",
-        "def split_sents(text):\n",
-        "    # 마침표/물음표/느낌표/줄바�� 기준\n",
-        "    return [s.strip() for s in re.split(r'[.?!\\n]', text) if s.strip()]\n",
-        "\n",
-        "def analyze_diary_percent(diary_text, max_len=256, return_details=False):\n",
-        "    sents = split_sents(diary_text)\n",
-        "    if not sents:\n",
-        "        print(\"문장이 없습니다.\"); return {}\n",
-        "\n",
-        "    counts = {id2label[i]: 0 for i in range(num_labels)}\n",
-        "    details = []\n",
-        "\n",
-        "    with torch.no_grad():\n",
-        "        for s in sents:\n",
-        "            enc = tok(s, truncation=True, padding=True, max_length=max_len, return_tensors=\"pt\").to(device)\n",
-        "            logits = model(**enc).logits\n",
-        "            pred = int(logits.argmax(-1).cpu().numpy()[0])\n",
-        "            lab = id2label[pred]\n",
-        "            counts[lab] += 1\n",
-        "            if return_details: details.append((s, lab))\n",
-        "\n",
-        "    total = sum(counts.values())\n",
-        "    perc = {lab: round((counts.get(lab, 0) / total) * 100, 2) if total > 0 else 0.0 for lab in id2label.values()}\n",
-        "\n",
-        "    print(\"=== 텍스트 기반 감정 분석 ===\")\n",
-        "    for lab, pct in sorted(perc.items(), key=lambda x: -x[1]):\n",
-        "        print(f\"{lab:<5}: {pct:5.2f}% \")\n",
-        "    print(\"============================\")\n",
-        "\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": 4,
-      "metadata": {
-        "colab": {
-          "base_uri": "https://localhost:8080/"
-        },
-        "id": "dXzmKSI2UjOu",
-        "outputId": "02d6ce57-ce23-489a-f1ca-0a052ceb2dee"
-      },
-      "outputs": [
-        {
-          "name": "stdout",
-          "output_type": "stream",
-          "text": [
-            "=== 텍스트 기반 감정 분석 ===\n",
-            "기쁨   : 66.67% \n",
-            "슬픔   : 33.33% \n",
-            "당황   :  0.00% \n",
-            "분노   :  0.00% \n",
-            "불안   :  0.00% \n",
-            "상처   :  0.00% \n",
-            "============================\n"
-          ]
-        }
-      ],
-      "source": [
-        "diary_text = \"\"\"\n",
-        "아침에 프로젝트 승인 소식을 듣고 너무 기뻤다.\n",
-        "하지만 오후에는 친한 동료가 쇠사를 고민한다는 말을 듣고 마음이 먹먹해졌다.\n",
-        "퇴근길 노을을 보며 오늘 하루를 감사한 마음으로 마무리했다.\n",
-        "\"\"\"\n",
-        "analyze_diary_percent(diary_text)\n"
-      ]
-    }
-  ],
-  "metadata": {
-    "colab": {
-      "provenance": []
-    },
-    "kernelspec": {
-      "display_name": "gpu_env",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.11.13"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}