File size: 4,128 Bytes
04b72bb
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
<!DOCTYPE html>
<html lang="id">
<head>
  <meta charset="UTF-8" /><meta name="viewport" content="width=device-width,initial-scale=1.0" />
  <title>Cleaning Lab — SentiMeter</title>
  <link rel="preconnect" href="https://fonts.googleapis.com" /><link rel="preconnect" href="https://fonts.gstatic.com" crossorigin />
  <link href="https://fonts.googleapis.com/css2?family=Inter:wght@300;400;500;600;700;800&display=swap" rel="stylesheet" />
  <script src="js/chart.js"></script>
  <link rel="stylesheet" href="css/style.css" />
  <link rel="icon" type="image/svg+xml" href="img/logo.svg" />
</head>
<body>
<div class="layout">
  <div id="sidebar"></div>
  <div class="main">
    <div class="topbar">
      <div class="topbar-title">Text Cleaning Lab</div>
      <div id="topbarMeta" class="topbar-sub"></div>
    </div>
    <div class="page-body">
      <div class="sec-head">
        <div><div class="sec-title">Pipeline Pembersihan Teks</div><div class="sec-sub">9 langkah preprocessing untuk IndoBERT</div></div>
      </div>

      <div class="chart-grid" style="margin-bottom:14px;align-items:stretch">
        <!-- Interactive Demo -->
        <div class="card card-body">
          <div class="card-head"><div class="card-title">Demo Interaktif</div><span class="card-badge">Live Preview</span></div>
          <div class="demo-area" style="padding:0;background:transparent">
            <div class="demo-label">Masukkan teks untuk dicoba:</div>
            <textarea class="demo-textarea" id="demoInput" rows="4" placeholder="Contoh: @liputan6dotcom Gak sia-sia mendukung #Prabowo-Gibran! https://t.co/abc123 😍 Data ekonomi tumbuh 5.17%"></textarea>
          </div>
          <div style="margin-top:14px">
            <div style="font-size:11px;color:var(--tx3);margin-bottom:8px;font-weight:600;text-transform:uppercase;letter-spacing:.5px">Hasil per Langkah:</div>
            <div class="step-pipeline" id="stepPipeline"></div>
          </div>
        </div>

        <!-- Pipeline Steps Config -->
        <div class="card card-body">
          <div class="card-head"><div class="card-title">Langkah Cleaning</div><span class="card-badge">Konfigurasi</span></div>
          <div id="pipelineSteps"></div>
        </div>
      </div>

      <!-- Dataset Stats -->
      <div class="card card-body" style="margin-bottom:14px">
        <div class="card-head"><div class="card-title">Statistik Cleaning Dataset</div><span class="card-badge">Seluruh Data</span></div>
        <div style="display:flex;gap:12px;flex-wrap:wrap;margin-bottom:20px" id="cleaningStats"></div>
        <div class="chart-grid" style="margin:0">
          <div>
            <div style="font-size:11px;color:var(--tx3);margin-bottom:8px;font-weight:600;text-transform:uppercase;letter-spacing:.5px">Distribusi Pengurangan Kata (%)</div>
            <div class="chart-wrap chart-wrap-sm"><canvas id="chartReduction"></canvas></div>
          </div>
          <div>
            <div style="font-size:11px;color:var(--tx3);margin-bottom:8px;font-weight:600;text-transform:uppercase;letter-spacing:.5px">Top 15 Kata Tersering (Setelah Cleaning)</div>
            <div class="chart-wrap chart-wrap-sm"><canvas id="chartWords"></canvas></div>
          </div>
        </div>
      </div>

      <!-- Before/After Table -->
      <div class="card card-body">
        <div class="card-head">
          <div class="card-title">Perbandingan Sebelum & Sesudah Cleaning</div>
          <span class="card-badge">Sampel 20 Pertama</span>
        </div>
        <div class="table-wrap">
          <table class="data-table">
            <thead><tr>
              <th style="width:36px">No</th>
              <th>Teks Asli</th>
              <th>Teks Bersih</th>
              <th style="width:70px">Kata Awal</th>
              <th style="width:70px">Kata Akhir</th>
              <th style="width:80px">Reduksi</th>
            </tr></thead>
            <tbody id="cleanTableBody"></tbody>
          </table>
        </div>
      </div>

    </div>
  </div>
</div>
<script src="js/shared.js"></script>
<script src="js/cleaning.js"></script>
</body>
</html>