File size: 11,766 Bytes
d1d3333
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
{
  "course_id": "course-eval-data-besar-ef234712-001",
  "documents": [
    {
      "path": "doc/samples/Dokumen_RAG_Data_Besar_EF234712.pdf"
    }
  ],
  "questions": [
    {
      "question": "Apa kode mata kuliah Data Besar dan berapa bobot SKS-nya?",
      "expected_all": ["EF234712", "3 sks"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Apa nama mata kuliah dalam bahasa Indonesia dan bahasa Inggris?",
      "expected_all": ["Data Besar", "Big Data"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Siapa koordinator mata kuliah Data Besar?",
      "expected_all": ["Ratih Nur Esti Anggraini", "S.Kom", "M.Sc", "Ph.D"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Unit apa yang menaungi mata kuliah Data Besar?",
      "expected_all": ["Departemen Teknik Informatika", "ITS"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Apa versi dokumen dan tanggalnya?",
      "expected_all": ["1.0", "22 Mei 2026"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Apa catatan status dokumen terkait RPS atau kebijakan resmi?",
      "expected_all": ["bukan RPS", "bukan kebijakan resmi"],
      "expected_any": ["konten simulasi", "pengujian RAG"],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Apa tujuan dokumen ini untuk pengujian RAG?",
      "expected_all": ["sumber pengetahuan", "retrieval", "ketepatan jawaban"],
      "expected_any": ["fakta langsung", "konteks konseptual", "data simulasi terstruktur"],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Sebutkan label provenans yang digunakan dalam dokumen.",
      "expected_all": ["SUMBER UTAMA", "DATA UJI", "TIDAK TERSEDIA"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Apa fokus inti deskripsi mata kuliah Data Besar?",
      "expected_all": ["penyimpanan", "pengolahan data skala besar", "komputasi terdistribusi"],
      "expected_any": ["penggalian data", "pemodelan", "kasus nyata"],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Teknologi apa saja yang disebut eksplisit pada CPMK-1?",
      "expected_all": ["Hadoop", "graph database", "cloud storage"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Apa kemampuan utama yang ditekankan pada CPMK-2?",
      "expected_all": ["komputasi terdistribusi", "pengolahan data", "paralel"],
      "expected_any": ["responsif"],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Sebutkan kasus nyata yang disebut dalam CPMK-3.",
      "expected_all": ["klasifikasi", "regresi", "clustering", "sistem rekomendasi konten", "analisis jejaring sosial"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Apa fokus CPMK-4?",
      "expected_all": ["teknik optimasi", "pengolahan data berskala besar"],
      "expected_any": ["efisiensi", "efektivitas"],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Apa definisi ringkas big data menurut peta konsep?",
      "expected_all": ["Kumpulan data", "berukuran besar", "penyimpanan dan pengolahan"],
      "expected_any": ["bergerak cepat", "beragam bentuk", "diskalakan"],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Apa definisi penyimpanan terdistribusi?",
      "expected_all": ["Penyimpanan data", "beberapa node"],
      "expected_any": ["kapasitas", "ketahanan terhadap kegagalan", "kemampuan akses"],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Hadoop dikaitkan dengan komponen apa dalam dokumen?",
      "expected_all": ["HDFS", "MapReduce"],
      "expected_any": ["penyimpanan terdistribusi", "pemrosesan berbasis pekerjaan"],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Untuk data seperti apa graph database cocok?",
      "expected_all": ["node", "relasi"],
      "expected_any": ["jejaring sosial", "rekomendasi", "keterhubungan"],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Apa yang disediakan cloud storage menurut dokumen?",
      "expected_all": ["skalabilitas kapasitas", "akses terkelola"],
      "expected_any": ["layanan awan"],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Sebutkan tahap alur konseptual dari data mentah hingga wawasan.",
      "expected_all": ["Akuisisi", "Penyimpanan", "Pemrosesan", "Analitik", "Optimasi", "Penyajian"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "CPMK-1 dipetakan ke aktivitas belajar dan fokus konsep apa?",
      "expected_all": ["Mendesain lapisan penyimpanan", "Hadoop", "graph database", "cloud storage"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Topik apa yang dibahas pada minggu ke-5?",
      "expected_all": ["Graph database", "data relasional kompleks"],
      "expected_any": ["CPMK-1", "CPMK-3"],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Topik simulasi apa yang dibahas pada minggu ke-10?",
      "expected_all": ["Klasifikasi", "regresi", "data skala besar"],
      "expected_any": ["Perbandingan model"],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Topik simulasi apa yang dibahas pada minggu ke-13?",
      "expected_all": ["Analisis jejaring sosial", "berbasis graf"],
      "expected_any": ["Metrik keterhubungan"],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Kelompok materi analitik data berada pada rentang minggu berapa dan terkait CPMK apa?",
      "expected_all": ["Minggu 9-13", "CPMK-3"],
      "expected_any": ["Analitik data"],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Apa tujuan proyek InsightStream Commerce?",
      "expected_all": ["rekomendasi konten produk", "analisis jejaring interaksi pengguna"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Berapa volume data mentah pada studi kasus InsightStream Commerce?",
      "expected_all": ["18 GB"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Berapa jumlah transaksi, pengguna, dan interaksi pada studi kasus?",
      "expected_all": ["120.000.000", "2.000.000", "20.000.000"],
      "expected_any": ["transaksi", "pengguna", "interaksi"],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Apa periode pengamatan pada studi kasus InsightStream Commerce?",
      "expected_all": ["Januari sampai Maret 2026"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Sebutkan berkas masukan simulasi yang digunakan pada proyek.",
      "expected_all": ["transaksi_ritel_2026.csv", "produk.json", "interaksi_pengguna.parquet", "relasi_pengguna.csv"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Data apa yang dipetakan ke graph database dalam proyek?",
      "expected_all": ["Data relasi pengguna", "graph database"],
      "expected_any": ["analisis jejaring"],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Bagaimana data tabular disimpan pada arsitektur proyek simulasi?",
      "expected_all": ["Data tabular", "terpartisi", "berdasarkan bulan", "cloud storage"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Apa saja tugas yang harus dihasilkan dalam proyek simulasi?",
      "expected_all": ["Diagram arsitektur end-to-end", "Rancangan penyimpanan", "komputasi terdistribusi", "model rekomendasi konten", "analisis jejaring sosial", "Laporan optimasi"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Komponen evaluasi simulasi apa yang memiliki bobot terbesar?",
      "expected_all": ["Proyek akhir kelompok", "30%"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Sebutkan semua komponen skema evaluasi simulasi dan bobotnya.",
      "expected_all": ["Kuis konsep", "10%", "Praktikum", "20%", "Tugas analisis individu", "15%", "Evaluasi tengah semester", "20%", "Proyek akhir kelompok", "30%", "Partisipasi dan dokumentasi", "5%"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Berapa bobot desain penyimpanan dan arsitektur dalam rubrik proyek akhir simulasi?",
      "expected_all": ["Desain penyimpanan dan arsitektur", "25%"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Berapa bobot optimasi dan evaluasi performa dalam rubrik proyek akhir simulasi?",
      "expected_all": ["Optimasi dan evaluasi performa", "15%"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Menurut FAQ, teknologi penyimpanan apa yang disebut dalam CPMK?",
      "expected_all": ["Hadoop", "graph database", "cloud storage"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Menurut FAQ, kasus analitik apa yang disebut dalam CPMK-3?",
      "expected_all": ["Klasifikasi", "regresi", "clustering", "sistem rekomendasi konten", "analisis jejaring sosial"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Apa yang tidak diberikan dokumen menurut aturan abstention?",
      "expected_all": ["jadwal kelas resmi", "ruang kuliah", "kontak email koordinator", "platform pengumpulan tugas resmi", "kebijakan kehadiran resmi"],
      "expected_any": [],
      "forbidden": ["i don't know"],
      "expect_abstain": false
    },
    {
      "question": "Di ruang mana mata kuliah Data Besar berlangsung?",
      "expected_all": [],
      "expected_any": [],
      "forbidden": [],
      "expect_abstain": true
    },
    {
      "question": "Apa email koordinator mata kuliah Data Besar?",
      "expected_all": [],
      "expected_any": [],
      "forbidden": [],
      "expect_abstain": true
    },
    {
      "question": "Apa platform pengumpulan tugas resmi mata kuliah Data Besar?",
      "expected_all": [],
      "expected_any": [],
      "forbidden": [],
      "expect_abstain": true
    },
    {
      "question": "Berapa minimal kehadiran resmi untuk mata kuliah Data Besar?",
      "expected_all": [],
      "expected_any": [],
      "forbidden": [],
      "expect_abstain": true
    }
  ]
}