Spaces:

Saurabh502
/

LLM_Quiz_Beg

Running

App Files Files Community

Saurabh502 commited on Mar 24, 2025

Commit

36bd29a

verified ·

1 Parent(s): 04c01c9

Update index.html

Browse files

Files changed (1) hide show

index.html +240 -86

index.html CHANGED Viewed

@@ -20,173 +20,212 @@
         justify-content: center;
         align-items: center;
         min-height: 100vh;
-        background-image: url('quiz-background.jpg'); /* Replace with your image */
         background-size: cover;
         background-position: center;
       }
       #root {
-        background-color: rgba(255, 255, 255, 0.95); /* Slightly transparent white */
         padding: 30px;
         border-radius: 12px;
-        box-shadow: 0 8px 20px rgba(0, 0, 0, 0.1); /* Softer shadow */
-        width: 80%; /* Slightly wider */
-        max-width: 800px; /* Maximum width for larger screens */
         text-align: center;
-        box-sizing: border-box; /* Include padding in width */
       }
       h1 {
         font-size: 2rem;
         margin-bottom: 20px;
-        color: #3498db; /* A brighter, more modern blue */
-        font-weight: 600; /* Semi-bold for headings */
       }
       p {
         font-size: 1.1rem;
-        margin-bottom: 25px; /* Increased margin for better spacing */
-        color: #555; /* Darker, more readable gray */
-        line-height: 1.7; /* Improved line height for readability */
       }
       #question-area {
         font-size: 1.2rem;
         margin-bottom: 20px;
         padding: 15px;
-        background-color: #e8f0fa; /* Very light blue for question area */
         border-radius: 8px;
-        border: 1px solid #b8c6da; /* Subtle border */
-        color: #2c3e50; /* Dark blue for question text */
-        text-align: left; /* Left-align the question */
       }
       #answer-options {
         display: flex;
         flex-direction: column;
-        align-items: stretch; /* Stretch options to container width */
-        margin-bottom: 25px; /* Increased margin */
       }
       .answer-option {
         padding: 15px;
-        margin-bottom: 12px; /* Increased margin */
-        background-color: #fff; /* White background for options */
         border-radius: 8px;
-        border: 1px solid #ddd; /* Lighter border */
         cursor: pointer;
-        transition: background-color 0.3s ease, transform 0.2s ease; /* Smooth transition */
-        font-size: 1.1rem; /* Slightly larger font */
-        text-align: left; /* Left-align the options text */
-        box-shadow: 0 2px 4px rgba(0, 0, 0, 0.05); /* Very subtle shadow */
       }
       .answer-option:hover {
-        background-color: #f0f8ff; /* Very light blue on hover */
-        transform: translateY(-2px); /* Slight lift on hover */
-        border-color: #a6d4fa; /* Slightly more prominent border on hover */
       }
       .answer-option.selected {
-        background-color: #a6d4fa; /* Light blue for selected option */
-        border-color: #3498db; /* Stronger blue border for selected */
-        color: #fff; /* White text for selected option */
-        box-shadow: 0 4px 6px rgba(0, 0, 0, 0.1); /* Slightly stronger shadow */
       }
       .answer-option.correct {
-        background-color: #86ef7d; /* Light green for correct answer */
-        border-color: #22c55e; /* Stronger green border */
         color: #fff;
-        font-weight: 600; /* Bold correct answer */
       }
       .answer-option.incorrect {
-        background-color: #fca5a5; /* Light red for incorrect answer */
-        border-color: #dc2626; /* Stronger red border */
         color: #fff;
-        font-weight: 600; /* Bold incorrect answer */
       }
       #result-message {
         font-size: 1.2rem;
         margin-bottom: 25px;
-        font-weight: 500; /* Medium font weight for message */
       }
       .correct-message {
-        color: #22c55e; /* Strong green for correct message */
       }
       .incorrect-message {
-        color: #dc2626; /* Strong red for incorrect message */
       }
-      #next-button, #skip-button, #reset-button {
         padding: 12px 25px;
         font-size: 1.1rem;
-        margin: 5px 10px; /* Added horizontal margin between buttons */
         border-radius: 8px;
         border: none;
         cursor: pointer;
-        transition: background-color 0.3s ease, transform 0.2s ease, box-shadow 0.3s ease; /* Added box-shadow transition */
-        font-weight: 500; /* Medium font weight for buttons */
-        box-shadow: 0 2px 5px rgba(0, 0, 0, 0.1); /* Subtle shadow for buttons */
       }
       #next-button {
-        background-color: #3498db; /* Blue for next button */
         color: #fff;
       }
       #next-button:hover {
         background-color: #2980b9;
         transform: translateY(-2px);
-        box-shadow: 0 4px 7px rgba(0, 0, 0, 0.15); /* Increased shadow on hover */
       }
       #next-button:disabled {
-        background-color: #b8c6da; /* Gray for disabled next button */
         cursor: not-allowed;
-        transform: none; /* Remove transform on disabled */
-        box-shadow: none; /* Remove shadow on disabled */
       }
       #skip-button {
-        background-color: #f39c12; /* Orange for skip button */
         color: #fff;
       }
       #skip-button:hover {
         background-color: #e67e22;
         transform: translateY(-2px);
-        box-shadow: 0 4px 7px rgba(0, 0, 0, 0.15); /* Increased shadow on hover */
       }
       #reset-button {
-        background-color: #2ecc71; /* Green for reset button */
         color: #fff;
       }
       #reset-button:hover {
         background-color: #27ae60;
         transform: translateY(-2px);
-        box-shadow: 0 4px 7px rgba(0, 0, 0, 0.15); /* Increased shadow on hover */
       }
       #final-score-area {
         font-size: 1.5rem;
         font-weight: 600;
         margin-bottom: 30px;
-        color: #2c3e50; /* Dark blue for final score */
       }
       .pass-message {
-        color: #22c55e; /* Green for pass message */
       }
       .fail-message {
-        color: #dc2626; /* Red for fail message */
       }
-      @media (max-width: 768px) { /* Styles for tablets and smaller screens */
         #root {
           width: 95%;
           padding: 20px;
@@ -200,7 +239,7 @@
           font-size: 1.1rem;
           padding: 12px;
         }
-        #next-button, #skip-button, #reset-button {
           padding: 10px 20px;
           font-size: 1rem;
         }
@@ -212,12 +251,12 @@
         }
       }
-      @media (max-width: 480px) { /* Styles for phones */
         #root {
           width: 100%;
           padding: 15px;
-          border-radius: 0; /* Remove border radius on phones */
-          box-shadow: none; /* Remove shadow on phones */
         }
         .answer-option {
           padding: 10px;
@@ -228,10 +267,10 @@
           font-size: 1rem;
           padding: 10px;
         }
-        #next-button, #skip-button, #reset-button {
           padding: 10px 18px;
           font-size: 0.9rem;
-          margin: 5px 5px; /* Reduced horizontal margin on phones */
         }
         h1 {
           font-size: 1.5rem;
@@ -262,6 +301,7 @@
           "To predict stock market trends.",
         ],
         correctAnswer: "To understand and generate human language.",
       },
       {
         question: "Which of the following is NOT a stage in the development of language models?",
@@ -272,6 +312,7 @@
           "Quantum language models (QLM)",
         ],
         correctAnswer: "Quantum language models (QLM)",
       },
       {
         question: "What is the basic idea behind statistical language models (SLMs)?",
@@ -282,6 +323,7 @@
           "To pre-train Transformer models.",
         ],
         correctAnswer: "To build word prediction models based on the Markov assumption.",
       },
       {
         question: "What is a limitation of SLMs?",
@@ -292,6 +334,7 @@
           "They are not used in NLP.",
         ],
         correctAnswer: "They suffer from the curse of dimensionality.",
       },
       {
         question: "What is the main characteristic of neural language models (NLMs)?",
@@ -302,6 +345,7 @@
           "They use n-gram models.",
         ],
         correctAnswer: "They characterize the probability of word sequences by neural networks.",
       },
       {
         question: "What concept did the work in [1] introduce?",
@@ -312,6 +356,7 @@
           "Pre-training and fine-tuning.",
         ],
         correctAnswer: "Distributed representation of words.",
       },
       {
         question: "What is word2vec?",
@@ -322,16 +367,19 @@
           "A pre-trained language model.",
         ],
         correctAnswer: "A simplified shallow neural network for learning distributed word representations.",
       },
       {
         question: "What was an early attempt at capturing context-aware word representations?",
         options: ["BERT", "ELMo", "GPT-2", "word2vec"],
         correctAnswer: "ELMo",
       },
       {
         question: "Which architecture is highly parallelizable and used in BERT?",
         options: ["RNN", "LSTM", "Transformer", "MLP"],
         correctAnswer: "Transformer",
       },
       {
         question: "What is a key feature of BERT?",
@@ -342,6 +390,7 @@
           "It predicts the next word based on the most recent context.",
         ],
         correctAnswer: "It pre-trains bidirectional language models.",
       },
       {
         question: "What paradigm did BERT inspire?",
@@ -352,6 +401,7 @@
           "Distributed representation learning.",
         ],
         correctAnswer: "Pre-training and fine-tuning.",
       },
       {
         question: "What do researchers find about scaling PLMs?",
@@ -362,6 +412,7 @@
           "It only works for small models.",
         ],
         correctAnswer: "It often leads to an improved model capacity.",
       },
       {
         question: "What is a characteristic of large-sized PLMs (LLMs)?",
@@ -372,6 +423,7 @@
           "They are less complex than SLMs.",
         ],
         correctAnswer: "They display different behaviors from smaller PLMs.",
       },
       {
         question: "What is an example of an emergent ability in LLMs?",
@@ -382,8 +434,9 @@
           "Using only n-gram models.",
         ],
         correctAnswer: "Solving few-shot tasks through in-context learning.",
       },
-       {
         question: "What does the term 'LLM' stand for?",
         options: [
           "Limited Language Model",
@@ -392,11 +445,13 @@
           "Logical Language Model",
         ],
         correctAnswer: "Large Language Model",
       },
       {
         question: "Which of the following is a remarkable application of LLMs?",
         options: ["ELMo", "ChatGPT", "word2vec", "SLM"],
         correctAnswer: "ChatGPT",
       },
       {
         question: "What is a key focus of the latest language models (e.g., GPT-4)?",
@@ -407,6 +462,7 @@
           "Using only statistical methods.",
         ],
         correctAnswer: "Complex task solving.",
       },
       {
         question: "How do LLMs differ from small PLMs in accessing them?",
@@ -417,6 +473,7 @@
           "They are accessed using n-gram models.",
         ],
         correctAnswer: "They are accessed through the prompting interface.",
       },
       {
         question: "What is a challenge in developing LLMs?",
@@ -427,6 +484,7 @@
           "It is very costly to train them due to huge demand for computation resources.",
         ],
         correctAnswer: "It is very costly to train them due to huge demand for computation resources.",
       },
       {
         question: "What is a potential issue with LLMs despite their capacities?",
@@ -437,6 +495,7 @@
           "They do not require effective control approaches.",
         ],
         correctAnswer: "They are likely to produce toxic, fictitious, or harmful content.",
       },
       {
         question: "What are the four major aspects of LLMs covered in the survey?",
@@ -447,6 +506,7 @@
           "Input, processing, output, and storage.",
         ],
         correctAnswer: "Pre-training, adaptation, utilization, and capacity evaluation.",
       },
       {
         question: "What is the typical parameter size of LLMs?",
@@ -457,6 +517,7 @@
           "Less than 100 parameters.",
         ],
         correctAnswer: "Billions or hundreds of billions of parameters.",
       },
       {
         question: "On what type of data are LLMs typically trained?",
@@ -467,6 +528,7 @@
           "Audio data only.",
         ],
         correctAnswer: "Massive text data.",
       },
       {
         question: "What strong capacity do LLMs exhibit?",
@@ -477,6 +539,7 @@
           "Performing only simple calculations.",
         ],
         correctAnswer: "Solving complex tasks via text generation.",
       },
       {
         question: "What does the survey introduce as basic background for LLMs?",
@@ -487,6 +550,7 @@
           "Only scaling laws.",
         ],
         correctAnswer: "Scaling laws, emergent abilities, and key techniques.",
       },
       {
         question: "What is the key to understanding the development of language models in research history?",
@@ -497,6 +561,7 @@
           "Ignoring the evolution of model capacities.",
         ],
         correctAnswer: "The leap from language modeling to task solving.",
       },
       {
         question: "Which of the following is NOT a characteristic of LLMs?",
@@ -507,6 +572,7 @@
           "Using Transformer language models.",
         ],
         correctAnswer: "Training on small datasets.",
       },
       {
         question: "What is a major difference between LLMs and previous smaller PLMs?",
@@ -517,6 +583,7 @@
           "LLMs do not require large-scale data.",
         ],
         correctAnswer: "LLMs display surprising emergent abilities.",
       },
       {
         question: "How has the research paradigm shifted towards the use of LLMs in NLP?",
@@ -527,6 +594,7 @@
           "Ignoring pre-training and fine-tuning.",
         ],
         correctAnswer: "LLMs serve as a general-purpose language task solver.",
       },
       {
         question: "What is a challenge that traditional search engines face with the advent of LLMs?",
@@ -537,6 +605,7 @@
           "Easier data processing.",
         ],
         correctAnswer: "New information seeking way through AI chatbots.",
       },
       {
         question: "What is a current trend in computer vision (CV) research related to LLMs?",
@@ -547,6 +616,7 @@
           "Focusing solely on image classification.",
         ],
         correctAnswer: "Developing ChatGPT-like vision-language models.",
       },
       {
         question: "What is a potential impact of the new wave of LLM technology?",
@@ -557,6 +627,7 @@
           "Slower development of AI algorithms.",
         ],
         correctAnswer: "A prosperous ecosystem of real-world applications based on LLMs.",
       },
       {
         question: "What is one of the mysterious aspects of LLMs?",
@@ -567,6 +638,7 @@
           "Why they only work on small datasets.",
         ],
         correctAnswer: "Why emergent abilities occur in LLMs.",
       },
       {
         question: "Why is it difficult for the research community to train capable LLMs?",
@@ -577,6 +649,7 @@
           "Because LLMs are mainly trained by academia.",
         ],
         correctAnswer: "Because it is very costly to carry out repetitive studies.",
       },
       {
         question: "What is a challenge in aligning LLMs?",
@@ -587,6 +660,7 @@
           "Reducing their computational costs.",
         ],
         correctAnswer: "Aligning them with human values or preferences.",
       },
       {
         question: "What does the paper 'Planning for AGI and beyond' discuss?",
@@ -597,6 +671,7 @@
           "Only short-term plans for AI development.",
         ],
         correctAnswer: "Short-term and long-term plans to approach AGI.",
       },
       {
         question: "What is a recent argument about GPT-4?",
@@ -607,6 +682,7 @@
           "It can only perform simple tasks.",
         ],
         correctAnswer: "It might be considered an early version of an AGI system.",
       },
       {
         question: "How is Microsoft 365 being empowered?",
@@ -617,32 +693,37 @@
           "By using only statistical models.",
         ],
         correctAnswer: "By LLMs to automate office work.",
       },
       {
-          question: "What is a suggestion for choosing layer normalization in LLMs?",
-          options: ["Post RMSNorm", "Pre RMSNorm", "Post LN", "No Normalization"],
-          correctAnswer: "Pre RMSNorm",
       },
       {
-          question: "Which activation function is recommended for stronger generalization and training stability?",
-          options: ["ReLU", "Sigmoid", "SwiGLU", "Tanh"],
-          correctAnswer: "SwiGLU",
       },
       {
-          question: "Which position embedding is considered a better choice for LLMs?",
-          options: ["Absolute Positional Embedding", "Relative Positional Embedding", "RoPE", "Sinusoidal Positional Encoding"],
-          correctAnswer: "RoPE",
       },
       {
         question: "What is the primary role of pre-training in LLMs?",
-options: [
           "To fine-tune models for specific tasks.",
           "To encode general knowledge from large-scale corpus.",
           "To reduce the size of the model.",
           "To improve inference speed.",
         ],
         correctAnswer: "To encode general knowledge from large-scale corpus.",
-},
       {
         question: "What type of data is included in the arXiv Dataset?",
         options: [
@@ -652,11 +733,13 @@ options: [
           "Image and video data.",
         ],
         correctAnswer: "Scientific publication data.",
       },
       {
         question: "What is the approximate size of the peS2o dataset?",
         options: ["42MB", "42GB", "42TB", "42B tokens"],
         correctAnswer: "42B tokens",
       },
       {
         question: "What is a characteristic of the articles in Wikipedia?",
@@ -667,11 +750,13 @@ options: [
           "They cover only a narrow range of topics.",
         ],
         correctAnswer: "They are composed in an expository style with references.",
       },
       {
         question: "What is a technique used to improve memory efficiency and throughput of deployed LLMs?",
         options: ["Data Parallelism", "Tensor Parallelism", "Pipeline Parallelism", "PagedAttention"],
         correctAnswer: "PagedAttention",
       },
       {
         question: "How does PagedAttention partition sequences?",
@@ -682,6 +767,7 @@ options: [
           "Into overlapping segments.",
         ],
         correctAnswer: "Into subsequences.",
       },
       {
         question: "What is the benefit of using PagedAttention?",
@@ -692,11 +778,13 @@ options: [
           "Improves model accuracy.",
         ],
         correctAnswer: "Increases GPU utilization and enables efficient memory sharing.",
       },
       {
         question: "What type of floating-point number was predominantly used for pre-training in previous PLMs like BERT?",
         options: ["FP16", "BF16", "FP32", "INT8"],
         correctAnswer: "FP32",
       },
       {
         question: "Why have some studies started to use FP16 for pre-training LLMs?",
@@ -707,6 +795,7 @@ options: [
           "To avoid the loss of computational accuracy.",
         ],
         correctAnswer: "To reduce memory usage and communication overhead.",
       },
       {
         question: "What is a potential issue with using FP16 for training?",
@@ -717,6 +806,7 @@ options: [
           "Improved model performance.",
         ],
         correctAnswer: "Loss of computational accuracy.",
       },
       {
         question: "What is BF16?",
@@ -727,6 +817,7 @@ options: [
           "A method for parallel training.",
         ],
         correctAnswer: "Brain Floating Point, an alternative to FP16.",
       },
       {
         question: "How does BF16 compare to FP16 in terms of representation accuracy for pre-training?",
@@ -737,6 +828,7 @@ options: [
           "BF16 is not suitable for pre-training.",
         ],
         correctAnswer: "BF16 generally performs better than FP16.",
       },
       {
         question: "Which training technique is often used jointly with 3D parallelism to improve training throughput?",
@@ -747,6 +839,7 @@ options: [
           "PagedAttention.",
         ],
         correctAnswer: "Mixed precision training.",
       },
       {
         question: "What type of parallelism was used to train BLOOM on 384 A100 GPUs?",
@@ -757,6 +850,7 @@ options: [
           "Only pipeline parallelism.",
         ],
         correctAnswer: "8-way data parallelism, 4-way tensor parallelism, and 12-way pipeline parallelism.",
       },
       {
         question: "What is the primary approach to using LLMs after pre-training or adaptation tuning?",
@@ -767,11 +861,13 @@ options: [
           "Using only n-gram models.",
         ],
         correctAnswer: "Designing suitable prompting strategies.",
       },
       {
         question: "What is a representative prompting method discussed in the text?",
         options: ["Fine-tuning", "Backpropagation", "In-context learning", "Random search"],
         correctAnswer: "In-context learning",
       },
       {
         question: "What does in-context learning involve?",
@@ -782,11 +878,13 @@ options: [
           "Employing only manual creation of prompts.",
         ],
         correctAnswer: "Formulating task description and demonstrations in natural language text.",
       },
       {
         question: "What is the process of manually creating a suitable prompt also called?",
         options: ["Automatic prompt optimization", "Prompt engineering", "Prompt tuning", "Prompt generation"],
         correctAnswer: "Prompt engineering",
       },
       {
         question: "What is the impact of a well-designed prompt on LLMs?",
@@ -797,16 +895,19 @@ options: [
           "It makes LLMs generate random outputs.",
         ],
         correctAnswer: "It is very helpful to elicit the abilities of LLMs.",
       },
       {
         question: "What type of data is considered well-organized with algorithmic logic and programming flow?",
         options: ["Natural language text", "Image data", "Code data", "Audio data"],
         correctAnswer: "Code data",
       },
       {
         question: "What ability do models trained on code show?",
         options: ["Weak reasoning ability", "Strong reasoning ability", "No reasoning ability", "Only language generation ability"],
         correctAnswer: "Strong reasoning ability",
       },
       {
         question: "What is a hypothesis regarding code data and LLMs' reasoning performance?",
@@ -817,6 +918,7 @@ options: [
           "Code data is only useful for code generation.",
         ],
         correctAnswer: "Code data may be useful to improve the reasoning performance of LLMs.",
       },
       {
         question: "What is a characteristic of LLMs' text generation quality?",
@@ -827,6 +929,7 @@ options: [
           "It cannot be evaluated.",
         ],
         correctAnswer: "It is comparable to human-written texts.",
       },
       {
         question: "How can LLMs be used in the context of generation evaluation?",
@@ -837,6 +940,7 @@ options: [
           "To perform only statistical analysis.",
         ],
         correctAnswer: "As language generation evaluators.",
       },
       {
         question: "What is a limitation of LLMs in specialized generation?",
@@ -847,6 +951,7 @@ options: [
           "They are only good at generating code.",
         ],
         correctAnswer: "They have learned general language patterns but underperform in specialized generation.",
       },
       {
         question: "What is a common approach to enhancing LLMs' factual knowledge?",
@@ -857,6 +962,7 @@ options: [
           "Ignoring up-to-date information.",
         ],
         correctAnswer: "Incorporating extracted relevant information into the context.",
       },
       {
         question: "What is a finding about smaller models with instruction tuning compared to larger models without it?",
@@ -867,6 +973,7 @@ options: [
           "Larger models are always better.",
         ],
         correctAnswer: "Smaller models can perform better.",
       },
       {
         question: "What does instruction tuning enable LLMs to do?",
@@ -877,6 +984,7 @@ options: [
           "Perform only without demonstrations.",
         ],
         correctAnswer: "Follow human instructions to perform specific tasks, even on unseen tasks.",
       },
       {
         question: "What is a benefit of instruction tuning?",
@@ -887,6 +995,7 @@ options: [
           "It does not improve model performance.",
         ],
         correctAnswer: "It is much less costly than pre-training.",
       },
       {
         question: "What is the primary goal of instruction tuning?",
@@ -897,6 +1006,7 @@ options: [
           "To generate random text",
         ],
         correctAnswer: "To make LLMs better at following instructions",
       },
       {
         question: "What kind of tasks does instruction tuning help LLMs perform?",
@@ -907,6 +1017,7 @@ options: [
           "No specific tasks",
         ],
         correctAnswer: "Specific tasks without demonstrations",
       },
       {
         question: "How does instruction tuning affect LLMs' ability to follow instructions?",
@@ -917,6 +1028,7 @@ options: [
           "It makes them ignore instructions",
         ],
         correctAnswer: "It enhances their ability",
       },
       {
         question: "What have a large number of studies confirmed about instruction tuning?",
@@ -927,6 +1039,7 @@ options: [
           "It decreases performance",
         ],
         correctAnswer: "It achieves superior performance on seen and unseen tasks",
       },
       {
         question: "What is a key aspect of high-quality long CoT data curation?",
@@ -937,6 +1050,7 @@ options: [
           "Manual data collection only",
         ],
         correctAnswer: "Using open models or APIs for data synthesis",
       },
       {
         question: "What is the basic idea behind creating long CoT response data?",
@@ -947,6 +1061,7 @@ options: [
           "Ignoring the prompt structure",
         ],
         correctAnswer: "Feeding prompts into teacher models",
       },
       {
         question: "What is the finding about smaller models with instruction tuning compared to larger models without fine-tuning?",
@@ -957,6 +1072,7 @@ options: [
           "Larger models are always better.",
         ],
         correctAnswer: "Smaller models can perform better.",
       },
     ];
@@ -968,12 +1084,12 @@ options: [
       const [quizEnd, setQuizEnd] = React.useState(false);
       const [selectedAnswerColor, setSelectedAnswerColor] = React.useState('');
       const [currentQuestionNumber, setCurrentQuestionNumber] = React.useState(1);
       const currentQuestion = quizData[currentQuestionIndex];
       const totalQuestions = quizData.length;
       const handleAnswerSelection = (answer) => {
         setSelectedAnswer(answer);
         if (answer === currentQuestion.correctAnswer) {
@@ -983,6 +1099,12 @@ options: [
         } else {
           setMessage('Incorrect!');
           setSelectedAnswerColor('incorrect');
         }
       };
@@ -1018,6 +1140,12 @@ options: [
         setQuizEnd(false);
         setSelectedAnswerColor('');
         setCurrentQuestionNumber(1);
       };
       return (
@@ -1028,13 +1156,13 @@ options: [
             <>
               <div id="question-area">
                 Question {currentQuestionNumber}/{totalQuestions}: {currentQuestion.question}
-                </div>
               <div id="answer-options">
                 {currentQuestion.options.map((option) => (
                   <div
                     key={option}
                     className={`answer-option ${selectedAnswer === option ? selectedAnswerColor : ''} ${selectedAnswer ? 'disabled' : ''} ${selectedAnswerColor && option === currentQuestion.correctAnswer ? 'correct' : ''}`}
-                    onClick={() => handleAnswerSelection(option)}
                   >
                     {option}
                   </div>
@@ -1054,15 +1182,41 @@ options: [
             <>
               <div id="final-score-area">
                 Your Final Score: {score} / {quizData.length} <br/>
-                {score >= 40 ? (
                   <span className="pass-message">Passed</span>
                 ) : (
                   <span className="fail-message">Failed</span>
                 )}
               </div>
-              <button id="reset-button"onClick={handleResetQuiz}>
-                Play Again
-              </button>
             </>
           )}
         </div>
@@ -1072,4 +1226,4 @@ options: [
     ReactDOM.render(<QuizApp />, document.getElementById("root"));
   </script>
 </body>
-</html>

         justify-content: center;
         align-items: center;
         min-height: 100vh;
+        background-image: url('quiz-background.jpg');
         background-size: cover;
         background-position: center;
       }
       #root {
+        background-color: rgba(255, 255, 255, 0.95);
         padding: 30px;
         border-radius: 12px;
+        box-shadow: 0 8px 20px rgba(0, 0, 0, 0.1);
+        width: 80%;
+        max-width: 800px;
         text-align: center;
+        box-sizing: border-box;
       }
       h1 {
         font-size: 2rem;
         margin-bottom: 20px;
+        color: #3498db;
+        font-weight: 600;
       }
       p {
         font-size: 1.1rem;
+        margin-bottom: 25px;
+        color: #555;
+        line-height: 1.7;
       }
       #question-area {
         font-size: 1.2rem;
         margin-bottom: 20px;
         padding: 15px;
+        background-color: #e8f0fa;
         border-radius: 8px;
+        border: 1px solid #b8c6da;
+        color: #2c3e50;
+        text-align: left;
       }
       #answer-options {
         display: flex;
         flex-direction: column;
+        align-items: stretch;
+        margin-bottom: 25px;
       }
       .answer-option {
         padding: 15px;
+        margin-bottom: 12px;
+        background-color: #fff;
         border-radius: 8px;
+        border: 1px solid #ddd;
         cursor: pointer;
+        transition: background-color 0.3s ease, transform 0.2s ease;
+        font-size: 1.1rem;
+        text-align: left;
+        box-shadow: 0 2px 4px rgba(0, 0, 0, 0.05);
       }
       .answer-option:hover {
+        background-color: #f0f8ff;
+        transform: translateY(-2px);
+        border-color: #a6d4fa;
       }
       .answer-option.selected {
+        background-color: #a6d4fa;
+        border-color: #3498db;
+        color: #fff;
+        box-shadow: 0 4px 6px rgba(0, 0, 0, 0.1);
       }
       .answer-option.correct {
+        background-color: #86ef7d;
+        border-color: #22c55e;
         color: #fff;
+        font-weight: 600;
       }
       .answer-option.incorrect {
+        background-color: #fca5a5;
+        border-color: #dc2626;
         color: #fff;
+        font-weight: 600;
       }
       #result-message {
         font-size: 1.2rem;
         margin-bottom: 25px;
+        font-weight: 500;
       }
       .correct-message {
+        color: #22c55e;
       }
       .incorrect-message {
+        color: #dc2626;
       }
+      #next-button, #skip-button, #reset-button, #review-button {
         padding: 12px 25px;
         font-size: 1.1rem;
+        margin: 5px 10px;
         border-radius: 8px;
         border: none;
         cursor: pointer;
+        transition: background-color 0.3s ease, transform 0.2s ease, box-shadow 0.3s ease;
+        font-weight: 500;
+        box-shadow: 0 2px 5px rgba(0, 0, 0, 0.1);
       }
       #next-button {
+        background-color: #3498db;
         color: #fff;
       }
       #next-button:hover {
         background-color: #2980b9;
         transform: translateY(-2px);
+        box-shadow: 0 4px 7px rgba(0, 0, 0, 0.15);
       }
       #next-button:disabled {
+        background-color: #b8c6da;
         cursor: not-allowed;
+        transform: none;
+        box-shadow: none;
       }
       #skip-button {
+        background-color: #f39c12;
         color: #fff;
       }
       #skip-button:hover {
         background-color: #e67e22;
         transform: translateY(-2px);
+        box-shadow: 0 4px 7px rgba(0, 0, 0, 0.15);
       }
       #reset-button {
+        background-color: #2ecc71;
         color: #fff;
       }
       #reset-button:hover {
         background-color: #27ae60;
         transform: translateY(-2px);
+        box-shadow: 0 4px 7px rgba(0, 0, 0, 0.15);
+      }
+      #review-button {
+        background-color: #8e44ad;
+        color: #fff;
+      }
+      #review-button:hover {
+        background-color: #732d91;
+        transform: translateY(-2px);
+        box-shadow: 0 4px 7px rgba(0, 0, 0, 0.15);
       }
       #final-score-area {
         font-size: 1.5rem;
         font-weight: 600;
         margin-bottom: 30px;
+        color: #2c3e50;
       }
       .pass-message {
+        color: #22c55e;
       }
       .fail-message {
+        color: #dc2626;
       }
+      #review-section {
+        text-align: left;
+        margin-top: 20px;
+      }
+      .review-item {
+        margin-bottom: 20px;
+        padding: 15px;
+        background-color: #f9f9f9;
+        border-radius: 8px;
+        border: 1px solid #ddd;
+      }
+      .review-question {
+        font-size: 1.2rem;
+        color: #2c3e50;
+        margin-bottom: 10px;
+      }
+      .review-answer {
+        font-size: 1.1rem;
+        margin-bottom: 5px;
+      }
+      .review-explanation {
+        font-size: 1rem;
+        color: #555;
+        margin-top: 10px;
+      }
+      @media (max-width: 768px) {
         #root {
           width: 95%;
           padding: 20px;
           font-size: 1.1rem;
           padding: 12px;
         }
+        #next-button, #skip-button, #reset-button, #review-button {
           padding: 10px 20px;
           font-size: 1rem;
         }
         }
       }
+      @media (max-width: 480px) {
         #root {
           width: 100%;
           padding: 15px;
+          border-radius: 0;
+          box-shadow: none;
         }
         .answer-option {
           padding: 10px;
           font-size: 1rem;
           padding: 10px;
         }
+        #next-button, #skip-button, #reset-button, #review-button {
           padding: 10px 18px;
           font-size: 0.9rem;
+          margin: 5px 5px;
         }
         h1 {
           font-size: 1.5rem;
           "To predict stock market trends.",
         ],
         correctAnswer: "To understand and generate human language.",
+        explanation: "Language modeling aims to understand and generate human language by predicting the likelihood of word sequences, forming the basis for many NLP applications."
       },
       {
         question: "Which of the following is NOT a stage in the development of language models?",
           "Quantum language models (QLM)",
         ],
         correctAnswer: "Quantum language models (QLM)",
+        explanation: "Quantum language models (QLM) are not a recognized stage in language model development; the progression includes SLMs, NLMs, and PLMs."
       },
       {
         question: "What is the basic idea behind statistical language models (SLMs)?",
           "To pre-train Transformer models.",
         ],
         correctAnswer: "To build word prediction models based on the Markov assumption.",
+        explanation: "SLMs rely on the Markov assumption, which posits that the probability of a word depends only on a fixed number of previous words (n-grams)."
       },
       {
         question: "What is a limitation of SLMs?",
           "They are not used in NLP.",
         ],
         correctAnswer: "They suffer from the curse of dimensionality.",
+        explanation: "SLMs struggle with high-dimensional data due to the curse of dimensionality, where the number of possible n-grams grows exponentially, making it hard to estimate probabilities accurately."
       },
       {
         question: "What is the main characteristic of neural language models (NLMs)?",
           "They use n-gram models.",
         ],
         correctAnswer: "They characterize the probability of word sequences by neural networks.",
+        explanation: "NLMs use neural networks to model the probability of word sequences, overcoming some limitations of SLMs by learning continuous representations."
       },
       {
         question: "What concept did the work in [1] introduce?",
           "Pre-training and fine-tuning.",
         ],
         correctAnswer: "Distributed representation of words.",
+        explanation: "The work in [1] refers to early neural network models (e.g., word2vec) that introduced distributed representations, allowing words to be represented as dense vectors in a continuous space."
       },
       {
         question: "What is word2vec?",
           "A pre-trained language model.",
         ],
         correctAnswer: "A simplified shallow neural network for learning distributed word representations.",
+        explanation: "Word2vec is a shallow neural network designed to learn distributed word representations (word embeddings) efficiently from large text corpora."
       },
       {
         question: "What was an early attempt at capturing context-aware word representations?",
         options: ["BERT", "ELMo", "GPT-2", "word2vec"],
         correctAnswer: "ELMo",
+        explanation: "ELMo (Embeddings from Language Models) was an early model that captured context-aware word representations by using bidirectional LSTMs, unlike the static embeddings of word2vec."
       },
       {
         question: "Which architecture is highly parallelizable and used in BERT?",
         options: ["RNN", "LSTM", "Transformer", "MLP"],
         correctAnswer: "Transformer",
+        explanation: "BERT uses the Transformer architecture, which is highly parallelizable due to its self-attention mechanism, unlike sequential models like RNNs or LSTMs."
       },
       {
         question: "What is a key feature of BERT?",
           "It predicts the next word based on the most recent context.",
         ],
         correctAnswer: "It pre-trains bidirectional language models.",
+        explanation: "BERT’s key feature is its bidirectional pre-training, allowing it to consider both left and right context for each word, unlike unidirectional models."
       },
       {
         question: "What paradigm did BERT inspire?",
           "Distributed representation learning.",
         ],
         correctAnswer: "Pre-training and fine-tuning.",
+        explanation: "BERT popularized the pre-training and fine-tuning paradigm, where a model is pre-trained on a large corpus and then fine-tuned for specific tasks."
       },
       {
         question: "What do researchers find about scaling PLMs?",
           "It only works for small models.",
         ],
         correctAnswer: "It often leads to an improved model capacity.",
+        explanation: "Scaling pre-trained language models (PLMs) by increasing parameters and data often improves their capacity to handle complex tasks, as seen in models like GPT-3."
       },
       {
         question: "What is a characteristic of large-sized PLMs (LLMs)?",
           "They are less complex than SLMs.",
         ],
         correctAnswer: "They display different behaviors from smaller PLMs.",
+        explanation: "Large-sized PLMs (LLMs) exhibit emergent behaviors, such as few-shot learning, that smaller PLMs like BERT typically do not show."
       },
       {
         question: "What is an example of an emergent ability in LLMs?",
           "Using only n-gram models.",
         ],
         correctAnswer: "Solving few-shot tasks through in-context learning.",
+        explanation: "An emergent ability in LLMs is solving few-shot tasks via in-context learning, where the model adapts to new tasks with just a few examples provided in the prompt."
       },
+      {
         question: "What does the term 'LLM' stand for?",
         options: [
           "Limited Language Model",
           "Logical Language Model",
         ],
         correctAnswer: "Large Language Model",
+        explanation: "LLM stands for Large Language Model, referring to models with billions of parameters trained on massive datasets."
       },
       {
         question: "Which of the following is a remarkable application of LLMs?",
         options: ["ELMo", "ChatGPT", "word2vec", "SLM"],
         correctAnswer: "ChatGPT",
+        explanation: "ChatGPT, built on the GPT architecture, is a remarkable LLM application known for its conversational abilities and widespread use."
       },
       {
         question: "What is a key focus of the latest language models (e.g., GPT-4)?",
           "Using only statistical methods.",
         ],
         correctAnswer: "Complex task solving.",
+        explanation: "Latest models like GPT-4 focus on solving complex tasks, leveraging their scale and training to handle diverse, intricate problems."
       },
       {
         question: "How do LLMs differ from small PLMs in accessing them?",
           "They are accessed using n-gram models.",
         ],
         correctAnswer: "They are accessed through the prompting interface.",
+        explanation: "LLMs are typically accessed via prompting, where users provide instructions or examples in natural language, unlike smaller PLMs that often require fine-tuning."
       },
       {
         question: "What is a challenge in developing LLMs?",
           "It is very costly to train them due to huge demand for computation resources.",
         ],
         correctAnswer: "It is very costly to train them due to huge demand for computation resources.",
+        explanation: "Training LLMs requires vast computational resources, making it expensive and often limiting development to well-funded organizations."
       },
       {
         question: "What is a potential issue with LLMs despite their capacities?",
           "They do not require effective control approaches.",
         ],
         correctAnswer: "They are likely to produce toxic, fictitious, or harmful content.",
+        explanation: "Despite their capabilities, LLMs can generate toxic or false content due to biases in training data or lack of perfect alignment with human values."
       },
       {
         question: "What are the four major aspects of LLMs covered in the survey?",
           "Input, processing, output, and storage.",
         ],
         correctAnswer: "Pre-training, adaptation, utilization, and capacity evaluation.",
+        explanation: "The survey covers pre-training (initial training), adaptation (tuning), utilization (application), and capacity evaluation (performance assessment) as key aspects of LLMs."
       },
       {
         question: "What is the typical parameter size of LLMs?",
           "Less than 100 parameters.",
         ],
         correctAnswer: "Billions or hundreds of billions of parameters.",
+        explanation: "LLMs typically have billions or hundreds of billions of parameters, enabling their vast capacity, unlike smaller models with millions."
       },
       {
         question: "On what type of data are LLMs typically trained?",
           "Audio data only.",
         ],
         correctAnswer: "Massive text data.",
+        explanation: "LLMs are trained on massive text corpora, such as web texts, books, and articles, to capture broad language patterns."
       },
       {
         question: "What strong capacity do LLMs exhibit?",
           "Performing only simple calculations.",
         ],
         correctAnswer: "Solving complex tasks via text generation.",
+        explanation: "LLMs excel at solving complex tasks by generating text, leveraging their understanding of language and context."
       },
       {
         question: "What does the survey introduce as basic background for LLMs?",
           "Only scaling laws.",
         ],
         correctAnswer: "Scaling laws, emergent abilities, and key techniques.",
+        explanation: "The survey provides background on scaling laws (performance vs. size), emergent abilities (e.g., few-shot learning), and key techniques (e.g., Transformers)."
       },
       {
         question: "What is the key to understanding the development of language models in research history?",
           "Ignoring the evolution of model capacities.",
         ],
         correctAnswer: "The leap from language modeling to task solving.",
+        explanation: "The shift from merely modeling language (predicting words) to solving tasks (e.g., reasoning, Q&A) marks a pivotal development in language models."
       },
       {
         question: "Which of the following is NOT a characteristic of LLMs?",
           "Using Transformer language models.",
         ],
         correctAnswer: "Training on small datasets.",
+        explanation: "LLMs are characterized by training on massive datasets, not small ones, which enables their strong performance."
       },
       {
         question: "What is a major difference between LLMs and previous smaller PLMs?",
           "LLMs do not require large-scale data.",
         ],
         correctAnswer: "LLMs display surprising emergent abilities.",
+        explanation: "LLMs show emergent abilities like in-context learning, which smaller PLMs typically lack due to their scale and training."
       },
       {
         question: "How has the research paradigm shifted towards the use of LLMs in NLP?",
           "Ignoring pre-training and fine-tuning.",
         ],
         correctAnswer: "LLMs serve as a general-purpose language task solver.",
+        explanation: "The paradigm has shifted to using LLMs as general-purpose solvers for various NLP tasks via prompting, rather than task-specific fine-tuning."
       },
       {
         question: "What is a challenge that traditional search engines face with the advent of LLMs?",
           "Easier data processing.",
         ],
         correctAnswer: "New information seeking way through AI chatbots.",
+        explanation: "LLM-powered chatbots offer a conversational way to seek information, challenging the keyword-based approach of traditional search engines."
       },
       {
         question: "What is a current trend in computer vision (CV) research related to LLMs?",
           "Focusing solely on image classification.",
         ],
         correctAnswer: "Developing ChatGPT-like vision-language models.",
+        explanation: "CV research is trending towards multimodal models that combine vision and language, inspired by ChatGPT’s success."
       },
       {
         question: "What is a potential impact of the new wave of LLM technology?",
           "Slower development of AI algorithms.",
         ],
         correctAnswer: "A prosperous ecosystem of real-world applications based on LLMs.",
+        explanation: "LLMs are fostering a wide range of real-world applications, from chatbots to automation, due to their versatility."
       },
       {
         question: "What is one of the mysterious aspects of LLMs?",
           "Why they only work on small datasets.",
         ],
         correctAnswer: "Why emergent abilities occur in LLMs.",
+        explanation: "The emergence of abilities like few-shot learning in LLMs is not fully understood, making it a mysterious aspect of their behavior."
       },
       {
         question: "Why is it difficult for the research community to train capable LLMs?",
           "Because LLMs are mainly trained by academia.",
         ],
         correctAnswer: "Because it is very costly to carry out repetitive studies.",
+        explanation: "Training LLMs requires extensive computational resources, making repetitive studies costly and limiting academic research."
       },
       {
         question: "What is a challenge in aligning LLMs?",
           "Reducing their computational costs.",
         ],
         correctAnswer: "Aligning them with human values or preferences.",
+        explanation: "Aligning LLMs with human values is challenging due to biases in data and the complexity of defining universal preferences."
       },
       {
         question: "What does the paper 'Planning for AGI and beyond' discuss?",
           "Only short-term plans for AI development.",
         ],
         correctAnswer: "Short-term and long-term plans to approach AGI.",
+        explanation: "The paper outlines strategies for developing Artificial General Intelligence (AGI), covering both immediate and future steps."
       },
       {
         question: "What is a recent argument about GPT-4?",
           "It can only perform simple tasks.",
         ],
         correctAnswer: "It might be considered an early version of an AGI system.",
+        explanation: "Some argue GPT-4’s broad capabilities suggest it could be an early AGI, though it lacks full general intelligence."
       },
       {
         question: "How is Microsoft 365 being empowered?",
           "By using only statistical models.",
         ],
         correctAnswer: "By LLMs to automate office work.",
+        explanation: "Microsoft 365 integrates LLMs (e.g., via Copilot) to automate tasks like writing, summarizing, and data analysis."
       },
       {
+        question: "What is a suggestion for choosing layer normalization in LLMs?",
+        options: ["Post RMSNorm", "Pre RMSNorm", "Post LN", "No Normalization"],
+        correctAnswer: "Pre RMSNorm",
+        explanation: "Pre RMSNorm (Root Mean Square Normalization before layers) is suggested for LLMs due to its stability and performance benefits."
       },
       {
+        question: "Which activation function is recommended for stronger generalization and training stability?",
+        options: ["ReLU", "Sigmoid", "SwiGLU", "Tanh"],
+        correctAnswer: "SwiGLU",
+        explanation: "SwiGLU (Swish-Gated Linear Unit) is recommended for LLMs as it improves generalization and training stability over traditional functions like ReLU."
       },
       {
+        question: "Which position embedding is considered a better choice for LLMs?",
+        options: ["Absolute Positional Embedding", "Relative Positional Embedding", "RoPE", "Sinusoidal Positional Encoding"],
+        correctAnswer: "RoPE",
+        explanation: "RoPE (Rotary Position Embedding) is favored in LLMs for its ability to encode relative positions efficiently and scale with sequence length."
       },
       {
         question: "What is the primary role of pre-training in LLMs?",
+        options: [
           "To fine-tune models for specific tasks.",
           "To encode general knowledge from large-scale corpus.",
           "To reduce the size of the model.",
           "To improve inference speed.",
         ],
         correctAnswer: "To encode general knowledge from large-scale corpus.",
+        explanation: "Pre-training encodes general knowledge from vast text corpora into LLMs, providing a foundation for later task-specific adaptation."
+      },
       {
         question: "What type of data is included in the arXiv Dataset?",
         options: [
           "Image and video data.",
         ],
         correctAnswer: "Scientific publication data.",
+        explanation: "The arXiv Dataset contains scientific publication data, primarily research papers, used for training models on academic content."
       },
       {
         question: "What is the approximate size of the peS2o dataset?",
         options: ["42MB", "42GB", "42TB", "42B tokens"],
         correctAnswer: "42B tokens",
+        explanation: "The peS2o dataset is approximately 42 billion tokens, a massive text corpus used for training LLMs."
       },
       {
         question: "What is a characteristic of the articles in Wikipedia?",
           "They cover only a narrow range of topics.",
         ],
         correctAnswer: "They are composed in an expository style with references.",
+        explanation: "Wikipedia articles are written in an expository style, providing detailed explanations with references, making them a valuable training resource."
       },
       {
         question: "What is a technique used to improve memory efficiency and throughput of deployed LLMs?",
         options: ["Data Parallelism", "Tensor Parallelism", "Pipeline Parallelism", "PagedAttention"],
         correctAnswer: "PagedAttention",
+        explanation: "PagedAttention improves memory efficiency and throughput in LLMs by managing key-value caches more effectively during inference."
       },
       {
         question: "How does PagedAttention partition sequences?",
           "Into overlapping segments.",
         ],
         correctAnswer: "Into subsequences.",
+        explanation: "PagedAttention partitions sequences into subsequences, allowing efficient memory management by processing them in blocks."
       },
       {
         question: "What is the benefit of using PagedAttention?",
           "Improves model accuracy.",
         ],
         correctAnswer: "Increases GPU utilization and enables efficient memory sharing.",
+        explanation: "PagedAttention boosts GPU utilization and memory sharing, optimizing resource use during LLM inference."
       },
       {
         question: "What type of floating-point number was predominantly used for pre-training in previous PLMs like BERT?",
         options: ["FP16", "BF16", "FP32", "INT8"],
         correctAnswer: "FP32",
+        explanation: "FP32 (32-bit floating-point) was commonly used in earlier PLMs like BERT for its high precision during pre-training."
       },
       {
         question: "Why have some studies started to use FP16 for pre-training LLMs?",
           "To avoid the loss of computational accuracy.",
         ],
         correctAnswer: "To reduce memory usage and communication overhead.",
+        explanation: "FP16 (16-bit floating-point) reduces memory usage and communication overhead, making pre-training LLMs more efficient despite lower precision."
       },
       {
         question: "What is a potential issue with using FP16 for training?",
           "Improved model performance.",
         ],
         correctAnswer: "Loss of computational accuracy.",
+        explanation: "FP16’s lower precision can lead to a loss of computational accuracy, potentially affecting model quality during training."
       },
       {
         question: "What is BF16?",
           "A method for parallel training.",
         ],
         correctAnswer: "Brain Floating Point, an alternative to FP16.",
+        explanation: "BF16 (Brain Floating Point) is a 16-bit format developed by Google, offering a balance between FP16’s efficiency and FP32’s precision."
       },
       {
         question: "How does BF16 compare to FP16 in terms of representation accuracy for pre-training?",
           "BF16 is not suitable for pre-training.",
         ],
         correctAnswer: "BF16 generally performs better than FP16.",
+        explanation: "BF16 provides better representation accuracy than FP16 due to its wider dynamic range, making it more suitable for pre-training LLMs."
       },
       {
         question: "Which training technique is often used jointly with 3D parallelism to improve training throughput?",
           "PagedAttention.",
         ],
         correctAnswer: "Mixed precision training.",
+        explanation: "Mixed precision training, combining FP16/BF16 with FP32, is used with 3D parallelism (data, tensor, pipeline) to boost LLM training throughput."
       },
       {
         question: "What type of parallelism was used to train BLOOM on 384 A100 GPUs?",
           "Only pipeline parallelism.",
         ],
         correctAnswer: "8-way data parallelism, 4-way tensor parallelism, and 12-way pipeline parallelism.",
+        explanation: "BLOOM used a combination of 8-way data, 4-way tensor, and 12-way pipeline parallelism to efficiently train on 384 A100 GPUs."
       },
       {
         question: "What is the primary approach to using LLMs after pre-training or adaptation tuning?",
           "Using only n-gram models.",
         ],
         correctAnswer: "Designing suitable prompting strategies.",
+        explanation: "Post-pre-training, LLMs are primarily used via prompting strategies, where carefully crafted inputs elicit desired outputs."
       },
       {
         question: "What is a representative prompting method discussed in the text?",
         options: ["Fine-tuning", "Backpropagation", "In-context learning", "Random search"],
         correctAnswer: "In-context learning",
+        explanation: "In-context learning is a key prompting method where LLMs learn tasks from examples provided in the input prompt."
       },
       {
         question: "What does in-context learning involve?",
           "Employing only manual creation of prompts.",
         ],
         correctAnswer: "Formulating task description and demonstrations in natural language text.",
+        explanation: "In-context learning involves providing a task description and examples in natural language within the prompt to guide the LLM."
       },
       {
         question: "What is the process of manually creating a suitable prompt also called?",
         options: ["Automatic prompt optimization", "Prompt engineering", "Prompt tuning", "Prompt generation"],
         correctAnswer: "Prompt engineering",
+        explanation: "Prompt engineering refers to the manual design of prompts to effectively leverage LLMs’ capabilities for specific tasks."
       },
       {
         question: "What is the impact of a well-designed prompt on LLMs?",
           "It makes LLMs generate random outputs.",
         ],
         correctAnswer: "It is very helpful to elicit the abilities of LLMs.",
+        explanation: "A well-designed prompt significantly enhances an LLM’s ability to perform tasks by providing clear context and instructions."
       },
       {
         question: "What type of data is considered well-organized with algorithmic logic and programming flow?",
         options: ["Natural language text", "Image data", "Code data", "Audio data"],
         correctAnswer: "Code data",
+        explanation: "Code data is structured with algorithmic logic and programming flow, making it distinct from unstructured natural language text."
       },
       {
         question: "What ability do models trained on code show?",
         options: ["Weak reasoning ability", "Strong reasoning ability", "No reasoning ability", "Only language generation ability"],
         correctAnswer: "Strong reasoning ability",
+        explanation: "Models trained on code exhibit strong reasoning ability due to the logical and structured nature of programming data."
       },
       {
         question: "What is a hypothesis regarding code data and LLMs' reasoning performance?",
           "Code data is only useful for code generation.",
         ],
         correctAnswer: "Code data may be useful to improve the reasoning performance of LLMs.",
+        explanation: "It’s hypothesized that code data’s logical structure could enhance LLMs’ reasoning skills beyond just code generation."
       },
       {
         question: "What is a characteristic of LLMs' text generation quality?",
           "It cannot be evaluated.",
         ],
         correctAnswer: "It is comparable to human-written texts.",
+        explanation: "LLMs generate text that is often comparable to human-written content in coherence and quality, a testament to their training scale."
       },
       {
         question: "How can LLMs be used in the context of generation evaluation?",
           "To perform only statistical analysis.",
         ],
         correctAnswer: "As language generation evaluators.",
+        explanation: "LLMs can evaluate generated text by assessing its quality, coherence, or relevance, supplementing human judgment."
       },
       {
         question: "What is a limitation of LLMs in specialized generation?",
           "They are only good at generating code.",
         ],
         correctAnswer: "They have learned general language patterns but underperform in specialized generation.",
+        explanation: "LLMs excel in general language but may struggle with highly specialized domains due to limited domain-specific training data."
       },
       {
         question: "What is a common approach to enhancing LLMs' factual knowledge?",
           "Ignoring up-to-date information.",
         ],
         correctAnswer: "Incorporating extracted relevant information into the context.",
+        explanation: "Enhancing LLMs’ factual knowledge often involves adding relevant external information (e.g., via retrieval-augmented generation) to the context."
       },
       {
         question: "What is a finding about smaller models with instruction tuning compared to larger models without it?",
           "Larger models are always better.",
         ],
         correctAnswer: "Smaller models can perform better.",
+        explanation: "Smaller models with instruction tuning can outperform larger untuned models by being more aligned with specific tasks."
       },
       {
         question: "What does instruction tuning enable LLMs to do?",
           "Perform only without demonstrations.",
         ],
         correctAnswer: "Follow human instructions to perform specific tasks, even on unseen tasks.",
+        explanation: "Instruction tuning allows LLMs to generalize to unseen tasks by following human instructions provided in natural language."
       },
       {
         question: "What is a benefit of instruction tuning?",
           "It does not improve model performance.",
         ],
         correctAnswer: "It is much less costly than pre-training.",
+        explanation: "Instruction tuning is less resource-intensive than pre-training, requiring only a smaller dataset of instructions to adapt the model."
       },
       {
         question: "What is the primary goal of instruction tuning?",
           "To generate random text",
         ],
         correctAnswer: "To make LLMs better at following instructions",
+        explanation: "The main goal of instruction tuning is to improve LLMs’ ability to accurately follow human instructions for various tasks."
       },
       {
         question: "What kind of tasks does instruction tuning help LLMs perform?",
           "No specific tasks",
         ],
         correctAnswer: "Specific tasks without demonstrations",
+        explanation: "Instruction tuning enables LLMs to perform specific tasks based solely on instructions, without needing example demonstrations."
       },
       {
         question: "How does instruction tuning affect LLMs' ability to follow instructions?",
           "It makes them ignore instructions",
         ],
         correctAnswer: "It enhances their ability",
+        explanation: "Instruction tuning enhances LLMs’ capability to interpret and act on human instructions effectively."
       },
       {
         question: "What have a large number of studies confirmed about instruction tuning?",
           "It decreases performance",
         ],
         correctAnswer: "It achieves superior performance on seen and unseen tasks",
+        explanation: "Studies show instruction tuning boosts LLM performance on both familiar (seen) and new (unseen) tasks."
       },
       {
         question: "What is a key aspect of high-quality long CoT data curation?",
           "Manual data collection only",
         ],
         correctAnswer: "Using open models or APIs for data synthesis",
+        explanation: "High-quality Chain-of-Thought (CoT) data is often curated using open models or APIs to synthesize detailed reasoning steps."
       },
       {
         question: "What is the basic idea behind creating long CoT response data?",
           "Ignoring the prompt structure",
         ],
         correctAnswer: "Feeding prompts into teacher models",
+        explanation: "Long CoT response data is created by feeding prompts into teacher models to generate step-by-step reasoning responses."
       },
       {
         question: "What is the finding about smaller models with instruction tuning compared to larger models without fine-tuning?",
           "Larger models are always better.",
         ],
         correctAnswer: "Smaller models can perform better.",
+        explanation: "Research indicates that smaller, instruction-tuned models can outperform larger models without tuning due to better task alignment."
       },
     ];
       const [quizEnd, setQuizEnd] = React.useState(false);
       const [selectedAnswerColor, setSelectedAnswerColor] = React.useState('');
       const [currentQuestionNumber, setCurrentQuestionNumber] = React.useState(1);
+      const [incorrectAnswers, setIncorrectAnswers] = React.useState([]);
+      const [showReview, setShowReview] = React.useState(false);
       const currentQuestion = quizData[currentQuestionIndex];
       const totalQuestions = quizData.length;
       const handleAnswerSelection = (answer) => {
         setSelectedAnswer(answer);
         if (answer === currentQuestion.correctAnswer) {
         } else {
           setMessage('Incorrect!');
           setSelectedAnswerColor('incorrect');
+          setIncorrectAnswers([...incorrectAnswers, {
+            question: currentQuestion.question,
+            selectedAnswer: answer,
+            correctAnswer: currentQuestion.correctAnswer,
+            explanation: currentQuestion.explanation
+          }]);
         }
       };
         setQuizEnd(false);
         setSelectedAnswerColor('');
         setCurrentQuestionNumber(1);
+        setIncorrectAnswers([]);
+        setShowReview(false);
+      };
+      const handleReviewIncorrect = () => {
+        setShowReview(true);
       };
       return (
             <>
               <div id="question-area">
                 Question {currentQuestionNumber}/{totalQuestions}: {currentQuestion.question}
+              </div>
               <div id="answer-options">
                 {currentQuestion.options.map((option) => (
                   <div
                     key={option}
                     className={`answer-option ${selectedAnswer === option ? selectedAnswerColor : ''} ${selectedAnswer ? 'disabled' : ''} ${selectedAnswerColor && option === currentQuestion.correctAnswer ? 'correct' : ''}`}
+                    onClick={() => !selectedAnswer && handleAnswerSelection(option)}
                   >
                     {option}
                   </div>
             <>
               <div id="final-score-area">
                 Your Final Score: {score} / {quizData.length} <br/>
+                {score >= Math.ceil(quizData.length * 0.8) ? (
                   <span className="pass-message">Passed</span>
                 ) : (
                   <span className="fail-message">Failed</span>
                 )}
               </div>
+              <div style={{display: 'flex', justifyContent: 'center'}}>
+                <button id="reset-button" onClick={handleResetQuiz}>
+                  Play Again
+                </button>
+                {incorrectAnswers.length > 0 && (
+                  <button id="review-button" onClick={handleReviewIncorrect}>
+                    Review Incorrect Answers
+                  </button>
+                )}
+              </div>
+              {showReview && (
+                <div id="review-section">
+                  <h2>Review of Incorrect Answers</h2>
+                  {incorrectAnswers.map((item, index) => (
+                    <div key={index} className="review-item">
+                      <div className="review-question">{item.question}</div>
+                      <div className="review-answer">
+                        <strong>Your Answer:</strong> {item.selectedAnswer} <span className="incorrect-message">(Incorrect)</span>
+                      </div>
+                      <div className="review-answer">
+                        <strong>Correct Answer:</strong> {item.correctAnswer} <span className="correct-message">(Correct)</span>
+                      </div>
+                      <div className="review-explanation">
+                        <strong>Explanation:</strong> {item.explanation}
+                      </div>
+                    </div>
+                  ))}
+                </div>
+              )}
             </>
           )}
         </div>
     ReactDOM.render(<QuizApp />, document.getElementById("root"));
   </script>
 </body>
+</html>