[ { "band": "A", "query": "attention is all you need", "description": "Landmark transformer paper by Vaswani et al.", "rewrite": "Transformer self-attention mechanisms Vaswani et al", "latency_ms": 4127.867400005925, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "1706.03762", "title": "Attention Is All You Need", "category": "?" }, { "rank": 2, "arxiv_id": "1912.11959", "title": "Is Attention All What You Need? -- An Empirical Investigation on Convolution-Based Active Memory and Self-Attention", "category": "?" }, { "rank": 3, "arxiv_id": "2404.01183", "title": "Positioning is All You Need", "category": "?" }, { "rank": 4, "arxiv_id": "2502.05383", "title": "Is attention all you need to solve the correlated electron problem?", "category": "?" }, { "rank": 5, "arxiv_id": "2405.06478", "title": "Attention is all they need: Cognitive science and the (techno)political economy of attention in humans and machines", "category": "?" }, { "rank": 6, "arxiv_id": "2304.04556", "title": "Attention: Marginal Probability is All You Need?", "category": "?" }, { "rank": 7, "arxiv_id": "2501.05730", "title": "Element-wise Attention Is All You Need", "category": "?" }, { "rank": 8, "arxiv_id": "1906.02792", "title": "Attention is all you need for Videos: Self-attention based Video Summarization using Universal Transformers", "category": "?" }, { "rank": 9, "arxiv_id": "2408.02692", "title": "Attention is all you need for an improved CNN-based flash flood susceptibility modeling. The case of the ungauged Rheraya watershed, Morocco", "category": "?" }, { "rank": 10, "arxiv_id": "2501.09166", "title": "Attention is All You Need Until You Need Retention", "category": "?" } ], "expected_id": "1706.03762", "expected_found": true, "expected_rank": 1, "topic_diversity": 0 }, { "band": "A", "query": "BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding", "description": "Full BERT title \u2014 should be exact #1", "rewrite": null, "latency_ms": 1612.3626999906264, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "1810.04805", "title": "BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding", "category": "?" }, { "rank": 2, "arxiv_id": "2210.12440", "title": "Spectrum-BERT: Pre-training of Deep Bidirectional Transformers for Spectral Classification of Chinese Liquors", "category": "?" }, { "rank": 3, "arxiv_id": "2106.08254", "title": "BEiT: BERT Pre-Training of Image Transformers", "category": "?" }, { "rank": 4, "arxiv_id": "1909.04120", "title": "Span Selection Pre-training for Question Answering", "category": "?" }, { "rank": 5, "arxiv_id": "2401.15861", "title": "BPDec: Unveiling the Potential of Masked Language Modeling Decoder in BERT pretraining", "category": "?" }, { "rank": 6, "arxiv_id": "1909.10351", "title": "TinyBERT: Distilling BERT for Natural Language Understanding", "category": "?" }, { "rank": 7, "arxiv_id": "2011.07208", "title": "Utilizing Bidirectional Encoder Representations from Transformers for Answer Selection", "category": "?" }, { "rank": 8, "arxiv_id": "1905.05583", "title": "How to Fine-Tune BERT for Text Classification?", "category": "?" }, { "rank": 9, "arxiv_id": "1906.08237", "title": "XLNet: Generalized Autoregressive Pretraining for Language Understanding", "category": "?" }, { "rank": 10, "arxiv_id": "2112.07571", "title": "Epigenomic language models powered by Cerebras", "category": "?" } ], "expected_id": "1810.04805", "expected_found": true, "expected_rank": 1, "topic_diversity": 0 }, { "band": "A", "query": "Deep Residual Learning for Image Recognition", "description": "ResNet \u2014 the most-cited CV paper", "rewrite": "Deep Residual Learning Image Recognition ConvNets ResNet", "latency_ms": 2775.4920000443235, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "1512.03385", "title": "Deep Residual Learning for Image Recognition", "category": "?" }, { "rank": 2, "arxiv_id": "1604.01335", "title": "Deep Cross Residual Learning for Multitask Visual Recognition", "category": "?" }, { "rank": 3, "arxiv_id": "1805.00325", "title": "Study of Residual Networks for Image Recognition", "category": "?" }, { "rank": 4, "arxiv_id": "2505.01632", "title": "Transfer Learning-Based Deep Residual Learning for Speech Recognition in Clean and Noisy Environments", "category": "?" }, { "rank": 5, "arxiv_id": "2004.04989", "title": "Improved Residual Networks for Image and Video Recognition", "category": "?" }, { "rank": 6, "arxiv_id": "1604.08671", "title": "Deep Edge Guided Recurrent Residual Learning for Image Super-Resolution", "category": "?" }, { "rank": 7, "arxiv_id": "1707.08866", "title": "Deep Residual Learning for Weakly-Supervised Relation Extraction", "category": "?" }, { "rank": 8, "arxiv_id": "1706.08807", "title": "Recurrent Residual Learning for Action Recognition", "category": "?" }, { "rank": 9, "arxiv_id": "2211.12320", "title": "A Cross-Residual Learning for Image Recognition", "category": "?" }, { "rank": 10, "arxiv_id": "2107.05318", "title": "R3L: Connecting Deep Reinforcement Learning to Recurrent Neural Networks for Image Denoising via Residual Recovery", "category": "?" } ], "expected_id": "1512.03385", "expected_found": true, "expected_rank": 1, "topic_diversity": 0 }, { "band": "F", "query": "how do transformers work in NLP", "description": "Newcomer asking about transformer basics", "rewrite": "Transformer architecture self-attention mechanisms NLP deep learning sequence modeling", "latency_ms": 2065.812500019092, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2406.16893", "title": "A Survey on Transformers in NLP with Focus on Efficiency", "category": "?" }, { "rank": 2, "arxiv_id": "1910.06764", "title": "Stabilizing Transformers for Reinforcement Learning", "category": "?" }, { "rank": 3, "arxiv_id": "2204.05673", "title": "What do Toothbrushes do in the Kitchen? How Transformers Think our World is Structured", "category": "?" }, { "rank": 4, "arxiv_id": "2410.13732", "title": "Reducing the Transformer Architecture to a Minimum", "category": "?" }, { "rank": 5, "arxiv_id": "2306.07303", "title": "A Comprehensive Survey on Applications of Transformers for Deep Learning Tasks", "category": "?" }, { "rank": 6, "arxiv_id": "2202.07856", "title": "The NLP Task Effectiveness of Long-Range Transformers", "category": "?" }, { "rank": 7, "arxiv_id": "2310.10930", "title": "Enhanced Transformer Architecture for Natural Language Processing", "category": "?" }, { "rank": 8, "arxiv_id": "1907.00570", "title": "Do Transformer Attention Heads Provide Transparency in Abstractive Summarization?", "category": "?" }, { "rank": 9, "arxiv_id": "1906.06755", "title": "Theoretical Limitations of Self-Attention in Neural Sequence Models", "category": "?" }, { "rank": 10, "arxiv_id": "2105.08050", "title": "Pay Attention to MLPs", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "F", "query": "what is reinforcement learning from human feedback", "description": "Beginner asking about RLHF \u2014 should surface Ouyang/InstructGPT/Christiano", "rewrite": null, "latency_ms": 1188.2260999991558, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2312.14925", "title": "A Survey of Reinforcement Learning from Human Feedback", "category": "?" }, { "rank": 2, "arxiv_id": "2504.12501", "title": "Reinforcement Learning from Human Feedback", "category": "?" }, { "rank": 3, "arxiv_id": "2504.14732", "title": "Reinforcement Learning from Multi-level and Episodic Human Feedback", "category": "?" }, { "rank": 4, "arxiv_id": "2502.05434", "title": "Sample-Efficient Reinforcement Learning from Human Feedback via Information-Directed Sampling", "category": "?" }, { "rank": 5, "arxiv_id": "2211.11602", "title": "Improving Multimodal Interactive Agents with Reinforcement Learning from Human Feedback", "category": "?" }, { "rank": 6, "arxiv_id": "2410.02504", "title": "Dual Active Learning for Reinforcement Learning from Human Feedback", "category": "?" }, { "rank": 7, "arxiv_id": "2303.02891", "title": "Perspectives on the Social Impacts of Reinforcement Learning with Human Feedback", "category": "?" }, { "rank": 8, "arxiv_id": "2310.13639", "title": "Contrastive Preference Learning: Learning from Human Feedback without RL", "category": "?" }, { "rank": 9, "arxiv_id": "1707.07402", "title": "Reinforcement Learning for Bandit Neural Machine Translation with Simulated Human Feedback", "category": "?" }, { "rank": 10, "arxiv_id": "1805.10627", "title": "Reliability and Learnability of Human Bandit Feedback for Sequence-to-Sequence Reinforcement Learning", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "F", "query": "explain how neural networks learn", "description": "Very basic \u2014 should return foundational/survey papers", "rewrite": "deep learning neural networks backpropagation optimization stochastic gradient descent", "latency_ms": 2098.3753000036813, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2204.07291", "title": "The training response law explains how deep neural networks learn", "category": "?" }, { "rank": 2, "arxiv_id": "1901.07538", "title": "Unsupervised Learning of Neural Networks to Explain Neural Networks (extended abstract)", "category": "?" }, { "rank": 3, "arxiv_id": "1805.07468", "title": "Unsupervised Learning of Neural Networks to Explain Neural Networks", "category": "?" }, { "rank": 4, "arxiv_id": "2310.09838", "title": "Explaining How a Neural Network Play the Go Game and Let People Learn", "category": "?" }, { "rank": 5, "arxiv_id": "2307.02129", "title": "How Deep Neural Networks Learn Compositional Data: The Random Hierarchy Model", "category": "?" }, { "rank": 6, "arxiv_id": "2303.14937", "title": "LEURN: Learning Explainable Univariate Rules with Neural Networks", "category": "?" }, { "rank": 7, "arxiv_id": "1902.08160", "title": "Topology of Learning in Artificial Neural Networks", "category": "?" }, { "rank": 8, "arxiv_id": "1502.04042", "title": "Abstract Learning via Demodulation in a Deep Neural Network", "category": "?" }, { "rank": 9, "arxiv_id": "1911.05640", "title": "Neural Network Processing Neural Networks: An efficient way to learn higher order functions", "category": "?" }, { "rank": 10, "arxiv_id": "2206.01717", "title": "A Theoretical Analysis on Feature Learning in Neural Networks: Emergence from Inputs and Advantage over Fixed Features", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "F", "query": "what are diffusion models and how do they generate images", "description": "Beginner asking about DDPM/Stable Diffusion family", "rewrite": null, "latency_ms": 1032.1455000084825, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2302.09378", "title": "Modelos Generativos basados en Mecanismos de Difusi\\'on", "category": "?" }, { "rank": 2, "arxiv_id": "2302.01394", "title": "Understanding and contextualising diffusion models", "category": "?" }, { "rank": 3, "arxiv_id": "2305.19066", "title": "Nested Diffusion Processes for Anytime Image Generation", "category": "?" }, { "rank": 4, "arxiv_id": "2209.10948", "title": "Implementing and Experimenting with Diffusion Models for Text-to-Image Generation", "category": "?" }, { "rank": 5, "arxiv_id": "2411.07449", "title": "Tracing the Roots: Leveraging Temporal Dynamics in Diffusion Trajectories for Origin Attribution", "category": "?" }, { "rank": 6, "arxiv_id": "2303.05275", "title": "Detecting Images Generated by Diffusers", "category": "?" }, { "rank": 7, "arxiv_id": "2212.00235", "title": "VIDM: Video Implicit Diffusion Models", "category": "?" }, { "rank": 8, "arxiv_id": "2301.13188", "title": "Extracting Training Data from Diffusion Models", "category": "?" }, { "rank": 9, "arxiv_id": "2306.08103", "title": "Generating Images with 3D Annotations Using Diffusion Models", "category": "?" }, { "rank": 10, "arxiv_id": "2306.05182", "title": "Interactive Fashion Content Generation Using LLMs and Latent Diffusion Models", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "F", "query": "how does GPT-4 work", "description": "Newcomer asking about GPT-4 \u2014 should surface the technical report", "rewrite": "GPT-4 architecture transformer large language model multimodal processing", "latency_ms": 2233.0756000010297, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2305.03195", "title": "Gpt-4: A Review on Advancements and Opportunities in Natural Language Processing", "category": "?" }, { "rank": 2, "arxiv_id": "2303.08774", "title": "GPT-4 Technical Report", "category": "?" }, { "rank": 3, "arxiv_id": "2304.10592", "title": "MiniGPT-4: Enhancing Vision-Language Understanding with Advanced Large Language Models", "category": "?" }, { "rank": 4, "arxiv_id": "2411.17976", "title": "The importance of visual modelling languages in generative software engineering", "category": "?" }, { "rank": 5, "arxiv_id": "2503.23601", "title": "Exploring GPT-4 for Robotic Agent Strategy with Real-Time State Feedback and a Reactive Behaviour Framework", "category": "?" }, { "rank": 6, "arxiv_id": "2409.15981", "title": "GPT-4 as a Homework Tutor can Improve Student Engagement and Learning Outcomes", "category": "?" }, { "rank": 7, "arxiv_id": "2402.17396", "title": "Benchmarking GPT-4 on Algorithmic Problems: A Systematic Evaluation of Prompting Strategies", "category": "?" }, { "rank": 8, "arxiv_id": "2310.11458", "title": "GPT-4 as an interface between researchers and computational software: improving usability and reproducibility", "category": "?" }, { "rank": 9, "arxiv_id": "2305.04160", "title": "X-LLM: Bootstrapping Advanced Large Language Models by Treating Multi-Modalities as Foreign Languages", "category": "?" }, { "rank": 10, "arxiv_id": "2311.15732", "title": "GPT4Vis: What Can GPT-4 Do for Zero-shot Visual Recognition?", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "G", "query": "contrastive learning for self-supervised visual representations", "description": "Should return SimCLR, MoCo, BYOL, DINO etc.", "rewrite": "Contrastive learning self-supervised visual representation learning CNNs", "latency_ms": 1839.8786999750882, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2202.03968", "title": "Self-supervised Contrastive Learning for Cross-domain Hyperspectral Image Representation", "category": "?" }, { "rank": 2, "arxiv_id": "2301.12541", "title": "Supervised and Contrastive Self-Supervised In-Domain Representation Learning for Dense Prediction Problems in Remote Sensing", "category": "?" }, { "rank": 3, "arxiv_id": "2210.03163", "title": "Brief Introduction to Contrastive Learning Pretext Tasks for Visual Representation", "category": "?" }, { "rank": 4, "arxiv_id": "2204.13386", "title": "Self-supervised Contrastive Learning for Audio-Visual Action Recognition", "category": "?" }, { "rank": 5, "arxiv_id": "2208.04278", "title": "Self-Supervised Contrastive Representation Learning for 3D Mesh Segmentation", "category": "?" }, { "rank": 6, "arxiv_id": "2401.12024", "title": "Multimodal Visual-Tactile Representation Learning through Self-Supervised Contrastive Pre-Training", "category": "?" }, { "rank": 7, "arxiv_id": "2112.05760", "title": "Learning Representations with Contrastive Self-Supervised Learning for Histopathology Applications", "category": "?" }, { "rank": 8, "arxiv_id": "2103.13517", "title": "A Broad Study on the Transferability of Visual Representations with Contrastive Learning", "category": "?" }, { "rank": 9, "arxiv_id": "2106.15788", "title": "Exploring Localization for Self-supervised Fine-grained Contrastive Learning", "category": "?" }, { "rank": 10, "arxiv_id": "2105.05682", "title": "Multi-Scale Contrastive Siamese Networks for Self-Supervised Graph Representation Learning", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "G", "query": "knowledge distillation from large language models to smaller ones", "description": "Distillation pipeline \u2014 DistilBERT, TinyBERT, knowledge distillation surveys", "rewrite": null, "latency_ms": 1139.147799985949, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2306.08543", "title": "MiniLLM: Knowledge Distillation of Large Language Models", "category": "?" }, { "rank": 2, "arxiv_id": "2504.13825", "title": "Feature Alignment and Representation Transfer in Knowledge Distillation for Large Language Models", "category": "?" }, { "rank": 3, "arxiv_id": "2504.14366", "title": "Empirical Evaluation of Knowledge Distillation from Transformers to Subquadratic Language Models", "category": "?" }, { "rank": 4, "arxiv_id": "2412.19449", "title": "Feature Alignment-Based Knowledge Distillation for Efficient Compression of Large Language Models", "category": "?" }, { "rank": 5, "arxiv_id": "2403.06414", "title": "Evolving Knowledge Distillation with Large Language Models and Active Learning", "category": "?" }, { "rank": 6, "arxiv_id": "2406.17328", "title": "Dual-Space Knowledge Distillation for Large Language Models", "category": "?" }, { "rank": 7, "arxiv_id": "2002.00733", "title": "Generation-Distillation for Efficient Natural Language Understanding in Low-Data Settings", "category": "?" }, { "rank": 8, "arxiv_id": "2402.04616", "title": "Beyond Answers: Transferring Reasoning Capabilities to Smaller LLMs Using Multi-Teacher Knowledge Distillation", "category": "?" }, { "rank": 9, "arxiv_id": "2505.15442", "title": "On the Generalization vs Fidelity Paradox in Knowledge Distillation", "category": "?" }, { "rank": 10, "arxiv_id": "2409.12500", "title": "LLMR: Knowledge Distillation with a Large Language Model-Induced Reward", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "G", "query": "graph neural networks for molecular property prediction", "description": "GNN + chemistry \u2014 SchNet, DimeNet, MPNN papers", "rewrite": null, "latency_ms": 1286.9488000287674, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2208.04852", "title": "Graph neural networks for the prediction of molecular structure-property relationships", "category": "?" }, { "rank": 2, "arxiv_id": "1909.00259", "title": "Gated Graph Recursive Neural Networks for Molecular Property Prediction", "category": "?" }, { "rank": 3, "arxiv_id": "2008.12187", "title": "Graph Neural Network Architecture Search for Molecular Property Prediction", "category": "?" }, { "rank": 4, "arxiv_id": "2005.13607", "title": "Multi-View Graph Neural Networks for Molecular Property Prediction", "category": "?" }, { "rank": 5, "arxiv_id": "2410.12156", "title": "FragNet: A Graph Neural Network for Molecular Property Prediction with Four Layers of Interpretability", "category": "?" }, { "rank": 6, "arxiv_id": "2410.11323", "title": "KA-GNN: Kolmogorov-Arnold Graph Neural Networks for Molecular Property Prediction", "category": "?" }, { "rank": 7, "arxiv_id": "2104.06046", "title": "Which Hyperparameters to Optimise? An Investigation of Evolutionary Hyperparameter Optimisation in Graph Neural Network For Molecular Property Prediction", "category": "?" }, { "rank": 8, "arxiv_id": "2106.15529", "title": "On Graph Neural Network Ensembles for Large-Scale Molecular Property Prediction", "category": "?" }, { "rank": 9, "arxiv_id": "2012.01981", "title": "Advanced Graph and Sequence Neural Networks for Molecular Property Prediction and Drug Discovery", "category": "?" }, { "rank": 10, "arxiv_id": "2405.05205", "title": "Hybrid Quantum Graph Neural Network for Molecular Property Prediction", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "G", "query": "efficient inference for large language models quantization pruning", "description": "LLM compression \u2014 GPTQ, AWQ, SparseGPT, pruning surveys", "rewrite": null, "latency_ms": 1113.6418000096455, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2402.09748", "title": "Model Compression and Efficient Inference for Large Language Models: A Survey", "category": "?" }, { "rank": 2, "arxiv_id": "2410.17170", "title": "Self-calibration for Language Model Quantization and Pruning", "category": "?" }, { "rank": 3, "arxiv_id": "2412.11629", "title": "QPruner: Probabilistic Decision Quantization for Structured Pruning in Large Language Models", "category": "?" }, { "rank": 4, "arxiv_id": "2412.11494", "title": "FTP: A Fine-grained Token-wise Pruner for Large Language Models via Token Routing", "category": "?" }, { "rank": 5, "arxiv_id": "2402.02834", "title": "Shortened LLaMA: Depth Pruning for Large Language Models with Comparison of Retraining Methods", "category": "?" }, { "rank": 6, "arxiv_id": "2309.09507", "title": "Pruning Large Language Models via Accuracy Predictor", "category": "?" }, { "rank": 7, "arxiv_id": "2102.11289", "title": "Ps and Qs: Quantization-aware pruning for efficient low latency neural network inference", "category": "?" }, { "rank": 8, "arxiv_id": "2502.15796", "title": "Pruning as a Defense: Reducing Memorization in Large Language Models", "category": "?" }, { "rank": 9, "arxiv_id": "2502.04348", "title": "Prompt-based Depth Pruning of Large Language Models", "category": "?" }, { "rank": 10, "arxiv_id": "2503.15369", "title": "EfficientLLaVA:Generalizable Auto-Pruning for Large Vision-language Models", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "G", "query": "causal inference in observational studies with machine learning", "description": "Causal ML \u2014 double ML, causal forests, CATE estimation", "rewrite": null, "latency_ms": 967.5587000092492, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2202.12813", "title": "Causal discovery for observational sciences using supervised machine learning", "category": "?" }, { "rank": 2, "arxiv_id": "2002.02770", "title": "A Survey on Causal Inference", "category": "?" }, { "rank": 3, "arxiv_id": "2011.12508", "title": "Causal inference using deep neural networks", "category": "?" }, { "rank": 4, "arxiv_id": "2101.00878", "title": "The Value Added of Machine Learning to Causal Inference: Evidence from Revisited Studies", "category": "?" }, { "rank": 5, "arxiv_id": "2009.10982", "title": "An Introduction to Proximal Causal Learning", "category": "?" }, { "rank": 6, "arxiv_id": "2012.06865", "title": "From controlled to undisciplined data: estimating causal effects in the era of data science using a potential outcome framework", "category": "?" }, { "rank": 7, "arxiv_id": "1805.06826", "title": "The Blessings of Multiple Causes", "category": "?" }, { "rank": 8, "arxiv_id": "1910.09648", "title": "Causal bootstrapping", "category": "?" }, { "rank": 9, "arxiv_id": "2009.13472", "title": "Targeted VAE: Variational and Targeted Learning for Causal Inference", "category": "?" }, { "rank": 10, "arxiv_id": "2406.02584", "title": "A Scoping Review of Earth Observation and Machine Learning for Causal Inference: Implications for the Geography of Poverty", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "G", "query": "multi-task learning with shared representations", "description": "MTL surveys, hard/soft parameter sharing, task relationships", "rewrite": "Multi-task learning shared representations transfer learning joint optimization", "latency_ms": 1785.949699988123, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "1603.02185", "title": "Distributed Multi-Task Learning with Shared Representation", "category": "?" }, { "rank": 2, "arxiv_id": "1603.02041", "title": "Learning Shared Representations in Multi-task Reinforcement Learning", "category": "?" }, { "rank": 3, "arxiv_id": "2102.06177", "title": "Multi-Task Reinforcement Learning with Context-based Representations", "category": "?" }, { "rank": 4, "arxiv_id": "2206.12441", "title": "Joint Representation Training in Sequential Tasks with Shared Structure", "category": "?" }, { "rank": 5, "arxiv_id": "2202.10066", "title": "Multi-task Representation Learning with Stochastic Linear Bandits", "category": "?" }, { "rank": 6, "arxiv_id": "2409.16651", "title": "Learning Representation for Multitask learning through Self Supervised Auxiliary learning", "category": "?" }, { "rank": 7, "arxiv_id": "1804.08139", "title": "Same Representation, Different Attentions: Shareable Sentence Representation Learning from Multiple Tasks", "category": "?" }, { "rank": 8, "arxiv_id": "2304.01354", "title": "Functional Knowledge Transfer with Self-supervised Representation Learning", "category": "?" }, { "rank": 9, "arxiv_id": "1812.00500", "title": "Multi-task Learning of Hierarchical Vision-Language Representation", "category": "?" }, { "rank": 10, "arxiv_id": "2309.16921", "title": "YOLOR-Based Multi-Task Learning", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "H", "query": "how to fine-tune a pre-trained language model for classification", "description": "Practical fine-tuning \u2014 ULMFiT, how-to-fine-tune-BERT papers", "rewrite": null, "latency_ms": 1168.5913000255823, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2004.11493", "title": "UHH-LT at SemEval-2020 Task 12: Fine-Tuning of Pre-Trained Transformer Networks for Offensive Language Detection", "category": "?" }, { "rank": 2, "arxiv_id": "2305.19249", "title": "Preserving Pre-trained Features Helps Calibrate Fine-tuned Language Models", "category": "?" }, { "rank": 3, "arxiv_id": "2305.00350", "title": "POUF: Prompt-oriented unsupervised fine-tuning for large pre-trained models", "category": "?" }, { "rank": 4, "arxiv_id": "2305.18324", "title": "Regex-augmented Domain Transfer Topic Classification based on a Pre-trained Language Model: An application in Financial Domain", "category": "?" }, { "rank": 5, "arxiv_id": "1907.05338", "title": "To Tune or Not To Tune? How About the Best of Both Worlds?", "category": "?" }, { "rank": 6, "arxiv_id": "1910.11959", "title": "FineText: Text Classification via Attention-based Language Model Fine-tuning", "category": "?" }, { "rank": 7, "arxiv_id": "2004.03829", "title": "Exploring Versatile Generative Language Model Via Parameter-Efficient Transfer Learning", "category": "?" }, { "rank": 8, "arxiv_id": "2004.14218", "title": "Exploring Fine-tuning Techniques for Pre-trained Cross-lingual Models via Continual Learning", "category": "?" }, { "rank": 9, "arxiv_id": "2105.12192", "title": "NukeLM: Pre-Trained and Fine-Tuned Language Models for the Nuclear and Energy Domains", "category": "?" }, { "rank": 10, "arxiv_id": "2210.16771", "title": "Parameter-Efficient Tuning Makes a Good Classification Head", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "H", "query": "implementing attention mechanism from scratch", "description": "Implementation-level detail \u2014 attention tutorials, scaled dot product", "rewrite": "Self-Attention Mechanism Implementation Transformer Architecture", "latency_ms": 1706.720200018026, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2503.15758", "title": "ATTENTION2D: Communication Efficient Distributed Self-Attention Mechanism", "category": "?" }, { "rank": 2, "arxiv_id": "2204.13154", "title": "Attention Mechanism in Neural Networks: Where it Comes and Where it Goes", "category": "?" }, { "rank": 3, "arxiv_id": "2502.19214", "title": "A Hybrid Transformer Architecture with a Quantized Self-Attention Mechanism Applied to Molecular Generation", "category": "?" }, { "rank": 4, "arxiv_id": "1811.05544", "title": "An Introductory Survey on Attention Mechanisms in NLP Problems", "category": "?" }, { "rank": 5, "arxiv_id": "1803.02155", "title": "Self-Attention with Relative Position Representations", "category": "?" }, { "rank": 6, "arxiv_id": "2103.05103", "title": "Image Captioning using Multiple Transformers for Self-Attention Mechanism", "category": "?" }, { "rank": 7, "arxiv_id": "2102.03902", "title": "Nystr\\\"omformer: A Nystr\\\"om-Based Algorithm for Approximating Self-Attention", "category": "?" }, { "rank": 8, "arxiv_id": "2108.05340", "title": "Person Re-identification via Attention Pyramid", "category": "?" }, { "rank": 9, "arxiv_id": "2006.04768", "title": "Linformer: Self-Attention with Linear Complexity", "category": "?" }, { "rank": 10, "arxiv_id": "2004.11207", "title": "Self-Attention Attribution: Interpreting Information Interactions Inside Transformer", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "H", "query": "best practices for training stable diffusion models", "description": "Practical SD training \u2014 latent diffusion, classifier-free guidance", "rewrite": null, "latency_ms": 955.2253999863751, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2302.00670", "title": "Stable Target Field for Reduced Variance Score Estimation in Diffusion Models", "category": "?" }, { "rank": 2, "arxiv_id": "2502.05625", "title": "Training-Free Constrained Generation With Stable Diffusion Models", "category": "?" }, { "rank": 3, "arxiv_id": "2306.01984", "title": "DYffusion: A Dynamics-informed Diffusion Model for Spatiotemporal Forecasting", "category": "?" }, { "rank": 4, "arxiv_id": "2411.14430", "title": "Stable Flow: Vital Layers for Training-Free Image Editing", "category": "?" }, { "rank": 5, "arxiv_id": "2303.16509", "title": "HoloDiffusion: Training a 3D Diffusion Model using 2D Images", "category": "?" }, { "rank": 6, "arxiv_id": "2312.02696", "title": "Analyzing and Improving the Training Dynamics of Diffusion Models", "category": "?" }, { "rank": 7, "arxiv_id": "2402.07802", "title": "Towards a mathematical theory for consistency training in diffusion models", "category": "?" }, { "rank": 8, "arxiv_id": "2403.05056", "title": "Stealing Stable Diffusion Prior for Robust Monocular Depth Estimation", "category": "?" }, { "rank": 9, "arxiv_id": "2310.13545", "title": "ScaleLong: Towards More Stable Training of Diffusion Model via Scaling Network Long Skip Connection", "category": "?" }, { "rank": 10, "arxiv_id": "2407.01014", "title": "An Expectation-Maximization Algorithm for Training Clean Diffusion Models from Corrupted Observations", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "H", "query": "building a retrieval augmented generation system", "description": "RAG \u2014 should surface the Lewis et al. RAG paper, REALM, etc.", "rewrite": "retrieval-augmented generation RAG language models knowledge retrieval architectures", "latency_ms": 1782.7779999934137, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2409.13707", "title": "Retrieval Augmented Generation-Based Incident Resolution Recommendation System for IT Support", "category": "?" }, { "rank": 2, "arxiv_id": "2410.15944", "title": "Developing Retrieval Augmented Generation (RAG) based LLM Systems from PDFs: An Experience Report", "category": "?" }, { "rank": 3, "arxiv_id": "2503.18016", "title": "Retrieval Augmented Generation and Understanding in Vision: A Survey and New Outlook", "category": "?" }, { "rank": 4, "arxiv_id": "2503.10677", "title": "A Survey on Knowledge-Oriented Retrieval-Augmented Generation", "category": "?" }, { "rank": 5, "arxiv_id": "2403.00820", "title": "Retrieval Augmented Generation Systems: Automatic Dataset Creation, Evaluation and Boolean Agent Setup", "category": "?" }, { "rank": 6, "arxiv_id": "2402.19473", "title": "Retrieval-Augmented Generation for AI-Generated Content: A Survey", "category": "?" }, { "rank": 7, "arxiv_id": "2406.13249", "title": "R^2AG: Incorporating Retrieval Information into Retrieval Augmented Generation", "category": "?" }, { "rank": 8, "arxiv_id": "2501.15915", "title": "Parametric Retrieval Augmented Generation", "category": "?" }, { "rank": 9, "arxiv_id": "2407.13193", "title": "Retrieval-Augmented Generation for Natural Language Processing: A Survey", "category": "?" }, { "rank": 10, "arxiv_id": "2401.15884", "title": "Corrective Retrieval Augmented Generation", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "H", "query": "how to do distributed training with PyTorch across GPUs", "description": "Distributed training \u2014 ZeRO, Megatron, FSDP, DeepSpeed papers", "rewrite": null, "latency_ms": 967.3073999583721, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2006.15704", "title": "PyTorch Distributed: Experiences on Accelerating Data Parallel Training", "category": "?" }, { "rank": 2, "arxiv_id": "2101.07956", "title": "PyTorch-Direct: Enabling GPU Centric Data Access for Very Large Graph Neural Network Training with Irregular Accesses", "category": "?" }, { "rank": 3, "arxiv_id": "2302.09406", "title": "{\\ae}net-PyTorch: a GPU-supported implementation for machine learning atomic potentials training", "category": "?" }, { "rank": 4, "arxiv_id": "2309.06497", "title": "A Distributed Data-Parallel PyTorch Implementation of the Distributed Shampoo Optimizer for Training Neural Networks At-Scale", "category": "?" }, { "rank": 5, "arxiv_id": "2103.13262", "title": "FastMoE: A Fast Mixture-of-Expert Training System", "category": "?" }, { "rank": 6, "arxiv_id": "2410.06511", "title": "TorchTitan: One-stop PyTorch native solution for production ready LLM pre-training", "category": "?" }, { "rank": 7, "arxiv_id": "2206.06356", "title": "Modern Distributed Data-Parallel Large-Scale Pre-training Strategies For NLP models", "category": "?" }, { "rank": 8, "arxiv_id": "1811.05233", "title": "Massively Distributed SGD: ImageNet/ResNet-50 Training in a Flash", "category": "?" }, { "rank": 9, "arxiv_id": "2412.06041", "title": "PyPOD-GP: Using PyTorch for Accelerated Chip-Level Thermal Simulation of the GPU", "category": "?" }, { "rank": 10, "arxiv_id": "2304.14226", "title": "TorchBench: Benchmarking PyTorch with High API Surface Coverage", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "I", "query": "transformer vs CNN for image classification", "description": "ViT vs ResNet/EfficientNet \u2014 should surface comparison papers", "rewrite": "Transformer CNN image classification comparison Vision Transformer ViT", "latency_ms": 1903.2504000351764, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2406.03478", "title": "Convolutional Neural Networks and Vision Transformers for Fashion MNIST Classification: A Literature Review", "category": "?" }, { "rank": 2, "arxiv_id": "2504.08481", "title": "A Hybrid Fully Convolutional CNN-Transformer Model for Inherently Interpretable Medical Image Classification", "category": "?" }, { "rank": 3, "arxiv_id": "2108.09038", "title": "Is it Time to Replace CNNs with Transformers for Medical Images?", "category": "?" }, { "rank": 4, "arxiv_id": "2108.09147", "title": "Convolutional Neural Network (CNN) vs Vision Transformer (ViT) for Digital Holography", "category": "?" }, { "rank": 5, "arxiv_id": "2112.00965", "title": "Vision Pair Learning: An Efficient Training Framework for Image Classification", "category": "?" }, { "rank": 6, "arxiv_id": "2406.00237", "title": "A Comparative Study of CNN, ResNet, and Vision Transformers for Multi-Classification of Chest Diseases", "category": "?" }, { "rank": 7, "arxiv_id": "2110.14731", "title": "Vision Transformer for Classification of Breast Ultrasound Images", "category": "?" }, { "rank": 8, "arxiv_id": "2409.12026", "title": "On Vision Transformers for Classification Tasks in Side-Scan Sonar Imagery", "category": "?" }, { "rank": 9, "arxiv_id": "2103.05940", "title": "TransMed: Transformers Advance Multi-modal Medical Image Classification", "category": "?" }, { "rank": 10, "arxiv_id": "2108.03414", "title": "Vision Transformer for femur fracture classification", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "I", "query": "survey of large language models", "description": "LLM surveys \u2014 Zhao et al. survey, Minaee survey", "rewrite": "large language models survey LLMs BERT transformer architectures evaluation benchmarks", "latency_ms": 2101.066200004425, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2411.11072", "title": "Multilingual Large Language Models: A Systematic Survey", "category": "?" }, { "rank": 2, "arxiv_id": "2406.10833", "title": "A Comprehensive Survey of Scientific Large Language Models and Their Applications in Scientific Discovery", "category": "?" }, { "rank": 3, "arxiv_id": "2309.15025", "title": "Large Language Model Alignment: A Survey", "category": "?" }, { "rank": 4, "arxiv_id": "2311.05876", "title": "Trends in Integration of Knowledge and Large Language Models: A Survey and Taxonomy of Methods, Benchmarks, and Applications", "category": "?" }, { "rank": 5, "arxiv_id": "2404.15777", "title": "A Comprehensive Survey on Evaluating Large Language Model Applications in the Medical Industry", "category": "?" }, { "rank": 6, "arxiv_id": "2412.03220", "title": "Survey of different Large Language Model Architectures: Trends, Benchmarks, and Challenges", "category": "?" }, { "rank": 7, "arxiv_id": "2505.15957", "title": "Towards Holistic Evaluation of Large Audio-Language Models: A Comprehensive Survey", "category": "?" }, { "rank": 8, "arxiv_id": "2405.19323", "title": "Are Large Language Models Chameleons? An Attempt to Simulate Social Surveys", "category": "?" }, { "rank": 9, "arxiv_id": "2309.17447", "title": "A Large Language Model Approach to Educational Survey Feedback Analysis", "category": "?" }, { "rank": 10, "arxiv_id": "2310.19736", "title": "Evaluating Large Language Models: A Comprehensive Survey", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "I", "query": "comparison of object detection architectures YOLO vs DETR", "description": "YOLO family vs transformer-based detection", "rewrite": null, "latency_ms": 1010.0513999932446, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2504.13099", "title": "RF-DETR Object Detection vs YOLOv12 : A Study of Transformer-based and CNN-based Architectures for Single-Class and Multi-Class Greenfruit Detection in Complex Orchard Environments Under Label Ambiguity", "category": "?" }, { "rank": 2, "arxiv_id": "2211.06588", "title": "DEYO: DETR with YOLO for Step-by-Step Object Detection", "category": "?" }, { "rank": 3, "arxiv_id": "2304.08069", "title": "DETRs Beat YOLOs on Real-time Object Detection", "category": "?" }, { "rank": 4, "arxiv_id": "2309.11851", "title": "DEYOv3: DETR with YOLO for Real-time Object Detection", "category": "?" }, { "rank": 5, "arxiv_id": "2402.16370", "title": "DEYO: DETR with YOLO for End-to-End Object Detection", "category": "?" }, { "rank": 6, "arxiv_id": "2504.18586", "title": "A Decade of You Only Look Once (YOLO) for Object Detection", "category": "?" }, { "rank": 7, "arxiv_id": "2406.03459", "title": "LW-DETR: A Transformer Replacement to YOLO for Real-Time Detection", "category": "?" }, { "rank": 8, "arxiv_id": "2312.12314", "title": "First qualitative observations on deep learning vision model YOLO and DETR for automated driving in Austria", "category": "?" }, { "rank": 9, "arxiv_id": "2310.08772", "title": "Investigating the Robustness and Properties of Detection Transformers (DETR) Toward Difficult Images", "category": "?" }, { "rank": 10, "arxiv_id": "2502.12524", "title": "YOLOv12: Attention-Centric Real-Time Object Detectors", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "I", "query": "GAN vs diffusion models for image generation", "description": "Generative model comparison \u2014 StyleGAN, DDPM, score matching", "rewrite": null, "latency_ms": 889.1186999971978, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2410.17966", "title": "A Wavelet Diffusion GAN for Image Super-Resolution", "category": "?" }, { "rank": 2, "arxiv_id": "2403.19645", "title": "GANTASTIC: GAN-based Transfer of Interpretable Directions for Disentangled Image Editing in Text-to-Image Diffusion Models", "category": "?" }, { "rank": 3, "arxiv_id": "2307.08702", "title": "Diffusion Models Beat GANs on Image Classification", "category": "?" }, { "rank": 4, "arxiv_id": "2105.05233", "title": "Diffusion Models Beat GANs on Image Synthesis", "category": "?" }, { "rank": 5, "arxiv_id": "2405.04356", "title": "Diffusion-driven GAN Inversion for Multi-Modal Face Image Generation", "category": "?" }, { "rank": 6, "arxiv_id": "2209.11047", "title": "MIDMs: Matching Interleaved Diffusion Models for Exemplar-based Image Translation", "category": "?" }, { "rank": 7, "arxiv_id": "2302.08908", "title": "LayoutDiffuse: Adapting Foundational Diffusion Models for Layout-to-Image Generation", "category": "?" }, { "rank": 8, "arxiv_id": "2503.23127", "title": "Galaxy Imaging with Generative Models: Insights from a Two-Models Framework", "category": "?" }, { "rank": 9, "arxiv_id": "2301.03396", "title": "Diffused Heads: Diffusion Models Beat GANs on Talking-Face Generation", "category": "?" }, { "rank": 10, "arxiv_id": "2211.16152", "title": "Wavelet Diffusion Models are fast and scalable Image Generators", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "I", "query": "review of federated learning privacy methods", "description": "FL surveys \u2014 McMahan, differential privacy in FL", "rewrite": "Federated learning privacy preservation methods differential privacy homomorphism", "latency_ms": 1966.5430000168271, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2302.04208", "title": "Exploratory Analysis of Federated Learning Methods with Differential Privacy on MIMIC-III", "category": "?" }, { "rank": 2, "arxiv_id": "2109.13012", "title": "Federated Deep Learning with Bayesian Privacy", "category": "?" }, { "rank": 3, "arxiv_id": "2102.05883", "title": "Privacy-Preserving Self-Taught Federated Learning for Heterogeneous Data", "category": "?" }, { "rank": 4, "arxiv_id": "2408.15621", "title": "Convergent Differential Privacy Analysis for General Federated Learning: the $f$-DP Perspective", "category": "?" }, { "rank": 5, "arxiv_id": "2402.00342", "title": "Survey of Privacy Threats and Countermeasures in Federated Learning", "category": "?" }, { "rank": 6, "arxiv_id": "2206.03396", "title": "Group privacy for personalized federated learning", "category": "?" }, { "rank": 7, "arxiv_id": "2311.10832", "title": "Exploring Machine Learning Models for Federated Learning: A Review of Approaches, Performance, and Limitations", "category": "?" }, { "rank": 8, "arxiv_id": "2405.03636", "title": "The Federation Strikes Back: A Survey of Federated Learning Privacy Attacks, Defenses, Applications, and Policy Landscape", "category": "?" }, { "rank": 9, "arxiv_id": "2007.00914", "title": "Federated Learning and Differential Privacy: Software tools analysis, the Sherpa.ai FL framework and methodological guidelines for preserving data privacy", "category": "?" }, { "rank": 10, "arxiv_id": "2501.14453", "title": "Optimal Strategies for Federated Learning Maintaining Client Privacy", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "J", "query": "mixture of experts models scaling", "description": "MoE \u2014 Switch Transformer, Mixtral, GShard", "rewrite": "Mixture of Experts MoE deep learning scalable architectures sparse gating", "latency_ms": 1488.4431999525987, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2502.05172", "title": "Joint MoE Scaling Laws: Mixture of Experts Can Be Memory Efficient", "category": "?" }, { "rank": 2, "arxiv_id": "2303.07226", "title": "Scaling Vision-Language Models with Sparse Mixture of Experts", "category": "?" }, { "rank": 3, "arxiv_id": "2310.07188", "title": "Adaptive Gating in Mixture-of-Experts based Language Models", "category": "?" }, { "rank": 4, "arxiv_id": "2402.07871", "title": "Scaling Laws for Fine-Grained Mixture of Experts", "category": "?" }, { "rank": 5, "arxiv_id": "2401.17118", "title": "Explainable data-driven modeling via mixture of experts: towards effective blending of grey and black-box models", "category": "?" }, { "rank": 6, "arxiv_id": "2407.06204", "title": "A Survey on Mixture of Experts in Large Language Models", "category": "?" }, { "rank": 7, "arxiv_id": "2404.02852", "title": "Toward Inference-optimal Mixture-of-Expert Large Language Models", "category": "?" }, { "rank": 8, "arxiv_id": "2503.00634", "title": "Efficiently Editing Mixture-of-Experts Models with Compressed Experts", "category": "?" }, { "rank": 9, "arxiv_id": "2410.09039", "title": "Semi-Supervised Learning of Noisy Mixture of Experts Models", "category": "?" }, { "rank": 10, "arxiv_id": "2404.08985", "title": "T-REX: Mixture-of-Rank-One-Experts with Semantic-aware Intuition for Multi-task Large Language Model Finetuning", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "J", "query": "test-time compute scaling for reasoning", "description": "New paradigm \u2014 o1-style reasoning, tree search at inference", "rewrite": "test-time compute efficient reasoning scalable inference methods", "latency_ms": 2332.4564999784343, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2504.00869", "title": "m1: Unleash the Potential of Test-Time Scaling for Medical Reasoning with Large Language Models", "category": "?" }, { "rank": 2, "arxiv_id": "2502.05171", "title": "Scaling up Test-Time Compute with Latent Reasoning: A Recurrent Depth Approach", "category": "?" }, { "rank": 3, "arxiv_id": "2502.18080", "title": "Towards Thinking-Optimal Scaling of Test-Time Compute for LLM Reasoning", "category": "?" }, { "rank": 4, "arxiv_id": "2504.02890", "title": "Scaling Test-time Compute for Low-resource Languages: Multilingual Reasoning in LLMs", "category": "?" }, { "rank": 5, "arxiv_id": "2505.14733", "title": "The Energy Cost of Reasoning: Analyzing Energy Usage in LLMs with Test-time Compute", "category": "?" }, { "rank": 6, "arxiv_id": "2505.19187", "title": "LIMOPro: Reasoning Refinement for Efficient and Effective Test-time Scaling", "category": "?" }, { "rank": 7, "arxiv_id": "2503.19877", "title": "Scaling Evaluation-time Compute with Reasoning Models as Process Evaluators", "category": "?" }, { "rank": 8, "arxiv_id": "2504.01317", "title": "Adaptive Rectification Sampling for Test-Time Compute Scaling", "category": "?" }, { "rank": 9, "arxiv_id": "2501.19393", "title": "s1: Simple test-time scaling", "category": "?" }, { "rank": 10, "arxiv_id": "2502.13962", "title": "Is That Your Final Answer? Test-Time Scaling Improves Selective Question Answering", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "J", "query": "multimodal large language models vision and text", "description": "GPT-4V, LLaVA, Flamingo, multimodal LLMs", "rewrite": null, "latency_ms": 977.2495999932289, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2411.14279", "title": "Looking Beyond Text: Reducing Language bias in Large Vision-Language Models via Multimodal Dual-Attention and Soft-Image Guidance", "category": "?" }, { "rank": 2, "arxiv_id": "2311.17647", "title": "Text as Images: Can Multimodal Large Language Models Follow Printed Instructions in Pixels?", "category": "?" }, { "rank": 3, "arxiv_id": "2410.01744", "title": "Leopard: A Vision Language Model For Text-Rich Multi-Image Tasks", "category": "?" }, { "rank": 4, "arxiv_id": "2412.02104", "title": "Explainable and Interpretable Multimodal Large Language Models: A Comprehensive Survey", "category": "?" }, { "rank": 5, "arxiv_id": "2407.10996", "title": "Visualization Literacy of Multimodal Large Language Models: A Comparative Study", "category": "?" }, { "rank": 6, "arxiv_id": "2411.09273", "title": "Cross-Modal Consistency in Multimodal Large Language Models", "category": "?" }, { "rank": 7, "arxiv_id": "2402.01345", "title": "Skip \\n: A Simple Method to Reduce Hallucination in Large Vision-Language Models", "category": "?" }, { "rank": 8, "arxiv_id": "2502.04395", "title": "Time-VLM: Exploring Multimodal Vision-Language Models for Augmented Time Series Forecasting", "category": "?" }, { "rank": 9, "arxiv_id": "2403.08773", "title": "Veagle: Advancements in Multimodal Representation Learning", "category": "?" }, { "rank": 10, "arxiv_id": "2407.04681", "title": "Rethinking Visual Prompting for Multimodal Large Language Models with External Knowledge", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "J", "query": "state space models as alternative to transformers", "description": "S4, Mamba, H3 \u2014 structured state space models", "rewrite": null, "latency_ms": 970.7190000335686, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2404.09516", "title": "State Space Model for New-Generation Network Alternative to Transformers: A Survey", "category": "?" }, { "rank": 2, "arxiv_id": "2404.16112", "title": "Mamba-360: Survey of State Space Models as Transformer Alternative for Long Sequence Modelling: Methods, Applications, and Challenges", "category": "?" }, { "rank": 3, "arxiv_id": "2402.01032", "title": "Repeat After Me: Transformers are Better than State Space Models at Copying", "category": "?" }, { "rank": 4, "arxiv_id": "2501.16237", "title": "Application of Structured State Space Models to High energy physics with locality-sensitive hashing", "category": "?" }, { "rank": 5, "arxiv_id": "2411.15685", "title": "State-Space Large Audio Language Models", "category": "?" }, { "rank": 6, "arxiv_id": "2404.08819", "title": "The Illusion of State in State-Space Models", "category": "?" }, { "rank": 7, "arxiv_id": "2412.14354", "title": "State Space Models are Strong Text Rerankers", "category": "?" }, { "rank": 8, "arxiv_id": "2405.17394", "title": "The Expressive Capacity of State Space Models: A Formal Language Perspective", "category": "?" }, { "rank": 9, "arxiv_id": "2302.14120", "title": "Diagonal State Space Augmented Transformers for Speech Recognition", "category": "?" }, { "rank": 10, "arxiv_id": "2407.05489", "title": "How Effective are State Space Models for Machine Translation?", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "J", "query": "constitutional AI and AI safety alignment techniques", "description": "Anthropic constitutional AI, RLHF alternatives, safety", "rewrite": null, "latency_ms": 925.6349000497721, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2502.15861", "title": "C3AI: Crafting and Evaluating Constitutions for Constitutional AI", "category": "?" }, { "rank": 2, "arxiv_id": "2501.17112", "title": "Decoding Human Preferences in Alignment: An Improved Approach to Inverse Constitutional AI", "category": "?" }, { "rank": 3, "arxiv_id": "2503.05748", "title": "Alignment, Agency and Autonomy in Frontier AI: A Systems Engineering Perspective", "category": "?" }, { "rank": 4, "arxiv_id": "2503.17365", "title": "How Effective Is Constitutional AI in Small LLMs? A Study on DeepSeek-R1 and Its Peers", "category": "?" }, { "rank": 5, "arxiv_id": "2502.16691", "title": "Toward Responsible Federated Large Language Models: Leveraging a Safety Filter and Constitutional AI", "category": "?" }, { "rank": 6, "arxiv_id": "2411.04127", "title": "Combining Theory of Mind and Kindness for Self-Supervised Human-AI Alignment", "category": "?" }, { "rank": 7, "arxiv_id": "2311.08706", "title": "Aligned: A Platform-based Process for Alignment", "category": "?" }, { "rank": 8, "arxiv_id": "2101.06060", "title": "The Challenge of Value Alignment: from Fairer Algorithms to AI Safety", "category": "?" }, { "rank": 9, "arxiv_id": "2403.18341", "title": "IterAlign: Iterative Constitutional Alignment of Large Language Models", "category": "?" }, { "rank": 10, "arxiv_id": "2410.17271", "title": "Rules, Cases, and Reasoning: Positivist Legal Theory as a Framework for Pluralistic AI Alignment", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "J", "query": "sparse attention mechanisms for long context", "description": "Longformer, BigBird, sparse transformers for 100K+ context", "rewrite": "sparse attention transformers long-range dependencies contextualization", "latency_ms": 1455.3994999732822, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2502.20766", "title": "FlexPrefill: A Context-Aware Sparse Attention Mechanism for Efficient Long-Sequence Inference", "category": "?" }, { "rank": 2, "arxiv_id": "2502.12216", "title": "Tactic: Adaptive Sparse Attention with Clustering and Distribution Fitting for Long-Context LLMs", "category": "?" }, { "rank": 3, "arxiv_id": "2502.01659", "title": "Longer Attention Span: Increasing Transformer Context Length with Sparse Graph Processing Techniques", "category": "?" }, { "rank": 4, "arxiv_id": "2504.16795", "title": "Random Long-Context Access for Mamba via Hardware-aligned Hierarchical Sparse Attention", "category": "?" }, { "rank": 5, "arxiv_id": "2109.01915", "title": "Sparse Spatial Attention Network for Semantic Segmentation", "category": "?" }, { "rank": 6, "arxiv_id": "2412.06198", "title": "SparseAccelerate: Efficient Long-Context Inference for Mid-Range GPUs", "category": "?" }, { "rank": 7, "arxiv_id": "2406.05678", "title": "SinkLoRA: Enhanced Efficiency and Chat Capabilities for Long-Context Large Language Models", "category": "?" }, { "rank": 8, "arxiv_id": "2009.06097", "title": "Cluster-Former: Clustering-based Sparse Transformer for Long-Range Dependency Encoding", "category": "?" }, { "rank": 9, "arxiv_id": "2406.15486", "title": "SampleAttention: Near-Lossless Acceleration of Long Context LLM Inference with Adaptive Structured Sparse Attention", "category": "?" }, { "rank": 10, "arxiv_id": "2406.16747", "title": "Sparser is Faster and Less is More: Efficient Sparse Attention for Long-Range Transformers", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "K", "query": "deep learning for protein structure prediction", "description": "AlphaFold, ESMFold, protein language models", "rewrite": "deep learning protein structure prediction AlphaFold convolutional neural networks", "latency_ms": 1523.7058000057004, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2503.13522", "title": "Advanced Deep Learning Methods for Protein Structure Prediction and Design", "category": "?" }, { "rank": 2, "arxiv_id": "2504.01490", "title": "Deep Learning-Driven Protein Structure Prediction and Design: Key Model Developments by Nobel Laureates and Multi-Domain Applications", "category": "?" }, { "rank": 3, "arxiv_id": "2107.12243", "title": "Protein-RNA interaction prediction with deep learning: Structure matters", "category": "?" }, { "rank": 4, "arxiv_id": "2211.14939", "title": "Applying Deep Reinforcement Learning to the HP Model for Protein Structure Prediction", "category": "?" }, { "rank": 5, "arxiv_id": "2012.09741", "title": "On the performance of deep learning for numerical optimization: an application to protein structure prediction", "category": "?" }, { "rank": 6, "arxiv_id": "2002.05643", "title": "DeepSurf: A surface-based deep learning approach for the prediction of ligand binding sites on proteins", "category": "?" }, { "rank": 7, "arxiv_id": "2412.20329", "title": "Protein Structure Prediction in the 3D HP Model Using Deep Reinforcement Learning", "category": "?" }, { "rank": 8, "arxiv_id": "1610.07187", "title": "Learning Deep Architectures for Interaction Prediction in Structure-based Virtual Screening", "category": "?" }, { "rank": 9, "arxiv_id": "2009.00133", "title": "Unsupervised and Supervised Structure Learning for Protein Contact Prediction", "category": "?" }, { "rank": 10, "arxiv_id": "1910.02845", "title": "Combining docking pose rank and structure with deep learning improves protein-ligand binding mode prediction", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "K", "query": "natural language processing for legal document analysis", "description": "Legal NLP \u2014 contract analysis, legal BERT, court opinion mining", "rewrite": null, "latency_ms": 1012.3439999879338, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2204.07182", "title": "Analysing similarities between legal court documents using natural language processing approaches based on Transformers", "category": "?" }, { "rank": 2, "arxiv_id": "2110.15709", "title": "LegalNLP -- Natural Language Processing methods for the Brazilian Legal Language", "category": "?" }, { "rank": 3, "arxiv_id": "2503.12100", "title": "Large Language Models in Legislative Content Analysis: A Dataset from the Polish Parliament", "category": "?" }, { "rank": 4, "arxiv_id": "1311.6063", "title": "NILE: Fast Natural Language Processing for Electronic Health Records", "category": "?" }, { "rank": 5, "arxiv_id": "2404.06751", "title": "Leveraging open-source models for legal language modeling and analysis: a case study on the Indian constitution", "category": "?" }, { "rank": 6, "arxiv_id": "2203.08244", "title": "Toward Improving Attentive Neural Networks in Legal Text Processing", "category": "?" }, { "rank": 7, "arxiv_id": "2410.21306", "title": "Natural Language Processing for the Legal Domain: A Survey of Tasks, Datasets, Models, and Challenges", "category": "?" }, { "rank": 8, "arxiv_id": "2309.05500", "title": "NeCo@ALQAC 2023: Legal Domain Knowledge Acquisition for Low-Resource Languages through Data Enrichment", "category": "?" }, { "rank": 9, "arxiv_id": "1806.03688", "title": "LexNLP: Natural language processing and information extraction for legal and regulatory texts", "category": "?" }, { "rank": 10, "arxiv_id": "1709.05563", "title": "Data Innovation for International Development: An overview of natural language processing for qualitative data analysis", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "K", "query": "machine learning for climate change prediction", "description": "Climate ML \u2014 weather forecasting, carbon modeling", "rewrite": "climate change prediction machine learning modeling uncertainty quantification", "latency_ms": 2138.445299991872, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "1806.11037", "title": "Using machine learning to parameterize moist convection: potential for modeling of climate, climate change and extreme events", "category": "?" }, { "rank": 2, "arxiv_id": "2112.08440", "title": "Climate-Invariant Machine Learning", "category": "?" }, { "rank": 3, "arxiv_id": "2311.09413", "title": "Leveraging machine learning to enhance climate models: a review", "category": "?" }, { "rank": 4, "arxiv_id": "2503.08163", "title": "XAI4Extremes: An interpretable machine learning framework for understanding extreme-weather precursors under climate change", "category": "?" }, { "rank": 5, "arxiv_id": "2310.09162", "title": "Quantum Machine Learning in Climate Change and Sustainability: a Review", "category": "?" }, { "rank": 6, "arxiv_id": "2207.07390", "title": "Machine learning applications for weather and climate need greater focus on extremes", "category": "?" }, { "rank": 7, "arxiv_id": "1906.05433", "title": "Tackling Climate Change with Machine Learning", "category": "?" }, { "rank": 8, "arxiv_id": "2310.03180", "title": "Accessing Convective Hazards Frequency Shift with Climate Change using Physics-Informed Machine Learning", "category": "?" }, { "rank": 9, "arxiv_id": "2107.07997", "title": "Uncertainty Prediction for Machine Learning Models of Material Properties", "category": "?" }, { "rank": 10, "arxiv_id": "1303.2739", "title": "Machine Learning for Bioclimatic Modelling", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "K", "query": "using transformers for time series forecasting", "description": "Time series transformers \u2014 Informer, Autoformer, PatchTST", "rewrite": "Transformer time series forecasting Prophet LSTM Seq2Seq", "latency_ms": 1477.9143999912776, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2207.05397", "title": "Dateformer: Time-modeling Transformer for Longer-term Series Forecasting", "category": "?" }, { "rank": 2, "arxiv_id": "2206.04038", "title": "Scaleformer: Iterative Multi-scale Refining Transformers for Time Series Forecasting", "category": "?" }, { "rank": 3, "arxiv_id": "2402.06638", "title": "Transformers with Attentive Federated Aggregation for Time Series Stock Forecasting", "category": "?" }, { "rank": 4, "arxiv_id": "2501.02735", "title": "Sequence Complementor: Complementing Transformers For Time Series Forecasting with Learnable Sequences", "category": "?" }, { "rank": 5, "arxiv_id": "2411.01419", "title": "PSformer: Parameter-efficient Transformer with Segment Attention for Time Series Forecasting", "category": "?" }, { "rank": 6, "arxiv_id": "2209.03945", "title": "W-Transformers : A Wavelet-based Transformer Framework for Univariate Time Series Forecasting", "category": "?" }, { "rank": 7, "arxiv_id": "2210.17393", "title": "Probabilistic Decomposition Transformer for Time Series Forecasting", "category": "?" }, { "rank": 8, "arxiv_id": "2503.09791", "title": "Minimal Time Series Transformer", "category": "?" }, { "rank": 9, "arxiv_id": "2408.02279", "title": "DRFormer: Multi-Scale Transformer Utilizing Diverse Receptive Fields for Long Time-Series Forecasting", "category": "?" }, { "rank": 10, "arxiv_id": "2310.01232", "title": "Modality-aware Transformer for Financial Time series Forecasting", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "K", "query": "reinforcement learning for robotics manipulation", "description": "RL + robotics \u2014 sim-to-real transfer, dexterous manipulation", "rewrite": "reinforcement learning robotics manipulation control policy optimization deep learning", "latency_ms": 1636.6290000150912, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2102.04148", "title": "Deep Reinforcement Learning for the Control of Robotic Manipulation: A Focussed Mini-Review", "category": "?" }, { "rank": 2, "arxiv_id": "1701.08878", "title": "Deep Reinforcement Learning for Robotic Manipulation-The state of the art", "category": "?" }, { "rank": 3, "arxiv_id": "1610.00633", "title": "Deep Reinforcement Learning for Robotic Manipulation with Asynchronous Off-Policy Updates", "category": "?" }, { "rank": 4, "arxiv_id": "1803.10371", "title": "Reinforcement learning for non-prehensile manipulation: Transfer from simulation to physical system", "category": "?" }, { "rank": 5, "arxiv_id": "1910.07294", "title": "Reinforcement Learning for Robotic Manipulation using Simulated Locomotion Demonstrations", "category": "?" }, { "rank": 6, "arxiv_id": "2107.13356", "title": "Value-Based Reinforcement Learning for Continuous Control Robotic Manipulation in Multi-Task Sparse Reward Settings", "category": "?" }, { "rank": 7, "arxiv_id": "2210.08126", "title": "Geometric Reinforcement Learning For Robotic Manipulation", "category": "?" }, { "rank": 8, "arxiv_id": "2311.11287", "title": "Tactile Active Inference Reinforcement Learning for Efficient Robotic Manipulation Skill Acquisition", "category": "?" }, { "rank": 9, "arxiv_id": "1704.03073", "title": "Data-efficient Deep Reinforcement Learning for Dexterous Manipulation", "category": "?" }, { "rank": 10, "arxiv_id": "2304.06055", "title": "Exploiting Symmetry and Heuristic Demonstrations in Off-policy Reinforcement Learning for Robotic Manipulation", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "L", "query": "AI ethics", "description": "Very broad \u2014 should return survey-level papers on AI ethics/fairness/bias", "rewrite": "AI ethics fairness accountability transparency explainability bias mitigation", "latency_ms": 1728.8928999914788, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2302.12149", "title": "Beyond Bias and Compliance: Towards Individual Agency and Plurality of Ethics in AI", "category": "?" }, { "rank": 2, "arxiv_id": "2403.14681", "title": "AI Ethics: A Bibliometric Analysis, Critical Issues, and Key Gaps", "category": "?" }, { "rank": 3, "arxiv_id": "2109.07906", "title": "Ethics of AI: A Systematic Literature Review of Principles and Challenges", "category": "?" }, { "rank": 4, "arxiv_id": "2304.08275", "title": "Implementing Responsible AI: Tensions and Trade-Offs Between Ethics Aspects", "category": "?" }, { "rank": 5, "arxiv_id": "2207.01493", "title": "AI Ethics: An Empirical Study on the Views of Practitioners and Lawmakers", "category": "?" }, { "rank": 6, "arxiv_id": "2307.10057", "title": "Ethics in the Age of AI: An Analysis of AI Practitioners' Awareness and Challenges", "category": "?" }, { "rank": 7, "arxiv_id": "2503.18842", "title": "Three Kinds of AI Ethics", "category": "?" }, { "rank": 8, "arxiv_id": "2206.09514", "title": "Ethics in AI through the Practitioner's View: A Grounded Theory Literature Review", "category": "?" }, { "rank": 9, "arxiv_id": "2403.05551", "title": "A Bibliometric View of AI Ethics Development", "category": "?" }, { "rank": 10, "arxiv_id": "2501.08497", "title": "Addressing Intersectionality, Explainability, and Ethics in AI-Driven Diagnostics: A Rebuttal and Call for Transdiciplinary Action", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "L", "query": "embedding", "description": "Single word \u2014 highly ambiguous. Word2Vec? Sentence embeddings? Image embeddings?", "rewrite": "word embeddings neural language models representation learning", "latency_ms": 1689.5794000010937, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "1607.06532", "title": "Novel Word Embedding and Translation-based Language Modeling for Extractive Speech Summarization", "category": "?" }, { "rank": 2, "arxiv_id": "1608.05852", "title": "Learning Word Embeddings from Intrinsic and Extrinsic Views", "category": "?" }, { "rank": 3, "arxiv_id": "1611.05962", "title": "Word and Document Embeddings based on Neural Network Approaches", "category": "?" }, { "rank": 4, "arxiv_id": "1502.05746", "title": "Binary Embedding: Fundamental Limits and Fast Algorithm", "category": "?" }, { "rank": 5, "arxiv_id": "1701.05291", "title": "Heterogeneous Information Network Embedding for Meta Path based Proximity", "category": "?" }, { "rank": 6, "arxiv_id": "2309.11824", "title": "Word Embedding with Neural Probabilistic Prior", "category": "?" }, { "rank": 7, "arxiv_id": "1412.6448", "title": "Embedding Word Similarity with Neural Machine Translation", "category": "?" }, { "rank": 8, "arxiv_id": "1705.03556", "title": "Relevance-based Word Embedding", "category": "?" }, { "rank": 9, "arxiv_id": "1910.03505", "title": "Investigating the Effectiveness of Representations Based on Word-Embeddings in Active Learning for Labelling Text Datasets", "category": "?" }, { "rank": 10, "arxiv_id": "1705.07368", "title": "Mixed Membership Word Embeddings for Computational Social Science", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "L", "query": "language model", "description": "Broad \u2014 should return influential LM papers or surveys", "rewrite": "neural language models NLP transformer architectures deep learning", "latency_ms": 1597.907799994573, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "1606.00499", "title": "Generalizing and Hybridizing Count-based and Neural Language Models", "category": "?" }, { "rank": 2, "arxiv_id": "2205.01398", "title": "Neural language models for network configuration: Opportunities and reality check", "category": "?" }, { "rank": 3, "arxiv_id": "1502.01446", "title": "Beyond Word-based Language Model in Statistical Machine Translation", "category": "?" }, { "rank": 4, "arxiv_id": "1909.04985", "title": "Learning Dynamic Author Representations with Temporal Language Models", "category": "?" }, { "rank": 5, "arxiv_id": "2412.03220", "title": "Survey of different Large Language Model Architectures: Trends, Benchmarks, and Challenges", "category": "?" }, { "rank": 6, "arxiv_id": "1801.08771", "title": "Modeling of languages for tensor manipulation", "category": "?" }, { "rank": 7, "arxiv_id": "2111.00610", "title": "Towards Language Modelling in the Speech Domain Using Sub-word Linguistic Units", "category": "?" }, { "rank": 8, "arxiv_id": "2205.05128", "title": "Human Language Modeling", "category": "?" }, { "rank": 9, "arxiv_id": "2109.08270", "title": "Language Models as a Knowledge Source for Cognitive Agents", "category": "?" }, { "rank": 10, "arxiv_id": "2110.10470", "title": "Interpreting Deep Learning Models in Natural Language Processing: A Review", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "L", "query": "generate images from text", "description": "Casual \u2014 should surface DALL-E, Stable Diffusion, Imagen", "rewrite": "text-to-image synthesis generative models diffusion transformers", "latency_ms": 1434.7260000067763, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "1806.11302", "title": "Generate the corresponding Image from Text Description using Modified GAN-CLS Algorithm", "category": "?" }, { "rank": 2, "arxiv_id": "2309.00810", "title": "RenAIssance: A Survey into AI Text-to-Image Generation in the Era of Large Model", "category": "?" }, { "rank": 3, "arxiv_id": "2209.10948", "title": "Implementing and Experimenting with Diffusion Models for Text-to-Image Generation", "category": "?" }, { "rank": 4, "arxiv_id": "1910.04056", "title": "Text-to-Image Synthesis Based on Machine Generated Captions", "category": "?" }, { "rank": 5, "arxiv_id": "2303.07909", "title": "Text-to-image Diffusion Models in Generative AI: A Survey", "category": "?" }, { "rank": 6, "arxiv_id": "2407.06079", "title": "Layered Diffusion Model for One-Shot High Resolution Text-to-Image Synthesis", "category": "?" }, { "rank": 7, "arxiv_id": "1904.01310", "title": "DM-GAN: Dynamic Memory Generative Adversarial Networks for Text-to-Image Synthesis", "category": "?" }, { "rank": 8, "arxiv_id": "2505.10046", "title": "Exploring the Deep Fusion of Large Language Models and Diffusion Transformers for Text-to-Image Synthesis", "category": "?" }, { "rank": 9, "arxiv_id": "1612.03242", "title": "StackGAN: Text to Photo-realistic Image Synthesis with Stacked Generative Adversarial Networks", "category": "?" }, { "rank": 10, "arxiv_id": "2407.06642", "title": "Powerful and Flexible: Personalized Text-to-Image Generation via Reinforcement Learning", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "L", "query": "make AI more safe", "description": "Very casual \u2014 should surface alignment/safety papers", "rewrite": "AI safety robustness adversarial attacks fairness transparency explainability", "latency_ms": 1531.0878999880515, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2504.16110", "title": "Security-First AI: Foundations for Robust and Trustworthy Systems", "category": "?" }, { "rank": 2, "arxiv_id": "2405.06624", "title": "Towards Guaranteed Safe AI: A Framework for Ensuring Robust and Reliable AI Systems", "category": "?" }, { "rank": 3, "arxiv_id": "2403.10462", "title": "Safety Cases: How to Justify the Safety of Advanced AI Systems", "category": "?" }, { "rank": 4, "arxiv_id": "2309.12321", "title": "A Case for AI Safety via Law", "category": "?" }, { "rank": 5, "arxiv_id": "2409.07878", "title": "Mapping Technical Safety Research at AI Companies: A literature review and incentives analysis", "category": "?" }, { "rank": 6, "arxiv_id": "2408.12935", "title": "Trustworthy, Responsible, and Safe AI: A Comprehensive Architectural Framework for AI Safety with Challenges and Mitigations", "category": "?" }, { "rank": 7, "arxiv_id": "2411.18526", "title": "NeuroAI for AI Safety", "category": "?" }, { "rank": 8, "arxiv_id": "2201.10436", "title": "Safe AI -- How is this Possible?", "category": "?" }, { "rank": 9, "arxiv_id": "2502.09288", "title": "AI Safety for Everyone", "category": "?" }, { "rank": 10, "arxiv_id": "2410.21572", "title": "Safety cases for frontier AI", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "M", "query": "improvements to the original transformer architecture", "description": "Post-Vaswani improvements \u2014 Reformer, Performer, ALiBi, RoPE", "rewrite": "Transformer-XL BERT RoBERTa DistilBERT efficient attention mechanisms", "latency_ms": 1451.1854000156745, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2410.23182", "title": "ProTransformer: Robustify Transformers via Plug-and-Play Paradigm", "category": "?" }, { "rank": 2, "arxiv_id": "2305.14768", "title": "Dual Path Transformer with Partition Attention", "category": "?" }, { "rank": 3, "arxiv_id": "2503.18565", "title": "Distil-xLSTM: Learning Attention Mechanisms through Recurrent Structures", "category": "?" }, { "rank": 4, "arxiv_id": "2503.15983", "title": "InhibiDistilbert: Knowledge Distillation for a ReLU and Addition-based Transformer", "category": "?" }, { "rank": 5, "arxiv_id": "2501.06098", "title": "ELFATT: Efficient Linear Fast Attention for Vision Transformers", "category": "?" }, { "rank": 6, "arxiv_id": "2311.12678", "title": "Interpretation of the Transformer and Improvement of the Extractor", "category": "?" }, { "rank": 7, "arxiv_id": "2004.05150", "title": "Longformer: The Long-Document Transformer", "category": "?" }, { "rank": 8, "arxiv_id": "2503.16726", "title": "EDiT: Efficient Diffusion Transformers with Linear Compressed Attention", "category": "?" }, { "rank": 9, "arxiv_id": "1906.05714", "title": "A Multiscale Visualization of Attention in the Transformer Model", "category": "?" }, { "rank": 10, "arxiv_id": "2210.11909", "title": "Boosting vision transformers for image retrieval", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "M", "query": "papers that cite ResNet and extend residual connections", "description": "ResNet extensions \u2014 DenseNet, ResNeXt, WideResNet, SE-Net", "rewrite": null, "latency_ms": 859.7527000238188, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "1904.01367", "title": "Why ResNet Works? Residuals Generalize", "category": "?" }, { "rank": 2, "arxiv_id": "1805.07477", "title": "Norm-Preservation: Why Residual Networks Can Become Extremely Deep?", "category": "?" }, { "rank": 3, "arxiv_id": "1910.09599", "title": "On the space-time expressivity of ResNets", "category": "?" }, { "rank": 4, "arxiv_id": "1707.08866", "title": "Deep Residual Learning for Weakly-Supervised Relation Extraction", "category": "?" }, { "rank": 5, "arxiv_id": "1804.10123", "title": "IamNN: Iterative and Adaptive Mobile Neural Network for Efficient Image Classification", "category": "?" }, { "rank": 6, "arxiv_id": "1905.10944", "title": "Identity Connections in Residual Nets Improve Noise Stability", "category": "?" }, { "rank": 7, "arxiv_id": "1611.01186", "title": "Demystifying ResNet", "category": "?" }, { "rank": 8, "arxiv_id": "1805.09585", "title": "Residual Networks as Geodesic Flows of Diffeomorphisms", "category": "?" }, { "rank": 9, "arxiv_id": "2109.12556", "title": "Frequency Disentangled Residual Network", "category": "?" }, { "rank": 10, "arxiv_id": "2004.04989", "title": "Improved Residual Networks for Image and Video Recognition", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "M", "query": "alternatives to RLHF for aligning language models", "description": "DPO, SPIN, KTO \u2014 methods that bypass reward modeling", "rewrite": null, "latency_ms": 1012.4404999660328, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2406.15567", "title": "SAIL: Self-Improving Efficient Online Alignment of Large Language Models", "category": "?" }, { "rank": 2, "arxiv_id": "2302.05206", "title": "The Wisdom of Hindsight Makes Language Models Better Instruction Followers", "category": "?" }, { "rank": 3, "arxiv_id": "2305.06176", "title": "Fine-tuning Language Models with Generative Adversarial Reward Modelling", "category": "?" }, { "rank": 4, "arxiv_id": "2408.14874", "title": "Inverse-Q*: Token Level Reinforcement Learning for Aligning Large Language Models Without Preference Data", "category": "?" }, { "rank": 5, "arxiv_id": "2406.05587", "title": "Creativity Has Left the Chat: The Price of Debiasing Language Models", "category": "?" }, { "rank": 6, "arxiv_id": "2407.04181", "title": "Orchestrating LLMs with Different Personalizations", "category": "?" }, { "rank": 7, "arxiv_id": "2401.11458", "title": "Linear Alignment: A Closed-form Solution for Aligning Human Preferences without Tuning and Feedback", "category": "?" }, { "rank": 8, "arxiv_id": "2403.16649", "title": "CLHA: A Simple yet Effective Contrastive Learning Framework for Human Alignment", "category": "?" }, { "rank": 9, "arxiv_id": "2405.17956", "title": "Unified Preference Optimization: Language Model Alignment Beyond the Preference Frontier", "category": "?" }, { "rank": 10, "arxiv_id": "2306.02231", "title": "Fine-Tuning Language Models with Advantage-Induced Policy Alignment", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 }, { "band": "M", "query": "BERT variants for low resource languages", "description": "mBERT, XLM-R, AfricanBERT, ArabBERT \u2014 multilingual BERT variants", "rewrite": "Multilingual BERT low-resource languages adaptation transfer learning", "latency_ms": 1428.8215999840759, "n_results": 10, "results": [ { "rank": 1, "arxiv_id": "2012.02462", "title": "Fine-tuning BERT for Low-Resource Natural Language Understanding via Active Learning", "category": "?" }, { "rank": 2, "arxiv_id": "2402.14408", "title": "Transferring BERT Capabilities from High-Resource to Low-Resource Languages Using Vocabulary Matching", "category": "?" }, { "rank": 3, "arxiv_id": "2204.05814", "title": "MuCoT: Multilingual Contrastive Training for Question-Answering in Low-resource Languages", "category": "?" }, { "rank": 4, "arxiv_id": "2004.13640", "title": "Extending Multilingual BERT to Low-Resource Languages", "category": "?" }, { "rank": 5, "arxiv_id": "2005.09093", "title": "Are All Languages Created Equal in Multilingual BERT?", "category": "?" }, { "rank": 6, "arxiv_id": "2012.15562", "title": "UNKs Everywhere: Adapting Multilingual Language Models to New Scripts", "category": "?" }, { "rank": 7, "arxiv_id": "2409.10965", "title": "Cross-lingual transfer of multilingual models on low resource African Languages", "category": "?" }, { "rank": 8, "arxiv_id": "2212.12510", "title": "MicroBERT: Effective Training of Low-resource Monolingual BERTs through Parameter Reduction and Multitask Learning", "category": "?" }, { "rank": 9, "arxiv_id": "2408.03172", "title": "Leveraging Parameter Efficient Training Methods for Low Resource Text Classification: A Case Study in Marathi", "category": "?" }, { "rank": 10, "arxiv_id": "1907.00409", "title": "Evaluating Language Model Finetuning Techniques for Low-resource Languages", "category": "?" } ], "expected_id": null, "expected_found": null, "expected_rank": null, "topic_diversity": 0 } ]