Spaces:

amarck
/

Researcher

Sleeping

File size: 8,502 Bytes

a0f27fa
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa
 
 
 
 
 
430d0f8
a0f27fa

[
  {
    "arxiv_id": "2401.04088",
    "title": "DeepSeek-Coder-V2: Breaking the Barrier of Closed-Source Models in Code Intelligence",
    "domain": "aiml",
    "categories": ["cs.CL", "cs.SE", "cs.AI"],
    "summary": "Open-source code LLM matching GPT-4 Turbo on coding benchmarks with MoE architecture."
  },
  {
    "arxiv_id": "2403.05530",
    "title": "GaLore: Memory-Efficient LLM Training by Gradient Low-Rank Projection",
    "domain": "aiml",
    "categories": ["cs.LG", "cs.CL"],
    "summary": "Reduces memory usage for LLM training via gradient projection, enabling 7B training on consumer GPUs."
  },
  {
    "arxiv_id": "2402.13616",
    "title": "World Model on Million-Length Video and Language with RingAttention",
    "domain": "aiml",
    "categories": ["cs.CV", "cs.CL", "cs.LG"],
    "summary": "Trains world models on million-token video sequences using ring attention for long context."
  },
  {
    "arxiv_id": "2403.03206",
    "title": "The Claude 3 Model Family",
    "domain": "aiml",
    "categories": ["cs.CL", "cs.AI"],
    "summary": "Multimodal LLM family with strong vision capabilities and extended context windows."
  },
  {
    "arxiv_id": "2402.17764",
    "title": "Sora: A Review on Background, Technology, Limitations, and Opportunities",
    "domain": "aiml",
    "categories": ["cs.CV", "cs.AI"],
    "summary": "Analysis of video generation model capabilities, architecture, and limitations."
  },
  {
    "arxiv_id": "2401.02954",
    "title": "MoE-Mamba: Efficient Selective State Space Models with Mixture of Experts",
    "domain": "aiml",
    "categories": ["cs.LG", "cs.CL"],
    "summary": "Combines Mamba state-space model with mixture-of-experts for efficient scaling."
  },
  {
    "arxiv_id": "2403.09611",
    "title": "Quiet-STaR: Language Models Can Teach Themselves to Think Before Speaking",
    "domain": "aiml",
    "categories": ["cs.CL", "cs.AI", "cs.LG"],
    "summary": "Self-taught reasoning where LLMs learn to generate internal rationale tokens."
  },
  {
    "arxiv_id": "2402.01032",
    "title": "OLMo: Accelerating the Science of Language Models",
    "domain": "aiml",
    "categories": ["cs.CL", "cs.AI"],
    "summary": "Fully open-source LLM with released weights, code, data, and training logs."
  },
  {
    "arxiv_id": "2403.14608",
    "title": "ReALM: Reference Resolution As Language Modeling",
    "domain": "aiml",
    "categories": ["cs.CL", "cs.AI"],
    "summary": "Resolves onscreen and conversational references using LLMs for device agents."
  },
  {
    "arxiv_id": "2402.14261",
    "title": "Griffin: Mixing Gated Linear Recurrences with Local Attention for Efficient Language Models",
    "domain": "aiml",
    "categories": ["cs.LG", "cs.CL"],
    "summary": "Hybrid architecture combining gated linear RNNs with local attention, matching transformer quality."
  },
  {
    "arxiv_id": "2401.14196",
    "title": "GPTQ: Accurate Post-Training Quantization for Generative Pre-trained Transformers",
    "domain": "aiml",
    "categories": ["cs.LG", "cs.CL"],
    "summary": "One-shot quantization method reducing LLM size to 3-4 bits with minimal accuracy loss."
  },
  {
    "arxiv_id": "2403.07691",
    "title": "Stealing Part of a Production Language Model",
    "domain": "security",
    "categories": ["cs.CR", "cs.LG", "cs.AI"],
    "summary": "Extracts internal architecture details from production LLM APIs through crafted queries."
  },
  {
    "arxiv_id": "2402.06132",
    "title": "SoK: Where's the Bug? A Study of Bug Localization Tools",
    "domain": "security",
    "categories": ["cs.CR", "cs.SE"],
    "summary": "Systematizes bug localization approaches and evaluates 23 tools on real-world CVEs."
  },
  {
    "arxiv_id": "2401.16727",
    "title": "A Survey of Side-Channel Attacks on Intel SGX",
    "domain": "security",
    "categories": ["cs.CR"],
    "summary": "Comprehensive analysis of side-channel attacks targeting Intel SGX enclaves."
  },
  {
    "arxiv_id": "2403.02783",
    "title": "SyzVegas: Beating Kernel Fuzzing Odds with Reinforcement Learning",
    "domain": "security",
    "categories": ["cs.CR", "cs.SE"],
    "summary": "RL-guided kernel fuzzer that outperforms Syzkaller in bug discovery rate."
  },
  {
    "arxiv_id": "2402.15483",
    "title": "BSIMM: An Empirical Study of 130 Software Security Programs",
    "domain": "security",
    "categories": ["cs.CR", "cs.SE"],
    "summary": "Large-scale study of enterprise security maturity across 130 organizations."
  },
  {
    "arxiv_id": "2403.14469",
    "title": "Reverse Engineering eBPF Programs: Challenges and Approaches",
    "domain": "security",
    "categories": ["cs.CR", "cs.OS"],
    "summary": "Novel techniques for reverse engineering eBPF bytecode in Linux kernel security."
  },
  {
    "arxiv_id": "2401.09577",
    "title": "WiFi-Based Keystroke Inference Attack Using Adversarial CSI Perturbation",
    "domain": "security",
    "categories": ["cs.CR", "cs.NI"],
    "summary": "Exploits WiFi channel state information to infer keystrokes from nearby devices."
  },
  {
    "arxiv_id": "2402.08787",
    "title": "Binary Code Similarity Detection via Graph Neural Networks",
    "domain": "security",
    "categories": ["cs.CR", "cs.SE", "cs.LG"],
    "summary": "GNN-based approach to detect similar binary functions across compilers and architectures."
  },
  {
    "arxiv_id": "2403.01218",
    "title": "Practical Exploitation of DNS Rebinding in IoT Devices",
    "domain": "security",
    "categories": ["cs.CR", "cs.NI"],
    "summary": "Demonstrates DNS rebinding attacks against 15 popular IoT devices in home networks."
  },
  {
    "arxiv_id": "2401.15491",
    "title": "GPU.zip: Side Channel Attacks on GPU-Based Graphical Data Compression",
    "domain": "security",
    "categories": ["cs.CR"],
    "summary": "First cross-origin pixel-stealing attack through GPU hardware data compression."
  },
  {
    "arxiv_id": "2402.03367",
    "title": "CryptoFuzz: Fully Automated Testing of Cryptographic API Misuse",
    "domain": "security",
    "categories": ["cs.CR", "cs.SE"],
    "summary": "Automated fuzzer detecting cryptographic API misuse patterns in Java applications."
  },
  {
    "arxiv_id": "2403.08946",
    "title": "Video Generation Models as World Simulators",
    "domain": "aiml",
    "categories": ["cs.CV", "cs.AI", "cs.LG"],
    "summary": "Explores how video generation models learn physical world dynamics as implicit simulators."
  },
  {
    "arxiv_id": "2402.05929",
    "title": "V-JEPA: Video Joint Embedding Predictive Architecture",
    "domain": "aiml",
    "categories": ["cs.CV", "cs.LG"],
    "summary": "Self-supervised video representation learning that predicts in latent space rather than pixel space."
  },
  {
    "arxiv_id": "2401.10020",
    "title": "AlphaGeometry: Solving Olympiad Geometry without Human Demonstrations",
    "domain": "aiml",
    "categories": ["cs.AI", "cs.LG"],
    "summary": "AI system solving IMO-level geometry problems through neurosymbolic reasoning."
  },
  {
    "arxiv_id": "2403.04132",
    "title": "Design2Code: How Far Are We From Automating Front-End Engineering?",
    "domain": "aiml",
    "categories": ["cs.CV", "cs.CL", "cs.SE"],
    "summary": "Benchmarks multimodal LLMs on converting visual designs to functional HTML/CSS code."
  },
  {
    "arxiv_id": "2402.14905",
    "title": "YOLOv9: Learning What You Want to Learn Using Programmable Gradient Information",
    "domain": "aiml",
    "categories": ["cs.CV"],
    "summary": "New YOLO architecture using programmable gradient information for better object detection."
  },
  {
    "arxiv_id": "2401.06066",
    "title": "MagicVideo-V2: Multi-Stage High-Aesthetic Video Generation",
    "domain": "aiml",
    "categories": ["cs.CV", "cs.AI"],
    "summary": "Multi-stage video generation pipeline producing high-quality aesthetic videos from text."
  },
  {
    "arxiv_id": "2402.01680",
    "title": "Grandmaster-Level Chess Without Search",
    "domain": "aiml",
    "categories": ["cs.AI", "cs.LG"],
    "summary": "Transformer achieving grandmaster chess play through pure pattern recognition without tree search."
  },
  {
    "arxiv_id": "2403.04706",
    "title": "SWE-agent: Agent-Computer Interfaces Enable Automated Software Engineering",
    "domain": "aiml",
    "categories": ["cs.SE", "cs.CL", "cs.AI"],
    "summary": "LLM agent that autonomously fixes GitHub issues by interacting with code repositories."
  }
]