Spaces:

LOOFYYLO
/

laa-algorithms-demo

Build error

App Files Files Community

laa-algorithms-demo / laa_core /src /lib.rs

LOOFYYLO

Upload laa_core/src/lib.rs with huggingface_hub

ef6a679 verified 2 months ago

raw

history blame contribute delete

17 kB


	use pyo3::prelude::*;
	use rand::Rng;
	use std::collections::HashMap;

	/// Implements the classic Ski Rental problem, a foundational online algorithm.
	///
	/// This algorithm models a scenario where a person must decide each day whether to rent skis
	/// for a fixed daily cost or to buy them outright for a larger fixed cost. The goal is to
	/// minimize the total cost over a skiing season of unknown length. This learning-augmented
	/// version incorporates a prediction for the total number of ski days to make a more
	/// informed decision.
	///
	/// The algorithm achieves a competitive ratio of 2 in the worst case and approaches 1
	/// (optimal) with perfect predictions.
	#[pyclass]
	pub struct SkiRental {
	buy_cost: f64,
	}

	#[pymethods]
	impl SkiRental {
	/// Creates a new `SkiRental` instance.
	///
	/// # Arguments
	///
	/// * `buy_cost` - The total cost of buying skis. This is the threshold against which
	/// the cumulative rental cost is compared.
	#[new]
	pub fn new(buy_cost: f64) -> Self {
	SkiRental { buy_cost }
	}

	/// Makes the daily decision to either rent or buy skis.
	///
	/// The decision is based on a threshold that balances the certainty of the traditional
	/// deterministic algorithm with the insight from the machine learning prediction.
	///
	/// # Arguments
	///
	/// * `day` - The current day of the skiing season (1-indexed).
	/// * `prediction` - The predicted total number of ski days.
	/// * `trust` - A confidence score in the prediction, typically in the range [0.0, 1.0].
	/// A value of 0 ignores the prediction, while 1 relies on it completely.
	///
	/// # Returns
	///
	/// * `bool` - Returns `true` if the decision is to buy, and `false` to continue renting.
	pub fn decide(&self, day: u32, prediction: f64, trust: f64) -> bool {
	let threshold = (1.0 - trust) * self.buy_cost + trust * prediction.min(self.buy_cost);
	day as f64 >= threshold
	}
	}

	/// Implements a randomized learning-augmented Ski Rental algorithm.
	///
	/// This version introduces randomization into the decision-making process to achieve a
	/// better competitive ratio in the worst-case scenario compared to its deterministic
	/// counterpart. It is approximately 1.58-competitive. The algorithm uses the prediction
	/// to influence a probabilistic decision.
	#[pyclass]
	pub struct RandomizedSkiRental {
	buy_cost: f64,
	}

	#[pymethods]
	impl RandomizedSkiRental {
	/// Creates a new `RandomizedSkiRental` instance.
	///
	/// # Arguments
	///
	/// * `buy_cost` - The total cost of buying skis.
	#[new]
	pub fn new(buy_cost: f64) -> Self {
	RandomizedSkiRental { buy_cost }
	}

	/// Makes a probabilistic daily decision to either rent or buy skis.
	///
	/// # Arguments
	///
	/// * `day` - The current day of the skiing season (1-indexed).
	/// * `prediction` - The predicted total number of ski days.
	/// * `trust` - A confidence score in the prediction, typically in [0.0, 1.0].
	///
	/// # Returns
	///
	/// * `bool` - Returns `true` if the decision is to buy, and `false` to rent.
	pub fn decide(&self, day: u32, prediction: f64, trust: f64) -> bool {
	let rent_cost = day as f64;

	// Clamp the prediction, as any prediction > buy_cost implies the same strategy.
	let effective_prediction = prediction.min(self.buy_cost);

	// The threshold is a blend of the deterministic buy cost and the clamped prediction.
	let threshold = (1.0 - trust) * self.buy_cost + trust * effective_prediction;

	// The probability scales with the rent_cost and the threshold, normalized by buy_cost^2 * e.
	// This ensures that low predictions (and thus low thresholds) lead to a low
	// probability of buying, making the algorithm robust to underestimation.
	let prob = (rent_cost * threshold / (self.buy_cost * self.buy_cost * std::f64::consts::E)).max(0.0).min(1.0);

	let mut rng = rand::thread_rng();
	rng.gen_bool(prob)
	}
	}

	/// Implements a learning-augmented caching algorithm.
	///
	/// This algorithm manages a cache of a fixed size. When an item is accessed, it must
	/// decide whether to keep or evict items in the cache. This implementation uses predictions
	/// about the next time an item will be accessed to make smarter eviction choices than

	/// traditional algorithms like LRU (Least Recently Used).
	#[pyclass]
	pub struct Caching {
	cache_size: usize,
	predictions: HashMap<u32, u32>,
	}

	#[pymethods]
	impl Caching {
	/// Creates a new `Caching` instance.
	///
	/// # Arguments
	///
	/// * `cache_size` - The maximum number of items the cache can hold.
	/// * `predictions` - A map where keys are item IDs and values are the predicted
	/// time of the next access. Lower values indicate sooner access.
	#[new]
	pub fn new(cache_size: usize, predictions: HashMap<u32, u32>) -> Self {
	Caching {
	cache_size,
	predictions,
	}
	}

	/// Processes an item access and updates the cache state.
	///
	/// If the item is already in the cache, it's a "hit". If not, it's a "miss".
	/// If the cache is full on a miss, another item is evicted based on the predictions
	/// (item with the latest predicted next access time is evicted).
	///
	/// # Arguments
	///
	/// * `item` - The unique identifier of the item being accessed.
	/// * `cache` - A `Vec<u32>` representing the current items in the cache.
	///
	/// # Returns
	///
	/// A tuple `(bool, Vec<u32>)`:
	/// * `_ .0` (bool): `true` for a cache hit, `false` for a miss.
	/// * `_ .1` (Vec<u32>): The new state of the cache after the access.
	pub fn decide(&self, item: u32, cache: Vec<u32>) -> (bool, Vec<u32>) {
	let mut new_cache = cache.clone();
	if new_cache.contains(&item) {
	return (true, new_cache);
	}

	if new_cache.len() < self.cache_size {
	new_cache.push(item);
	return (true, new_cache);
	}

	let mut evict_item_index = 0;
	let mut max_prediction = 0;
	for i in 0..new_cache.len() {
	let prediction = self.predictions.get(&new_cache[i]).unwrap_or(&u32::MAX);
	if *prediction > max_prediction {
	max_prediction = *prediction;
	evict_item_index = i;
	}
	}
	new_cache.remove(evict_item_index);
	new_cache.push(item);
	(false, new_cache)
	}
	}

	/// Implements a learning-augmented Oneway Trading algorithm.
	///
	/// This algorithm addresses the problem of converting an initial amount of one asset
	/// into another by choosing the best time to execute the trade. The goal is to maximize
	/// the amount of the target asset obtained. This version uses a price prediction to
	/// decide when to trade.
	#[pyclass]
	pub struct OnewayTrading {
	buy_price: f64,
	}

	#[pymethods]
	impl OnewayTrading {
	/// Creates a new `OnewayTrading` instance.
	///
	/// # Arguments
	///
	/// * `buy_price` - The initial price of the asset, used as a reference for the
	/// deterministic part of the algorithm.
	#[new]
	pub fn new(buy_price: f64) -> Self {
	OnewayTrading { buy_price }
	}

	/// Decides whether to execute the trade or to wait.
	///
	/// The decision is based on a threshold that blends the initial price with the
	/// predicted future price, weighted by the trust parameter.
	///
	/// # Arguments
	///
	/// * `current_price` - The current market price of the asset.
	/// * `prediction` - The predicted future price of the asset.
	/// * `trust` - A confidence score in the prediction, typically in [0.0, 1.0].
	///
	/// # Returns
	///
	/// * `bool` - Returns `true` to execute the trade, `false` to wait.
	pub fn decide(&self, current_price: f64, prediction: f64, trust: f64) -> bool {
	let threshold = (1.0 - trust) * self.buy_price + trust * prediction;
	current_price >= threshold
	}
	}

	/// Implements a learning-augmented scheduling algorithm (makespan minimization).
	///
	/// This algorithm assigns a set of jobs to a fixed number of machines with the goal
	/// of minimizing the makespan, which is the total time until the last job completes.
	/// It uses predictions of job lengths to sort them, aiming to schedule shorter jobs
	/// first (a variant of the Shortest Processing Time heuristic).
	#[pyclass]
	pub struct Scheduling {
	num_machines: usize,
	}

	#[pymethods]
	impl Scheduling {
	/// Creates a new `Scheduling` instance.
	///
	/// # Arguments
	///
	/// * `num_machines` - The number of identical machines available for processing jobs.
	#[new]
	pub fn new(num_machines: usize) -> Self {
	Scheduling { num_machines }
	}

	/// Assigns a list of jobs to the available machines.
	///
	/// This method sorts jobs based on their predicted lengths and then assigns each
	/// job to the machine that will become free earliest.
	///
	/// # Arguments
	///
	/// * `job_lengths` - A `Vec<u32>` containing the true, actual lengths of the jobs.
	/// * `predictions` - A `Vec<u32>` containing the predicted lengths of the jobs.
	/// The order of predictions must correspond to the order of `job_lengths`.
	///
	/// # Returns
	///
	/// * `Vec<usize>` - A vector where the element at index `i` is the machine ID
	/// (0 to `num_machines - 1`) assigned to job `i`.
	pub fn decide(&self, job_lengths: Vec<u32>, predictions: Vec<u32>) -> Vec<usize> {
	let jobs: Vec<(usize, u32)> = job_lengths.iter().map(\|&x\| x).enumerate().collect();
	let mut sorted_jobs: Vec<(usize, u32)> = predictions.iter().map(\|&x\| x).enumerate().collect();
	sorted_jobs.sort_by_key(\|k\| k.1);

	let mut assignments = vec![0; jobs.len()];
	let mut machine_loads = vec![0; self.num_machines];

	for (job_index, _) in sorted_jobs {
	let mut best_machine = 0;
	let mut min_load = u32::MAX;
	for j in 0..self.num_machines {
	if machine_loads[j] < min_load {
	min_load = machine_loads[j];
	best_machine = j;
	}
	}
	assignments[job_index] = best_machine;
	machine_loads[best_machine] += jobs[job_index].1;
	}
	assignments
	}
	}

	/// Implements a learning-augmented search algorithm.
	///
	/// This algorithm finds the maximum value in a list. It uses a prediction for the
	/// index of the maximum value as a starting point for its search, which can improve
	/// performance in certain online or resource-constrained scenarios.
	#[pyclass]
	pub struct Search {
	#[allow(dead_code)]
	max_value: u32,
	}

	#[pymethods]
	impl Search {
	/// Creates a new `Search` instance.
	///
	/// # Arguments
	///
	/// * `max_value` - The theoretical maximum possible value in the search space.
	/// (Note: This is not currently used in the `decide` method but
	/// is part of the class structure for future extensions).
	#[new]
	pub fn new(max_value: u32) -> Self {
	Search { max_value }
	}

	/// Finds the index of the maximum value in a list.
	///
	/// It starts its search from the predicted index and wraps around the list,
	/// which can be advantageous if the search can be terminated early.
	///
	/// # Arguments
	///
	/// * `values` - The `Vec<u32>` of values to search through.
	/// * `prediction` - The predicted index of the maximum value.
	///
	/// # Returns
	///
	/// * `usize` - The index of the first occurrence of the maximum value found.
	pub fn decide(&self, values: Vec<u32>, prediction: u32) -> usize {
	let mut best_index = 0;
	let mut max_value = 0;
	let mut start_index = 0;
	if prediction < values.len() as u32 {
	start_index = prediction as usize;
	}

	for i in 0..values.len() {
	let index = (start_index + i) % values.len();
	if values[index] > max_value {
	max_value = values[index];
	best_index = index;
	}
	}
	best_index
	}
	}

	/// Defines the Python module for the Learning-Augmented Algorithms core library.
	///
	/// This function exposes the Rust implementations of the LAA classes (`SkiRental`,
	/// `Caching`, `OnewayTrading`, `Scheduling`, `Search`) to Python, allowing them
	/// to be imported and used seamlessly.
	#[pymodule]
	fn laa_core(m: &Bound<'_, PyModule>) -> PyResult<()> {
	m.add_class::<SkiRental>()?;
	m.add_class::<RandomizedSkiRental>()?;
	m.add_class::<Caching>()?;
	m.add_class::<OnewayTrading>()?;
	m.add_class::<Scheduling>()?;
	m.add_class::<Search>()?;
	Ok(())
	}

	#[cfg(test)]
	mod tests {
	use super::*;

	#[test]
	fn test_ski_rental_no_trust() {
	let ski_rental = SkiRental::new(100.0);
	assert_eq!(ski_rental.decide(99, 10.0, 0.0), false);
	assert_eq!(ski_rental.decide(100, 10.0, 0.0), true);
	}

	#[test]
	fn test_ski_rental_full_trust_good_prediction() {
	let ski_rental = SkiRental::new(100.0);
	assert_eq!(ski_rental.decide(24, 25.0, 1.0), false);
	assert_eq!(ski_rental.decide(25, 25.0, 1.0), true);
	}

	#[test]
	fn test_ski_rental_full_trust_bad_prediction() {
	let ski_rental = SkiRental::new(100.0);
	// Prediction is 120, but it's clamped at buy_cost (100), so threshold is 100.
	assert_eq!(ski_rental.decide(99, 120.0, 1.0), false);
	assert_eq!(ski_rental.decide(100, 120.0, 1.0), true);
	}

	#[test]
	fn test_caching_hit() {
	let caching = Caching::new(3, HashMap::new());
	let cache = vec![1, 2, 3];
	let (hit, new_cache) = caching.decide(2, cache.clone());
	assert_eq!(hit, true);
	assert_eq!(new_cache, cache);
	}

	#[test]
	fn test_caching_miss_no_eviction() {
	let caching = Caching::new(3, HashMap::new());
	let cache = vec![1, 2];
	let (hit, new_cache) = caching.decide(3, cache.clone());
	assert_eq!(hit, true);
	assert_eq!(new_cache, vec![1, 2, 3]);
	}

	#[test]
	fn test_caching_miss_with_eviction() {
	let mut predictions = HashMap::new();
	predictions.insert(1, 10);
	predictions.insert(2, 5);
	predictions.insert(3, 15);
	let caching = Caching::new(3, predictions);
	let cache = vec![1, 2, 3];
	let (hit, new_cache) = caching.decide(4, cache.clone());
	assert_eq!(hit, false);
	assert_eq!(new_cache, vec![1, 2, 4]);
	}

	#[test]
	fn test_oneway_trading_no_trust() {
	let trading = OnewayTrading::new(100.0);
	assert_eq!(trading.decide(99.0, 120.0, 0.0), false);
	assert_eq!(trading.decide(100.0, 120.0, 0.0), true);
	}

	#[test]
	fn test_oneway_trading_full_trust() {
	let trading = OnewayTrading::new(100.0);
	assert_eq!(trading.decide(119.0, 120.0, 1.0), false);
	assert_eq!(trading.decide(120.0, 120.0, 1.0), true);
	}

	#[test]
	fn test_scheduling() {
	let scheduling = Scheduling::new(2);
	let job_lengths = vec![10, 5, 12];
	let predictions = vec![5, 10, 12];
	let assignments = scheduling.decide(job_lengths, predictions);
	assert_eq!(assignments, vec![0, 1, 1]);
	}

	#[test]
	fn test_search() {
	let search = Search::new(100);
	let values = vec![10, 5, 12, 50, 99];
	let prediction = 4;
	let best_index = search.decide(values, prediction);
	assert_eq!(best_index, 4);
	}

	#[test]
	fn test_randomized_ski_rental_statistical() {
	let buy_cost = 100.0;
	let num_simulations = 10000;
	let mut total_ratio = 0.0;
	let mut rng = rand::thread_rng();

	for _ in 0..num_simulations {
	let ski_days = rng.gen_range(1..150);
	// Add more realistic noise to the prediction
	let noise = rng.gen_range(0.7..1.3);
	let prediction = (ski_days as f64 * noise).max(1.0);
	let trust = 0.8;
	let rental = RandomizedSkiRental::new(buy_cost);

	let mut alg_cost = ski_days as f64; // Default cost is renting all days
	for day in 1..=ski_days {
	if rental.decide(day, prediction, trust) {
	alg_cost = (day - 1) as f64 + buy_cost;
	break; // Decision is final
	}
	}

	let optimal_cost = (ski_days as f64).min(buy_cost);
	total_ratio += alg_cost / optimal_cost;
	}

	let avg_ratio = total_ratio / num_simulations as f64;
	assert!(avg_ratio < 1.7, "Average ratio was {}", avg_ratio);
	}
	}