File size: 5,824 Bytes
36143bb ef06a73 45324e0 ef06a73 36143bb 45324e0 ef06a73 36143bb ef06a73 36143bb 45324e0 36143bb 14c0f62 45324e0 995601f 36143bb 8a23004 995601f 36143bb ef06a73 36143bb ef06a73 36143bb ef06a73 36143bb 14c0f62 36143bb 14c0f62 36143bb c1298ea 36143bb c1298ea 36143bb c1298ea ef06a73 36143bb ef06a73 36143bb ef06a73 45324e0 36143bb ef06a73 36143bb ef06a73 36143bb ef06a73 36143bb ef06a73 36143bb ef06a73 36143bb ef06a73 | 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 | use std::path::{Path, PathBuf};
use std::sync::Arc;
use std::time::Duration;
use anyhow::{Context, Result};
use camino::Utf8PathBuf;
use reqwest_middleware::{ClientBuilder, ClientWithMiddleware};
use reqwest_retry::{RetryTransientMiddleware, policies::ExponentialBackoff};
use tokio::sync::broadcast;
use crate::downloads::Downloads;
use crate::packages::PackageCatalog;
const USER_AGENT: &str = concat!(env!("CARGO_PKG_NAME"), "/", env!("CARGO_PKG_VERSION"));
pub type RuntimeHttpClient = Arc<ClientWithMiddleware>;
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
pub enum ComputePolicy {
PreferGpu,
CpuOnly,
}
#[derive(Debug, Clone)]
pub struct RuntimeHttpConfig {
pub connect_timeout_secs: u64,
pub read_timeout_secs: u64,
pub max_retries: u32,
}
impl Default for RuntimeHttpConfig {
fn default() -> Self {
Self {
connect_timeout_secs: 20,
read_timeout_secs: 300,
max_retries: 3,
}
}
}
impl RuntimeHttpConfig {
pub fn build_client(&self) -> Result<RuntimeHttpClient> {
let base = reqwest::Client::builder()
.user_agent(USER_AGENT)
.connect_timeout(Duration::from_secs(self.connect_timeout_secs))
.read_timeout(Duration::from_secs(self.read_timeout_secs))
.build()?;
Ok(Arc::new(
ClientBuilder::new(base)
.with(RetryTransientMiddleware::new_with_policy(
ExponentialBackoff::builder().build_with_max_retries(self.max_retries),
))
.build(),
))
}
}
// FIXME: move this function to a more appropriate place, e.g. a `config` module
pub fn default_app_data_root() -> Utf8PathBuf {
// Env-override (tests, CI, portable installs).
if let Ok(v) = std::env::var("KOHARU_DATA_ROOT")
&& !v.is_empty()
{
return Utf8PathBuf::from(v);
}
if let Ok(exe) = std::env::current_exe()
&& let Some(root) = exe.parent()
&& root.join("config.toml").is_file()
{
return Utf8PathBuf::from_path_buf(root.to_path_buf())
.unwrap_or_else(|path| Utf8PathBuf::from(path.to_string_lossy().into_owned()));
}
let root = dirs::data_local_dir()
.or_else(dirs::data_dir)
.unwrap_or_else(std::env::temp_dir)
.join("Koharu");
Utf8PathBuf::from_path_buf(root)
.unwrap_or_else(|path| Utf8PathBuf::from(path.to_string_lossy().into_owned()))
}
#[derive(Clone)]
pub struct Runtime {
inner: Arc<RuntimeInner>,
}
struct RuntimeInner {
root: PathBuf,
compute: ComputePolicy,
downloads: Downloads,
packages: PackageCatalog,
}
impl Runtime {
pub fn new(root: impl Into<PathBuf>, compute: ComputePolicy) -> Result<Self> {
Self::new_with_http(root, compute, RuntimeHttpConfig::default())
}
pub fn new_with_http(
root: impl Into<PathBuf>,
compute: ComputePolicy,
http: RuntimeHttpConfig,
) -> Result<Self> {
let root = root.into();
let downloads = Downloads::new(
root.join("runtime").join(".downloads"),
root.join("models").join("huggingface"),
&http,
)?;
Ok(Self {
inner: Arc::new(RuntimeInner {
root,
compute,
downloads,
packages: PackageCatalog::discover(),
}),
})
}
pub fn root(&self) -> &Path {
&self.inner.root
}
pub fn wants_gpu(&self) -> bool {
matches!(self.inner.compute, ComputePolicy::PreferGpu)
}
pub fn http_client(&self) -> RuntimeHttpClient {
self.inner.downloads.client()
}
pub fn subscribe_downloads(&self) -> broadcast::Receiver<koharu_core::DownloadProgress> {
self.inner.downloads.subscribe()
}
pub fn downloads(&self) -> Downloads {
self.inner.downloads.clone()
}
pub async fn prepare(&self) -> Result<()> {
let dirs = [
self.root().join("runtime"),
self.root().join("runtime").join(".downloads"),
self.root().join("models"),
self.root().join("models").join("huggingface"),
];
for dir in dirs {
std::fs::create_dir_all(&dir)
.with_context(|| format!("failed to create `{}`", dir.display()))?;
}
self.inner.packages.prepare_bootstrap(self).await
}
pub fn llama_directory(&self) -> Result<PathBuf> {
crate::llama::runtime_dir(self)
}
}
pub type RuntimeManager = Runtime;
#[cfg(test)]
mod tests {
use std::fs;
use anyhow::Result;
use super::*;
#[tokio::test]
#[ignore]
async fn prepares_llama_runtime_into_configured_root() -> Result<()> {
let tempdir = tempfile::tempdir()?;
let runtime = Runtime::new(tempdir.path(), ComputePolicy::CpuOnly)?;
runtime.prepare().await?;
assert!(runtime.llama_directory()?.exists());
Ok(())
}
#[tokio::test]
#[ignore]
async fn repeated_basename_loads_succeed_after_prepare() -> Result<()> {
let tempdir = tempfile::tempdir()?;
let runtime = Runtime::new(tempdir.path(), ComputePolicy::CpuOnly)?;
runtime.prepare().await?;
let dir = runtime.llama_directory()?;
let lib_name = fs::read_dir(&dir)?
.filter_map(|entry| entry.ok())
.filter_map(|entry| {
let name = entry.file_name().to_string_lossy().into_owned();
name.contains("llama").then_some(name)
})
.next()
.ok_or_else(|| anyhow::anyhow!("no llama library found"))?;
let _first = crate::load_library_by_name(&lib_name)?;
let _second = crate::load_library_by_name(&lib_name)?;
Ok(())
}
}
|