2023-05-02 04:58:21 -04:00
|
|
|
//! This module provides the functionality to cache the aggregated results fetched and aggregated
|
|
|
|
//! from the upstream search engines in a json format.
|
|
|
|
|
2023-08-27 13:50:42 -04:00
|
|
|
use error_stack::Report;
|
2023-09-13 17:19:44 -04:00
|
|
|
#[cfg(feature = "memory-cache")]
|
2023-09-09 12:17:29 -04:00
|
|
|
use mini_moka::sync::Cache as MokaCache;
|
2023-09-13 17:19:44 -04:00
|
|
|
#[cfg(feature = "memory-cache")]
|
2023-09-09 12:17:29 -04:00
|
|
|
use std::time::Duration;
|
|
|
|
use tokio::sync::Mutex;
|
2023-08-27 13:50:42 -04:00
|
|
|
|
2023-09-14 14:26:08 -04:00
|
|
|
use crate::{config::parser::Config, models::aggregation_models::SearchResults};
|
2023-09-11 17:20:05 -04:00
|
|
|
|
2023-09-17 12:56:48 -04:00
|
|
|
use super::error::CacheError;
|
2023-09-13 17:19:44 -04:00
|
|
|
#[cfg(feature = "redis-cache")]
|
2023-09-12 16:14:54 -04:00
|
|
|
use super::redis_cacher::RedisCache;
|
2023-05-02 04:58:21 -04:00
|
|
|
|
2023-11-28 01:17:35 -05:00
|
|
|
/// Abstraction trait for common methods provided by a cache backend.
|
|
|
|
#[async_trait::async_trait]
|
|
|
|
pub trait Cacher: Send + Sync {
|
|
|
|
// A function that builds the cache from the given configuration.
|
2023-09-17 05:47:02 -04:00
|
|
|
///
|
|
|
|
/// # Arguments
|
|
|
|
///
|
|
|
|
/// * `config` - It takes the config struct as an argument.
|
|
|
|
///
|
|
|
|
/// # Returns
|
|
|
|
///
|
2023-11-28 01:17:35 -05:00
|
|
|
/// It returns a newly initialized backend based on the feature enabled by the user.
|
|
|
|
async fn build(config: &Config) -> Self
|
|
|
|
where
|
|
|
|
Self: Sized;
|
2023-09-17 05:47:02 -04:00
|
|
|
|
2023-09-09 12:17:29 -04:00
|
|
|
/// A function which fetches the cached json results as json string.
|
2023-05-02 04:58:21 -04:00
|
|
|
///
|
|
|
|
/// # Arguments
|
|
|
|
///
|
|
|
|
/// * `url` - It takes an url as a string.
|
2023-09-17 05:47:02 -04:00
|
|
|
///
|
|
|
|
/// # Error
|
|
|
|
///
|
|
|
|
/// Returns the `SearchResults` from the cache if the program executes normally otherwise
|
|
|
|
/// returns a `CacheError` if the results cannot be retrieved from the cache.
|
2023-11-28 01:17:35 -05:00
|
|
|
async fn cached_results(&mut self, url: &str) -> Result<SearchResults, Report<CacheError>>;
|
2023-05-02 04:58:21 -04:00
|
|
|
|
2023-09-09 12:17:29 -04:00
|
|
|
/// A function which caches the results by using the `url` as the key and
|
|
|
|
/// `json results` as the value and stores it in the cache
|
2023-05-02 04:58:21 -04:00
|
|
|
///
|
|
|
|
/// # Arguments
|
|
|
|
///
|
|
|
|
/// * `json_results` - It takes the json results string as an argument.
|
|
|
|
/// * `url` - It takes the url as a String.
|
2023-09-17 05:47:02 -04:00
|
|
|
///
|
|
|
|
/// # Error
|
|
|
|
///
|
|
|
|
/// Returns a unit type if the program caches the given search results without a failure
|
|
|
|
/// otherwise it returns a `CacheError` if the search results cannot be cached due to a
|
|
|
|
/// failure.
|
2023-11-28 01:17:35 -05:00
|
|
|
async fn cache_results(
|
|
|
|
&mut self,
|
|
|
|
search_results: &SearchResults,
|
|
|
|
url: &str,
|
|
|
|
) -> Result<(), Report<CacheError>>;
|
|
|
|
|
|
|
|
/// A helper function which computes the hash of the url and formats and returns it as string.
|
|
|
|
///
|
|
|
|
/// # Arguments
|
|
|
|
///
|
|
|
|
/// * `url` - It takes an url as string.
|
|
|
|
fn hash_url(&self, url: &str) -> String {
|
|
|
|
blake3::hash(url.as_bytes()).to_string()
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
#[cfg(feature = "redis-cache")]
|
|
|
|
#[async_trait::async_trait]
|
|
|
|
impl Cacher for RedisCache {
|
|
|
|
async fn build(config: &Config) -> Self {
|
|
|
|
log::info!(
|
|
|
|
"Initialising redis cache. Listening to {}",
|
|
|
|
&config.redis_url
|
|
|
|
);
|
2023-11-30 07:09:17 -05:00
|
|
|
RedisCache::new(&config.redis_url, 5, config.cache_expiry_time)
|
2023-11-28 01:17:35 -05:00
|
|
|
.await
|
|
|
|
.expect("Redis cache configured")
|
|
|
|
}
|
|
|
|
|
|
|
|
async fn cached_results(&mut self, url: &str) -> Result<SearchResults, Report<CacheError>> {
|
|
|
|
let hashed_url_string: &str = &self.hash_url(url);
|
|
|
|
let json = self.cached_json(hashed_url_string).await?;
|
|
|
|
Ok(serde_json::from_str::<SearchResults>(&json)
|
|
|
|
.map_err(|_| CacheError::SerializationError)?)
|
|
|
|
}
|
|
|
|
|
|
|
|
async fn cache_results(
|
|
|
|
&mut self,
|
|
|
|
search_results: &SearchResults,
|
|
|
|
url: &str,
|
|
|
|
) -> Result<(), Report<CacheError>> {
|
|
|
|
let json =
|
|
|
|
serde_json::to_string(search_results).map_err(|_| CacheError::SerializationError)?;
|
|
|
|
let hashed_url_string = self.hash_url(url);
|
|
|
|
self.cache_json(&json, &hashed_url_string).await
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Memory based cache backend.
|
|
|
|
#[cfg(feature = "memory-cache")]
|
|
|
|
pub struct InMemoryCache {
|
|
|
|
/// The backend cache which stores data.
|
|
|
|
cache: MokaCache<String, SearchResults>,
|
|
|
|
}
|
|
|
|
|
|
|
|
#[cfg(feature = "memory-cache")]
|
|
|
|
#[async_trait::async_trait]
|
|
|
|
impl Cacher for InMemoryCache {
|
2023-11-30 07:09:17 -05:00
|
|
|
async fn build(config: &Config) -> Self {
|
2023-11-28 01:17:35 -05:00
|
|
|
log::info!("Initialising in-memory cache");
|
|
|
|
|
|
|
|
InMemoryCache {
|
|
|
|
cache: MokaCache::builder()
|
2023-11-30 07:09:17 -05:00
|
|
|
.time_to_live(Duration::from_secs(config.cache_expiry_time.into()))
|
2023-11-28 01:17:35 -05:00
|
|
|
.build(),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
async fn cached_results(&mut self, url: &str) -> Result<SearchResults, Report<CacheError>> {
|
|
|
|
let hashed_url_string = self.hash_url(url);
|
|
|
|
match self.cache.get(&hashed_url_string) {
|
|
|
|
Some(res) => Ok(res),
|
|
|
|
None => Err(Report::new(CacheError::MissingValue)),
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
async fn cache_results(
|
|
|
|
&mut self,
|
|
|
|
search_results: &SearchResults,
|
|
|
|
url: &str,
|
|
|
|
) -> Result<(), Report<CacheError>> {
|
|
|
|
let hashed_url_string = self.hash_url(url);
|
|
|
|
self.cache.insert(hashed_url_string, search_results.clone());
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Cache backend which utilises both memory and redis based caches.
|
|
|
|
///
|
|
|
|
/// The hybrid cache system uses both the types of cache to ensure maximum availability.
|
|
|
|
/// The set method sets the key, value pair in both the caches. Therefore in a case where redis
|
|
|
|
/// cache becomes unavailable, the backend will retreive the value from in-memory cache.
|
|
|
|
#[cfg(all(feature = "memory-cache", feature = "redis-cache"))]
|
|
|
|
pub struct HybridCache {
|
|
|
|
/// The in-memory backend cache which stores data.
|
|
|
|
memory_cache: InMemoryCache,
|
|
|
|
/// The redis backend cache which stores data.
|
|
|
|
redis_cache: RedisCache,
|
|
|
|
}
|
|
|
|
|
|
|
|
#[cfg(all(feature = "memory-cache", feature = "redis-cache"))]
|
|
|
|
#[async_trait::async_trait]
|
|
|
|
impl Cacher for HybridCache {
|
|
|
|
async fn build(config: &Config) -> Self {
|
|
|
|
log::info!("Initialising hybrid cache");
|
|
|
|
HybridCache {
|
|
|
|
memory_cache: InMemoryCache::build(config).await,
|
|
|
|
redis_cache: RedisCache::build(config).await,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
async fn cached_results(&mut self, url: &str) -> Result<SearchResults, Report<CacheError>> {
|
|
|
|
match self.redis_cache.cached_results(url).await {
|
|
|
|
Ok(res) => Ok(res),
|
|
|
|
Err(_) => self.memory_cache.cached_results(url).await,
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
async fn cache_results(
|
|
|
|
&mut self,
|
|
|
|
search_results: &SearchResults,
|
|
|
|
url: &str,
|
|
|
|
) -> Result<(), Report<CacheError>> {
|
|
|
|
self.redis_cache.cache_results(search_results, url).await?;
|
|
|
|
self.memory_cache.cache_results(search_results, url).await?;
|
|
|
|
|
|
|
|
Ok(())
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
/// Dummy cache backend
|
|
|
|
pub struct DisabledCache;
|
|
|
|
|
|
|
|
#[async_trait::async_trait]
|
|
|
|
impl Cacher for DisabledCache {
|
|
|
|
async fn build(_config: &Config) -> Self {
|
|
|
|
log::info!("Caching is disabled");
|
|
|
|
DisabledCache
|
|
|
|
}
|
|
|
|
|
|
|
|
async fn cached_results(&mut self, _url: &str) -> Result<SearchResults, Report<CacheError>> {
|
|
|
|
Err(Report::new(CacheError::MissingValue))
|
|
|
|
}
|
|
|
|
|
|
|
|
async fn cache_results(
|
2023-05-14 20:20:43 -04:00
|
|
|
&mut self,
|
2023-09-17 05:47:02 -04:00
|
|
|
_search_results: &SearchResults,
|
|
|
|
_url: &str,
|
2023-09-17 12:56:48 -04:00
|
|
|
) -> Result<(), Report<CacheError>> {
|
2023-11-28 01:17:35 -05:00
|
|
|
Ok(())
|
2023-09-09 12:17:29 -04:00
|
|
|
}
|
|
|
|
}
|
2023-05-02 04:58:21 -04:00
|
|
|
|
2023-09-09 12:17:29 -04:00
|
|
|
/// A structure to efficiently share the cache between threads - as it is protected by a Mutex.
|
|
|
|
pub struct SharedCache {
|
2023-09-14 14:26:08 -04:00
|
|
|
/// The internal cache protected from concurrent access by a mutex
|
2023-11-28 01:17:35 -05:00
|
|
|
cache: Mutex<Box<dyn Cacher>>,
|
2023-09-09 12:17:29 -04:00
|
|
|
}
|
2023-05-02 04:58:21 -04:00
|
|
|
|
2023-09-09 12:17:29 -04:00
|
|
|
impl SharedCache {
|
2023-09-17 05:47:02 -04:00
|
|
|
/// A function that creates a new `SharedCache` from a Cache implementation.
|
|
|
|
///
|
|
|
|
/// # Arguments
|
|
|
|
///
|
|
|
|
/// * `cache` - It takes the `Cache` enum variant as an argument with the prefered cache type.
|
|
|
|
///
|
|
|
|
/// Returns a newly constructed `SharedCache` struct.
|
2023-11-28 01:17:35 -05:00
|
|
|
pub fn new(cache: impl Cacher + 'static) -> Self {
|
2023-09-09 12:17:29 -04:00
|
|
|
Self {
|
2023-11-28 01:17:35 -05:00
|
|
|
cache: Mutex::new(Box::new(cache)),
|
2023-08-27 13:50:42 -04:00
|
|
|
}
|
2023-05-02 04:58:21 -04:00
|
|
|
}
|
2023-09-09 12:17:29 -04:00
|
|
|
|
2023-09-17 05:47:02 -04:00
|
|
|
/// A getter function which retrieves the cached SearchResulsts from the internal cache.
|
|
|
|
///
|
|
|
|
/// # Arguments
|
|
|
|
///
|
|
|
|
/// * `url` - It takes the search url as an argument which will be used as the key to fetch the
|
|
|
|
/// cached results from the cache.
|
|
|
|
///
|
|
|
|
/// # Error
|
|
|
|
///
|
|
|
|
/// Returns a `SearchResults` struct containing the search results from the cache if nothing
|
|
|
|
/// goes wrong otherwise returns a `CacheError`.
|
2023-11-28 01:17:35 -05:00
|
|
|
pub async fn cached_results(&self, url: &str) -> Result<SearchResults, Report<CacheError>> {
|
2023-09-09 12:17:29 -04:00
|
|
|
let mut mut_cache = self.cache.lock().await;
|
2023-11-28 01:17:35 -05:00
|
|
|
mut_cache.cached_results(url).await
|
2023-09-09 12:17:29 -04:00
|
|
|
}
|
|
|
|
|
2023-09-17 05:47:02 -04:00
|
|
|
/// A setter function which caches the results by using the `url` as the key and
|
2023-09-11 17:20:05 -04:00
|
|
|
/// `SearchResults` as the value.
|
2023-09-17 05:47:02 -04:00
|
|
|
///
|
|
|
|
/// # Arguments
|
|
|
|
///
|
|
|
|
/// * `search_results` - It takes the `SearchResults` as an argument which are results that
|
|
|
|
/// needs to be cached.
|
|
|
|
/// * `url` - It takes the search url as an argument which will be used as the key for storing
|
|
|
|
/// results in the cache.
|
|
|
|
///
|
|
|
|
/// # Error
|
|
|
|
///
|
|
|
|
/// Returns an unit type if the results are cached succesfully otherwise returns a `CacheError`
|
|
|
|
/// on a failure.
|
2023-09-09 12:17:29 -04:00
|
|
|
pub async fn cache_results(
|
|
|
|
&self,
|
2023-09-12 01:37:33 -04:00
|
|
|
search_results: &SearchResults,
|
2023-09-09 12:17:29 -04:00
|
|
|
url: &str,
|
2023-09-17 12:56:48 -04:00
|
|
|
) -> Result<(), Report<CacheError>> {
|
2023-09-09 12:17:29 -04:00
|
|
|
let mut mut_cache = self.cache.lock().await;
|
2023-09-11 17:20:05 -04:00
|
|
|
mut_cache.cache_results(search_results, url).await
|
2023-09-09 12:17:29 -04:00
|
|
|
}
|
2023-05-02 04:58:21 -04:00
|
|
|
}
|
2023-11-28 01:17:35 -05:00
|
|
|
|
|
|
|
/// A function to initialise the cache backend.
|
|
|
|
pub async fn create_cache(config: &Config) -> impl Cacher {
|
|
|
|
#[cfg(all(feature = "redis-cache", feature = "memory-cache"))]
|
|
|
|
return HybridCache::build(config).await;
|
|
|
|
|
|
|
|
#[cfg(all(feature = "memory-cache", not(feature = "redis-cache")))]
|
|
|
|
return InMemoryCache::build(config).await;
|
|
|
|
|
|
|
|
#[cfg(all(feature = "redis-cache", not(feature = "memory-cache")))]
|
|
|
|
return RedisCache::build(config).await;
|
|
|
|
|
|
|
|
#[cfg(not(any(feature = "memory-cache", feature = "redis-cache")))]
|
|
|
|
return DisabledCache::build(config).await;
|
|
|
|
}
|