improve search route

2024-08-15 08:55:27 +02:00 · 2024-08-15 08:55:27 +02:00 · 23799eeb9e
commit 23799eeb9e
parent 9a00f91ebc
4 changed files with 123 additions and 210 deletions
--- a/src/config.rs
+++ b/src/config.rs
@ -3,7 +3,7 @@
 use figment::{providers::Serialized, Figment};
 use serde::{Deserialize, Serialize};
-/// A named struct which stores the parsed config file options.
+/// Struct holding config Options
 #[derive(Debug, Clone, Deserialize, Serialize)]
 pub struct Config {
    /// It stores the parsed port number option on which the server should launch.
@ -32,15 +32,7 @@ pub struct Config {
    pub pool_idle_connection_timeout: u8,
 }
-/// A named struct which stores,deserializes, serializes and groups the parsed config file options
+/// A struct holding style config
 /// of theme and colorscheme names into the Style struct which derives the `Clone`, `Serialize`
 /// and Deserialize traits where the `Clone` trait is derived for allowing the struct to be
 /// cloned and passed to the server as a shared data between all routes except `/robots.txt` and
 /// the `Serialize` trait has been derived for allowing the object to be serialized so that it
 /// can be passed to handlebars template files and the `Deserialize` trait has been derived in
 /// order to allow the deserializing the json back to struct in aggregate function in
 /// aggregator.rs and create a new struct out of it and then serialize it back to json and pass
 /// it to the template files.
 #[derive(Default, Debug, Clone, Deserialize, Serialize)]
 pub struct Style {
    /// It stores the parsed theme option used to set a theme for the website.
--- a/src/main.rs
+++ b/src/main.rs
@ -40,7 +40,7 @@ async fn main() {
        .init();
    log::info!(
-        "started server on port {} and IP {}",
+        "starting server on port {} and IP {}",
        config.port,
        config.binding_ip
    );
--- a/src/models/server_models.rs
+++ b/src/models/server_models.rs
@ -11,7 +11,7 @@ use crate::config::Style;
 pub struct SearchParams {
    /// It stores the search parameter option `q` (or query in simple words)
    /// of the search url.
-    pub q: Option<String>,
+    pub query: Option<String>,
    /// It stores the search parameter `page` (or pageno in simple words)
    /// of the search url.
    pub page: Option<u32>,
--- a/src/server/routes/search.rs
+++ b/src/server/routes/search.rs
@ -20,13 +20,13 @@ use tokio::join;
 /// # Example
 ///
 /// ```bash
-/// curl "http://127.0.0.1:8080/search?q=sweden&page=1"
+/// wget "http://127.0.0.1:8080/search?q=sweden&page=1"
 /// ```
 ///
 /// Or
 ///
 /// ```bash
-/// curl "http://127.0.0.1:8080/search?q=sweden"
+/// wget "http://127.0.0.1:8080/search?q=sweden"
 /// ```
 #[get("/search")]
 pub async fn search(
@ -34,16 +34,16 @@ pub async fn search(
    config: web::Data<Config>,
    cache: web::Data<Cache>,
 ) -> Result<HttpResponse, Box<dyn std::error::Error>> {
    use std::sync::Arc;
    let params = web::Query::<SearchParams>::from_query(req.query_string())?;
-    match &params.q {
+
-        Some(query) => {
+    if !params.query.as_ref().is_some_and(|q| !q.trim().is_empty()) {
            if query.trim().is_empty() {
        return Ok(HttpResponse::TemporaryRedirect()
            .insert_header(("location", "/"))
            .finish());
    }
    let query = params.query.as_ref().unwrap();
    let cookie = req.cookie("appCookie");
    // Get search settings using the user's cookie or from the server's config
@ -61,23 +61,21 @@ pub async fn search(
        });
    // Closure wrapping the results function capturing local references
-            let get_results =
+    let get_results = |page| results(config.clone(), cache.clone(), query, page, &search_settings);
                |page| results(config.clone(), cache.clone(), query, page, &search_settings);
    // .max(1) makes sure that the page >= 0.
    let page = params.page.unwrap_or(1).max(1) - 1;
    let previous_page = page.saturating_sub(1);
    let next_page = page + 1;
-            let mut results = Arc::new((SearchResults::default(), String::default()));
+    let mut results = (SearchResults::default(), String::default());
    if page != previous_page {
        let (previous_results, current_results, next_results) = join!(
            get_results(previous_page),
            get_results(page),
            get_results(next_page)
        );
-                let (parsed_previous_results, parsed_next_results) =
+        let (parsed_previous_results, parsed_next_results) = (previous_results?, next_results?);
                    (previous_results?, next_results?);
        let (cache_keys, results_list) = (
            [
@ -92,23 +90,22 @@ pub async fn search(
            ],
        );
-                results = Arc::new(current_results?);
+        results = current_results?;
-                tokio::spawn(async move { cache.cache_results(&results_list, &cache_keys) });
+        cache.cache_results(&results_list, &cache_keys);
    } else {
-                let (current_results, next_results) =
+        let (current_results, next_results) = join!(get_results(page), get_results(page + 1));
                    join!(get_results(page), get_results(page + 1));
        let parsed_next_results = next_results?;
-                results = Arc::new(current_results?);
+        results = current_results?;
        let (cache_keys, results_list) = (
            [results.1.clone(), parsed_next_results.1.clone()],
            [results.0.clone(), parsed_next_results.0],
        );
-                tokio::spawn(async move { cache.cache_results(&results_list, &cache_keys) });
+        cache.cache_results(&results_list, &cache_keys);
    }
    Ok(HttpResponse::Ok().content_type(ContentType::html()).body(
@ -122,11 +119,6 @@ pub async fn search(
        .0,
    ))
 }
        None => Ok(HttpResponse::TemporaryRedirect()
            .insert_header(("location", "/"))
            .finish()),
    }
 }
 /// Fetches the results for a query and page. It First checks the redis cache, if that
 /// fails it gets proper results by requesting from the upstream search engines.
@ -153,21 +145,19 @@ async fn results(
    // eagerly parse cookie value to evaluate safe search level
    let cache_key = format!(
-        "http://{}:{}/search?q={}&page={}&engines={}",
+        "search?q={}&page={}&engines={}",
        config.binding_ip,
        config.port,
        query,
        page,
        search_settings.engines.join(",")
    );
    // fetch the cached results json.
-    let cached_results = cache.cached_results(&cache_key);
+    let response = cache.cached_results(&cache_key);
-    // check if fetched cache results was indeed fetched or it was an error and if so
+
-    // handle the data accordingly.
+    if let Some(results) = response {
-    match cached_results {
+        return Ok((results, cache_key));
-        Some(results) => Ok((results, cache_key)),
+    }
-        None => {
+
    // check if the cookie value is empty or not if it is empty then use the
    // default selected upstream search engines from the config file otherwise
    // parse the non-empty cookie and grab the user selected engines from the
@ -201,72 +191,3 @@ async fn results(
    cache.cache_results(&[results.clone()], &[cache_key.clone()]);
    Ok((results, cache_key))
 }
    }
 }
 #[cfg(test)]
 mod tests {
    use std::time::{SystemTime, UNIX_EPOCH};
    /// A helper function which creates a random mock safe search level value.
    ///
    /// # Returns
    ///
    /// Returns an optional u8 value.
    fn mock_safe_search_level_value() -> Option<u8> {
        let nanos = SystemTime::now()
            .duration_since(UNIX_EPOCH)
            .unwrap_or_default()
            .subsec_nanos() as f32;
        let delay = ((nanos / 1_0000_0000 as f32).floor() as i8) - 1;
        match delay {
            -1 => None,
            some_num => Some(if some_num > 4 { some_num - 4 } else { some_num } as u8),
        }
    }
    #[test]
    /// A test function to test whether the output of the branchless and branched code
    /// for the code to choose the appropriate safe search level is same or not.
    fn get_safesearch_level_branched_branchless_code_test() {
        // Get mock values for the safe search level values for URL parameters, cookie
        // and config.
        let safe_search_level_from_url = mock_safe_search_level_value();
        let cookie_safe_search_level = mock_safe_search_level_value().unwrap_or(0);
        let config_safe_search_level = mock_safe_search_level_value().unwrap_or(0);
        // Branched code
        let safe_search_level_value_from_branched_code = match safe_search_level_from_url {
            Some(safe_search_level_from_url_parsed) => {
                if config_safe_search_level >= 3 {
                    config_safe_search_level
                } else {
                    safe_search_level_from_url_parsed
                }
            }
            None => {
                if config_safe_search_level >= 3 {
                    config_safe_search_level
                } else {
                    cookie_safe_search_level
                }
            }
        };
        // branchless code
        let safe_search_level_value_from_branchless_code =
            (u8::from(safe_search_level_from_url.is_some())
                * ((u8::from(config_safe_search_level >= 3) * config_safe_search_level)
                    + (u8::from(config_safe_search_level < 3)
                        * safe_search_level_from_url.unwrap_or(0))))
                + (u8::from(safe_search_level_from_url.is_none())
                    * ((u8::from(config_safe_search_level >= 3) * config_safe_search_level)
                        + (u8::from(config_safe_search_level < 3) * cookie_safe_search_level)));
        assert_eq!(
            safe_search_level_value_from_branched_code,
            safe_search_level_value_from_branchless_code
        );
    }
 }