Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Add SearchMode fzf. #279

Merged
merged 5 commits into from
Mar 18, 2022
Merged
Show file tree
Hide file tree
Changes from 3 commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions Cargo.lock

Some generated files are not rendered by default. Learn more about how customized files appear on GitHub.

1 change: 1 addition & 0 deletions atuin-client/Cargo.toml
Original file line number Diff line number Diff line change
Expand Up @@ -47,3 +47,4 @@ sqlx = { version = "0.5", features = [
"sqlite",
] }
minspan = "0.1.1"
regex = "1.5.4"
220 changes: 150 additions & 70 deletions atuin-client/src/database.rs
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,7 @@ use chrono::Utc;

use eyre::Result;
use itertools::Itertools;
use regex::Regex;

use sqlx::sqlite::{
SqliteConnectOptions, SqliteJournalMode, SqlitePool, SqlitePoolOptions, SqliteRow,
Expand Down Expand Up @@ -286,27 +287,96 @@ impl Database for Sqlite {
let query = query.to_string().replace('*', "%"); // allow wildcard char
let limit = limit.map_or("".to_owned(), |l| format!("limit {}", l));

let query = match search_mode {
SearchMode::Prefix => query,
SearchMode::FullText => format!("%{}", query),
SearchMode::Fuzzy => query.split("").join("%"),
let (query_sql, query_params) = match search_mode {
SearchMode::Prefix => ("command like ?1".to_string(), vec![format!("{}%", query)]),
SearchMode::FullText => ("command like ?1".to_string(), vec![format!("%{}%", query)]),
SearchMode::Fuzzy => {
let split_regex = Regex::new(r" +").unwrap();
let terms: Vec<&str> = split_regex.split(query.as_str()).collect();
let num_terms = terms.len();
let mut query_sql = "".to_string();
let mut query_params = std::vec::Vec::with_capacity(num_terms);
let mut was_or = false;
for (i, query_part) in terms.into_iter().enumerate() {
// TODO smart case mode could be made configurable like in fzf
let (operator, glob) = if query_part.contains(char::is_uppercase) {
("glob", '*')
} else {
("like", '%')
};
let (is_inverse, query_part) = if query_part.starts_with('!') {
(true, query_part.strip_prefix('!').unwrap())
} else {
(false, query_part)
};
conradludgate marked this conversation as resolved.
Show resolved Hide resolved
match query_part {
"|" => {
if !was_or {
query_sql.push_str(" OR ");
was_or = true;
continue;
} else {
query_params.push(format!("{glob}|{glob}", glob = glob));
}
}
exact_prefix if query_part.starts_with('^') => query_params.push(format!(
"{term}{glob}",
term = exact_prefix.strip_prefix('^').unwrap(),
glob = glob
conradludgate marked this conversation as resolved.
Show resolved Hide resolved
)),
exact_suffix if query_part.ends_with('$') => query_params.push(format!(
"{glob}{term}",
term = exact_suffix.strip_suffix('$').unwrap(),
glob = glob
)),
exact if query_part.starts_with('\'') => query_params.push(format!(
"{glob}{term}{glob}",
term = exact.strip_prefix('\'').unwrap(),
glob = glob
)),
exact if is_inverse => query_params.push(format!(
"{glob}{term}{glob}",
term = exact,
glob = glob
)),
_ => {
query_params.push(query_part.split("").join(glob.to_string().as_str()))
}
}
if i > 0 && !was_or {
query_sql.push_str(" AND ");
}
if is_inverse {
query_sql.push_str("NOT ");
}
query_sql
.push_str(format!("command {} ?{}", operator, query_params.len()).as_str());
was_or = false;
}
(query_sql, query_params)
}
};

let res = sqlx::query(
format!(
"select * from history h
where command like ?1 || '%'
group by command
having max(timestamp)
order by timestamp desc {}",
limit.clone()
let res = query_params
.iter()
.fold(
sqlx::query(
format!(
"select * from history h
where {}
group by command
having max(timestamp)
order by timestamp desc {}",
query_sql.as_str(),
limit.clone()
)
.as_str(),
),
|query, query_param| query.bind(query_param),
)
.as_str(),
)
.bind(query)
.map(Self::query_history)
.fetch_all(&self.pool)
.await?;
.map(Self::query_history)
.fetch_all(&self.pool)
.await?;

Ok(ordering::reorder_fuzzy(search_mode, orig_query, res))
}
Expand All @@ -326,6 +396,31 @@ mod test {
use super::*;
use std::time::{Duration, Instant};

macro_rules! assert_search_eq {
($db:expr, $mode:expr, $query:expr, $expected:expr) => {
let results = $db.search(None, $mode, $query).await.unwrap();
assert_eq!(
results.len(),
$expected,
"query \"{}\", commands: {:?}",
$query,
results.iter().map(|a| &a.command).collect::<Vec<&String>>()
);
};
($db:expr, $mode:expr, $query:expr, $expected:expr, $commands:expr) => {
let results = $db.search(None, $mode, $query).await.unwrap();
let commands: Vec<&String> = results.iter().map(|a| &a.command).collect();
assert_eq!(
results.len(),
$expected,
"query \"{}\", commands: {:?}",
$query,
commands
);
assert_eq!(commands, $commands);
};
}

conradludgate marked this conversation as resolved.
Show resolved Hide resolved
async fn new_history_item(db: &mut impl Database, cmd: &str) -> Result<()> {
let history = History::new(
chrono::Utc::now(),
Expand All @@ -344,67 +439,57 @@ mod test {
let mut db = Sqlite::new("sqlite::memory:").await.unwrap();
new_history_item(&mut db, "ls /home/ellie").await.unwrap();

let mut results = db.search(None, SearchMode::Prefix, "ls").await.unwrap();
assert_eq!(results.len(), 1);

results = db.search(None, SearchMode::Prefix, "/home").await.unwrap();
assert_eq!(results.len(), 0);

results = db.search(None, SearchMode::Prefix, "ls ").await.unwrap();
assert_eq!(results.len(), 0);
assert_search_eq!(db, SearchMode::Prefix, "ls", 1);
assert_search_eq!(db, SearchMode::Prefix, "/home", 0);
assert_search_eq!(db, SearchMode::Prefix, "ls ", 0);
}

#[tokio::test(flavor = "multi_thread")]
async fn test_search_fulltext() {
let mut db = Sqlite::new("sqlite::memory:").await.unwrap();
new_history_item(&mut db, "ls /home/ellie").await.unwrap();

let mut results = db.search(None, SearchMode::FullText, "ls").await.unwrap();
assert_eq!(results.len(), 1);

results = db
.search(None, SearchMode::FullText, "/home")
.await
.unwrap();
assert_eq!(results.len(), 1);

results = db.search(None, SearchMode::FullText, "ls ").await.unwrap();
assert_eq!(results.len(), 0);
assert_search_eq!(db, SearchMode::FullText, "ls", 1);
assert_search_eq!(db, SearchMode::FullText, "/home", 1);
assert_search_eq!(db, SearchMode::FullText, "ls ", 0);
}

#[tokio::test(flavor = "multi_thread")]
async fn test_search_fuzzy() {
let mut db = Sqlite::new("sqlite::memory:").await.unwrap();
new_history_item(&mut db, "ls /home/ellie").await.unwrap();
new_history_item(&mut db, "ls /home/frank").await.unwrap();
new_history_item(&mut db, "cd /home/ellie").await.unwrap();
new_history_item(&mut db, "cd /home/Ellie").await.unwrap();
new_history_item(&mut db, "/home/ellie/.bin/rustup")
.await
.unwrap();

let mut results = db.search(None, SearchMode::Fuzzy, "ls /").await.unwrap();
assert_eq!(results.len(), 2);

results = db.search(None, SearchMode::Fuzzy, "l/h/").await.unwrap();
assert_eq!(results.len(), 2);

results = db.search(None, SearchMode::Fuzzy, "/h/e").await.unwrap();
assert_eq!(results.len(), 3);

results = db.search(None, SearchMode::Fuzzy, "/hmoe/").await.unwrap();
assert_eq!(results.len(), 0);

results = db
.search(None, SearchMode::Fuzzy, "ellie/home")
.await
.unwrap();
assert_eq!(results.len(), 0);

results = db.search(None, SearchMode::Fuzzy, "lsellie").await.unwrap();
assert_eq!(results.len(), 1);

results = db.search(None, SearchMode::Fuzzy, " ").await.unwrap();
assert_eq!(results.len(), 3);
assert_search_eq!(db, SearchMode::Fuzzy, "ls /", 3);
assert_search_eq!(db, SearchMode::Fuzzy, "ls/", 2);
assert_search_eq!(db, SearchMode::Fuzzy, "l/h/", 2);
assert_search_eq!(db, SearchMode::Fuzzy, "/h/e", 3);
assert_search_eq!(db, SearchMode::Fuzzy, "/hmoe/", 0);
assert_search_eq!(db, SearchMode::Fuzzy, "ellie/home", 0);
assert_search_eq!(db, SearchMode::Fuzzy, "lsellie", 1);
assert_search_eq!(db, SearchMode::Fuzzy, " ", 4);

// single term operators
assert_search_eq!(db, SearchMode::Fuzzy, "^ls", 2);
assert_search_eq!(db, SearchMode::Fuzzy, "'ls", 2);
assert_search_eq!(db, SearchMode::Fuzzy, "ellie$", 2);
assert_search_eq!(db, SearchMode::Fuzzy, "!^ls", 2);
assert_search_eq!(db, SearchMode::Fuzzy, "!ellie", 1);
assert_search_eq!(db, SearchMode::Fuzzy, "!ellie$", 2);

// multiple terms
assert_search_eq!(db, SearchMode::Fuzzy, "ls !ellie", 1);
assert_search_eq!(db, SearchMode::Fuzzy, "^ls !e$", 1);
assert_search_eq!(db, SearchMode::Fuzzy, "home !^ls", 2);
assert_search_eq!(db, SearchMode::Fuzzy, "'frank | 'rustup", 2);
assert_search_eq!(db, SearchMode::Fuzzy, "'frank | 'rustup 'ls", 1);

// case matching
assert_search_eq!(db, SearchMode::Fuzzy, "Ellie", 1);
}

#[tokio::test(flavor = "multi_thread")]
Expand All @@ -414,17 +499,12 @@ mod test {

new_history_item(&mut db, "curl").await.unwrap();
new_history_item(&mut db, "corburl").await.unwrap();
// if fuzzy reordering is on, it should come back in a more sensible order
let mut results = db.search(None, SearchMode::Fuzzy, "curl").await.unwrap();
assert_eq!(results.len(), 2);
let commands: Vec<&String> = results.iter().map(|a| &a.command).collect();
assert_eq!(commands, vec!["curl", "corburl"]);

results = db.search(None, SearchMode::Fuzzy, "xxxx").await.unwrap();
assert_eq!(results.len(), 0);
// if fuzzy reordering is on, it should come back in a more sensible order
assert_search_eq!(db, SearchMode::Fuzzy, "curl", 2, vec!["curl", "corburl"]);

results = db.search(None, SearchMode::Fuzzy, "").await.unwrap();
assert_eq!(results.len(), 2);
assert_search_eq!(db, SearchMode::Fuzzy, "xxxx", 0);
assert_search_eq!(db, SearchMode::Fuzzy, "", 2);
}

#[tokio::test(flavor = "multi_thread")]
Expand Down
1 change: 1 addition & 0 deletions atuin-client/src/ordering.rs
Original file line number Diff line number Diff line change
Expand Up @@ -17,6 +17,7 @@ where
let mut r = res.clone();
let qvec = &query.chars().collect();
r.sort_by_cached_key(|h| {
// TODO for fzf search we should sum up scores for each matched term
let (from, to) = match minspan::span(qvec, &(f(h).chars().collect())) {
Some(x) => x,
// this is a little unfortunate: when we are asked to match a query that is found nowhere,
Expand Down
26 changes: 25 additions & 1 deletion docs/config.md
Original file line number Diff line number Diff line change
Expand Up @@ -97,14 +97,38 @@ key = "~/.atuin-session"
### `search_mode`

Which search mode to use. Atuin supports "prefix", full text and "fuzzy" search
modes. The prefix search for "query\*", fulltext "\*query\*", and fuzzy "\*q\*u\*e\*r\*y\*"
modes. The prefix searches for "query\*", fulltext "\*query\*", and fuzzy applies
the search syntax [described below](#fuzzy-search-syntax).

Defaults to "prefix"

```
search_mode = "fulltext"
```

#### `fuzzy` search syntax

The "fuzzy" search syntax is based on the
[fzf search syntax](https://github.com/junegunn/fzf#search-syntax).

| Token | Match type | Description |
| --------- | -------------------------- | ------------------------------------ |
| `sbtrkt` | fuzzy-match | Items that match `sbtrkt` |
| `'wild` | exact-match (quoted) | Items that include `wild` |
| `^music` | prefix-exact-match | Items that start with `music` |
| `.mp3$` | suffix-exact-match | Items that end with `.mp3` |
| `!fire` | inverse-exact-match | Items that do not include `fire` |
| `!^music` | inverse-prefix-exact-match | Items that do not start with `music` |
| `!.mp3$` | inverse-suffix-exact-match | Items that do not end with `.mp3` |

A single bar character term acts as an OR operator. For example, the following
query matches entries that start with `core` and end with either `go`, `rb`,
or `py`.

```
^core go$ | rb$ | py$
```

## Server config

`// TODO`