From 0cff65e5a86bfcacaa5ac318365d9b00c3d6ccbf Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Sun, 1 Nov 2020 17:24:08 +0100
Subject: [PATCH 01/20] Fix bugs and inconsistencies in the search parser

---
 rslib/src/search/parser.rs    | 262 +++++++++++++++++++++++-----------
 rslib/src/search/sqlwriter.rs | 133 ++++++++---------
 rslib/src/text.rs             |  22 ---
 3 files changed, 240 insertions(+), 177 deletions(-)
diff --git a/rslib/src/search/parser.rs b/rslib/src/search/parser.rs
index 6d3cd038c..44315af0d 100644
--- a/rslib/src/search/parser.rs
+++ b/rslib/src/search/parser.rs
@@ -9,16 +9,15 @@ use crate::{
 use lazy_static::lazy_static;
 use nom::{
     branch::alt,
-    bytes::complete::{escaped, is_not, tag, take_while1},
-    character::complete::{anychar, char, one_of},
+    bytes::complete::{escaped, is_not, tag},
+    character::complete::{anychar, char, none_of, one_of},
     combinator::{all_consuming, map, map_res},
-    sequence::{delimited, preceded, tuple},
+    sequence::{delimited, preceded, separated_pair},
     {multi::many0, IResult},
 };
-use regex::Regex;
+use regex::{Captures, Regex};
 use std::{borrow::Cow, num};
 
-// fixme: need to preserve \ when used twice in string
 
 struct ParseError {}
 
@@ -42,6 +41,12 @@ impl<I> From<nom::Err<(I, nom::error::ErrorKind)>> for ParseError {
 
 type ParseResult<T> = std::result::Result<T, ParseError>;
 
+#[derive(Debug, PartialEq)]
+pub(super) enum OptionalRe<'a> {
+    Text(Cow<'a, str>),
+    Re(Cow<'a, str>),
+}
+
 #[derive(Debug, PartialEq)]
 pub(super) enum Node<'a> {
     And,
@@ -57,30 +62,30 @@ pub(super) enum SearchNode<'a> {
     UnqualifiedText(Cow<'a, str>),
     // foo:bar, where foo doesn't match a term below
     SingleField {
-        field: Cow<'a, str>,
+        field: OptionalRe<'a>,
         text: Cow<'a, str>,
         is_re: bool,
     },
     AddedInDays(u32),
     EditedInDays(u32),
-    CardTemplate(TemplateKind),
-    Deck(Cow<'a, str>),
+    CardTemplate(TemplateKind<'a>),
+    Deck(String),
     DeckID(DeckID),
     NoteTypeID(NoteTypeID),
-    NoteType(Cow<'a, str>),
+    NoteType(OptionalRe<'a>),
     Rated {
         days: u32,
         ease: Option<u8>,
     },
-    Tag(Cow<'a, str>),
+    Tag(OptionalRe<'a>),
     Duplicates {
         note_type_id: NoteTypeID,
-        text: String,
+        text: Cow<'a, str>,
     },
     State(StateKind),
     Flag(u8),
-    NoteIDs(Cow<'a, str>),
-    CardIDs(Cow<'a, str>),
+    NoteIDs(&'a str),
+    CardIDs(&'a str),
     Property {
         operator: String,
         kind: PropertyKind,
@@ -88,7 +93,7 @@ pub(super) enum SearchNode<'a> {
     WholeCollection,
     Regex(Cow<'a, str>),
     NoCombining(Cow<'a, str>),
-    WordBoundary(Cow<'a, str>),
+    WordBoundary(String),
 }
 
 #[derive(Debug, PartialEq)]
@@ -113,9 +118,9 @@ pub(super) enum StateKind {
 }
 
 #[derive(Debug, PartialEq)]
-pub(super) enum TemplateKind {
+pub(super) enum TemplateKind<'a> {
     Ordinal(u16),
-    Name(String),
+    Name(OptionalRe<'a>),
 }
 
 /// Parse the input string into a list of nodes.
@@ -127,7 +132,6 @@ pub(super) fn parse(input: &str) -> Result<Vec<Node>> {
 
     let (_, nodes) =
         all_consuming(group_inner)(input).map_err(|_e| AnkiError::SearchError(None))?;
-
     Ok(nodes)
 }
 
@@ -184,7 +188,7 @@ fn group_inner(input: &str) -> IResult<&str, Vec<Node>> {
 }
 
 fn whitespace0(s: &str) -> IResult<&str, Vec<char>> {
-    many0(one_of(" \u{3000}"))(s)
+    many0(one_of(" \u{3000}\t\n"))(s)
 }
 
 /// Optional leading space, then a (negated) group or text
@@ -205,32 +209,18 @@ fn text(s: &str) -> IResult<&str, Node> {
 
 /// Determine if text is a qualified search, and handle escaped chars.
 fn search_node_for_text(s: &str) -> ParseResult<SearchNode> {
-    let mut it = s.splitn(2, ':');
-    let (head, tail) = (
-        unescape_quotes(it.next().unwrap()),
-        it.next().map(unescape_quotes),
-    );
-
-    if let Some(tail) = tail {
-        search_node_for_text_with_argument(head, tail)
+    let (tail, head) = escaped(is_not(r":\"), '\\', anychar)(s)?;
+    if tail.is_empty() {
+        Ok(SearchNode::UnqualifiedText(unescape_to_glob(head)?))
     } else {
-        Ok(SearchNode::UnqualifiedText(head))
+        search_node_for_text_with_argument(head, &tail[1..])
     }
 }
 
-/// \" -> "
-fn unescape_quotes(s: &str) -> Cow<str> {
-    if s.find(r#"\""#).is_some() {
-        s.replace(r#"\""#, "\"").into()
-    } else {
-        s.into()
-    }
-}
-
-/// Unquoted text, terminated by a space or )
+/// Unquoted text, terminated by whitespace or unescaped ", ( or )
 fn unquoted_term(s: &str) -> IResult<&str, Node> {
     map_res(
-        take_while1(|c| c != ' ' && c != ')' && c != '"'),
+        escaped(is_not("\"() \u{3000}\\"), '\\', none_of(" \u{3000}")),
         |text: &str| -> ParseResult<Node> {
             Ok(if text.eq_ignore_ascii_case("or") {
                 Node::Or
@@ -261,52 +251,64 @@ fn quoted_term_inner(s: &str) -> IResult<&str, &str> {
 
 /// eg deck:"foo bar" - quotes must come after the :
 fn partially_quoted_term(s: &str) -> IResult<&str, Node> {
-    let term = take_while1(|c| c != ' ' && c != ')' && c != ':');
-    let (s, (term, _, quoted_val)) = tuple((term, char(':'), quoted_term_str))(s)?;
-    let quoted_val = unescape_quotes(quoted_val);
-
-    match search_node_for_text_with_argument(term.into(), quoted_val) {
-        Ok(search) => Ok((s, Node::Search(search))),
-        Err(_) => Err(nom::Err::Failure((s, nom::error::ErrorKind::NoneOf))),
-    }
+    map_res(
+        separated_pair(
+            escaped(is_not("\"(): \u{3000}\\"), '\\', none_of(": \u{3000}")),
+            char(':'),
+            quoted_term_str,
+        ),
+        |p| match search_node_for_text_with_argument(p.0, p.1) {
+            Ok(search) => Ok(Node::Search(search)),
+            Err(e) => Err(e),
+        },
+    )(s)
 }
 
 /// Convert a colon-separated key/val pair into the relevant search type.
 fn search_node_for_text_with_argument<'a>(
-    key: Cow<'a, str>,
-    val: Cow<'a, str>,
+    key: &'a str,
+    val: &'a str,
 ) -> ParseResult<SearchNode<'a>> {
     Ok(match key.to_ascii_lowercase().as_str() {
         "added" => SearchNode::AddedInDays(val.parse()?),
         "edited" => SearchNode::EditedInDays(val.parse()?),
-        "deck" => SearchNode::Deck(val),
-        "note" => SearchNode::NoteType(val),
-        "tag" => SearchNode::Tag(val),
+        "deck" => SearchNode::Deck(unescape_to_enforced_re(val)?),
+        "note" => SearchNode::NoteType(unescape_to_re(val)?),
+        "tag" => SearchNode::Tag(parse_tag(val)?),
         "mid" => SearchNode::NoteTypeID(val.parse()?),
         "nid" => SearchNode::NoteIDs(check_id_list(val)?),
         "cid" => SearchNode::CardIDs(check_id_list(val)?),
         "did" => SearchNode::DeckID(val.parse()?),
-        "card" => parse_template(val.as_ref()),
-        "is" => parse_state(val.as_ref())?,
-        "flag" => parse_flag(val.as_ref())?,
-        "rated" => parse_rated(val.as_ref())?,
-        "dupe" => parse_dupes(val.as_ref())?,
-        "prop" => parse_prop(val.as_ref())?,
-        "re" => SearchNode::Regex(val),
-        "nc" => SearchNode::NoCombining(val),
-        "w" => SearchNode::WordBoundary(val),
+        "card" => parse_template(val)?,
+        "is" => parse_state(val)?,
+        "flag" => parse_flag(val)?,
+        "rated" => parse_rated(val)?,
+        "dupe" => parse_dupes(val)?,
+        "prop" => parse_prop(val)?,
+        "re" => SearchNode::Regex(unescape_quotes(val)),
+        "nc" => SearchNode::NoCombining(unescape_to_glob(val)?),
+        "w" => SearchNode::WordBoundary(unescape_to_enforced_re(val)?),
         // anything else is a field search
-        _ => parse_single_field(key.as_ref(), val.as_ref()),
+        _ => parse_single_field(key, val)?,
     })
 }
 
+/// Ensure the string doesn't contain whitespace and unescape.
+fn parse_tag(s: &str) -> ParseResult<OptionalRe> {
+    if s.as_bytes().iter().any(u8::is_ascii_whitespace) {
+        Err(ParseError {})
+    } else {
+        unescape_to_custom_re(s, r"\S")
+    }
+}
+
 /// ensure a list of ids contains only numbers and commas, returning unchanged if true
 /// used by nid: and cid:
-fn check_id_list(s: Cow<str>) -> ParseResult<Cow<str>> {
+fn check_id_list(s: &str) -> ParseResult<&str> {
     lazy_static! {
         static ref RE: Regex = Regex::new(r"^(\d+,)*\d+$").unwrap();
     }
-    if RE.is_match(s.as_ref()) {
+    if RE.is_match(s) {
         Ok(s)
     } else {
         Err(ParseError {})
@@ -360,13 +362,13 @@ fn parse_rated(val: &str) -> ParseResult<SearchNode<'static>> {
 }
 
 /// eg dupes:1231,hello
-fn parse_dupes(val: &str) -> ParseResult<SearchNode<'static>> {
+fn parse_dupes(val: &str) -> ParseResult<SearchNode> {
     let mut it = val.splitn(2, ',');
     let mid: NoteTypeID = it.next().unwrap().parse()?;
     let text = it.next().ok_or(ParseError {})?;
     Ok(SearchNode::Duplicates {
         note_type_id: mid,
-        text: text.into(),
+        text: unescape_quotes(text),
     })
 }
 
@@ -411,27 +413,122 @@ fn parse_prop(val: &str) -> ParseResult<SearchNode<'static>> {
     })
 }
 
-fn parse_template(val: &str) -> SearchNode<'static> {
-    SearchNode::CardTemplate(match val.parse::<u16>() {
+fn parse_template(val: &str) -> ParseResult<SearchNode> {
+    Ok(SearchNode::CardTemplate(match val.parse::<u16>() {
         Ok(n) => TemplateKind::Ordinal(n.max(1) - 1),
-        Err(_) => TemplateKind::Name(val.into()),
+        Err(_) => TemplateKind::Name(unescape_to_re(val)?),
+    }))
+}
+
+fn parse_single_field<'a>(key: &'a str, val: &'a str) -> ParseResult<SearchNode<'a>> {
+    Ok(if val.starts_with("re:") {
+        SearchNode::SingleField {
+            field: unescape_to_re(key)?,
+            text: unescape_quotes(&val[3..]),
+            is_re: true,
+        }
+    } else {
+        SearchNode::SingleField {
+            field: unescape_to_re(key)?,
+            text: unescape_to_glob(val)?,
+            is_re: false,
+        }
     })
 }
 
-fn parse_single_field(key: &str, mut val: &str) -> SearchNode<'static> {
-    let is_re = if val.starts_with("re:") {
-        val = val.trim_start_matches("re:");
-        true
+/// For strings without unescaped ", convert \" to "
+fn unescape_quotes(s: &str) -> Cow<str> {
+    if s.contains('"') {
+        s.replace(r#"\""#, "\"").into()
     } else {
-        false
-    };
-    SearchNode::SingleField {
-        field: key.to_string().into(),
-        text: val.to_string().into(),
-        is_re,
+        s.into()
     }
 }
 
+/// Check string for invalid escape sequences.
+fn is_invalid_escape(txt: &str) -> bool {
+    // odd number of \s not followed by an escapable character
+    lazy_static! {
+        static ref RE: Regex = Regex::new(r#"(^|[^\\])(\\\\)*\\([^":*_()]|$)"#).unwrap();
+    }
+    RE.is_match(txt)
+}
+
+/// Handle escaped characters and convert Anki wildcards to SQL wildcards.
+/// Return error if there is an undefined escape sequence.
+fn unescape_to_glob(txt: &str) -> ParseResult<Cow<str>> {
+    if is_invalid_escape(txt) {
+        Err(ParseError {})
+    } else {
+        // escape sequences and unescaped special characters which need conversion
+        lazy_static! {
+            static ref RE: Regex = Regex::new(r"\\.|[*%]").unwrap();
+        }
+        Ok(RE.replace_all(&txt, |caps: &Captures| {
+            match &caps[0] {
+                r"\\" => r"\\",
+                "\\\"" => "\"",
+                r"\:" => ":",
+                r"\*" => "*",
+                r"\_" => r"\_",
+                r"\(" => "(",
+                r"\)" => ")",
+                "*" => "%",
+                "%" => r"\%",
+                _ => unreachable!(),
+            }
+        }))
+    }
+}
+
+/// Handle escaped characters and convert to regex if there are wildcards.
+/// Return error if there is an undefined escape sequence.
+fn unescape_to_re(txt: &str) -> ParseResult<OptionalRe> {
+    unescape_to_custom_re(txt, ".")
+}
+
+/// Handle escaped characters and if there are wildcards, convert to a regex using the given wildcard.
+/// Return error if there is an undefined escape sequence.
+fn unescape_to_custom_re<'a>(txt: &'a str, wildcard: &str) -> ParseResult<OptionalRe<'a>> {
+    if is_invalid_escape(txt) {
+        Err(ParseError {})
+    } else {
+        lazy_static! {
+            static ref WILDCARD: Regex = Regex::new(r"(^|[^\\])(\\\\)*[*_]").unwrap();
+            static ref MAYBE_ESCAPED: Regex = Regex::new(r"\\?.").unwrap();
+            static ref ESCAPED: Regex = Regex::new(r"\\(.)").unwrap();
+        }
+        if WILDCARD.is_match(txt) {
+            Ok(OptionalRe::Re(MAYBE_ESCAPED.replace_all(
+                &txt,
+                |caps: &Captures| {
+                    let s = &caps[0];
+                    match s {
+                        r"\\" | r"\*" | r"\(" | r"\)" => s.to_string(),
+                        "\\\"" => "\"".to_string(),
+                        r"\:" => ":".to_string(),
+                        r"*" => format!("{}*", wildcard),
+                        "_" => wildcard.to_string(),
+                        r"\_" => r"_".to_string(),
+                        s => regex::escape(s),
+                    }
+                },
+            )))
+        } else {
+            Ok(OptionalRe::Text(ESCAPED.replace_all(&txt, "$1")))
+        }
+    }
+}
+
+/// Handle escaped characters and convert to regex.
+/// Return error if there is an undefined escape sequence.
+fn unescape_to_enforced_re(txt: &str) -> ParseResult<String> {
+    Ok(match unescape_to_re(txt)? {
+        OptionalRe::Text(s) => regex::escape(s.as_ref()),
+        OptionalRe::Re(s) => s.to_string(),
+    })
+}
+
 #[cfg(test)]
 mod test {
     use super::*;
@@ -440,6 +537,7 @@ mod test {
     fn parsing() -> Result<()> {
         use Node::*;
         use SearchNode::*;
+        use OptionalRe::*;
 
         assert_eq!(parse("")?, vec![Search(SearchNode::WholeCollection)]);
         assert_eq!(parse("  ")?, vec![Search(SearchNode::WholeCollection)]);
@@ -478,7 +576,7 @@ mod test {
                     Search(UnqualifiedText("world".into())),
                     And,
                     Search(SingleField {
-                        field: "foo".into(),
+                        field: Text("foo".into()),
                         text: "bar baz".into(),
                         is_re: false,
                     })
@@ -491,7 +589,7 @@ mod test {
         assert_eq!(
             parse("foo:re:bar")?,
             vec![Search(SingleField {
-                field: "foo".into(),
+                field: Text("foo".into()),
                 text: "bar".into(),
                 is_re: true
             })]
@@ -501,7 +599,7 @@ mod test {
         assert_eq!(
             parse(r#""field:va\"lue""#)?,
             vec![Search(SingleField {
-                field: "field".into(),
+                field: Text("foo".into()),
                 text: "va\"lue".into(),
                 is_re: false
             })]
@@ -517,7 +615,7 @@ mod test {
         assert_eq!(parse("added:3")?, vec![Search(AddedInDays(3))]);
         assert_eq!(
             parse("card:front")?,
-            vec![Search(CardTemplate(TemplateKind::Name("front".into())))]
+            vec![Search(CardTemplate(TemplateKind::Name(Text("front".into()))))]
         );
         assert_eq!(
             parse("card:3")?,
diff --git a/rslib/src/search/sqlwriter.rs b/rslib/src/search/sqlwriter.rs
index 611f3adce..9f17c555c 100644
--- a/rslib/src/search/sqlwriter.rs
+++ b/rslib/src/search/sqlwriter.rs
@@ -1,7 +1,7 @@
 // Copyright: Ankitects Pty Ltd and contributors
 // License: GNU AGPL, version 3 or later; http://www.gnu.org/licenses/agpl.html
 
-use super::parser::{Node, PropertyKind, SearchNode, StateKind, TemplateKind};
+use super::parser::{Node, PropertyKind, SearchNode, StateKind, OptionalRe, TemplateKind};
 use crate::{
     card::{CardQueue, CardType},
     collection::Collection,
@@ -9,13 +9,13 @@ use crate::{
     err::Result,
     notes::field_checksum,
     notetype::NoteTypeID,
-    text::{matches_wildcard, text_to_re},
+    text::text_to_re,
     text::{normalize_to_nfc, strip_html_preserving_image_filenames, without_combining},
     timestamp::TimestampSecs,
 };
-use lazy_static::lazy_static;
 use regex::Regex;
 use std::{borrow::Cow, fmt::Write};
+use unicase::eq as uni_eq;
 
 pub(crate) struct SqlWriter<'a> {
     col: &'a mut Collection,
@@ -119,7 +119,7 @@ impl SqlWriter<'_> {
             // note fields related
             SearchNode::UnqualifiedText(text) => self.write_unqualified(&self.norm_note(text)),
             SearchNode::SingleField { field, text, is_re } => {
-                self.write_single_field(field.as_ref(), &self.norm_note(text), *is_re)?
+                self.write_single_field(field, &self.norm_note(text), *is_re)?
             }
             SearchNode::Duplicates { note_type_id, text } => {
                 self.write_dupes(*note_type_id, &self.norm_note(text))
@@ -131,14 +131,8 @@ impl SqlWriter<'_> {
             // other
             SearchNode::AddedInDays(days) => self.write_added(*days)?,
             SearchNode::EditedInDays(days) => self.write_edited(*days)?,
-            SearchNode::CardTemplate(template) => match template {
-                TemplateKind::Ordinal(_) => {
-                    self.write_template(template)?;
-                }
-                TemplateKind::Name(name) => {
-                    self.write_template(&TemplateKind::Name(norm(name).into()))?;
-                }
-            },
+            // fixme: normalise in name case?
+            SearchNode::CardTemplate(template) => self.write_template(template)?,
             SearchNode::Deck(deck) => self.write_deck(&norm(deck))?,
             SearchNode::NoteTypeID(ntid) => {
                 write!(self.sql, "n.mid = {}", ntid).unwrap();
@@ -146,9 +140,12 @@ impl SqlWriter<'_> {
             SearchNode::DeckID(did) => {
                 write!(self.sql, "c.did = {}", did).unwrap();
             }
-            SearchNode::NoteType(notetype) => self.write_note_type(&norm(notetype))?,
+            // fixme: normalise?
+            SearchNode::NoteType(notetype) => self.write_note_type(notetype)?,
             SearchNode::Rated { days, ease } => self.write_rated(*days, *ease)?,
-            SearchNode::Tag(tag) => self.write_tag(&norm(tag))?,
+
+            // fixme: normalise?
+            SearchNode::Tag(tag) => self.write_tag(tag)?,
             SearchNode::State(state) => self.write_state(state)?,
             SearchNode::Flag(flag) => {
                 write!(self.sql, "(c.flags & 7) == {}", flag).unwrap();
@@ -167,7 +164,7 @@ impl SqlWriter<'_> {
 
     fn write_unqualified(&mut self, text: &str) {
         // implicitly wrap in %
-        let text = format!("%{}%", convert_glob_char(text));
+        let text = format!("%{}%", text);
         self.args.push(text);
         write!(
             self.sql,
@@ -191,27 +188,27 @@ impl SqlWriter<'_> {
         .unwrap();
     }
 
-    fn write_tag(&mut self, text: &str) -> Result<()> {
+    fn write_tag(&mut self, text: &OptionalRe) -> Result<()> {
         match text {
-            "none" => {
-                write!(self.sql, "n.tags = ''").unwrap();
-            }
-            "*" | "%" => {
-                write!(self.sql, "true").unwrap();
-            }
-            text => {
-                if let Some(re_glob) = glob_to_re(text) {
-                    // text contains a wildcard
-                    let re_glob = format!("(?i).* {} .*", re_glob);
-                    write!(self.sql, "n.tags regexp ?").unwrap();
-                    self.args.push(re_glob);
-                } else if let Some(tag) = self.col.storage.preferred_tag_case(&text)? {
+            OptionalRe::Text(s) => {
+                if s == "none" {
+                    write!(self.sql, "n.tags = ''").unwrap();
+                } else if let Some(tag) = self.col.storage.preferred_tag_case(s)? {
                     write!(self.sql, "n.tags like ?").unwrap();
                     self.args.push(format!("% {} %", tag));
                 } else {
                     write!(self.sql, "false").unwrap();
                 }
             }
+            OptionalRe::Re(s) => {
+                if s == "*" {
+                    write!(self.sql, "true").unwrap();
+                } else {
+                    let re = format!("(?i).* {} .*", s);
+                    write!(self.sql, "n.tags regexp ?").unwrap();
+                    self.args.push(re);
+                }
+            }
         }
         Ok(())
     }
@@ -340,45 +337,54 @@ impl SqlWriter<'_> {
             TemplateKind::Ordinal(n) => {
                 write!(self.sql, "c.ord = {}", n).unwrap();
             }
-            TemplateKind::Name(name) => {
-                if let Some(re) = glob_to_re(name) {
-                    let re = format!("(?i){}", re);
+            TemplateKind::Name(name) => match name {
+                OptionalRe::Re(s) => {
+                    let re = format!("(?i){}", s);
                     self.sql.push_str(
                         "(n.mid,c.ord) in (select ntid,ord from templates where name regexp ?)",
                     );
                     self.args.push(re);
-                } else {
+                }
+                OptionalRe::Text(s) => {
                     self.sql.push_str(
                         "(n.mid,c.ord) in (select ntid,ord from templates where name = ?)",
                     );
-                    self.args.push(name.to_string());
+                    self.args.push(s.to_string());
                 }
-            }
+            },
         };
         Ok(())
     }
 
-    fn write_note_type(&mut self, nt_name: &str) -> Result<()> {
-        if let Some(re) = glob_to_re(nt_name) {
-            let re = format!("(?i){}", re);
-            self.sql
-                .push_str("n.mid in (select id from notetypes where name regexp ?)");
-            self.args.push(re);
-        } else {
-            self.sql
-                .push_str("n.mid in (select id from notetypes where name = ?)");
-            self.args.push(nt_name.to_string());
+    fn write_note_type(&mut self, nt_name: &OptionalRe) -> Result<()> {
+        match nt_name {
+            OptionalRe::Re(s) => {
+                let re = format!("(?i){}", s);
+                self.sql
+                    .push_str("n.mid in (select id from notetypes where name regexp ?)");
+                self.args.push(re);
+            }
+            OptionalRe::Text(s) => {
+                self.sql
+                    .push_str("n.mid in (select id from notetypes where name = ?)");
+                self.args.push(s.to_string());
+            }
         }
         Ok(())
     }
 
-    fn write_single_field(&mut self, field_name: &str, val: &str, is_re: bool) -> Result<()> {
+    fn write_single_field(
+        &mut self,
+        field_name: &OptionalRe,
+        val: &str,
+        is_re: bool,
+    ) -> Result<()> {
         let note_types = self.col.get_all_notetypes()?;
 
         let mut field_map = vec![];
         for nt in note_types.values() {
             for field in &nt.fields {
-                if matches_wildcard(&field.name, field_name) {
+                if matches_string_variant(&field.name, field_name) {
                     field_map.push((nt.id, field.ord));
                 }
             }
@@ -401,7 +407,7 @@ impl SqlWriter<'_> {
         } else {
             cmp = "like";
             cmp_trailer = "escape '\\'";
-            self.args.push(convert_glob_char(val).into())
+            self.args.push(val.into())
         }
 
         let arg_idx = self.args.len();
@@ -455,27 +461,16 @@ impl SqlWriter<'_> {
     }
 
     fn write_word_boundary(&mut self, word: &str) {
-        // fixme: need to escape in the no-glob case as well
-        let re = text_to_re(word);
-        self.write_regex(&format!(r"\b{}\b", re))
+        self.write_regex(&format!(r"\b{}\b", word))
     }
 }
 
-/// Replace * with %, leaving \* alone.
-fn convert_glob_char(val: &str) -> Cow<str> {
-    lazy_static! {
-        static ref RE: Regex = Regex::new(r"(^|[^\\])\*").unwrap();
+/// True if the content of search is equal to text, folding case.
+fn matches_string_variant(text: &str, search: &OptionalRe) -> bool {
+    match search {
+        OptionalRe::Re(s) => Regex::new(&format!("^(?i){}$", s)).unwrap().is_match(text),
+        OptionalRe::Text(s) => uni_eq(text, s),
     }
-    RE.replace_all(val, "${1}%")
-}
-
-/// Convert a string with _, % or * characters into a regex.
-/// If string contains no globbing characters, return None.
-fn glob_to_re(glob: &str) -> Option<String> {
-    if !glob.contains(|c| c == '_' || c == '*' || c == '%') {
-        return None;
-    }
-    Some(text_to_re(glob))
 }
 
 #[derive(Debug, PartialEq, Clone, Copy)]
@@ -803,12 +798,4 @@ mod test {
             RequiredTable::Notes
         );
     }
-
-    #[test]
-    fn convert_glob() {
-        assert_eq!(&convert_glob_char("foo*bar"), "foo%bar");
-        assert_eq!(&convert_glob_char("*bar"), "%bar");
-        assert_eq!(&convert_glob_char("\n*bar"), "\n%bar");
-        assert_eq!(&convert_glob_char(r"\*bar"), r"\*bar");
-    }
 }
diff --git a/rslib/src/text.rs b/rslib/src/text.rs
index 0793281c0..b24b838c9 100644
--- a/rslib/src/text.rs
+++ b/rslib/src/text.rs
@@ -5,7 +5,6 @@ use lazy_static::lazy_static;
 use regex::{Captures, Regex};
 use std::borrow::Cow;
 use std::ptr;
-use unicase::eq as uni_eq;
 use unicode_normalization::{
     char::is_combining_mark, is_nfc, is_nfkd_quick, IsNormalized, UnicodeNormalization,
 };
@@ -240,17 +239,6 @@ pub(crate) fn ensure_string_in_nfc(s: &mut String) {
     }
 }
 
-/// True if search is equal to text, folding case.
-/// Supports '*' to match 0 or more characters.
-pub(crate) fn matches_wildcard(text: &str, search: &str) -> bool {
-    if search.contains('*') {
-        let search = format!("^(?i){}$", regex::escape(search).replace(r"\*", ".*"));
-        Regex::new(&search).unwrap().is_match(text)
-    } else {
-        uni_eq(text, search)
-    }
-}
-
 /// Convert provided string to NFKD form and strip combining characters.
 pub(crate) fn without_combining(s: &str) -> Cow<str> {
     // if the string is already normalized
@@ -303,7 +291,6 @@ pub(crate) fn text_to_re(glob: &str) -> String {
 
 #[cfg(test)]
 mod test {
-    use super::matches_wildcard;
     use crate::text::without_combining;
     use crate::text::{
         extract_av_tags, strip_av_tags, strip_html, strip_html_preserving_image_filenames, AVTag,
@@ -351,15 +338,6 @@ mod test {
         );
     }
 
-    #[test]
-    fn wildcard() {
-        assert_eq!(matches_wildcard("foo", "bar"), false);
-        assert_eq!(matches_wildcard("foo", "Foo"), true);
-        assert_eq!(matches_wildcard("foo", "F*"), true);
-        assert_eq!(matches_wildcard("foo", "F*oo"), true);
-        assert_eq!(matches_wildcard("foo", "b*"), false);
-    }
-
     #[test]
     fn combining() {
         assert!(matches!(without_combining("test"), Cow::Borrowed(_)));

From b186e61e549b8f0322fecee3aa97ebb246869ee4 Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Sat, 14 Nov 2020 18:28:24 +0100
Subject: [PATCH 02/20] Fix 'escaped' parser for empty string

Fix a bug where 'escaped' parsers (nom) accepted the empty
string by wrapping them in 'verify' parsers.
---
 rslib/src/search/parser.rs | 12 ++++++++++--
 1 file changed, 10 insertions(+), 2 deletions(-)

diff --git a/rslib/src/search/parser.rs b/rslib/src/search/parser.rs
index 44315af0d..37ff504f8 100644
--- a/rslib/src/search/parser.rs
+++ b/rslib/src/search/parser.rs
@@ -11,7 +11,7 @@ use nom::{
     branch::alt,
     bytes::complete::{escaped, is_not, tag},
     character::complete::{anychar, char, none_of, one_of},
-    combinator::{all_consuming, map, map_res},
+    combinator::{all_consuming, map, map_res, verify},
     sequence::{delimited, preceded, separated_pair},
     {multi::many0, IResult},
 };
@@ -220,7 +220,10 @@ fn search_node_for_text(s: &str) -> ParseResult<SearchNode> {
 /// Unquoted text, terminated by whitespace or unescaped ", ( or )
 fn unquoted_term(s: &str) -> IResult<&str, Node> {
     map_res(
+        verify(
         escaped(is_not("\"() \u{3000}\\"), '\\', none_of(" \u{3000}")),
+            |s: &str| !s.is_empty(),
+        ),
         |text: &str| -> ParseResult<Node> {
             Ok(if text.eq_ignore_ascii_case("or") {
                 Node::Or
@@ -246,14 +249,19 @@ fn quoted_term_str(s: &str) -> IResult<&str, &str> {
 
 /// Quoted text, terminated by a non-escaped double quote
 fn quoted_term_inner(s: &str) -> IResult<&str, &str> {
-    escaped(is_not(r#""\"#), '\\', anychar)(s)
+    verify(escaped(is_not(r#""\"#), '\\', anychar), |s: &str| {
+        !s.is_empty()
+    })(s)
 }
 
 /// eg deck:"foo bar" - quotes must come after the :
 fn partially_quoted_term(s: &str) -> IResult<&str, Node> {
     map_res(
         separated_pair(
+            verify(
             escaped(is_not("\"(): \u{3000}\\"), '\\', none_of(": \u{3000}")),
+                |s: &str| !s.is_empty(),
+            ),
             char(':'),
             quoted_term_str,
         ),

From 39499967285714ed30bf1ed9274b926a06583b49 Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Sat, 14 Nov 2020 18:32:41 +0100
Subject: [PATCH 03/20] For deck searches, unescape quotes only

For now, revert to the old handling of deck names using text_to_re from
text.rs and have parser.rs only unescape quotes.
---
 rslib/src/search/parser.rs    | 4 ++--
 rslib/src/search/sqlwriter.rs | 1 +
 2 files changed, 3 insertions(+), 2 deletions(-)

diff --git a/rslib/src/search/parser.rs b/rslib/src/search/parser.rs
index 37ff504f8..54fb8c553 100644
--- a/rslib/src/search/parser.rs
+++ b/rslib/src/search/parser.rs
@@ -69,7 +69,7 @@ pub(super) enum SearchNode<'a> {
     AddedInDays(u32),
     EditedInDays(u32),
     CardTemplate(TemplateKind<'a>),
-    Deck(String),
+    Deck(Cow<'a, str>),
     DeckID(DeckID),
     NoteTypeID(NoteTypeID),
     NoteType(OptionalRe<'a>),
@@ -280,7 +280,7 @@ fn search_node_for_text_with_argument<'a>(
     Ok(match key.to_ascii_lowercase().as_str() {
         "added" => SearchNode::AddedInDays(val.parse()?),
         "edited" => SearchNode::EditedInDays(val.parse()?),
-        "deck" => SearchNode::Deck(unescape_to_enforced_re(val)?),
+        "deck" => SearchNode::Deck(unescape_quotes(val)),
         "note" => SearchNode::NoteType(unescape_to_re(val)?),
         "tag" => SearchNode::Tag(parse_tag(val)?),
         "mid" => SearchNode::NoteTypeID(val.parse()?),
diff --git a/rslib/src/search/sqlwriter.rs b/rslib/src/search/sqlwriter.rs
index 9f17c555c..5ea422b04 100644
--- a/rslib/src/search/sqlwriter.rs
+++ b/rslib/src/search/sqlwriter.rs
@@ -319,6 +319,7 @@ impl SqlWriter<'_> {
                 };
 
                 // convert to a regex that includes child decks
+                // fixme: use unescape_to_enforced_re from parser.rs?
                 let re = text_to_re(&native_deck);
                 self.args.push(format!("(?i)^{}($|\x1f)", re));
                 let arg_idx = self.args.len();

From 836977aac8cc2ac17d286eaa294fb8b5b9f52508 Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Sat, 14 Nov 2020 19:10:56 +0100
Subject: [PATCH 04/20] Fix whitespace in write_tag and parser/whitespac0

---
 rslib/src/search/parser.rs    | 2 +-
 rslib/src/search/sqlwriter.rs | 2 +-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/rslib/src/search/parser.rs b/rslib/src/search/parser.rs
index 54fb8c553..1123cd701 100644
--- a/rslib/src/search/parser.rs
+++ b/rslib/src/search/parser.rs
@@ -188,7 +188,7 @@ fn group_inner(input: &str) -> IResult<&str, Vec<Node>> {
 }
 
 fn whitespace0(s: &str) -> IResult<&str, Vec<char>> {
-    many0(one_of(" \u{3000}\t\n"))(s)
+    many0(one_of(" \u{3000}"))(s)
 }
 
 /// Optional leading space, then a (negated) group or text
diff --git a/rslib/src/search/sqlwriter.rs b/rslib/src/search/sqlwriter.rs
index 5ea422b04..e062bab01 100644
--- a/rslib/src/search/sqlwriter.rs
+++ b/rslib/src/search/sqlwriter.rs
@@ -201,7 +201,7 @@ impl SqlWriter<'_> {
                 }
             }
             OptionalRe::Re(s) => {
-                if s == "*" {
+                if s == r"\S*" {
                     write!(self.sql, "true").unwrap();
                 } else {
                     let re = format!("(?i).* {} .*", s);

From 9e5348100366da5a5aea3bdaccd55933c20deeb2 Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Sat, 14 Nov 2020 19:13:09 +0100
Subject: [PATCH 05/20] Fix tests for new search parsing (and reformat)

---
 rslib/src/search/parser.rs    | 50 ++++++++++++++++++-----------------
 rslib/src/search/sqlwriter.rs | 13 +++++----
 2 files changed, 32 insertions(+), 31 deletions(-)

diff --git a/rslib/src/search/parser.rs b/rslib/src/search/parser.rs
index 1123cd701..e4f4cdb93 100644
--- a/rslib/src/search/parser.rs
+++ b/rslib/src/search/parser.rs
@@ -18,7 +18,6 @@ use nom::{
 use regex::{Captures, Regex};
 use std::{borrow::Cow, num};
 
-
 struct ParseError {}
 
 impl From<num::ParseIntError> for ParseError {
@@ -221,7 +220,7 @@ fn search_node_for_text(s: &str) -> ParseResult<SearchNode> {
 fn unquoted_term(s: &str) -> IResult<&str, Node> {
     map_res(
         verify(
-        escaped(is_not("\"() \u{3000}\\"), '\\', none_of(" \u{3000}")),
+            escaped(is_not("\"() \u{3000}\\"), '\\', none_of(" \u{3000}")),
             |s: &str| !s.is_empty(),
         ),
         |text: &str| -> ParseResult<Node> {
@@ -259,7 +258,7 @@ fn partially_quoted_term(s: &str) -> IResult<&str, Node> {
     map_res(
         separated_pair(
             verify(
-            escaped(is_not("\"(): \u{3000}\\"), '\\', none_of(": \u{3000}")),
+                escaped(is_not("\"(): \u{3000}\\"), '\\', none_of(": \u{3000}")),
                 |s: &str| !s.is_empty(),
             ),
             char(':'),
@@ -472,19 +471,17 @@ fn unescape_to_glob(txt: &str) -> ParseResult<Cow<str>> {
         lazy_static! {
             static ref RE: Regex = Regex::new(r"\\.|[*%]").unwrap();
         }
-        Ok(RE.replace_all(&txt, |caps: &Captures| {
-            match &caps[0] {
-                r"\\" => r"\\",
-                "\\\"" => "\"",
-                r"\:" => ":",
-                r"\*" => "*",
-                r"\_" => r"\_",
-                r"\(" => "(",
-                r"\)" => ")",
-                "*" => "%",
-                "%" => r"\%",
-                _ => unreachable!(),
-            }
+        Ok(RE.replace_all(&txt, |caps: &Captures| match &caps[0] {
+            r"\\" => r"\\",
+            "\\\"" => "\"",
+            r"\:" => ":",
+            r"\*" => "*",
+            r"\_" => r"\_",
+            r"\(" => "(",
+            r"\)" => ")",
+            "*" => "%",
+            "%" => r"\%",
+            _ => unreachable!(),
         }))
     }
 }
@@ -512,12 +509,12 @@ fn unescape_to_custom_re<'a>(txt: &'a str, wildcard: &str) -> ParseResult<Option
                 |caps: &Captures| {
                     let s = &caps[0];
                     match s {
-                        r"\\" | r"\*" | r"\(" | r"\)" => s.to_string(),
+                        "\\" | r"\*" | r"\(" | r"\)" => s.to_string(),
                         "\\\"" => "\"".to_string(),
                         r"\:" => ":".to_string(),
-                        r"*" => format!("{}*", wildcard),
+                        "*" => format!("{}*", wildcard),
                         "_" => wildcard.to_string(),
-                        r"\_" => r"_".to_string(),
+                        r"\_" => "_".to_string(),
                         s => regex::escape(s),
                     }
                 },
@@ -544,8 +541,8 @@ mod test {
     #[test]
     fn parsing() -> Result<()> {
         use Node::*;
-        use SearchNode::*;
         use OptionalRe::*;
+        use SearchNode::*;
 
         assert_eq!(parse("")?, vec![Search(SearchNode::WholeCollection)]);
         assert_eq!(parse("  ")?, vec![Search(SearchNode::WholeCollection)]);
@@ -607,7 +604,7 @@ mod test {
         assert_eq!(
             parse(r#""field:va\"lue""#)?,
             vec![Search(SingleField {
-                field: Text("foo".into()),
+                field: Text("field".into()),
                 text: "va\"lue".into(),
                 is_re: false
             })]
@@ -623,7 +620,9 @@ mod test {
         assert_eq!(parse("added:3")?, vec![Search(AddedInDays(3))]);
         assert_eq!(
             parse("card:front")?,
-            vec![Search(CardTemplate(TemplateKind::Name(Text("front".into()))))]
+            vec![Search(CardTemplate(TemplateKind::Name(Text(
+                "front".into()
+            ))))]
         );
         assert_eq!(
             parse("card:3")?,
@@ -640,8 +639,11 @@ mod test {
             vec![Search(Deck("default one".into()))]
         );
 
-        assert_eq!(parse("note:basic")?, vec![Search(NoteType("basic".into()))]);
-        assert_eq!(parse("tag:hard")?, vec![Search(Tag("hard".into()))]);
+        assert_eq!(
+            parse("note:basic")?,
+            vec![Search(NoteType(Text("basic".into())))]
+        );
+        assert_eq!(parse("tag:hard")?, vec![Search(Tag(Text("hard".into())))]);
         assert_eq!(
             parse("nid:1237123712,2,3")?,
             vec![Search(NoteIDs("1237123712,2,3".into()))]
diff --git a/rslib/src/search/sqlwriter.rs b/rslib/src/search/sqlwriter.rs
index e062bab01..b6a7647cc 100644
--- a/rslib/src/search/sqlwriter.rs
+++ b/rslib/src/search/sqlwriter.rs
@@ -1,7 +1,7 @@
 // Copyright: Ankitects Pty Ltd and contributors
 // License: GNU AGPL, version 3 or later; http://www.gnu.org/licenses/agpl.html
 
-use super::parser::{Node, PropertyKind, SearchNode, StateKind, OptionalRe, TemplateKind};
+use super::parser::{Node, OptionalRe, PropertyKind, SearchNode, StateKind, TemplateKind};
 use crate::{
     card::{CardQueue, CardType},
     collection::Collection,
@@ -597,10 +597,9 @@ mod test {
                 vec!["%te%st%".into()]
             )
         );
-        assert_eq!(s(ctx, "te%st").1, vec!["%te%st%".to_string()]);
-        // user should be able to escape sql wildcards
-        assert_eq!(s(ctx, r#"te\%s\_t"#).1, vec!["%te\\%s\\_t%".to_string()]);
-        assert_eq!(s(ctx, r#"te\*s\_t"#).1, vec!["%te\\*s\\_t%".to_string()]);
+        assert_eq!(s(ctx, "te%st").1, vec![r"%te\%st%".to_string()]);
+        // user should be able to escape wildcards
+        assert_eq!(s(ctx, r#"te\*s\_t"#).1, vec!["%te*s\\_t%".to_string()]);
 
         // qualified search
         assert_eq!(
@@ -682,10 +681,10 @@ mod test {
 
         // wildcards force a regexp search
         assert_eq!(
-            s(ctx, r"tag:o*n\*et%w\%oth_re\_e"),
+            s(ctx, r"tag:o*n\*et%w%oth_re\_e"),
             (
                 "(n.tags regexp ?)".into(),
-                vec![r"(?i).* o.*n\*et.*w%oth.re_e .*".into()]
+                vec![r"(?i).* o\S*n\*et%w%oth\Sre_e .*".into()]
             )
         );
         assert_eq!(s(ctx, "tag:none"), ("(n.tags = '')".into(), vec![]));

From 8d24fb89bff69a73320c823d2014c562ae3819b1 Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Sat, 14 Nov 2020 20:37:40 +0100
Subject: [PATCH 06/20] Update frontend search escapes to new parsing

---
 qt/aqt/browser.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/qt/aqt/browser.py b/qt/aqt/browser.py
index 5bdfc5e39..150fbb58e 100644
--- a/qt/aqt/browser.py
+++ b/qt/aqt/browser.py
@@ -1215,7 +1215,7 @@ QTableView {{ gridline-color: {grid} }}
                 if i % 2 == 0:
                     txt += a + ":"
                 else:
-                    txt += re.sub("[*%_]", r"\\\g<0>", a)
+                    txt += re.sub(r"[*_\\]", r"\\\g<0>", a)
                     for c in ' 　()"':
                         if c in txt:
                             txt = '"{}"'.format(txt.replace('"', '\\"'))

From d1ee507b3a5f0e7d02dbfd6d50a2cf84afa086e2 Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Sun, 15 Nov 2020 09:39:10 +0100
Subject: [PATCH 07/20] Update frontend test to new escape handling

---
 pylib/tests/test_find.py | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/pylib/tests/test_find.py b/pylib/tests/test_find.py
index d9b7f76f2..ffa190fa6 100644
--- a/pylib/tests/test_find.py
+++ b/pylib/tests/test_find.py
@@ -48,8 +48,7 @@ def test_findCards():
     # tag searches
     assert len(col.findCards("tag:*")) == 5
     assert len(col.findCards("tag:\\*")) == 1
-    assert len(col.findCards("tag:%")) == 5
-    assert len(col.findCards("tag:\\%")) == 1
+    assert len(col.findCards("tag:%")) == 1
     assert len(col.findCards("tag:animal_1")) == 2
     assert len(col.findCards("tag:animal\\_1")) == 1
     assert not col.findCards("tag:donkey")

From 57787368a1f0421885b96ca9fc952e1e4b5bcfbd Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Sun, 15 Nov 2020 09:52:00 +0100
Subject: [PATCH 08/20] Always use regex for tag search

Don't distinguish between the glob and no-glob cases when comparing
tags but always use regexp. Thus, avoid problems with SQL wildcards in
registered tags.
---
 rslib/src/search/parser.rs    | 14 +++++++-------
 rslib/src/search/sqlwriter.rs | 33 +++++++++------------------------
 2 files changed, 16 insertions(+), 31 deletions(-)

diff --git a/rslib/src/search/parser.rs b/rslib/src/search/parser.rs
index e4f4cdb93..ec8727456 100644
--- a/rslib/src/search/parser.rs
+++ b/rslib/src/search/parser.rs
@@ -76,7 +76,7 @@ pub(super) enum SearchNode<'a> {
         days: u32,
         ease: Option<u8>,
     },
-    Tag(OptionalRe<'a>),
+    Tag(String),
     Duplicates {
         note_type_id: NoteTypeID,
         text: Cow<'a, str>,
@@ -294,18 +294,18 @@ fn search_node_for_text_with_argument<'a>(
         "prop" => parse_prop(val)?,
         "re" => SearchNode::Regex(unescape_quotes(val)),
         "nc" => SearchNode::NoCombining(unescape_to_glob(val)?),
-        "w" => SearchNode::WordBoundary(unescape_to_enforced_re(val)?),
+        "w" => SearchNode::WordBoundary(unescape_to_enforced_re(val, ".")?),
         // anything else is a field search
         _ => parse_single_field(key, val)?,
     })
 }
 
 /// Ensure the string doesn't contain whitespace and unescape.
-fn parse_tag(s: &str) -> ParseResult<OptionalRe> {
+fn parse_tag(s: &str) -> ParseResult<String> {
     if s.as_bytes().iter().any(u8::is_ascii_whitespace) {
         Err(ParseError {})
     } else {
-        unescape_to_custom_re(s, r"\S")
+        unescape_to_enforced_re(s, r"\S")
     }
 }
 
@@ -527,8 +527,8 @@ fn unescape_to_custom_re<'a>(txt: &'a str, wildcard: &str) -> ParseResult<Option
 
 /// Handle escaped characters and convert to regex.
 /// Return error if there is an undefined escape sequence.
-fn unescape_to_enforced_re(txt: &str) -> ParseResult<String> {
-    Ok(match unescape_to_re(txt)? {
+fn unescape_to_enforced_re(txt: &str, wildcard: &str) -> ParseResult<String> {
+    Ok(match unescape_to_custom_re(txt, wildcard)? {
         OptionalRe::Text(s) => regex::escape(s.as_ref()),
         OptionalRe::Re(s) => s.to_string(),
     })
@@ -643,7 +643,7 @@ mod test {
             parse("note:basic")?,
             vec![Search(NoteType(Text("basic".into())))]
         );
-        assert_eq!(parse("tag:hard")?, vec![Search(Tag(Text("hard".into())))]);
+        assert_eq!(parse("tag:hard")?, vec![Search(Tag("hard".to_string()))]);
         assert_eq!(
             parse("nid:1237123712,2,3")?,
             vec![Search(NoteIDs("1237123712,2,3".into()))]
diff --git a/rslib/src/search/sqlwriter.rs b/rslib/src/search/sqlwriter.rs
index b6a7647cc..daf6e2af2 100644
--- a/rslib/src/search/sqlwriter.rs
+++ b/rslib/src/search/sqlwriter.rs
@@ -188,28 +188,16 @@ impl SqlWriter<'_> {
         .unwrap();
     }
 
-    fn write_tag(&mut self, text: &OptionalRe) -> Result<()> {
-        match text {
-            OptionalRe::Text(s) => {
-                if s == "none" {
-                    write!(self.sql, "n.tags = ''").unwrap();
-                } else if let Some(tag) = self.col.storage.preferred_tag_case(s)? {
-                    write!(self.sql, "n.tags like ?").unwrap();
-                    self.args.push(format!("% {} %", tag));
-                } else {
-                    write!(self.sql, "false").unwrap();
-                }
-            }
-            OptionalRe::Re(s) => {
-                if s == r"\S*" {
-                    write!(self.sql, "true").unwrap();
-                } else {
-                    let re = format!("(?i).* {} .*", s);
-                    write!(self.sql, "n.tags regexp ?").unwrap();
-                    self.args.push(re);
-                }
+    fn write_tag(&mut self, s: &String) -> Result<()> {
+        match s.as_str() {
+            "none" => write!(self.sql, "n.tags = ''").unwrap(),
+            r"\S*" => write!(self.sql, "true").unwrap(),
+            _ => {
+                write!(self.sql, "n.tags regexp ?").unwrap();
+                self.args.push(format!("(?i).* {} .*", s));
             }
         }
+
         Ok(())
     }
 
@@ -668,15 +656,12 @@ mod test {
             )
         );
 
-        // unregistered tag short circuits
-        assert_eq!(s(ctx, r"tag:one"), ("(false)".into(), vec![]));
-
         // if registered, searches with canonical
         ctx.transact(None, |col| col.register_tag("One", Usn(-1)))
             .unwrap();
         assert_eq!(
             s(ctx, r"tag:one"),
-            ("(n.tags like ?)".into(), vec![r"% One %".into()])
+            ("(n.tags regexp ?)".into(), vec![r"(?i).* one .*".into()])
         );
 
         // wildcards force a regexp search

From 63cc877023ad0001746a9c977e06d9d159c223f6 Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Sun, 15 Nov 2020 11:54:21 +0100
Subject: [PATCH 09/20] Move whitespace check for tags from to sqlwriter

Instead of not parsing a tag containing whitespace, check for spaces
when writing sql and if there are any, explicitly match nothing.
---
 rslib/src/search/parser.rs    | 11 +----------
 rslib/src/search/sqlwriter.rs |  4 ++++
 2 files changed, 5 insertions(+), 10 deletions(-)

diff --git a/rslib/src/search/parser.rs b/rslib/src/search/parser.rs
index ec8727456..a8abc2ee5 100644
--- a/rslib/src/search/parser.rs
+++ b/rslib/src/search/parser.rs
@@ -281,7 +281,7 @@ fn search_node_for_text_with_argument<'a>(
         "edited" => SearchNode::EditedInDays(val.parse()?),
         "deck" => SearchNode::Deck(unescape_quotes(val)),
         "note" => SearchNode::NoteType(unescape_to_re(val)?),
-        "tag" => SearchNode::Tag(parse_tag(val)?),
+        "tag" => SearchNode::Tag(unescape_to_enforced_re(val, r"\S")?),
         "mid" => SearchNode::NoteTypeID(val.parse()?),
         "nid" => SearchNode::NoteIDs(check_id_list(val)?),
         "cid" => SearchNode::CardIDs(check_id_list(val)?),
@@ -300,15 +300,6 @@ fn search_node_for_text_with_argument<'a>(
     })
 }
 
-/// Ensure the string doesn't contain whitespace and unescape.
-fn parse_tag(s: &str) -> ParseResult<String> {
-    if s.as_bytes().iter().any(u8::is_ascii_whitespace) {
-        Err(ParseError {})
-    } else {
-        unescape_to_enforced_re(s, r"\S")
-    }
-}
-
 /// ensure a list of ids contains only numbers and commas, returning unchanged if true
 /// used by nid: and cid:
 fn check_id_list(s: &str) -> ParseResult<&str> {
diff --git a/rslib/src/search/sqlwriter.rs b/rslib/src/search/sqlwriter.rs
index daf6e2af2..3354342ee 100644
--- a/rslib/src/search/sqlwriter.rs
+++ b/rslib/src/search/sqlwriter.rs
@@ -189,6 +189,9 @@ impl SqlWriter<'_> {
     }
 
     fn write_tag(&mut self, s: &String) -> Result<()> {
+        if s.contains(" ") {
+            write!(self.sql, "false").unwrap();
+        } else {
         match s.as_str() {
             "none" => write!(self.sql, "n.tags = ''").unwrap(),
             r"\S*" => write!(self.sql, "true").unwrap(),
@@ -197,6 +200,7 @@ impl SqlWriter<'_> {
                 self.args.push(format!("(?i).* {} .*", s));
             }
         }
+        }
 
         Ok(())
     }

From ae01a5b3a2e3d42ab50a41d07bf6ef260127abf6 Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Sun, 15 Nov 2020 11:57:11 +0100
Subject: [PATCH 10/20] Fix escape check for escaped backslash

---
 rslib/src/search/parser.rs | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/rslib/src/search/parser.rs b/rslib/src/search/parser.rs
index a8abc2ee5..b8312b281 100644
--- a/rslib/src/search/parser.rs
+++ b/rslib/src/search/parser.rs
@@ -447,8 +447,9 @@ fn unescape_quotes(s: &str) -> Cow<str> {
 fn is_invalid_escape(txt: &str) -> bool {
     // odd number of \s not followed by an escapable character
     lazy_static! {
-        static ref RE: Regex = Regex::new(r#"(^|[^\\])(\\\\)*\\([^":*_()]|$)"#).unwrap();
+        static ref RE: Regex = Regex::new(r#"(^|[^\\])(\\\\)*\\([^\\":*_()]|$)"#).unwrap();
     }
+
     RE.is_match(txt)
 }
 

From a16d271eb057fb1fa01086a11c2cf5b60aeadf3d Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Sun, 15 Nov 2020 12:00:20 +0100
Subject: [PATCH 11/20] Extend tests for new search parsing

(Also fix indentation)
---
 rslib/src/search/parser.rs    | 43 +++++++++++++++++++++++++++++++----
 rslib/src/search/sqlwriter.rs | 14 ++++++------
 2 files changed, 46 insertions(+), 11 deletions(-)

diff --git a/rslib/src/search/parser.rs b/rslib/src/search/parser.rs
index b8312b281..6c3a35f07 100644
--- a/rslib/src/search/parser.rs
+++ b/rslib/src/search/parser.rs
@@ -592,7 +592,7 @@ mod test {
             })]
         );
 
-        // partially quoted text should handle escaping the same way
+        // escaping is independent of quotation
         assert_eq!(
             parse(r#""field:va\"lue""#)?,
             vec![Search(SingleField {
@@ -602,13 +602,44 @@ mod test {
             })]
         );
         assert_eq!(parse(r#""field:va\"lue""#)?, parse(r#"field:"va\"lue""#)?,);
+        assert_eq!(parse(r#""field:va\"lue""#)?, parse(r#"field:va\"lue"#)?,);
 
-        // any character should be escapable in quotes
+        // only \":()*_ are escapable
+        assert!(parse(r"\").is_err());
+        assert!(parse(r"\a").is_err());
+        assert!(parse(r"\%").is_err());
         assert_eq!(
-            parse(r#""re:\btest""#)?,
-            vec![Search(Regex(r"\btest".into()))]
+            parse(r#"\\\"\:\(\)\*\_"#)?,
+            vec![Search(UnqualifiedText(r#"\\":()*\_"#.into())),]
         );
 
+        // escaping parentheses is optional (only) inside quotes
+        assert_eq!(parse(r#""\)\(""#), parse(r#"")(""#));
+        assert!(parse(")(").is_err());
+
+        // escaping : is optional if it is preceded by another :
+        assert!(parse(":test").is_err());
+        assert!(parse(":").is_err());
+        assert_eq!(parse("field:val:ue"), parse(r"field:val\:ue"));
+        assert_eq!(parse(r#""field:val:ue""#), parse(r"field:val\:ue"));
+        assert_eq!(parse(r#"field:"val:ue""#), parse(r"field:val\:ue"));
+
+        // any character should be escapable on the right side of  re:
+        assert_eq!(
+            parse(r#""re:\btest\%""#)?,
+            vec![Search(Regex(r"\btest\%".into()))]
+        );
+
+        // no exceptions for escaping "
+        assert_eq!(
+            parse(r#"re:te\"st"#)?,
+            vec![Search(Regex(r#"te"st"#.into()))]
+        );
+        assert!(parse(r#"re:te"st"#).is_err());
+
+        // spaces are optional if node separation is clear
+        assert_eq!(parse(r#"a"b"(c)"#)?, parse("a b (c)")?);
+
         assert_eq!(parse("added:3")?, vec![Search(AddedInDays(3))]);
         assert_eq!(
             parse("card:front")?,
@@ -636,6 +667,10 @@ mod test {
             vec![Search(NoteType(Text("basic".into())))]
         );
         assert_eq!(parse("tag:hard")?, vec![Search(Tag("hard".to_string()))]);
+        // wildcards in tags don't match whitespace
+        assert_eq!(parse("tag:ha_d")?, vec![Search(Tag(r"ha\Sd".to_string()))]);
+        assert_eq!(parse("tag:h*d")?, vec![Search(Tag(r"h\S*d".to_string()))]);
+
         assert_eq!(
             parse("nid:1237123712,2,3")?,
             vec![Search(NoteIDs("1237123712,2,3".into()))]
diff --git a/rslib/src/search/sqlwriter.rs b/rslib/src/search/sqlwriter.rs
index 3354342ee..9afbca0cd 100644
--- a/rslib/src/search/sqlwriter.rs
+++ b/rslib/src/search/sqlwriter.rs
@@ -192,15 +192,15 @@ impl SqlWriter<'_> {
         if s.contains(" ") {
             write!(self.sql, "false").unwrap();
         } else {
-        match s.as_str() {
-            "none" => write!(self.sql, "n.tags = ''").unwrap(),
-            r"\S*" => write!(self.sql, "true").unwrap(),
-            _ => {
-                write!(self.sql, "n.tags regexp ?").unwrap();
-                self.args.push(format!("(?i).* {} .*", s));
+            match s.as_str() {
+                "none" => write!(self.sql, "n.tags = ''").unwrap(),
+                r"\S*" => write!(self.sql, "true").unwrap(),
+                _ => {
+                    write!(self.sql, "n.tags regexp ?").unwrap();
+                    self.args.push(format!("(?i).* {} .*", s));
+                }
             }
         }
-        }
 
         Ok(())
     }

From a6628709c50a497288df9fe2a7d19db089ca4e05 Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Sun, 15 Nov 2020 14:22:16 +0100
Subject: [PATCH 12/20] Annotate RegEx for invalid-escape check

---
 rslib/src/search/parser.rs | 10 +++++++++-
 1 file changed, 9 insertions(+), 1 deletion(-)

diff --git a/rslib/src/search/parser.rs b/rslib/src/search/parser.rs
index 6c3a35f07..a9df06dd0 100644
--- a/rslib/src/search/parser.rs
+++ b/rslib/src/search/parser.rs
@@ -447,7 +447,15 @@ fn unescape_quotes(s: &str) -> Cow<str> {
 fn is_invalid_escape(txt: &str) -> bool {
     // odd number of \s not followed by an escapable character
     lazy_static! {
-        static ref RE: Regex = Regex::new(r#"(^|[^\\])(\\\\)*\\([^\\":*_()]|$)"#).unwrap();
+        static ref RE: Regex = Regex::new(
+            r#"(?x)
+            (?:^|[^\\])         # not a backslash
+            (?:\\\\)*           # even number of backslashes
+            \\                  # single backslash
+            (?:[^\\":*_()]|$)   # anything but an escapable char
+            "#
+        )
+        .unwrap();
     }
 
     RE.is_match(txt)

From 7c5cf6d18b7c7402b34554b56f81955c89a26a0b Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Sun, 15 Nov 2020 21:32:36 +0100
Subject: [PATCH 13/20] Use enforced re to parse deck

Fix write_deck not recognising escaped deck name separators:
\:\: -> ::
---
 rslib/src/search/parser.rs    |  6 +++---
 rslib/src/search/sqlwriter.rs | 20 ++++++++++----------
 2 files changed, 13 insertions(+), 13 deletions(-)

diff --git a/rslib/src/search/parser.rs b/rslib/src/search/parser.rs
index a9df06dd0..656ed1700 100644
--- a/rslib/src/search/parser.rs
+++ b/rslib/src/search/parser.rs
@@ -68,7 +68,7 @@ pub(super) enum SearchNode<'a> {
     AddedInDays(u32),
     EditedInDays(u32),
     CardTemplate(TemplateKind<'a>),
-    Deck(Cow<'a, str>),
+    Deck(String),
     DeckID(DeckID),
     NoteTypeID(NoteTypeID),
     NoteType(OptionalRe<'a>),
@@ -279,7 +279,7 @@ fn search_node_for_text_with_argument<'a>(
     Ok(match key.to_ascii_lowercase().as_str() {
         "added" => SearchNode::AddedInDays(val.parse()?),
         "edited" => SearchNode::EditedInDays(val.parse()?),
-        "deck" => SearchNode::Deck(unescape_quotes(val)),
+        "deck" => SearchNode::Deck(unescape_to_enforced_re(val, ".")?),
         "note" => SearchNode::NoteType(unescape_to_re(val)?),
         "tag" => SearchNode::Tag(unescape_to_enforced_re(val, r"\S")?),
         "mid" => SearchNode::NoteTypeID(val.parse()?),
@@ -632,7 +632,7 @@ mod test {
         assert_eq!(parse(r#""field:val:ue""#), parse(r"field:val\:ue"));
         assert_eq!(parse(r#"field:"val:ue""#), parse(r"field:val\:ue"));
 
-        // any character should be escapable on the right side of  re:
+        // any character should be escapable on the right side of re:
         assert_eq!(
             parse(r#""re:\btest\%""#)?,
             vec![Search(Regex(r"\btest\%".into()))]
diff --git a/rslib/src/search/sqlwriter.rs b/rslib/src/search/sqlwriter.rs
index 9afbca0cd..fb06f659c 100644
--- a/rslib/src/search/sqlwriter.rs
+++ b/rslib/src/search/sqlwriter.rs
@@ -9,7 +9,6 @@ use crate::{
     err::Result,
     notes::field_checksum,
     notetype::NoteTypeID,
-    text::text_to_re,
     text::{normalize_to_nfc, strip_html_preserving_image_filenames, without_combining},
     timestamp::TimestampSecs,
 };
@@ -295,25 +294,26 @@ impl SqlWriter<'_> {
 
     fn write_deck(&mut self, deck: &str) -> Result<()> {
         match deck {
-            "*" => write!(self.sql, "true").unwrap(),
+            ".*" => write!(self.sql, "true").unwrap(),
             "filtered" => write!(self.sql, "c.odid != 0").unwrap(),
             deck => {
                 // rewrite "current" to the current deck name
                 let native_deck = if deck == "current" {
                     let current_did = self.col.get_current_deck_id();
-                    self.col
-                        .storage
-                        .get_deck(current_did)?
-                        .map(|d| d.name)
-                        .unwrap_or_else(|| "Default".into())
+                    regex::escape(
+                        self.col
+                            .storage
+                            .get_deck(current_did)?
+                            .map(|d| d.name)
+                            .unwrap_or_else(|| "Default".into())
+                            .as_str(),
+                    )
                 } else {
                     human_deck_name_to_native(deck)
                 };
 
                 // convert to a regex that includes child decks
-                // fixme: use unescape_to_enforced_re from parser.rs?
-                let re = text_to_re(&native_deck);
-                self.args.push(format!("(?i)^{}($|\x1f)", re));
+                self.args.push(format!("(?i)^{}($|\x1f)", native_deck));
                 let arg_idx = self.args.len();
                 self.sql.push_str(&format!(concat!(
                     "(c.did in (select id from decks where name regexp ?{n})",

From 8c02c6e2052ce55f87a0242e145e705ad00a1a2a Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Tue, 17 Nov 2020 12:49:37 +0100
Subject: [PATCH 14/20] Split unescaping between parser and writer

* Unescape wildcards in writer instead of parser.
* Move text conversion functions to text.rs.
* Implicitly norm when converting text.
* Revert to using collection when comparing tags but add escape support.
---
 rslib/src/search/parser.rs    | 175 +++++++++++++---------------------
 rslib/src/search/sqlwriter.rs | 163 +++++++++++++++++++------------
 rslib/src/text.rs             |  74 ++++++++++++++
 3 files changed, 241 insertions(+), 171 deletions(-)

diff --git a/rslib/src/search/parser.rs b/rslib/src/search/parser.rs
index 656ed1700..f36577c7d 100644
--- a/rslib/src/search/parser.rs
+++ b/rslib/src/search/parser.rs
@@ -40,12 +40,6 @@ impl<I> From<nom::Err<(I, nom::error::ErrorKind)>> for ParseError {
 
 type ParseResult<T> = std::result::Result<T, ParseError>;
 
-#[derive(Debug, PartialEq)]
-pub(super) enum OptionalRe<'a> {
-    Text(Cow<'a, str>),
-    Re(Cow<'a, str>),
-}
-
 #[derive(Debug, PartialEq)]
 pub(super) enum Node<'a> {
     And,
@@ -61,22 +55,22 @@ pub(super) enum SearchNode<'a> {
     UnqualifiedText(Cow<'a, str>),
     // foo:bar, where foo doesn't match a term below
     SingleField {
-        field: OptionalRe<'a>,
+        field: Cow<'a, str>,
         text: Cow<'a, str>,
         is_re: bool,
     },
     AddedInDays(u32),
     EditedInDays(u32),
     CardTemplate(TemplateKind<'a>),
-    Deck(String),
+    Deck(Cow<'a, str>),
     DeckID(DeckID),
     NoteTypeID(NoteTypeID),
-    NoteType(OptionalRe<'a>),
+    NoteType(Cow<'a, str>),
     Rated {
         days: u32,
         ease: Option<u8>,
     },
-    Tag(String),
+    Tag(Cow<'a, str>),
     Duplicates {
         note_type_id: NoteTypeID,
         text: Cow<'a, str>,
@@ -92,7 +86,7 @@ pub(super) enum SearchNode<'a> {
     WholeCollection,
     Regex(Cow<'a, str>),
     NoCombining(Cow<'a, str>),
-    WordBoundary(String),
+    WordBoundary(Cow<'a, str>),
 }
 
 #[derive(Debug, PartialEq)]
@@ -119,7 +113,7 @@ pub(super) enum StateKind {
 #[derive(Debug, PartialEq)]
 pub(super) enum TemplateKind<'a> {
     Ordinal(u16),
-    Name(OptionalRe<'a>),
+    Name(Cow<'a, str>),
 }
 
 /// Parse the input string into a list of nodes.
@@ -210,7 +204,7 @@ fn text(s: &str) -> IResult<&str, Node> {
 fn search_node_for_text(s: &str) -> ParseResult<SearchNode> {
     let (tail, head) = escaped(is_not(r":\"), '\\', anychar)(s)?;
     if tail.is_empty() {
-        Ok(SearchNode::UnqualifiedText(unescape_to_glob(head)?))
+        Ok(SearchNode::UnqualifiedText(unescape(head)?))
     } else {
         search_node_for_text_with_argument(head, &tail[1..])
     }
@@ -279,9 +273,9 @@ fn search_node_for_text_with_argument<'a>(
     Ok(match key.to_ascii_lowercase().as_str() {
         "added" => SearchNode::AddedInDays(val.parse()?),
         "edited" => SearchNode::EditedInDays(val.parse()?),
-        "deck" => SearchNode::Deck(unescape_to_enforced_re(val, ".")?),
-        "note" => SearchNode::NoteType(unescape_to_re(val)?),
-        "tag" => SearchNode::Tag(unescape_to_enforced_re(val, r"\S")?),
+        "deck" => SearchNode::Deck(unescape(val)?),
+        "note" => SearchNode::NoteType(unescape(val)?),
+        "tag" => SearchNode::Tag(unescape(val)?),
         "mid" => SearchNode::NoteTypeID(val.parse()?),
         "nid" => SearchNode::NoteIDs(check_id_list(val)?),
         "cid" => SearchNode::CardIDs(check_id_list(val)?),
@@ -293,8 +287,8 @@ fn search_node_for_text_with_argument<'a>(
         "dupe" => parse_dupes(val)?,
         "prop" => parse_prop(val)?,
         "re" => SearchNode::Regex(unescape_quotes(val)),
-        "nc" => SearchNode::NoCombining(unescape_to_glob(val)?),
-        "w" => SearchNode::WordBoundary(unescape_to_enforced_re(val, ".")?),
+        "nc" => SearchNode::NoCombining(unescape(val)?),
+        "w" => SearchNode::WordBoundary(unescape(val)?),
         // anything else is a field search
         _ => parse_single_field(key, val)?,
     })
@@ -414,21 +408,21 @@ fn parse_prop(val: &str) -> ParseResult<SearchNode<'static>> {
 fn parse_template(val: &str) -> ParseResult<SearchNode> {
     Ok(SearchNode::CardTemplate(match val.parse::<u16>() {
         Ok(n) => TemplateKind::Ordinal(n.max(1) - 1),
-        Err(_) => TemplateKind::Name(unescape_to_re(val)?),
+        Err(_) => TemplateKind::Name(unescape(val)?),
     }))
 }
 
 fn parse_single_field<'a>(key: &'a str, val: &'a str) -> ParseResult<SearchNode<'a>> {
     Ok(if val.starts_with("re:") {
         SearchNode::SingleField {
-            field: unescape_to_re(key)?,
+            field: unescape(key)?,
             text: unescape_quotes(&val[3..]),
             is_re: true,
         }
     } else {
         SearchNode::SingleField {
-            field: unescape_to_re(key)?,
-            text: unescape_to_glob(val)?,
+            field: unescape(key)?,
+            text: unescape(val)?,
             is_re: false,
         }
     })
@@ -443,6 +437,26 @@ fn unescape_quotes(s: &str) -> Cow<str> {
     }
 }
 
+fn unescape(txt: &str) -> ParseResult<Cow<str>> {
+    if is_invalid_escape(txt) {
+        Err(ParseError {})
+    } else if is_parser_escape(txt) {
+        lazy_static! {
+            static ref RE: Regex = Regex::new(r#"\\[\\":()]"#).unwrap();
+        }
+        Ok(RE.replace_all(&txt, |caps: &Captures| match &caps[0] {
+            r"\\" => r"\\",
+            "\\\"" => "\"",
+            r"\:" => ":",
+            r"\(" => "(",
+            r"\)" => ")",
+            _ => unreachable!(),
+        }))
+    } else {
+        Ok(txt.into())
+    }
+}
+
 /// Check string for invalid escape sequences.
 fn is_invalid_escape(txt: &str) -> bool {
     // odd number of \s not followed by an escapable character
@@ -461,77 +475,22 @@ fn is_invalid_escape(txt: &str) -> bool {
     RE.is_match(txt)
 }
 
-/// Handle escaped characters and convert Anki wildcards to SQL wildcards.
-/// Return error if there is an undefined escape sequence.
-fn unescape_to_glob(txt: &str) -> ParseResult<Cow<str>> {
-    if is_invalid_escape(txt) {
-        Err(ParseError {})
-    } else {
-        // escape sequences and unescaped special characters which need conversion
-        lazy_static! {
-            static ref RE: Regex = Regex::new(r"\\.|[*%]").unwrap();
-        }
-        Ok(RE.replace_all(&txt, |caps: &Captures| match &caps[0] {
-            r"\\" => r"\\",
-            "\\\"" => "\"",
-            r"\:" => ":",
-            r"\*" => "*",
-            r"\_" => r"\_",
-            r"\(" => "(",
-            r"\)" => ")",
-            "*" => "%",
-            "%" => r"\%",
-            _ => unreachable!(),
-        }))
+/// Check string for escape sequences handled by the parser: ":()
+fn is_parser_escape(txt: &str) -> bool {
+    // odd number of \s followed by a char with special meaning to the parser
+    lazy_static! {
+        static ref RE: Regex = Regex::new(
+            r#"(?x)
+            (?:^|[^\\])     # not a backslash
+            (?:\\\\)*       # even number of backslashes
+            \\              # single backslash
+            [":()]          # parser escape
+            "#
+        )
+        .unwrap();
     }
-}
 
-/// Handle escaped characters and convert to regex if there are wildcards.
-/// Return error if there is an undefined escape sequence.
-fn unescape_to_re(txt: &str) -> ParseResult<OptionalRe> {
-    unescape_to_custom_re(txt, ".")
-}
-
-/// Handle escaped characters and if there are wildcards, convert to a regex using the given wildcard.
-/// Return error if there is an undefined escape sequence.
-fn unescape_to_custom_re<'a>(txt: &'a str, wildcard: &str) -> ParseResult<OptionalRe<'a>> {
-    if is_invalid_escape(txt) {
-        Err(ParseError {})
-    } else {
-        lazy_static! {
-            static ref WILDCARD: Regex = Regex::new(r"(^|[^\\])(\\\\)*[*_]").unwrap();
-            static ref MAYBE_ESCAPED: Regex = Regex::new(r"\\?.").unwrap();
-            static ref ESCAPED: Regex = Regex::new(r"\\(.)").unwrap();
-        }
-        if WILDCARD.is_match(txt) {
-            Ok(OptionalRe::Re(MAYBE_ESCAPED.replace_all(
-                &txt,
-                |caps: &Captures| {
-                    let s = &caps[0];
-                    match s {
-                        "\\" | r"\*" | r"\(" | r"\)" => s.to_string(),
-                        "\\\"" => "\"".to_string(),
-                        r"\:" => ":".to_string(),
-                        "*" => format!("{}*", wildcard),
-                        "_" => wildcard.to_string(),
-                        r"\_" => "_".to_string(),
-                        s => regex::escape(s),
-                    }
-                },
-            )))
-        } else {
-            Ok(OptionalRe::Text(ESCAPED.replace_all(&txt, "$1")))
-        }
-    }
-}
-
-/// Handle escaped characters and convert to regex.
-/// Return error if there is an undefined escape sequence.
-fn unescape_to_enforced_re(txt: &str, wildcard: &str) -> ParseResult<String> {
-    Ok(match unescape_to_custom_re(txt, wildcard)? {
-        OptionalRe::Text(s) => regex::escape(s.as_ref()),
-        OptionalRe::Re(s) => s.to_string(),
-    })
+    RE.is_match(txt)
 }
 
 #[cfg(test)]
@@ -541,7 +500,6 @@ mod test {
     #[test]
     fn parsing() -> Result<()> {
         use Node::*;
-        use OptionalRe::*;
         use SearchNode::*;
 
         assert_eq!(parse("")?, vec![Search(SearchNode::WholeCollection)]);
@@ -581,7 +539,7 @@ mod test {
                     Search(UnqualifiedText("world".into())),
                     And,
                     Search(SingleField {
-                        field: Text("foo".into()),
+                        field: "foo".into(),
                         text: "bar baz".into(),
                         is_re: false,
                     })
@@ -594,7 +552,7 @@ mod test {
         assert_eq!(
             parse("foo:re:bar")?,
             vec![Search(SingleField {
-                field: Text("foo".into()),
+                field: "foo".into(),
                 text: "bar".into(),
                 is_re: true
             })]
@@ -604,7 +562,7 @@ mod test {
         assert_eq!(
             parse(r#""field:va\"lue""#)?,
             vec![Search(SingleField {
-                field: Text("field".into()),
+                field: "field".into(),
                 text: "va\"lue".into(),
                 is_re: false
             })]
@@ -616,9 +574,17 @@ mod test {
         assert!(parse(r"\").is_err());
         assert!(parse(r"\a").is_err());
         assert!(parse(r"\%").is_err());
+
+        // parser unescapes ":()
         assert_eq!(
-            parse(r#"\\\"\:\(\)\*\_"#)?,
-            vec![Search(UnqualifiedText(r#"\\":()*\_"#.into())),]
+            parse(r#"\"\:\(\)"#)?,
+            vec![Search(UnqualifiedText(r#"":()"#.into())),]
+        );
+
+        // parser doesn't unescape unescape \*_
+        assert_eq!(
+            parse(r#"\\\*\_"#)?,
+            vec![Search(UnqualifiedText(r#"\\\*\_"#.into())),]
         );
 
         // escaping parentheses is optional (only) inside quotes
@@ -651,9 +617,7 @@ mod test {
         assert_eq!(parse("added:3")?, vec![Search(AddedInDays(3))]);
         assert_eq!(
             parse("card:front")?,
-            vec![Search(CardTemplate(TemplateKind::Name(Text(
-                "front".into()
-            ))))]
+            vec![Search(CardTemplate(TemplateKind::Name("front".into())))]
         );
         assert_eq!(
             parse("card:3")?,
@@ -670,15 +634,8 @@ mod test {
             vec![Search(Deck("default one".into()))]
         );
 
-        assert_eq!(
-            parse("note:basic")?,
-            vec![Search(NoteType(Text("basic".into())))]
-        );
-        assert_eq!(parse("tag:hard")?, vec![Search(Tag("hard".to_string()))]);
-        // wildcards in tags don't match whitespace
-        assert_eq!(parse("tag:ha_d")?, vec![Search(Tag(r"ha\Sd".to_string()))]);
-        assert_eq!(parse("tag:h*d")?, vec![Search(Tag(r"h\S*d".to_string()))]);
-
+        assert_eq!(parse("note:basic")?, vec![Search(NoteType("basic".into()))]);
+        assert_eq!(parse("tag:hard")?, vec![Search(Tag("hard".into()))]);
         assert_eq!(
             parse("nid:1237123712,2,3")?,
             vec![Search(NoteIDs("1237123712,2,3".into()))]
diff --git a/rslib/src/search/sqlwriter.rs b/rslib/src/search/sqlwriter.rs
index fb06f659c..f2ce61ef8 100644
--- a/rslib/src/search/sqlwriter.rs
+++ b/rslib/src/search/sqlwriter.rs
@@ -1,7 +1,7 @@
 // Copyright: Ankitects Pty Ltd and contributors
 // License: GNU AGPL, version 3 or later; http://www.gnu.org/licenses/agpl.html
 
-use super::parser::{Node, OptionalRe, PropertyKind, SearchNode, StateKind, TemplateKind};
+use super::parser::{Node, PropertyKind, SearchNode, StateKind, TemplateKind};
 use crate::{
     card::{CardQueue, CardType},
     collection::Collection,
@@ -9,12 +9,24 @@ use crate::{
     err::Result,
     notes::field_checksum,
     notetype::NoteTypeID,
-    text::{normalize_to_nfc, strip_html_preserving_image_filenames, without_combining},
+    text::{
+        escape_sql, is_glob, normalize_to_nfc, strip_html_preserving_image_filenames, to_custom_re,
+        to_re, to_sql, to_text, without_combining,
+    },
     timestamp::TimestampSecs,
 };
 use regex::Regex;
 use std::{borrow::Cow, fmt::Write};
 use unicase::eq as uni_eq;
+use ConversionMode as CM;
+
+enum ConversionMode<'a> {
+    OnlyNorm,
+    Regex,
+    CustomRe(&'a str),
+    Sql,
+    Text,
+}
 
 pub(crate) struct SqlWriter<'a> {
     col: &'a mut Collection,
@@ -116,22 +128,20 @@ impl SqlWriter<'_> {
         use normalize_to_nfc as norm;
         match node {
             // note fields related
-            SearchNode::UnqualifiedText(text) => self.write_unqualified(&self.norm_note(text)),
+            SearchNode::UnqualifiedText(text) => self.write_unqualified(text),
             SearchNode::SingleField { field, text, is_re } => {
-                self.write_single_field(field, &self.norm_note(text), *is_re)?
+                self.write_single_field(field, text, *is_re)?
             }
-            SearchNode::Duplicates { note_type_id, text } => {
-                self.write_dupes(*note_type_id, &self.norm_note(text))
-            }
-            SearchNode::Regex(re) => self.write_regex(&self.norm_note(re)),
-            SearchNode::NoCombining(text) => self.write_no_combining(&self.norm_note(text)),
-            SearchNode::WordBoundary(text) => self.write_word_boundary(&self.norm_note(text)),
+            SearchNode::Duplicates { note_type_id, text } => self.write_dupes(*note_type_id, text),
+            SearchNode::Regex(re) => self.write_regex(re),
+            SearchNode::NoCombining(text) => self.write_no_combining(text),
+            SearchNode::WordBoundary(text) => self.write_word_boundary(text),
 
             // other
             SearchNode::AddedInDays(days) => self.write_added(*days)?,
             SearchNode::EditedInDays(days) => self.write_edited(*days)?,
-            // fixme: normalise in name case?
             SearchNode::CardTemplate(template) => self.write_template(template)?,
+            // fixme: always norm?
             SearchNode::Deck(deck) => self.write_deck(&norm(deck))?,
             SearchNode::NoteTypeID(ntid) => {
                 write!(self.sql, "n.mid = {}", ntid).unwrap();
@@ -139,11 +149,9 @@ impl SqlWriter<'_> {
             SearchNode::DeckID(did) => {
                 write!(self.sql, "c.did = {}", did).unwrap();
             }
-            // fixme: normalise?
             SearchNode::NoteType(notetype) => self.write_note_type(notetype)?,
             SearchNode::Rated { days, ease } => self.write_rated(*days, *ease)?,
 
-            // fixme: normalise?
             SearchNode::Tag(tag) => self.write_tag(tag)?,
             SearchNode::State(state) => self.write_state(state)?,
             SearchNode::Flag(flag) => {
@@ -163,7 +171,7 @@ impl SqlWriter<'_> {
 
     fn write_unqualified(&mut self, text: &str) {
         // implicitly wrap in %
-        let text = format!("%{}%", text);
+        let text = format!("%{}%", &self.convert(CM::Sql, text));
         self.args.push(text);
         write!(
             self.sql,
@@ -174,7 +182,7 @@ impl SqlWriter<'_> {
     }
 
     fn write_no_combining(&mut self, text: &str) {
-        let text = format!("%{}%", without_combining(text));
+        let text = format!("%{}%", without_combining(&self.convert(CM::Sql, text)));
         self.args.push(text);
         write!(
             self.sql,
@@ -187,16 +195,28 @@ impl SqlWriter<'_> {
         .unwrap();
     }
 
-    fn write_tag(&mut self, s: &String) -> Result<()> {
-        if s.contains(" ") {
+    fn write_tag(&mut self, text: &str) -> Result<()> {
+        if text.contains(" ") {
             write!(self.sql, "false").unwrap();
         } else {
-            match s.as_str() {
+            match text {
                 "none" => write!(self.sql, "n.tags = ''").unwrap(),
-                r"\S*" => write!(self.sql, "true").unwrap(),
-                _ => {
-                    write!(self.sql, "n.tags regexp ?").unwrap();
-                    self.args.push(format!("(?i).* {} .*", s));
+                "*" => write!(self.sql, "true").unwrap(),
+                s => {
+                    if is_glob(s) {
+                        write!(self.sql, "n.tags regexp ?").unwrap();
+                        let re = &self.convert(CM::CustomRe(r"\S"), s);
+                        self.args.push(format!("(?i).* {} .*", re));
+                    } else if let Some(tag) = self
+                        .col
+                        .storage
+                        .preferred_tag_case(&self.convert(CM::Text, s))?
+                    {
+                        write!(self.sql, "n.tags like ? escape '\\'").unwrap();
+                        self.args.push(format!("% {} %", escape_sql(&tag)));
+                    } else {
+                        write!(self.sql, "false").unwrap();
+                    }
                 }
             }
         }
@@ -294,7 +314,7 @@ impl SqlWriter<'_> {
 
     fn write_deck(&mut self, deck: &str) -> Result<()> {
         match deck {
-            ".*" => write!(self.sql, "true").unwrap(),
+            "*" => write!(self.sql, "true").unwrap(),
             "filtered" => write!(self.sql, "c.odid != 0").unwrap(),
             deck => {
                 // rewrite "current" to the current deck name
@@ -309,7 +329,7 @@ impl SqlWriter<'_> {
                             .as_str(),
                     )
                 } else {
-                    human_deck_name_to_native(deck)
+                    human_deck_name_to_native(&self.convert(CM::Regex, deck))
                 };
 
                 // convert to a regex that includes child decks
@@ -330,54 +350,45 @@ impl SqlWriter<'_> {
             TemplateKind::Ordinal(n) => {
                 write!(self.sql, "c.ord = {}", n).unwrap();
             }
-            TemplateKind::Name(name) => match name {
-                OptionalRe::Re(s) => {
-                    let re = format!("(?i){}", s);
+            TemplateKind::Name(name) => {
+                if is_glob(name) {
+                    let re = format!("(?i){}", self.convert(CM::Regex, name));
                     self.sql.push_str(
                         "(n.mid,c.ord) in (select ntid,ord from templates where name regexp ?)",
                     );
                     self.args.push(re);
-                }
-                OptionalRe::Text(s) => {
+                } else {
                     self.sql.push_str(
                         "(n.mid,c.ord) in (select ntid,ord from templates where name = ?)",
                     );
-                    self.args.push(s.to_string());
+                    self.args.push(self.convert(CM::Text, name).into());
                 }
-            },
+            }
         };
         Ok(())
     }
 
-    fn write_note_type(&mut self, nt_name: &OptionalRe) -> Result<()> {
-        match nt_name {
-            OptionalRe::Re(s) => {
-                let re = format!("(?i){}", s);
-                self.sql
-                    .push_str("n.mid in (select id from notetypes where name regexp ?)");
-                self.args.push(re);
-            }
-            OptionalRe::Text(s) => {
-                self.sql
-                    .push_str("n.mid in (select id from notetypes where name = ?)");
-                self.args.push(s.to_string());
-            }
+    fn write_note_type(&mut self, nt_name: &str) -> Result<()> {
+        if is_glob(nt_name) {
+            let re = format!("(?i){}", self.convert(CM::Regex, nt_name));
+            self.sql
+                .push_str("n.mid in (select id from notetypes where name regexp ?)");
+            self.args.push(re);
+        } else {
+            self.sql
+                .push_str("n.mid in (select id from notetypes where name = ?)");
+            self.args.push(self.convert(CM::Text, nt_name).into());
         }
         Ok(())
     }
 
-    fn write_single_field(
-        &mut self,
-        field_name: &OptionalRe,
-        val: &str,
-        is_re: bool,
-    ) -> Result<()> {
+    fn write_single_field(&mut self, field_name: &str, val: &str, is_re: bool) -> Result<()> {
         let note_types = self.col.get_all_notetypes()?;
 
         let mut field_map = vec![];
         for nt in note_types.values() {
             for field in &nt.fields {
-                if matches_string_variant(&field.name, field_name) {
+                if self.matches_glob(&field.name, field_name) {
                     field_map.push((nt.id, field.ord));
                 }
             }
@@ -396,11 +407,12 @@ impl SqlWriter<'_> {
         if is_re {
             cmp = "regexp";
             cmp_trailer = "";
-            self.args.push(format!("(?i){}", val));
+            self.args
+                .push(format!("(?i){}", self.convert(CM::OnlyNorm, val)));
         } else {
             cmp = "like";
             cmp_trailer = "escape '\\'";
-            self.args.push(val.into())
+            self.args.push(self.convert(CM::Sql, val).into())
         }
 
         let arg_idx = self.args.len();
@@ -423,6 +435,7 @@ impl SqlWriter<'_> {
     }
 
     fn write_dupes(&mut self, ntid: NoteTypeID, text: &str) {
+        let text = &self.convert(CM::OnlyNorm, text);
         let text_nohtml = strip_html_preserving_image_filenames(text);
         let csum = field_checksum(text_nohtml.as_ref());
         write!(
@@ -450,19 +463,39 @@ impl SqlWriter<'_> {
 
     fn write_regex(&mut self, word: &str) {
         self.sql.push_str("n.flds regexp ?");
-        self.args.push(format!(r"(?i){}", word));
+        self.args
+            .push(format!(r"(?i){}", self.convert(CM::OnlyNorm, word)));
     }
 
     fn write_word_boundary(&mut self, word: &str) {
-        self.write_regex(&format!(r"\b{}\b", word))
+        self.sql.push_str("n.flds regexp ?");
+        self.args
+            .push(format!(r"(?i)\b{}\b", self.convert(CM::Regex, word)));
     }
-}
 
-/// True if the content of search is equal to text, folding case.
-fn matches_string_variant(text: &str, search: &OptionalRe) -> bool {
-    match search {
-        OptionalRe::Re(s) => Regex::new(&format!("^(?i){}$", s)).unwrap().is_match(text),
-        OptionalRe::Text(s) => uni_eq(text, s),
+    /// Norm text and call the according conversion function.
+    fn convert<'a>(&self, mode: ConversionMode, txt: &'a str) -> Cow<'a, str> {
+        let txt = match mode {
+            CM::OnlyNorm => txt.into(),
+            CM::Regex => to_re(txt),
+            CM::CustomRe(wildcard) => to_custom_re(txt, wildcard),
+            CM::Sql => to_sql(txt),
+            CM::Text => to_text(txt),
+        };
+        match txt {
+            Cow::Borrowed(s) => self.norm_note(s),
+            Cow::Owned(s) => self.norm_note(&s).to_string().into(),
+        }
+    }
+
+    /// Compare text with a possible glob, folding case.
+    fn matches_glob(&self, text: &str, search: &str) -> bool {
+        if is_glob(search) {
+            let search = format!("^(?i){}$", self.convert(CM::Regex, search));
+            Regex::new(&search).unwrap().is_match(text)
+        } else {
+            uni_eq(text, &self.convert(CM::Text, search))
+        }
     }
 }
 
@@ -665,9 +698,15 @@ mod test {
             .unwrap();
         assert_eq!(
             s(ctx, r"tag:one"),
-            ("(n.tags regexp ?)".into(), vec![r"(?i).* one .*".into()])
+            (
+                "(n.tags like ? escape '\\')".into(),
+                vec![r"% One %".into()]
+            )
         );
 
+        // unregistered tags without wildcards won't match
+        assert_eq!(s(ctx, "tag:unknown"), ("(false)".into(), vec![]));
+
         // wildcards force a regexp search
         assert_eq!(
             s(ctx, r"tag:o*n\*et%w%oth_re\_e"),
diff --git a/rslib/src/text.rs b/rslib/src/text.rs
index b24b838c9..d5a17506f 100644
--- a/rslib/src/text.rs
+++ b/rslib/src/text.rs
@@ -289,6 +289,80 @@ pub(crate) fn text_to_re(glob: &str) -> String {
     text2.into()
 }
 
+/// Check if string contains an unescaped wildcard.
+pub(crate) fn is_glob(txt: &str) -> bool {
+    // even number of \s followed by a wildcard
+    lazy_static! {
+        static ref RE: Regex = Regex::new(
+            r#"(?x)
+            (?:^|[^\\])     # not a backslash
+            (?:\\\\)*       # even number of backslashes
+            [*_]            # wildcard
+            "#
+        )
+        .unwrap();
+    }
+
+    RE.is_match(txt)
+}
+
+/// Convert to a RegEx respecting Anki wildcards.
+pub(crate) fn to_re(txt: &str) -> Cow<str> {
+    to_custom_re(txt, ".")
+}
+
+/// Convert Anki style to RegEx using the provided wildcard.
+pub(crate) fn to_custom_re<'a>(txt: &'a str, wildcard: &str) -> Cow<'a, str> {
+    // escape sequences and unescaped special characters which need conversion
+    lazy_static! {
+        static ref RE: Regex = Regex::new(r"\\.|[*_]").unwrap();
+    }
+    RE.replace_all(&txt, |caps: &Captures| {
+        let s = &caps[0];
+        match s {
+            r"\\" | r"\*" => s.to_string(),
+            r"\_" => "_".to_string(),
+            "*" => format!("{}*", wildcard),
+            "_" => wildcard.to_string(),
+            s => regex::escape(s),
+        }
+    })
+}
+
+/// Convert to SQL respecting Anki wildcards.
+pub(crate) fn to_sql<'a>(txt: &'a str) -> Cow<'a, str> {
+    // escape sequences and unescaped special characters which need conversion
+    lazy_static! {
+        static ref RE: Regex = Regex::new(r"\\[\\*]|[*%]").unwrap();
+    }
+    RE.replace_all(&txt, |caps: &Captures| {
+        let s = &caps[0];
+        match s {
+            r"\\" => r"\\",
+            r"\*" => "*",
+            "*" => "%",
+            "%" => r"\%",
+            _ => unreachable!(),
+        }
+    })
+}
+
+/// Unescape everything.
+pub(crate) fn to_text(txt: &str) -> Cow<str> {
+    lazy_static! {
+        static ref RE: Regex = Regex::new(r"\\(.)").unwrap();
+    }
+    RE.replace_all(&txt, "$1")
+}
+
+/// Escape characters special to SQL: \%_
+pub(crate) fn escape_sql(txt: &str) -> Cow<str> {
+    lazy_static! {
+        static ref RE: Regex = Regex::new(r"[\\%_]").unwrap();
+    }
+    RE.replace_all(&txt, r"\$0")
+}
+
 #[cfg(test)]
 mod test {
     use crate::text::without_combining;

From 91873d68eb14ea384d23266e5602c638b7f73e4c Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Tue, 17 Nov 2020 15:39:54 +0100
Subject: [PATCH 15/20] Fix RE in to_custom_re of text.rs

Match every single (potentially escaped) character of the string, so
they can be escaped properly.
---
 rslib/src/text.rs | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/rslib/src/text.rs b/rslib/src/text.rs
index d5a17506f..524040586 100644
--- a/rslib/src/text.rs
+++ b/rslib/src/text.rs
@@ -313,9 +313,8 @@ pub(crate) fn to_re(txt: &str) -> Cow<str> {
 
 /// Convert Anki style to RegEx using the provided wildcard.
 pub(crate) fn to_custom_re<'a>(txt: &'a str, wildcard: &str) -> Cow<'a, str> {
-    // escape sequences and unescaped special characters which need conversion
     lazy_static! {
-        static ref RE: Regex = Regex::new(r"\\.|[*_]").unwrap();
+        static ref RE: Regex = Regex::new(r"\\?.").unwrap();
     }
     RE.replace_all(&txt, |caps: &Captures| {
         let s = &caps[0];

From b09a398d2d21b158a3ef638e28e3de9054ea1089 Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Tue, 17 Nov 2020 18:38:27 +0100
Subject: [PATCH 16/20] Make - escapable

Treat unescaped - as before but make it escapable with \ to distinguish
the literal from the negator.
---
 rslib/src/search/parser.rs | 21 ++++++++++++++-------
 1 file changed, 14 insertions(+), 7 deletions(-)

diff --git a/rslib/src/search/parser.rs b/rslib/src/search/parser.rs
index f36577c7d..6937f02ab 100644
--- a/rslib/src/search/parser.rs
+++ b/rslib/src/search/parser.rs
@@ -442,7 +442,7 @@ fn unescape(txt: &str) -> ParseResult<Cow<str>> {
         Err(ParseError {})
     } else if is_parser_escape(txt) {
         lazy_static! {
-            static ref RE: Regex = Regex::new(r#"\\[\\":()]"#).unwrap();
+            static ref RE: Regex = Regex::new(r#"\\[\\":()-]"#).unwrap();
         }
         Ok(RE.replace_all(&txt, |caps: &Captures| match &caps[0] {
             r"\\" => r"\\",
@@ -450,6 +450,7 @@ fn unescape(txt: &str) -> ParseResult<Cow<str>> {
             r"\:" => ":",
             r"\(" => "(",
             r"\)" => ")",
+            r"\-" => "-",
             _ => unreachable!(),
         }))
     } else {
@@ -466,7 +467,7 @@ fn is_invalid_escape(txt: &str) -> bool {
             (?:^|[^\\])         # not a backslash
             (?:\\\\)*           # even number of backslashes
             \\                  # single backslash
-            (?:[^\\":*_()]|$)   # anything but an escapable char
+            (?:[^\\":*_()-]|$)  # anything but an escapable char
             "#
         )
         .unwrap();
@@ -484,7 +485,7 @@ fn is_parser_escape(txt: &str) -> bool {
             (?:^|[^\\])     # not a backslash
             (?:\\\\)*       # even number of backslashes
             \\              # single backslash
-            [":()]          # parser escape
+            [":()-]         # parser escape
             "#
         )
         .unwrap();
@@ -570,15 +571,15 @@ mod test {
         assert_eq!(parse(r#""field:va\"lue""#)?, parse(r#"field:"va\"lue""#)?,);
         assert_eq!(parse(r#""field:va\"lue""#)?, parse(r#"field:va\"lue"#)?,);
 
-        // only \":()*_ are escapable
+        // only \":()-*_ are escapable
         assert!(parse(r"\").is_err());
         assert!(parse(r"\a").is_err());
         assert!(parse(r"\%").is_err());
 
-        // parser unescapes ":()
+        // parser unescapes ":()-
         assert_eq!(
-            parse(r#"\"\:\(\)"#)?,
-            vec![Search(UnqualifiedText(r#"":()"#.into())),]
+            parse(r#"\"\:\(\)\-"#)?,
+            vec![Search(UnqualifiedText(r#"":()-"#.into())),]
         );
 
         // parser doesn't unescape unescape \*_
@@ -598,6 +599,12 @@ mod test {
         assert_eq!(parse(r#""field:val:ue""#), parse(r"field:val\:ue"));
         assert_eq!(parse(r#"field:"val:ue""#), parse(r"field:val\:ue"));
 
+        // escaping - is optional if it cannot be mistaken for a negator
+        assert_eq!(parse("-"), parse(r"\-"));
+        assert_eq!(parse("A-"), parse(r"A\-"));
+        assert_eq!(parse(r#""-A""#), parse(r"\-A"));
+        assert_ne!(parse("-A"), parse(r"\-A"));
+
         // any character should be escapable on the right side of re:
         assert_eq!(
             parse(r#""re:\btest\%""#)?,

From 88d66fc939f3266c2a5d8c97a72e46d7ca85bebf Mon Sep 17 00:00:00 2001
From: RumovZ <r5j6q930s@relay.firefox.com>
Date: Wed, 18 Nov 2020 09:25:35 +0100
Subject: [PATCH 17/20] Remove space for contributors check... again?

---
 CONTRIBUTORS | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/CONTRIBUTORS b/CONTRIBUTORS
index a581234e5..a1ebd645f 100644
--- a/CONTRIBUTORS
+++ b/CONTRIBUTORS
@@ -65,7 +65,7 @@ lukkea <github.com/lukkea/>
 David Allison <davidallisongithub@gmail.com>
 Tsung-Han Yu <johan456789@gmail.com>
 Piotr Kubowicz <piotr.kubowicz@gmail.com>
-RumovZ <gp5glkw78@relay.firefox.com> 
+RumovZ <gp5glkw78@relay.firefox.com>
 Cecini <github.com/cecini> 
 Krish Shah <github.com/k12ish>
 ianki <iankigit@gmail.com>

From 6e51bad7db655d02e074d4f0f8677e6f8af33a76 Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Wed, 18 Nov 2020 22:26:51 +0100
Subject: [PATCH 18/20] Implement the prefix `r:` to search for raw input

---
 rslib/src/search/parser.rs | 31 +++++++++++++++++++++++++++++++
 1 file changed, 31 insertions(+)

diff --git a/rslib/src/search/parser.rs b/rslib/src/search/parser.rs
index 6937f02ab..3fb20c3e7 100644
--- a/rslib/src/search/parser.rs
+++ b/rslib/src/search/parser.rs
@@ -287,6 +287,7 @@ fn search_node_for_text_with_argument<'a>(
         "dupe" => parse_dupes(val)?,
         "prop" => parse_prop(val)?,
         "re" => SearchNode::Regex(unescape_quotes(val)),
+        "r" => SearchNode::UnqualifiedText(unescape_raw(val)),
         "nc" => SearchNode::NoCombining(unescape(val)?),
         "w" => SearchNode::WordBoundary(unescape(val)?),
         // anything else is a field search
@@ -419,6 +420,12 @@ fn parse_single_field<'a>(key: &'a str, val: &'a str) -> ParseResult<SearchNode<
             text: unescape_quotes(&val[3..]),
             is_re: true,
         }
+    } else if val.starts_with("r:") {
+        SearchNode::SingleField {
+            field: unescape(key)?,
+            text: unescape_raw(&val[2..]),
+            is_re: false,
+        }
     } else {
         SearchNode::SingleField {
             field: unescape(key)?,
@@ -437,6 +444,21 @@ fn unescape_quotes(s: &str) -> Cow<str> {
     }
 }
 
+/// Unescape quotes but escape wildcards and \s.
+fn unescape_raw(s: &str) -> Cow<str> {
+    lazy_static! {
+        static ref RE: Regex = Regex::new(r#"\\"?|\*|_"#).unwrap();
+    }
+    RE.replace_all(&s, |caps: &Captures| match &caps[0] {
+        r"\" => r"\\",
+        "\\\"" => "\"",
+        r"*" => r"\*",
+        r"_" => r"\_",
+        _ => unreachable!(),
+    })
+}
+
+/// Unescape chars with special meaning to the parser.
 fn unescape(txt: &str) -> ParseResult<Cow<str>> {
     if is_invalid_escape(txt) {
         Err(ParseError {})
@@ -611,12 +633,21 @@ mod test {
             vec![Search(Regex(r"\btest\%".into()))]
         );
 
+        // treat all chars as literals in raw searches
+        assert_eq!(parse(r"r:\*_"), parse(r"\\\*\_"));
+        assert_eq!(parse(r"field:r:\*_"), parse(r"field:\\\*\_"));
+
         // no exceptions for escaping "
         assert_eq!(
             parse(r#"re:te\"st"#)?,
             vec![Search(Regex(r#"te"st"#.into()))]
         );
         assert!(parse(r#"re:te"st"#).is_err());
+        assert_eq!(
+            parse(r#"r:te\"st"#)?,
+            vec![Search(UnqualifiedText(r#"te"st"#.into()))]
+        );
+        assert!(parse(r#"r:te"st"#).is_err());
 
         // spaces are optional if node separation is clear
         assert_eq!(parse(r#"a"b"(c)"#)?, parse("a b (c)")?);

From 785540bddcbb9c57b876d8c6751772027257e4c5 Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Wed, 18 Nov 2020 23:46:27 +0100
Subject: [PATCH 19/20] Revert changes to normalisation handling

Handle norm calls individually in write_search_node_to_sql again.
---
 rslib/src/search/sqlwriter.rs | 103 +++++++++++-----------------------
 rslib/src/text.rs             |  11 ++++
 2 files changed, 43 insertions(+), 71 deletions(-)

diff --git a/rslib/src/search/sqlwriter.rs b/rslib/src/search/sqlwriter.rs
index cbe18dd3b..5137255a2 100644
--- a/rslib/src/search/sqlwriter.rs
+++ b/rslib/src/search/sqlwriter.rs
@@ -10,23 +10,12 @@ use crate::{
     notes::field_checksum,
     notetype::NoteTypeID,
     text::{
-        escape_sql, is_glob, normalize_to_nfc, strip_html_preserving_media_filenames, to_custom_re,
-        to_re, to_sql, to_text, without_combining,
+        escape_sql, is_glob, matches_glob, normalize_to_nfc, strip_html_preserving_media_filenames,
+        to_custom_re, to_re, to_sql, to_text, without_combining,
     },
     timestamp::TimestampSecs,
 };
-use regex::Regex;
 use std::{borrow::Cow, fmt::Write};
-use unicase::eq as uni_eq;
-use ConversionMode as CM;
-
-enum ConversionMode<'a> {
-    OnlyNorm,
-    Regex,
-    CustomRe(&'a str),
-    Sql,
-    Text,
-}
 
 pub(crate) struct SqlWriter<'a> {
     col: &'a mut Collection,
@@ -128,20 +117,26 @@ impl SqlWriter<'_> {
         use normalize_to_nfc as norm;
         match node {
             // note fields related
-            SearchNode::UnqualifiedText(text) => self.write_unqualified(text),
+            SearchNode::UnqualifiedText(text) => self.write_unqualified(&self.norm_note(text)),
             SearchNode::SingleField { field, text, is_re } => {
-                self.write_single_field(field, text, *is_re)?
+                self.write_single_field(&norm(field), &self.norm_note(text), *is_re)?
             }
-            SearchNode::Duplicates { note_type_id, text } => self.write_dupes(*note_type_id, text),
-            SearchNode::Regex(re) => self.write_regex(re),
-            SearchNode::NoCombining(text) => self.write_no_combining(text),
-            SearchNode::WordBoundary(text) => self.write_word_boundary(text),
+            SearchNode::Duplicates { note_type_id, text } => {
+                self.write_dupes(*note_type_id, &self.norm_note(text))
+            }
+            SearchNode::Regex(re) => self.write_regex(&self.norm_note(re)),
+            SearchNode::NoCombining(text) => self.write_no_combining(&self.norm_note(text)),
+            SearchNode::WordBoundary(text) => self.write_word_boundary(&self.norm_note(text)),
 
             // other
             SearchNode::AddedInDays(days) => self.write_added(*days)?,
             SearchNode::EditedInDays(days) => self.write_edited(*days)?,
-            SearchNode::CardTemplate(template) => self.write_template(template)?,
-            // fixme: always norm?
+            SearchNode::CardTemplate(template) => match template {
+                TemplateKind::Ordinal(_) => self.write_template(template)?,
+                TemplateKind::Name(name) => {
+                    self.write_template(&TemplateKind::Name(norm(name).into()))?
+                }
+            },
             SearchNode::Deck(deck) => self.write_deck(&norm(deck))?,
             SearchNode::NoteTypeID(ntid) => {
                 write!(self.sql, "n.mid = {}", ntid).unwrap();
@@ -149,10 +144,10 @@ impl SqlWriter<'_> {
             SearchNode::DeckID(did) => {
                 write!(self.sql, "c.did = {}", did).unwrap();
             }
-            SearchNode::NoteType(notetype) => self.write_note_type(notetype)?,
+            SearchNode::NoteType(notetype) => self.write_note_type(&norm(notetype))?,
             SearchNode::Rated { days, ease } => self.write_rated(*days, *ease)?,
 
-            SearchNode::Tag(tag) => self.write_tag(tag)?,
+            SearchNode::Tag(tag) => self.write_tag(&norm(tag))?,
             SearchNode::State(state) => self.write_state(state)?,
             SearchNode::Flag(flag) => {
                 write!(self.sql, "(c.flags & 7) == {}", flag).unwrap();
@@ -171,7 +166,7 @@ impl SqlWriter<'_> {
 
     fn write_unqualified(&mut self, text: &str) {
         // implicitly wrap in %
-        let text = format!("%{}%", &self.convert(CM::Sql, text));
+        let text = format!("%{}%", &to_sql(text));
         self.args.push(text);
         write!(
             self.sql,
@@ -182,7 +177,7 @@ impl SqlWriter<'_> {
     }
 
     fn write_no_combining(&mut self, text: &str) {
-        let text = format!("%{}%", without_combining(&self.convert(CM::Sql, text)));
+        let text = format!("%{}%", without_combining(&to_sql(text)));
         self.args.push(text);
         write!(
             self.sql,
@@ -205,13 +200,9 @@ impl SqlWriter<'_> {
                 s => {
                     if is_glob(s) {
                         write!(self.sql, "n.tags regexp ?").unwrap();
-                        let re = &self.convert(CM::CustomRe(r"\S"), s);
+                        let re = &to_custom_re(s, r"\S");
                         self.args.push(format!("(?i).* {} .*", re));
-                    } else if let Some(tag) = self
-                        .col
-                        .storage
-                        .preferred_tag_case(&self.convert(CM::Text, s))?
-                    {
+                    } else if let Some(tag) = self.col.storage.preferred_tag_case(&to_text(s))? {
                         write!(self.sql, "n.tags like ? escape '\\'").unwrap();
                         self.args.push(format!("% {} %", escape_sql(&tag)));
                     } else {
@@ -329,7 +320,7 @@ impl SqlWriter<'_> {
                             .as_str(),
                     )
                 } else {
-                    human_deck_name_to_native(&self.convert(CM::Regex, deck))
+                    human_deck_name_to_native(&to_re(deck))
                 };
 
                 // convert to a regex that includes child decks
@@ -352,7 +343,7 @@ impl SqlWriter<'_> {
             }
             TemplateKind::Name(name) => {
                 if is_glob(name) {
-                    let re = format!("(?i){}", self.convert(CM::Regex, name));
+                    let re = format!("(?i){}", to_re(name));
                     self.sql.push_str(
                         "(n.mid,c.ord) in (select ntid,ord from templates where name regexp ?)",
                     );
@@ -361,7 +352,7 @@ impl SqlWriter<'_> {
                     self.sql.push_str(
                         "(n.mid,c.ord) in (select ntid,ord from templates where name = ?)",
                     );
-                    self.args.push(self.convert(CM::Text, name).into());
+                    self.args.push(to_text(name).into());
                 }
             }
         };
@@ -370,14 +361,14 @@ impl SqlWriter<'_> {
 
     fn write_note_type(&mut self, nt_name: &str) -> Result<()> {
         if is_glob(nt_name) {
-            let re = format!("(?i){}", self.convert(CM::Regex, nt_name));
+            let re = format!("(?i){}", to_re(nt_name));
             self.sql
                 .push_str("n.mid in (select id from notetypes where name regexp ?)");
             self.args.push(re);
         } else {
             self.sql
                 .push_str("n.mid in (select id from notetypes where name = ?)");
-            self.args.push(self.convert(CM::Text, nt_name).into());
+            self.args.push(to_text(nt_name).into());
         }
         Ok(())
     }
@@ -388,7 +379,7 @@ impl SqlWriter<'_> {
         let mut field_map = vec![];
         for nt in note_types.values() {
             for field in &nt.fields {
-                if self.matches_glob(&field.name, field_name) {
+                if matches_glob(&field.name, field_name) {
                     field_map.push((nt.id, field.ord));
                 }
             }
@@ -407,12 +398,11 @@ impl SqlWriter<'_> {
         if is_re {
             cmp = "regexp";
             cmp_trailer = "";
-            self.args
-                .push(format!("(?i){}", self.convert(CM::OnlyNorm, val)));
+            self.args.push(format!("(?i){}", val));
         } else {
             cmp = "like";
             cmp_trailer = "escape '\\'";
-            self.args.push(self.convert(CM::Sql, val).into())
+            self.args.push(to_sql(val).into())
         }
 
         let arg_idx = self.args.len();
@@ -435,7 +425,6 @@ impl SqlWriter<'_> {
     }
 
     fn write_dupes(&mut self, ntid: NoteTypeID, text: &str) {
-        let text = &self.convert(CM::OnlyNorm, text);
         let text_nohtml = strip_html_preserving_media_filenames(text);
         let csum = field_checksum(text_nohtml.as_ref());
         write!(
@@ -463,39 +452,11 @@ impl SqlWriter<'_> {
 
     fn write_regex(&mut self, word: &str) {
         self.sql.push_str("n.flds regexp ?");
-        self.args
-            .push(format!(r"(?i){}", self.convert(CM::OnlyNorm, word)));
+        self.args.push(format!(r"(?i){}", word));
     }
 
     fn write_word_boundary(&mut self, word: &str) {
-        self.sql.push_str("n.flds regexp ?");
-        self.args
-            .push(format!(r"(?i)\b{}\b", self.convert(CM::Regex, word)));
-    }
-
-    /// Norm text and call the according conversion function.
-    fn convert<'a>(&self, mode: ConversionMode, txt: &'a str) -> Cow<'a, str> {
-        let txt = match mode {
-            CM::OnlyNorm => txt.into(),
-            CM::Regex => to_re(txt),
-            CM::CustomRe(wildcard) => to_custom_re(txt, wildcard),
-            CM::Sql => to_sql(txt),
-            CM::Text => to_text(txt),
-        };
-        match txt {
-            Cow::Borrowed(s) => self.norm_note(s),
-            Cow::Owned(s) => self.norm_note(&s).to_string().into(),
-        }
-    }
-
-    /// Compare text with a possible glob, folding case.
-    fn matches_glob(&self, text: &str, search: &str) -> bool {
-        if is_glob(search) {
-            let search = format!("^(?i){}$", self.convert(CM::Regex, search));
-            Regex::new(&search).unwrap().is_match(text)
-        } else {
-            uni_eq(text, &self.convert(CM::Text, search))
-        }
+        self.write_regex(&format!(r"\b{}\b", to_re(word)));
     }
 }
 
diff --git a/rslib/src/text.rs b/rslib/src/text.rs
index 5bc822edb..934fa64c0 100644
--- a/rslib/src/text.rs
+++ b/rslib/src/text.rs
@@ -5,6 +5,7 @@ use lazy_static::lazy_static;
 use regex::{Captures, Regex};
 use std::borrow::Cow;
 use std::ptr;
+use unicase::eq as uni_eq;
 use unicode_normalization::{
     char::is_combining_mark, is_nfc, is_nfkd_quick, IsNormalized, UnicodeNormalization,
 };
@@ -362,6 +363,16 @@ pub(crate) fn escape_sql(txt: &str) -> Cow<str> {
     RE.replace_all(&txt, r"\$0")
 }
 
+/// Compare text with a possible glob, folding case.
+pub(crate) fn matches_glob(text: &str, search: &str) -> bool {
+    if is_glob(search) {
+        let search = format!("^(?i){}$", to_re(search));
+        Regex::new(&search).unwrap().is_match(text)
+    } else {
+        uni_eq(text, &to_text(search))
+    }
+}
+
 #[cfg(test)]
 mod test {
     use crate::text::without_combining;

From cb2c19aced7feb7f375e17a2a597669624a80a8f Mon Sep 17 00:00:00 2001
From: RumovZ <gp5glkw78@relay.firefox.com>
Date: Thu, 19 Nov 2020 09:28:19 +0100
Subject: [PATCH 20/20] Add Python test for tag whitespace

Assert tag matches do not occur across different tags.
---
 pylib/tests/test_find.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/pylib/tests/test_find.py b/pylib/tests/test_find.py
index ffa190fa6..e7adfafec 100644
--- a/pylib/tests/test_find.py
+++ b/pylib/tests/test_find.py
@@ -49,6 +49,9 @@ def test_findCards():
     assert len(col.findCards("tag:*")) == 5
     assert len(col.findCards("tag:\\*")) == 1
     assert len(col.findCards("tag:%")) == 1
+    assert len(col.findCards("tag:sheep_goat")) == 0
+    assert len(col.findCards('"tag:sheep goat"')) == 0
+    assert len(col.findCards('"tag:* *"')) == 0
     assert len(col.findCards("tag:animal_1")) == 2
     assert len(col.findCards("tag:animal\\_1")) == 1
     assert not col.findCards("tag:donkey")