Package version:

Flexibly separates text into terms via a regular expression pattern. This analyzer is implemented using Apache Lucene.

interface PatternAnalyzer {
    flags?: (
        | "CANON_EQ"
        | "CASE_INSENSITIVE"
        | "COMMENTS"
        | "DOTALL"
        | "LITERAL"
        | "MULTILINE"
        | "UNICODE_CASE"
        | "UNIX_LINES")[];
    lowerCaseTerms?: boolean;
    name: string;
    odatatype: "#Microsoft.Azure.Search.PatternAnalyzer";
    pattern?: string;
    stopwords?: string[];
}

Properties

flags?: (
    | "CANON_EQ"
    | "CASE_INSENSITIVE"
    | "COMMENTS"
    | "DOTALL"
    | "LITERAL"
    | "MULTILINE"
    | "UNICODE_CASE"
    | "UNIX_LINES")[]

Regular expression flags. Possible values include: 'CANON_EQ', 'CASE_INSENSITIVE', 'COMMENTS', 'DOTALL', 'LITERAL', 'MULTILINE', 'UNICODE_CASE', 'UNIX_LINES'

lowerCaseTerms?: boolean

A value indicating whether terms should be lower-cased. Default is true. Default value: true.

name: string

The name of the analyzer. It must only contain letters, digits, spaces, dashes or underscores, can only start and end with alphanumeric characters, and is limited to 128 characters.

odatatype

Polymorphic Discriminator

pattern?: string

A regular expression pattern to match token separators. Default is an expression that matches one or more whitespace characters. Default value: \W+.

stopwords?: string[]

A list of stopwords.