# -------------------------------------------------------------------------
# Copyright (c) Microsoft Corporation. All rights reserved.
# Licensed under the MIT License. See License.txt in the project root for
# license information.
# --------------------------------------------------------------------------
from typing import Any, Dict, Union, List, Optional, MutableMapping, Callable, cast
from typing_extensions import Self
from .._generated import _serialization
from ._edm import Collection, ComplexType, String
from .._generated.models import (
SearchField as _SearchField,
SearchIndex as _SearchIndex,
PatternTokenizer as _PatternTokenizer,
LexicalAnalyzerName,
VectorEncodingFormat,
SearchFieldDataType,
ScoringProfile,
CorsOptions,
SearchSuggester,
LexicalAnalyzer,
LexicalTokenizer,
TokenFilter,
CharFilter,
SimilarityAlgorithm,
SemanticSearch,
VectorSearch,
)
from ._models import (
pack_analyzer,
unpack_analyzer,
PatternTokenizer,
SearchResourceEncryptionKey,
)
__all__ = ("ComplexField", "SearchableField", "SimpleField")
[docs]class SearchField(_serialization.Model):
# pylint: disable=too-many-instance-attributes
"""Represents a field in an index definition, which describes the name, data type, and search behavior of a field.
All required parameters must be populated in order to send to Azure.
:ivar name: The name of the field, which must be unique within the fields collection of the
index or parent field. Required.
:vartype name: str
:ivar type: The data type of the field. Required. Known values are: "Edm.String", "Edm.Int32",
"Edm.Int64", "Edm.Double", "Edm.Boolean", "Edm.DateTimeOffset", "Edm.GeographyPoint",
"Edm.ComplexType", "Edm.Single", "Edm.Half", "Edm.Int16", "Edm.SByte", and "Edm.Byte".
:vartype type: str or ~azure.search.documents.indexes.models.SearchFieldDataType
:ivar key: A value indicating whether the field uniquely identifies documents in the index.
Exactly one top-level field in each index must be chosen as the key field and it must be of
type Edm.String. Key fields can be used to look up documents directly and update or delete
specific documents. Default is false for simple fields and null for complex fields.
:vartype key: bool
:ivar stored: An immutable value indicating whether the field will be persisted separately on
disk to be returned in a search result. You can disable this option if you don't plan to return
the field contents in a search response to save on storage overhead. This can only be set
during index creation and only for vector fields. This property cannot be changed for existing
fields or set as false for new fields. If this property is set as false, the property
'hidden' must be set to true. This property must be true or unset for key fields,
for new fields, and for non-vector fields, and it must be null for complex fields. Disabling
this property will reduce index storage requirements. The default is true for vector fields.
:vartype stored: bool
:ivar searchable: A value indicating whether the field is full-text searchable. This means it
will undergo analysis such as word-breaking during indexing. If you set a searchable field to a
value like "sunny day", internally it will be split into the individual tokens "sunny" and
"day". This enables full-text searches for these terms. Fields of type Edm.String or
Collection(Edm.String) are searchable by default. This property must be false for simple fields
of other non-string data types, and it must be null for complex fields. Note: searchable fields
consume extra space in your index since Azure Cognitive Search will store an additional
tokenized version of the field value for full-text searches. If you want to save space in your
index and you don't need a field to be included in searches, set searchable to false.
:vartype searchable: bool
:ivar filterable: A value indicating whether to enable the field to be referenced in $filter
queries. filterable differs from searchable in how strings are handled. Fields of type
Edm.String or Collection(Edm.String) that are filterable do not undergo word-breaking, so
comparisons are for exact matches only. For example, if you set such a field f to "sunny day",
$filter=f eq 'sunny' will find no matches, but $filter=f eq 'sunny day' will. This property
must be null for complex fields. Default is true for simple fields and null for complex fields.
:vartype filterable: bool
:ivar sortable: A value indicating whether to enable the field to be referenced in $orderby
expressions. By default Azure Cognitive Search sorts results by score, but in many experiences
users will want to sort by fields in the documents. A simple field can be sortable only if it
is single-valued (it has a single value in the scope of the parent document). Simple collection
fields cannot be sortable, since they are multi-valued. Simple sub-fields of complex
collections are also multi-valued, and therefore cannot be sortable. This is true whether it's
an immediate parent field, or an ancestor field, that's the complex collection. Complex fields
cannot be sortable and the sortable property must be null for such fields. The default for
sortable is true for single-valued simple fields, false for multi-valued simple fields, and
null for complex fields.
:vartype sortable: bool
:ivar facetable: A value indicating whether to enable the field to be referenced in facet
queries. Typically used in a presentation of search results that includes hit count by category
(for example, search for digital cameras and see hits by brand, by megapixels, by price, and so
on). This property must be null for complex fields. Fields of type Edm.GeographyPoint or
Collection(Edm.GeographyPoint) cannot be facetable. Default is true for all other simple
fields.
:vartype facetable: bool
:ivar analyzer_name: The name of the analyzer to use for the field. This option can be used only
with searchable fields and it can't be set together with either searchAnalyzer or
indexAnalyzer. Once the analyzer is chosen, it cannot be changed for the field. Must be null
for complex fields. Known values are: "ar.microsoft", "ar.lucene", "hy.lucene", "bn.microsoft",
"eu.lucene", "bg.microsoft", "bg.lucene", "ca.microsoft", "ca.lucene", "zh-Hans.microsoft",
"zh-Hans.lucene", "zh-Hant.microsoft", "zh-Hant.lucene", "hr.microsoft", "cs.microsoft",
"cs.lucene", "da.microsoft", "da.lucene", "nl.microsoft", "nl.lucene", "en.microsoft",
"en.lucene", "et.microsoft", "fi.microsoft", "fi.lucene", "fr.microsoft", "fr.lucene",
"gl.lucene", "de.microsoft", "de.lucene", "el.microsoft", "el.lucene", "gu.microsoft",
"he.microsoft", "hi.microsoft", "hi.lucene", "hu.microsoft", "hu.lucene", "is.microsoft",
"id.microsoft", "id.lucene", "ga.lucene", "it.microsoft", "it.lucene", "ja.microsoft",
"ja.lucene", "kn.microsoft", "ko.microsoft", "ko.lucene", "lv.microsoft", "lv.lucene",
"lt.microsoft", "ml.microsoft", "ms.microsoft", "mr.microsoft", "nb.microsoft", "no.lucene",
"fa.lucene", "pl.microsoft", "pl.lucene", "pt-BR.microsoft", "pt-BR.lucene", "pt-PT.microsoft",
"pt-PT.lucene", "pa.microsoft", "ro.microsoft", "ro.lucene", "ru.microsoft", "ru.lucene",
"sr-cyrillic.microsoft", "sr-latin.microsoft", "sk.microsoft", "sl.microsoft", "es.microsoft",
"es.lucene", "sv.microsoft", "sv.lucene", "ta.microsoft", "te.microsoft", "th.microsoft",
"th.lucene", "tr.microsoft", "tr.lucene", "uk.microsoft", "ur.microsoft", "vi.microsoft",
"standard.lucene", "standardasciifolding.lucene", "keyword", "pattern", "simple", "stop", and
"whitespace".
:vartype analyzer_name: str or ~azure.search.documents.indexes.models.LexicalAnalyzerName
:ivar search_analyzer_name: The name of the analyzer used at search time for the field. This option
can be used only with searchable fields. It must be set together with indexAnalyzer and it
cannot be set together with the analyzer option. This property cannot be set to the name of a
language analyzer; use the analyzer property instead if you need a language analyzer. This
analyzer can be updated on an existing field. Must be null for complex fields. Known values
are: "ar.microsoft", "ar.lucene", "hy.lucene", "bn.microsoft", "eu.lucene", "bg.microsoft",
"bg.lucene", "ca.microsoft", "ca.lucene", "zh-Hans.microsoft", "zh-Hans.lucene",
"zh-Hant.microsoft", "zh-Hant.lucene", "hr.microsoft", "cs.microsoft", "cs.lucene",
"da.microsoft", "da.lucene", "nl.microsoft", "nl.lucene", "en.microsoft", "en.lucene",
"et.microsoft", "fi.microsoft", "fi.lucene", "fr.microsoft", "fr.lucene", "gl.lucene",
"de.microsoft", "de.lucene", "el.microsoft", "el.lucene", "gu.microsoft", "he.microsoft",
"hi.microsoft", "hi.lucene", "hu.microsoft", "hu.lucene", "is.microsoft", "id.microsoft",
"id.lucene", "ga.lucene", "it.microsoft", "it.lucene", "ja.microsoft", "ja.lucene",
"kn.microsoft", "ko.microsoft", "ko.lucene", "lv.microsoft", "lv.lucene", "lt.microsoft",
"ml.microsoft", "ms.microsoft", "mr.microsoft", "nb.microsoft", "no.lucene", "fa.lucene",
"pl.microsoft", "pl.lucene", "pt-BR.microsoft", "pt-BR.lucene", "pt-PT.microsoft",
"pt-PT.lucene", "pa.microsoft", "ro.microsoft", "ro.lucene", "ru.microsoft", "ru.lucene",
"sr-cyrillic.microsoft", "sr-latin.microsoft", "sk.microsoft", "sl.microsoft", "es.microsoft",
"es.lucene", "sv.microsoft", "sv.lucene", "ta.microsoft", "te.microsoft", "th.microsoft",
"th.lucene", "tr.microsoft", "tr.lucene", "uk.microsoft", "ur.microsoft", "vi.microsoft",
"standard.lucene", "standardasciifolding.lucene", "keyword", "pattern", "simple", "stop", and
"whitespace".
:vartype search_analyzer_name: str or ~azure.search.documents.indexes.models.LexicalAnalyzerName
:ivar index_analyzer_name: The name of the analyzer used at indexing time for the field. This option
can be used only with searchable fields. It must be set together with searchAnalyzer and it
cannot be set together with the analyzer option. This property cannot be set to the name of a
language analyzer; use the analyzer property instead if you need a language analyzer. Once the
analyzer is chosen, it cannot be changed for the field. Must be null for complex fields. Known
values are: "ar.microsoft", "ar.lucene", "hy.lucene", "bn.microsoft", "eu.lucene",
"bg.microsoft", "bg.lucene", "ca.microsoft", "ca.lucene", "zh-Hans.microsoft",
"zh-Hans.lucene", "zh-Hant.microsoft", "zh-Hant.lucene", "hr.microsoft", "cs.microsoft",
"cs.lucene", "da.microsoft", "da.lucene", "nl.microsoft", "nl.lucene", "en.microsoft",
"en.lucene", "et.microsoft", "fi.microsoft", "fi.lucene", "fr.microsoft", "fr.lucene",
"gl.lucene", "de.microsoft", "de.lucene", "el.microsoft", "el.lucene", "gu.microsoft",
"he.microsoft", "hi.microsoft", "hi.lucene", "hu.microsoft", "hu.lucene", "is.microsoft",
"id.microsoft", "id.lucene", "ga.lucene", "it.microsoft", "it.lucene", "ja.microsoft",
"ja.lucene", "kn.microsoft", "ko.microsoft", "ko.lucene", "lv.microsoft", "lv.lucene",
"lt.microsoft", "ml.microsoft", "ms.microsoft", "mr.microsoft", "nb.microsoft", "no.lucene",
"fa.lucene", "pl.microsoft", "pl.lucene", "pt-BR.microsoft", "pt-BR.lucene", "pt-PT.microsoft",
"pt-PT.lucene", "pa.microsoft", "ro.microsoft", "ro.lucene", "ru.microsoft", "ru.lucene",
"sr-cyrillic.microsoft", "sr-latin.microsoft", "sk.microsoft", "sl.microsoft", "es.microsoft",
"es.lucene", "sv.microsoft", "sv.lucene", "ta.microsoft", "te.microsoft", "th.microsoft",
"th.lucene", "tr.microsoft", "tr.lucene", "uk.microsoft", "ur.microsoft", "vi.microsoft",
"standard.lucene", "standardasciifolding.lucene", "keyword", "pattern", "simple", "stop", and
"whitespace".
:vartype index_analyzer_name: str or ~azure.search.documents.indexes.models.LexicalAnalyzerName
:ivar vector_search_dimensions: The dimensionality of the vector field.
:vartype vector_search_dimensions: int
:ivar vector_search_profile_name: The name of the vector search profile that specifies the algorithm
to use when searching the vector field.
:vartype vector_search_profile_name: str
:ivar synonym_map_names: A list of the names of synonym maps to associate with this field. This
option can be used only with searchable fields. Currently only one synonym map per field is
supported. Assigning a synonym map to a field ensures that query terms targeting that field are
expanded at query-time using the rules in the synonym map. This attribute can be changed on
existing fields. Must be null or an empty collection for complex fields.
:vartype synonym_map_names: list[str]
:ivar fields: A list of sub-fields if this is a field of type Edm.ComplexType or
Collection(Edm.ComplexType). Must be null or empty for simple fields.
:vartype fields: list[~azure.search.documents.indexes.models.SearchField]
:ivar vector_encoding_format: The encoding format to interpret the field contents. "packedBit"
:vartype vector_encoding_format: str or ~azure.search.documents.indexes.models.VectorEncodingFormat
"""
def __init__(
self,
*,
name: str,
type: Union[str, SearchFieldDataType],
key: Optional[bool] = None,
hidden: Optional[bool] = None,
stored: Optional[bool] = None,
searchable: Optional[bool] = None,
filterable: Optional[bool] = None,
sortable: Optional[bool] = None,
facetable: Optional[bool] = None,
analyzer_name: Optional[Union[str, LexicalAnalyzerName]] = None,
search_analyzer_name: Optional[Union[str, LexicalAnalyzerName]] = None,
index_analyzer_name: Optional[Union[str, LexicalAnalyzerName]] = None,
synonym_map_names: Optional[List[str]] = None,
fields: Optional[List["SearchField"]] = None,
vector_search_dimensions: Optional[int] = None,
vector_search_profile_name: Optional[str] = None,
vector_encoding_format: Optional[Union[str, VectorEncodingFormat]] = None,
**kwargs
):
super().__init__(**kwargs)
self.name = name
self.type = type
self.key = key
self.hidden = hidden
self.stored = stored
self.searchable = searchable
self.filterable = filterable
self.sortable = sortable
self.facetable = facetable
self.analyzer_name = analyzer_name
self.search_analyzer_name = search_analyzer_name
self.index_analyzer_name = index_analyzer_name
self.synonym_map_names = synonym_map_names
self.fields = fields
self.vector_search_dimensions = vector_search_dimensions
self.vector_search_profile_name = vector_search_profile_name
self.vector_encoding_format = vector_encoding_format
def _to_generated(self) -> _SearchField:
fields = [pack_search_field(x) for x in self.fields] if self.fields else None
retrievable = not self.hidden if self.hidden is not None else None
return _SearchField(
name=self.name,
type=self.type,
key=self.key,
retrievable=retrievable,
stored=self.stored,
searchable=self.searchable,
filterable=self.filterable,
sortable=self.sortable,
facetable=self.facetable,
analyzer=self.analyzer_name,
search_analyzer=self.search_analyzer_name,
index_analyzer=self.index_analyzer_name,
synonym_maps=self.synonym_map_names,
fields=fields,
vector_search_dimensions=self.vector_search_dimensions,
vector_search_profile_name=self.vector_search_profile_name,
vector_encoding_format=self.vector_encoding_format,
)
@classmethod
def _from_generated(cls, search_field) -> Optional[Self]:
if not search_field:
return None
# pylint:disable=protected-access
fields = (
[cast(SearchField, SearchField._from_generated(x)) for x in search_field.fields]
if search_field.fields
else None
)
hidden = not search_field.retrievable if search_field.retrievable is not None else None
return cls(
name=search_field.name,
type=search_field.type,
key=search_field.key,
hidden=hidden,
stored=search_field.stored,
searchable=search_field.searchable,
filterable=search_field.filterable,
sortable=search_field.sortable,
facetable=search_field.facetable,
analyzer_name=search_field.analyzer,
search_analyzer_name=search_field.search_analyzer,
index_analyzer_name=search_field.index_analyzer,
synonym_map_names=search_field.synonym_maps,
fields=fields,
vector_search_dimensions=search_field.vector_search_dimensions,
vector_search_profile_name=search_field.vector_search_profile_name,
vector_encoding_format=search_field.vector_encoding_format,
)
[docs] def serialize(self, keep_readonly: bool = False, **kwargs: Any) -> MutableMapping[str, Any]:
"""Return the JSON that would be sent to server from this model.
:param bool keep_readonly: If you want to serialize the readonly attributes
:returns: A dict JSON compatible object
:rtype: dict
"""
return self._to_generated().serialize(keep_readonly=keep_readonly, **kwargs)
[docs] @classmethod
def deserialize(cls, data: Any, content_type: Optional[str] = None) -> Optional[Self]: # type: ignore
"""Parse a str using the RestAPI syntax and return a SearchField instance.
:param str data: A str using RestAPI structure. JSON by default.
:param str content_type: JSON by default, set application/xml if XML.
:returns: A SearchField instance
:raises: DeserializationError if something went wrong
"""
return cls._from_generated(_SearchField.deserialize(data, content_type=content_type))
[docs] def as_dict(
self,
keep_readonly: bool = True,
key_transformer: Callable[[str, Dict[str, Any], Any], Any] = _serialization.attribute_transformer,
**kwargs: Any
) -> MutableMapping[str, Any]:
"""Return a dict that can be serialized using json.dump.
:param bool keep_readonly: If you want to serialize the readonly attributes
:param Callable key_transformer: A callable that will transform the key of the dict
:returns: A dict JSON compatible object
:rtype: dict
"""
return self._to_generated().as_dict( # type: ignore
keep_readonly=keep_readonly, key_transformer=key_transformer, **kwargs
)
[docs] @classmethod
def from_dict( # type: ignore
cls,
data: Any,
key_extractors: Optional[Callable[[str, Dict[str, Any], Any], Any]] = None,
content_type: Optional[str] = None,
) -> Optional["SearchField"]:
"""Parse a dict using given key extractor return a model.
By default consider key
extractors (rest_key_case_insensitive_extractor, attribute_key_case_insensitive_extractor
and last_rest_key_case_insensitive_extractor)
:param dict data: A dict using RestAPI structure
:param Callable key_extractors: A callable that will extract a key from a dict
:param str content_type: JSON by default, set application/xml if XML.
:returns: A SearchField instance
:rtype: SearchField
:raises: DeserializationError if something went wrong
"""
return cls._from_generated(
_SearchField.from_dict(data, content_type=content_type, key_extractors=key_extractors)
)
[docs]def SimpleField(
*,
name: str,
type: str,
key: bool = False,
hidden: bool = False,
filterable: bool = False,
sortable: bool = False,
facetable: bool = False,
**kw # pylint:disable=unused-argument
) -> SearchField:
"""Configure a simple field for an Azure Search Index
:keyword name: Required. The name of the field, which must be unique within the fields collection
of the index or parent field.
:paramtype name: str
:keyword type: Required. The data type of the field. Possible values include: SearchFieldDataType.String,
SearchFieldDataType.Int32, SearchFieldDataType.Int64, SearchFieldDataType.Double, SearchFieldDataType.Boolean,
SearchFieldDataType.DateTimeOffset, SearchFieldDataType.GeographyPoint, SearchFieldDataType.ComplexType,
from `azure.search.documents.SearchFieldDataType`.
:paramtype type: str
:keyword key: A value indicating whether the field uniquely identifies documents in the index.
Exactly one top-level field in each index must be chosen as the key field and it must be of
type SearchFieldDataType.String. Key fields can be used to look up documents directly and
update or delete specific documents. Default is False
:paramtype key: bool
:keyword hidden: A value indicating whether the field can be returned in a search result.
You can enable this option if you want to use a field (for example, margin) as a filter,
sorting, or scoring mechanism but do not want the field to be visible to the end user. This
property must be False for key fields. This property can be changed on existing fields.
Enabling this property does not cause any increase in index storage requirements. Default is
False.
:paramtype hidden: bool
:keyword filterable: A value indicating whether to enable the field to be referenced in $filter
queries. filterable differs from searchable in how strings are handled. Fields of type
SearchFieldDataType.String or Collection(SearchFieldDataType.String) that are filterable do
not undergo word-breaking, so comparisons are for exact matches only. For example, if you
set such a field f to "sunny day", $filter=f eq 'sunny' will find no matches, but
$filter=f eq 'sunny day' will. This property must be null for complex fields. Default is False
:paramtype filterable: bool
:keyword sortable: A value indicating whether to enable the field to be referenced in $orderby
expressions. By default Azure Cognitive Search sorts results by score, but in many experiences
users will want to sort by fields in the documents. A simple field can be sortable only if it
is single-valued (it has a single value in the scope of the parent document). Simple collection
fields cannot be sortable, since they are multi-valued. Simple sub-fields of complex
collections are also multi-valued, and therefore cannot be sortable. This is true whether it's
an immediate parent field, or an ancestor field, that's the complex collection. The default is
False.
:paramtype sortable: bool
:keyword facetable: A value indicating whether to enable the field to be referenced in facet
queries. Typically used in a presentation of search results that includes hit count by category
(for example, search for digital cameras and see hits by brand, by megapixels, by price, and so
on). Fields of type SearchFieldDataType.GeographyPoint or
Collection(SearchFieldDataType.GeographyPoint) cannot be facetable. Default is False.
:paramtype facetable: bool
:return: The search field object.
:rtype: SearchField
"""
result: Dict[str, Any] = {
"name": name,
"type": type,
"key": key,
"searchable": False,
"filterable": filterable,
"facetable": facetable,
"sortable": sortable,
"hidden": hidden,
}
return SearchField(**result)
[docs]def SearchableField(
*,
name: str,
collection: bool = False,
key: bool = False,
hidden: bool = False,
searchable: bool = True,
filterable: bool = False,
sortable: bool = False,
facetable: bool = False,
analyzer_name: Optional[Union[str, LexicalAnalyzerName]] = None,
search_analyzer_name: Optional[Union[str, LexicalAnalyzerName]] = None,
index_analyzer_name: Optional[Union[str, LexicalAnalyzerName]] = None,
synonym_map_names: Optional[List[str]] = None,
**kw # pylint:disable=unused-argument
) -> SearchField:
"""Configure a searchable text field for an Azure Search Index
:keyword name: Required. The name of the field, which must be unique within the fields collection
of the index or parent field.
:paramtype name: str
:keyword collection: Whether this search field is a collection (default False)
:paramtype collection: bool
:keyword key: A value indicating whether the field uniquely identifies documents in the index.
Exactly one top-level field in each index must be chosen as the key field and it must be of
type SearchFieldDataType.String. Key fields can be used to look up documents directly and update or delete
specific documents. Default is False
:paramtype key: bool
:keyword hidden: A value indicating whether the field can be returned in a search result.
You can enable this option if you want to use a field (for example, margin) as a filter,
sorting, or scoring mechanism but do not want the field to be visible to the end user. This
property must be False for key fields. This property can be changed on existing fields.
Enabling this property does not cause any increase in index storage requirements. Default is
False.
:paramtype hidden: bool
:keyword searchable: A value indicating whether the field is full-text searchable. This means it
will undergo analysis such as word-breaking during indexing. If you set a searchable field to a
value like "sunny day", internally it will be split into the individual tokens "sunny" and
"day". This enables full-text searches for these terms. Note: searchable fields
consume extra space in your index since Azure Cognitive Search will store an additional
tokenized version of the field value for full-text searches. If you want to save space in your
index and you don't need a field to be included in searches, set searchable to false. Default
is True.
:paramtype searchable: bool
:keyword filterable: A value indicating whether to enable the field to be referenced in $filter
queries. filterable differs from searchable in how strings are handled. Fields that are
filterable do not undergo word-breaking, so comparisons are for exact matches only. For example,
if you set such a field f to "sunny day", $filter=f eq 'sunny' will find no matches, but
$filter=f eq 'sunny day' will. Default is False.
:paramtype filterable: bool
:keyword sortable: A value indicating whether to enable the field to be referenced in $orderby
expressions. By default Azure Cognitive Search sorts results by score, but in many experiences
users will want to sort by fields in the documents. The default is False.
:paramtype sortable: bool
:keyword facetable: A value indicating whether to enable the field to be referenced in facet
queries. Typically used in a presentation of search results that includes hit count by category
(for example, search for digital cameras and see hits by brand, by megapixels, by price, and so
on). Default is False.
:paramtype facetable: bool
:keyword analyzer_name: The name of the analyzer to use for the field. This option can't be set together
with either searchAnalyzer or indexAnalyzer. Once the analyzer is chosen, it cannot be changed
for the field. Possible values include: 'ar.microsoft', 'ar.lucene', 'hy.lucene',
'bn.microsoft', 'eu.lucene', 'bg.microsoft', 'bg.lucene', 'ca.microsoft', 'ca.lucene', 'zh-
Hans.microsoft', 'zh-Hans.lucene', 'zh-Hant.microsoft', 'zh-Hant.lucene', 'hr.microsoft',
'cs.microsoft', 'cs.lucene', 'da.microsoft', 'da.lucene', 'nl.microsoft', 'nl.lucene',
'en.microsoft', 'en.lucene', 'et.microsoft', 'fi.microsoft', 'fi.lucene', 'fr.microsoft',
'fr.lucene', 'gl.lucene', 'de.microsoft', 'de.lucene', 'el.microsoft', 'el.lucene',
'gu.microsoft', 'he.microsoft', 'hi.microsoft', 'hi.lucene', 'hu.microsoft', 'hu.lucene',
'is.microsoft', 'id.microsoft', 'id.lucene', 'ga.lucene', 'it.microsoft', 'it.lucene',
'ja.microsoft', 'ja.lucene', 'kn.microsoft', 'ko.microsoft', 'ko.lucene', 'lv.microsoft',
'lv.lucene', 'lt.microsoft', 'ml.microsoft', 'ms.microsoft', 'mr.microsoft', 'nb.microsoft',
'no.lucene', 'fa.lucene', 'pl.microsoft', 'pl.lucene', 'pt-BR.microsoft', 'pt-BR.lucene', 'pt-
PT.microsoft', 'pt-PT.lucene', 'pa.microsoft', 'ro.microsoft', 'ro.lucene', 'ru.microsoft',
'ru.lucene', 'sr-cyrillic.microsoft', 'sr-latin.microsoft', 'sk.microsoft', 'sl.microsoft',
'es.microsoft', 'es.lucene', 'sv.microsoft', 'sv.lucene', 'ta.microsoft', 'te.microsoft',
'th.microsoft', 'th.lucene', 'tr.microsoft', 'tr.lucene', 'uk.microsoft', 'ur.microsoft',
'vi.microsoft', 'standard.lucene', 'standardasciifolding.lucene', 'keyword', 'pattern',
'simple', 'stop', 'whitespace'.
:paramtype analyzer_name: str or ~azure.search.documents.indexes.models.LexicalAnalyzerName
:keyword search_analyzer_name: The name of the analyzer used at search time for the field. It must be
set together with indexAnalyzer and it cannot be set together with the analyzer option. This
property cannot be set to the name of a language analyzer; use the analyzer property instead
if you need a language analyzer. This analyzer can be updated on an existing field. Possible
values include:
'ar.microsoft', 'ar.lucene', 'hy.lucene', 'bn.microsoft', 'eu.lucene', 'bg.microsoft',
'bg.lucene', 'ca.microsoft', 'ca.lucene', 'zh-Hans.microsoft', 'zh-Hans.lucene', 'zh-
Hant.microsoft', 'zh-Hant.lucene', 'hr.microsoft', 'cs.microsoft', 'cs.lucene', 'da.microsoft',
'da.lucene', 'nl.microsoft', 'nl.lucene', 'en.microsoft', 'en.lucene', 'et.microsoft',
'fi.microsoft', 'fi.lucene', 'fr.microsoft', 'fr.lucene', 'gl.lucene', 'de.microsoft',
'de.lucene', 'el.microsoft', 'el.lucene', 'gu.microsoft', 'he.microsoft', 'hi.microsoft',
'hi.lucene', 'hu.microsoft', 'hu.lucene', 'is.microsoft', 'id.microsoft', 'id.lucene',
'ga.lucene', 'it.microsoft', 'it.lucene', 'ja.microsoft', 'ja.lucene', 'kn.microsoft',
'ko.microsoft', 'ko.lucene', 'lv.microsoft', 'lv.lucene', 'lt.microsoft', 'ml.microsoft',
'ms.microsoft', 'mr.microsoft', 'nb.microsoft', 'no.lucene', 'fa.lucene', 'pl.microsoft',
'pl.lucene', 'pt-BR.microsoft', 'pt-BR.lucene', 'pt-PT.microsoft', 'pt-PT.lucene',
'pa.microsoft', 'ro.microsoft', 'ro.lucene', 'ru.microsoft', 'ru.lucene', 'sr-
cyrillic.microsoft', 'sr-latin.microsoft', 'sk.microsoft', 'sl.microsoft', 'es.microsoft',
'es.lucene', 'sv.microsoft', 'sv.lucene', 'ta.microsoft', 'te.microsoft', 'th.microsoft',
'th.lucene', 'tr.microsoft', 'tr.lucene', 'uk.microsoft', 'ur.microsoft', 'vi.microsoft',
'standard.lucene', 'standardasciifolding.lucene', 'keyword', 'pattern', 'simple', 'stop',
'whitespace'.
:paramtype search_analyzer_name: str or ~azure.search.documents.indexes.models.LexicalAnalyzerName
:keyword index_analyzer_name: The name of the analyzer used at indexing time for the field.
It must be set together with searchAnalyzer and it cannot be set together with the analyzer
option. This property cannot be set to the name of a language analyzer; use the analyzer
property instead if you need a language analyzer. Once the analyzer is chosen, it cannot be
changed for the field. Possible values include:
'ar.microsoft', 'ar.lucene', 'hy.lucene', 'bn.microsoft', 'eu.lucene',
'bg.microsoft', 'bg.lucene', 'ca.microsoft', 'ca.lucene', 'zh-Hans.microsoft', 'zh-
Hans.lucene', 'zh-Hant.microsoft', 'zh-Hant.lucene', 'hr.microsoft', 'cs.microsoft',
'cs.lucene', 'da.microsoft', 'da.lucene', 'nl.microsoft', 'nl.lucene', 'en.microsoft',
'en.lucene', 'et.microsoft', 'fi.microsoft', 'fi.lucene', 'fr.microsoft', 'fr.lucene',
'gl.lucene', 'de.microsoft', 'de.lucene', 'el.microsoft', 'el.lucene', 'gu.microsoft',
'he.microsoft', 'hi.microsoft', 'hi.lucene', 'hu.microsoft', 'hu.lucene', 'is.microsoft',
'id.microsoft', 'id.lucene', 'ga.lucene', 'it.microsoft', 'it.lucene', 'ja.microsoft',
'ja.lucene', 'kn.microsoft', 'ko.microsoft', 'ko.lucene', 'lv.microsoft', 'lv.lucene',
'lt.microsoft', 'ml.microsoft', 'ms.microsoft', 'mr.microsoft', 'nb.microsoft', 'no.lucene',
'fa.lucene', 'pl.microsoft', 'pl.lucene', 'pt-BR.microsoft', 'pt-BR.lucene', 'pt-PT.microsoft',
'pt-PT.lucene', 'pa.microsoft', 'ro.microsoft', 'ro.lucene', 'ru.microsoft', 'ru.lucene', 'sr-
cyrillic.microsoft', 'sr-latin.microsoft', 'sk.microsoft', 'sl.microsoft', 'es.microsoft',
'es.lucene', 'sv.microsoft', 'sv.lucene', 'ta.microsoft', 'te.microsoft', 'th.microsoft',
'th.lucene', 'tr.microsoft', 'tr.lucene', 'uk.microsoft', 'ur.microsoft', 'vi.microsoft',
'standard.lucene', 'standardasciifolding.lucene', 'keyword', 'pattern', 'simple', 'stop',
'whitespace'.
:paramtype index_analyzer_name: str or ~azure.search.documents.indexes.models.LexicalAnalyzerName
:keyword synonym_map_names: A list of the names of synonym maps to associate with this field. Currently
only one synonym map per field is supported. Assigning a synonym map to a field ensures that
query terms targeting that field are expanded at query-time using the rules in the synonym map.
This attribute can be changed on existing fields.
:paramtype synonym_map_names: list[str]
:return: The search field object.
:rtype: SearchField
"""
typ = Collection(String) if collection else String
result: Dict[str, Any] = {
"name": name,
"type": typ,
"key": key,
"searchable": searchable,
"filterable": filterable,
"facetable": facetable,
"sortable": sortable,
"hidden": hidden,
}
if analyzer_name:
result["analyzer_name"] = analyzer_name
if search_analyzer_name:
result["search_analyzer_name"] = search_analyzer_name
if index_analyzer_name:
result["index_analyzer_name"] = index_analyzer_name
if synonym_map_names:
result["synonym_map_names"] = synonym_map_names
return SearchField(**result)
[docs]def ComplexField(
*,
name: str,
collection: bool = False,
fields: Optional[List[SearchField]] = None,
**kw # pylint:disable=unused-argument
) -> SearchField:
"""Configure a Complex or Complex collection field for an Azure Search
Index
:keyword name: Required. The name of the field, which must be unique within the fields collection
of the index or parent field.
:paramtype name: str
:keyword collection: Whether this complex field is a collection (default False)
:paramtype collection: bool
:keyword fields: A list of sub-fields
:paramtype fields: list[~azure.search.documents.indexes.models.SearchField]
:return: The search field object.
:rtype: SearchField
"""
typ = Collection(ComplexType) if collection else ComplexType
result: Dict[str, Any] = {"name": name, "type": typ, "fields": fields}
return SearchField(**result)
[docs]class SearchIndex(_serialization.Model):
# pylint: disable=too-many-instance-attributes
"""Represents a search index definition, which describes the fields and search behavior of an index.
All required parameters must be populated in order to send to Azure.
:ivar name: Required. The name of the index.
:vartype name: str
:ivar fields: Required. The fields of the index.
:vartype fields: list[~azure.search.documents.indexes.models.SearchField]
:ivar scoring_profiles: The scoring profiles for the index.
:vartype scoring_profiles: list[~azure.search.documents.indexes.models.ScoringProfile]
:ivar default_scoring_profile: The name of the scoring profile to use if none is specified in
the query. If this property is not set and no scoring profile is specified in the query, then
default scoring (tf-idf) will be used.
:vartype default_scoring_profile: str
:ivar cors_options: Options to control Cross-Origin Resource Sharing (CORS) for the index.
:vartype cors_options: ~azure.search.documents.indexes.models.CorsOptions
:ivar suggesters: The suggesters for the index.
:vartype suggesters: list[~azure.search.documents.indexes.models.SearchSuggester]
:ivar analyzers: The analyzers for the index.
:vartype analyzers: list[~azure.search.documents.indexes.models.LexicalAnalyzer]
:ivar tokenizers: The tokenizers for the index.
:vartype tokenizers: list[~azure.search.documents.indexes.models.LexicalTokenizer]
:ivar token_filters: The token filters for the index.
:vartype token_filters: list[~azure.search.documents.indexes.models.TokenFilter]
:ivar char_filters: The character filters for the index.
:vartype char_filters: list[~azure.search.documents.indexes.models.CharFilter]
:ivar encryption_key: A description of an encryption key that you create in Azure Key Vault.
This key is used to provide an additional level of encryption-at-rest for your data when you
want full assurance that no one, not even Microsoft, can decrypt your data in Azure Cognitive
Search. Once you have encrypted your data, it will always remain encrypted. Azure Cognitive
Search will ignore attempts to set this property to null. You can change this property as
needed if you want to rotate your encryption key; Your data will be unaffected. Encryption with
customer-managed keys is not available for free search services, and is only available for paid
services created on or after January 1, 2019.
:vartype encryption_key: ~azure.search.documents.indexes.models.SearchResourceEncryptionKey
:ivar similarity: The type of similarity algorithm to be used when scoring and ranking the
documents matching a search query. The similarity algorithm can only be defined at index
creation time and cannot be modified on existing indexes. If null, the ClassicSimilarity
algorithm is used.
:vartype similarity: ~azure.search.documents.indexes.models.SimilarityAlgorithm
:ivar semantic_search: Defines parameters for a search index that influence semantic capabilities.
:vartype semantic_search: ~azure.search.documents.indexes.models.SemanticSearch
:ivar vector_search: Defines parameters for a search index that influence scoring in a vector space.
:vartype vector_search: ~azure.search.documents.indexes.models.VectorSearch
:ivar e_tag: The ETag of the index.
:vartype e_tag: str
"""
def __init__(
self,
*,
name: str,
fields: List[SearchField],
scoring_profiles: Optional[List[ScoringProfile]] = None,
default_scoring_profile: Optional[str] = None,
cors_options: Optional[CorsOptions] = None,
suggesters: Optional[List[SearchSuggester]] = None,
analyzers: Optional[List[LexicalAnalyzer]] = None,
tokenizers: Optional[List[LexicalTokenizer]] = None,
token_filters: Optional[List[TokenFilter]] = None,
char_filters: Optional[List[CharFilter]] = None,
encryption_key: Optional[SearchResourceEncryptionKey] = None,
similarity: Optional[SimilarityAlgorithm] = None,
semantic_search: Optional[SemanticSearch] = None,
vector_search: Optional[VectorSearch] = None,
e_tag: Optional[str] = None,
**kwargs
):
super().__init__(**kwargs)
self.name = name
self.fields = fields
self.scoring_profiles = scoring_profiles
self.default_scoring_profile = default_scoring_profile
self.cors_options = cors_options
self.suggesters = suggesters
self.analyzers = analyzers
self.tokenizers = tokenizers
self.token_filters = token_filters
self.char_filters = char_filters
self.encryption_key = encryption_key
self.similarity = similarity
self.semantic_search = semantic_search
self.vector_search = vector_search
self.e_tag = e_tag
def _to_generated(self) -> _SearchIndex:
if self.analyzers:
analyzers = [pack_analyzer(x) for x in self.analyzers] # type: ignore # mypy: ignore
else:
analyzers = None
if self.tokenizers:
tokenizers = [
x._to_generated() if isinstance(x, PatternTokenizer) else x # pylint:disable=protected-access
for x in self.tokenizers
]
else:
tokenizers = None
if self.fields:
fields = [pack_search_field(x) for x in self.fields]
else:
fields = []
return _SearchIndex(
name=self.name,
fields=fields,
scoring_profiles=self.scoring_profiles,
default_scoring_profile=self.default_scoring_profile,
cors_options=self.cors_options,
suggesters=self.suggesters,
analyzers=analyzers,
tokenizers=tokenizers,
token_filters=self.token_filters,
char_filters=self.char_filters,
# pylint:disable=protected-access
encryption_key=self.encryption_key._to_generated() if self.encryption_key else None,
similarity=self.similarity,
semantic_search=self.semantic_search,
e_tag=self.e_tag,
vector_search=self.vector_search,
)
@classmethod
def _from_generated(cls, search_index) -> Optional[Self]:
if not search_index:
return None
if search_index.analyzers:
analyzers = [unpack_analyzer(x) for x in search_index.analyzers] # type: ignore
else:
analyzers = None
if search_index.tokenizers:
tokenizers = [
(
PatternTokenizer._from_generated(x) # pylint:disable=protected-access
if isinstance(x, _PatternTokenizer)
else x
)
for x in search_index.tokenizers
]
else:
tokenizers = None
if search_index.fields:
# pylint:disable=protected-access
fields = [cast(SearchField, SearchField._from_generated(x)) for x in search_index.fields]
else:
fields = []
return cls(
name=search_index.name,
fields=fields,
scoring_profiles=search_index.scoring_profiles,
default_scoring_profile=search_index.default_scoring_profile,
cors_options=search_index.cors_options,
suggesters=search_index.suggesters,
analyzers=analyzers,
tokenizers=tokenizers,
token_filters=search_index.token_filters,
char_filters=search_index.char_filters,
# pylint:disable=protected-access
encryption_key=SearchResourceEncryptionKey._from_generated(search_index.encryption_key),
similarity=search_index.similarity,
semantic_search=search_index.semantic_search,
e_tag=search_index.e_tag,
vector_search=search_index.vector_search,
)
[docs] def serialize(self, keep_readonly: bool = False, **kwargs: Any) -> MutableMapping[str, Any]:
"""Return the JSON that would be sent to server from this model.
:param bool keep_readonly: If you want to serialize the readonly attributes
:returns: A dict JSON compatible object
:rtype: dict
"""
return self._to_generated().serialize(keep_readonly=keep_readonly, **kwargs)
[docs] @classmethod
def deserialize(cls, data: Any, content_type: Optional[str] = None) -> Optional[Self]: # type: ignore
"""Parse a str using the RestAPI syntax and return a SearchIndex instance.
:param str data: A str using RestAPI structure. JSON by default.
:param str content_type: JSON by default, set application/xml if XML.
:returns: A SearchIndex instance
:rtype: SearchIndex
:raises: DeserializationError if something went wrong
"""
return cls._from_generated(_SearchIndex.deserialize(data, content_type=content_type))
[docs] def as_dict(
self,
keep_readonly: bool = True,
key_transformer: Callable[[str, Dict[str, Any], Any], Any] = _serialization.attribute_transformer,
**kwargs: Any
) -> MutableMapping[str, Any]:
"""Return a dict that can be serialized using json.dump.
:param bool keep_readonly: If you want to serialize the readonly attributes
:param Callable key_transformer: A callable that will transform the key of the dict
:returns: A dict JSON compatible object
:rtype: dict
"""
return self._to_generated().as_dict(
keep_readonly=keep_readonly, key_transformer=key_transformer, **kwargs
) # type: ignore
[docs] @classmethod
def from_dict( # type: ignore
cls,
data: Any,
key_extractors: Optional[Callable[[str, Dict[str, Any], Any], Any]] = None,
content_type: Optional[str] = None,
) -> Optional[Self]:
"""Parse a dict using given key extractor return a model.
By default consider key
extractors (rest_key_case_insensitive_extractor, attribute_key_case_insensitive_extractor
and last_rest_key_case_insensitive_extractor)
:param dict data: A dict using RestAPI structure
:param Callable key_extractors: A callable that will extract a key from a dict
:param str content_type: JSON by default, set application/xml if XML.
:returns: A SearchIndex instance
:rtype: SearchIndex
:raises: DeserializationError if something went wrong
"""
return cls._from_generated(
_SearchIndex.from_dict(data, content_type=content_type, key_extractors=key_extractors)
)
def pack_search_field(search_field: SearchField) -> _SearchField:
if isinstance(search_field, dict):
name = search_field.get("name")
assert name is not None # Hint for mypy
field_type = search_field.get("type")
assert field_type is not None # Hint for mypy
key = search_field.get("key")
hidden = search_field.get("hidden")
retrievable = not hidden if hidden is not None else None
searchable = search_field.get("searchable")
filterable = search_field.get("filterable")
sortable = search_field.get("sortable")
facetable = search_field.get("facetable")
analyzer_name = search_field.get("analyzer_name")
search_analyzer_name = search_field.get("search_analyzer_name")
index_analyzer_name = search_field.get("index_analyzer_name")
synonym_map_names = search_field.get("synonym_map_names")
fields = search_field.get("fields")
fields = [pack_search_field(x) for x in fields] if fields else None
vector_search_dimensions = search_field.get("vector_search_dimensions")
vector_search_profile_name = search_field.get("vector_search_profile_name")
return _SearchField(
name=name,
type=field_type,
key=key,
retrievable=retrievable,
searchable=searchable,
filterable=filterable,
sortable=sortable,
facetable=facetable,
analyzer=analyzer_name,
search_analyzer=search_analyzer_name,
index_analyzer=index_analyzer_name,
synonym_maps=synonym_map_names,
fields=fields,
vector_search_dimensions=vector_search_dimensions,
vector_search_profile_name=vector_search_profile_name,
)
return search_field._to_generated() # pylint:disable=protected-access