diff --git a/arangodb-net-standard.Test/AnalyzerApi/AnalyzerApiClientTest.cs b/arangodb-net-standard.Test/AnalyzerApi/AnalyzerApiClientTest.cs index 073b55fd..ead677f7 100644 --- a/arangodb-net-standard.Test/AnalyzerApi/AnalyzerApiClientTest.cs +++ b/arangodb-net-standard.Test/AnalyzerApi/AnalyzerApiClientTest.cs @@ -47,14 +47,6 @@ public async Task PostAnalyzerAsync_ShouldSucceed() { Name = "text_sc", Type = "identity", - Properties = new AnalyzerProperties() - { - Accent = false, - Case = "lower", - Locale = "sc", - Stemming = false, - StopWords = new List() - }, Features = new List() { "frequency", @@ -78,15 +70,7 @@ public async Task PostAnalyzerAsync_ShouldThrow_WhenAnalyzerIsInvalid() new Analyzer() { Name = "text_sc", - Type = "collection", //...invalid analyzer type - Properties = new AnalyzerProperties() - { - Accent = false, - Case = "lower", - Locale = "sc", - Stemming = false, - StopWords = new List() - }, + Type = "collection", Features = new List() { "frequency", @@ -125,14 +109,6 @@ public async Task DeleteAnalyzerAsync_ShouldSucceed() { Name = name, Type = "identity", - Properties = new AnalyzerProperties() - { - Accent = false, - Case = "lower", - Locale = "mu", - Stemming = false, - StopWords = new List() - }, Features = new List() { "frequency", diff --git a/arangodb-net-standard/AnalyzerApi/AnalyzerApiClient.cs b/arangodb-net-standard/AnalyzerApi/AnalyzerApiClient.cs index ecb2558a..967410b3 100644 --- a/arangodb-net-standard/AnalyzerApi/AnalyzerApiClient.cs +++ b/arangodb-net-standard/AnalyzerApi/AnalyzerApiClient.cs @@ -72,10 +72,10 @@ public virtual async Task GetAllAnalyzersAsync(Cancella /// Creates a new Analyzer based on the provided definition /// POST /_api/analyzer /// - /// The properties of the new analyzer. + /// The definition of the new analyzer. /// A CancellationToken to observe while waiting for the task to complete or to cancel the task. /// - public virtual async Task PostAnalyzerAsync(Analyzer body, CancellationToken token = default) + public virtual async Task PostAnalyzerAsync(AnalyzerDefinition body, CancellationToken token = default) { if (body == null) { diff --git a/arangodb-net-standard/AnalyzerApi/IAnalyzerApiClient.cs b/arangodb-net-standard/AnalyzerApi/IAnalyzerApiClient.cs index c83bebab..7ee0a2fb 100644 --- a/arangodb-net-standard/AnalyzerApi/IAnalyzerApiClient.cs +++ b/arangodb-net-standard/AnalyzerApi/IAnalyzerApiClient.cs @@ -7,7 +7,7 @@ namespace ArangoDBNetStandard.AnalyzerApi /// /// Defines a client to access the ArangoDB Analyzer API. /// - internal interface IAnalyzerApiClient + public interface IAnalyzerApiClient { /// /// Fetch the list of available Analyzer definitions. @@ -21,10 +21,10 @@ internal interface IAnalyzerApiClient /// Creates a new Analyzer based on the provided definition /// POST /_api/analyzer /// - /// The properties of the new analyzer. + /// The definition of the new analyzer. /// A CancellationToken to observe while waiting for the task to complete or to cancel the task. /// - Task PostAnalyzerAsync(Analyzer body, CancellationToken token = default); + Task PostAnalyzerAsync(AnalyzerDefinition body, CancellationToken token = default); /// /// Fetches the definition of the specified analyzer. diff --git a/arangodb-net-standard/AnalyzerApi/Models/Analyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/Analyzer.cs index b737e840..ff6f9ba3 100644 --- a/arangodb-net-standard/AnalyzerApi/Models/Analyzer.cs +++ b/arangodb-net-standard/AnalyzerApi/Models/Analyzer.cs @@ -5,42 +5,11 @@ namespace ArangoDBNetStandard.AnalyzerApi.Models /// /// Defines an Analyzer in the database /// - public class Analyzer + public class Analyzer: AnalyzerDefinition { /// - /// Name of the analyzer - /// For rules regarding analyzer names, see - /// https://www.arangodb.com/docs/stable/analyzers.html#analyzer-names + /// Properties of the analyzer /// - public string Name { get; set; } - - /// - /// Type of the analyzer - /// For valid analyzer types, see - /// https://www.arangodb.com/docs/stable/analyzers.html#analyzer-types - /// - public string Type { get; set; } - - /// - /// Properties of the analyzer - /// used to configure the specified type - /// - public AnalyzerProperties Properties { get; set; } - - /// - /// The set of features to set on - /// the Analyzer generated fields. - /// Determines what term matching - /// capabilities will be available. - /// Possible features: - /// frequency: how often a term is seen, required for PHRASE(). - /// norm: the field normalization factor. - /// position: sequentially increasing term position, - /// required for PHRASE(). If present then the - /// frequency feature is also required. - /// offset: 3.10 onwards. Enables search highlighting capabilities - /// for ArangoSearch Views. - /// - public List Features { get; set; } + public new AnalyzerProperties Properties { get; set; } } } \ No newline at end of file diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinition.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinition.cs new file mode 100644 index 00000000..4293fc56 --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinition.cs @@ -0,0 +1,47 @@ +using ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties; +using System.Collections.Generic; + +namespace ArangoDBNetStandard.AnalyzerApi.Models +{ + /// + /// Defines an Analyzer in the database + /// + public class AnalyzerDefinition + { + /// + /// Name of the analyzer + /// For rules regarding analyzer names, see + /// https://www.arangodb.com/docs/stable/analyzers.html#analyzer-names + /// + public string Name { get; set; } + + /// + /// Type of the analyzer + /// For valid analyzer types, see + /// https://www.arangodb.com/docs/stable/analyzers.html#analyzer-types + /// + public string Type { get; set; } + + /// + /// Properties of the analyzer + /// used to configure the specified + /// + public AnalyzerDefinitionPropertiesBase Properties { get; set; } + + /// + /// The set of features to set on + /// the Analyzer generated fields. + /// Determines what term matching + /// capabilities will be available. + /// Possible features: + /// frequency: how often a term is seen, required for PHRASE(). + /// norm: the field normalization factor. + /// position: sequentially increasing term position, + /// required for PHRASE(). If present then the + /// frequency feature is also required. + /// offset: 3.10 onwards. Enables search highlighting capabilities + /// for ArangoSearch Views. + /// + public List Features { get; set; } + } +} \ No newline at end of file diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/AQLAnalyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/AQLAnalyzer.cs new file mode 100644 index 00000000..a89f9f8c --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/AQLAnalyzer.cs @@ -0,0 +1,72 @@ +using System; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Properties for AQL analyzer + /// + public class AQLAnalyzer : AnalyzerDefinitionPropertiesBase + { + /// + /// Convert emitted tokens to strings. (default) + /// + public const string ReturnTypeString = "string"; + + /// + /// Convert emitted tokens to numbers + /// + public const string ReturnTypeNumber = "number"; + + /// + /// Convert emitted tokens to booleans + /// + public const string ReturnTypeBool = "bool"; + + /// + /// AQL query to be executed + /// + public string QueryString { get; set; } + + /// + /// When true: set the position to 0 for all members + /// of the query result array. + /// When false: (default): set the position corresponding + /// to the index of the result array member + /// + public bool CollapsePositions { get; set; } + + /// + /// When true: (default): treat null like an empty string. + /// When false: discard nulls from View index. Can be used + /// for index filtering (i.e. make your query return null + /// for unwanted data). Note that empty results are always + /// discarded. + /// + public bool KeepNull { get; set; } + + /// + /// A number between 1 and 1000 (default = 1) that determines + /// the batch size for reading data from the query. In general, + /// a single token is expected to be returned. However, if the + /// query is expected to return many results, then increasing + /// trades memory for performance. + /// + public int BatchSize { get; set; } + + /// + /// Memory limit for query execution in bytes. + /// (default is 1048576 = 1Mb) + /// Maximum is 33554432U (32Mb) + /// + public int MemoryLimit { get; set; } + + /// + /// The Data type of the returned tokens. If the indicated + /// type does not match the actual type then an implicit + /// type conversion is applied. For possible values, see + /// , + /// and + /// + public string ReturnType { get; set; } + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/AnalyzerPropertiesBase.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/AnalyzerPropertiesBase.cs new file mode 100644 index 00000000..5f9f6b6a --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/AnalyzerPropertiesBase.cs @@ -0,0 +1,14 @@ +using System; +using System.Collections.Generic; +using System.Text; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Base class for analyzer properties + /// + public class AnalyzerDefinitionPropertiesBase + { + + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/ClassificationAnalyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/ClassificationAnalyzer.cs new file mode 100644 index 00000000..eb986923 --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/ClassificationAnalyzer.cs @@ -0,0 +1,33 @@ +using System; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Properties for Classification analyzer. + /// (only available in the Enterprise Edition) + /// + public class ClassificationAnalyzer : AnalyzerDefinitionPropertiesBase + { + /// + /// Required. The on-disk path to the trained fastText + /// supervised model. Note: if you are running this in + /// an ArangoDB cluster, this model must exist on every + /// machine in the cluster. + /// + public string Model_Location { get; set; } + + /// + /// Optional. The number of class labels that will be + /// produced per input (default: 1). + /// + public int? Top_K { get; set; } + + /// + /// Optional. The probability threshold for which a + /// label will be assigned to an input. A fastText model + /// produces a probability per class label, and this is + /// what will be filtered (default: 0.99). + /// + public int? Threshold { get; set; } + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/CollationAnalyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/CollationAnalyzer.cs new file mode 100644 index 00000000..ee172fd4 --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/CollationAnalyzer.cs @@ -0,0 +1,18 @@ +using System; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Properties for Collation analyzer + /// + public class CollationAnalyzer : AnalyzerDefinitionPropertiesBase + { + /// + /// A locale in the format language, e.g. "de" or "en". + /// The locale is forwarded to the Snowball stemmer + /// without checks. An invalid locale does not prevent + /// the creation of the Analyzer. + /// + public string Locale { get; set; } + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/DelimiterAnalyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/DelimiterAnalyzer.cs new file mode 100644 index 00000000..30fc84e3 --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/DelimiterAnalyzer.cs @@ -0,0 +1,15 @@ +using System; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Properties for delimiter analyzer + /// + public class DelimiterAnalyzer : AnalyzerDefinitionPropertiesBase + { + /// + /// The delimiting character(s) + /// + public string Delimiter { get; set; } + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/GeoJSONAnalyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/GeoJSONAnalyzer.cs new file mode 100644 index 00000000..7c5274b2 --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/GeoJSONAnalyzer.cs @@ -0,0 +1,41 @@ +using System; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Properties for GeoJSON analyzer. + /// + public class GeoJSONAnalyzer : AnalyzerDefinitionPropertiesBase + { + /// + /// Index all GeoJSON geometry types (Point, Polygon etc.) + /// (default). + /// + public const string TypeShape = "shape"; + + /// + /// Compute and only index the centroid of the input + /// geometry + /// + public const string TypeCentroid = "centroid"; + + /// + /// Only index GeoJSON objects of type Point, ignore all + /// other geometry types + /// + public const string TypePoint = "point"; + + /// + /// Determines the type of indexing to use. + /// Possible values are , + /// and + /// + public string Type { get; set; } + + /// + /// Options for fine-tuning geo queries. + /// These options should generally remain unchanged. + /// + public GeoJSONAnalyzerOptions Options { get; set; } + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/GeoPointAnalyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/GeoPointAnalyzer.cs new file mode 100644 index 00000000..2e903cef --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/GeoPointAnalyzer.cs @@ -0,0 +1,30 @@ +using System.Collections.Generic; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Properties for GeoPoint analyzer. + /// + public class GeoPointAnalyzer : AnalyzerDefinitionPropertiesBase + { + /// + /// A list of strings that describes the attribute path + /// of the latitude value relative to the field for + /// which the Analyzer is defined in the View. + /// + public List Latitude { get; set; } + + /// + /// A list of strings that describes the attribute path + /// of the longitude value relative to the field for + /// which the Analyzer is defined in the View. + /// + public List Longitude { get; set; } + + /// + /// Options for fine-tuning geo queries. + /// These options should generally remain unchanged. + /// + public GeoJSONAnalyzerOptions Options { get; set; } + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/IdentityAnalyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/IdentityAnalyzer.cs new file mode 100644 index 00000000..cf102993 --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/IdentityAnalyzer.cs @@ -0,0 +1,14 @@ +using System; +using System.Collections.Generic; +using System.Reflection; +using System.Text; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Properties for Identity analyzer + /// + public class IdentityAnalyzer : AnalyzerDefinitionPropertiesBase + { + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/MinhashAnalyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/MinhashAnalyzer.cs new file mode 100644 index 00000000..ec3153bd --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/MinhashAnalyzer.cs @@ -0,0 +1,25 @@ +using System; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Properties for Minhash analyzer. + /// (only available in the Enterprise Edition) + /// + public class MinhashAnalyzer : AnalyzerDefinitionPropertiesBase + { + /// + /// An Analyzer object. + /// + public Analyzer Analyzer { get; set; } + + /// + /// The size of the MinHash signature. Must be greater or + /// equal to 1. The signature size defines the probalistic + /// error (err = rsqrt(numHashes)). For an error amount + /// that does not exceed 5% (0.05), + /// use a size of 1 / (0.05 * 0.05) = 400. + /// + public int NumHashes { get; set; } + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/NearestNeighborsAnalyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/NearestNeighborsAnalyzer.cs new file mode 100644 index 00000000..de31e1fd --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/NearestNeighborsAnalyzer.cs @@ -0,0 +1,24 @@ +using System; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Properties for nearest_neighbors analyzer. + /// + public class NearestNeighborsAnalyzer : AnalyzerDefinitionPropertiesBase + { + /// + /// Required. The on-disk path to the trained fastText + /// supervised model. Note: if you are running this in + /// an ArangoDB cluster, this model must exist on every + /// machine in the cluster. + /// + public string Model_Location { get; set; } + + /// + /// Optional. The number of class labels that will be + /// produced per input (default: 1). + /// + public int? Top_K { get; set; } + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/NgramAnalyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/NgramAnalyzer.cs new file mode 100644 index 00000000..aa61800a --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/NgramAnalyzer.cs @@ -0,0 +1,60 @@ +using System; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Properties for ngram analyzer + /// + public class NgramAnalyzer : AnalyzerDefinitionPropertiesBase + { + /// + /// One byte is considered as one character (default) + /// + public const string StreamTypeBinary = "binary"; + + /// + /// One Unicode codepoint is treated as one character + /// + public const string StreamTypeUTF8 = "utf8"; + + /// + /// Unsigned integer for the minimum n-gram length + /// + public int Min { get; set; } + + /// + /// Unsigned integer for the maximum n-gram length + /// + public int Max { get; set; } + + /// + /// When true: include the original value as well. + /// When false: produce the n-grams based on + /// and only. + /// + public bool PreserveOriginal { get; set; } + + /// + /// This value will be prepended to n-grams which + /// include the beginning of the input. Can be used + /// for matching prefixes. Choose a character or + /// sequence as marker which does not occur in the input. + /// + public string StartMarker { get; set; } + + /// + /// This value will be appended to n-grams which + /// include the end of the input. Can be used for + /// matching suffixes. Choose a character or sequence + /// as marker which does not occur in the input. + /// + public string EndMarker { get; set; } + + /// + /// Type of the input stream. + /// Possible values are + /// and + /// + public string StreamType { get; set; } + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/NormAnalyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/NormAnalyzer.cs new file mode 100644 index 00000000..10ef2792 --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/NormAnalyzer.cs @@ -0,0 +1,48 @@ +using System; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Properties for norm analyzer + /// + public class NormAnalyzer : AnalyzerDefinitionPropertiesBase + { + /// + /// Convert to all lower-case characters + /// + public const string CaseHandlingLower = "lower"; + + /// + /// Convert to all upper-case characters + /// + public const string CaseHandlingUpper = "upper"; + + /// + /// Do not change character case (default) + /// + public const string CaseHandlingNone = "none"; + + /// + /// A locale in the format language[_COUNTRY] + /// (square brackets denote optional parts), + /// e.g. "de" or "en_US". The locale is forwarded + /// to ICU without checks. An invalid locale does + /// not prevent the creation of the Analyzer. + /// + public string Locale { get; set; } + + /// + /// When true: preserves accented characters (default). + /// When false: converts accented characters to their + /// base characters. + /// + public bool? Accent { get; set; } + + /// + /// Determines how to handle character casing + /// Possible values are , + /// , and + /// + public string Case { get; set; } + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/PipelineAnalyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/PipelineAnalyzer.cs new file mode 100644 index 00000000..0d1752ee --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/PipelineAnalyzer.cs @@ -0,0 +1,20 @@ +using System; +using System.Collections.Generic; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Properties for Pipeline analyzer + /// + public class PipelineAnalyzer : AnalyzerDefinitionPropertiesBase + { + /// + /// An array of Analyzer objects to use for the pipeline. + /// Analyzers of types geopoint and geojson cannot be used + /// in pipelines and will make the creation fail. + /// These Analyzers require additional postprocessing and + /// can only be applied to document fields directly. + /// + public List Pipeline { get; set; } + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/SegmentationAnalyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/SegmentationAnalyzer.cs new file mode 100644 index 00000000..f4b8c9f1 --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/SegmentationAnalyzer.cs @@ -0,0 +1,59 @@ +using System; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Properties for Segmentation analyzer + /// + public class SegmentationAnalyzer : AnalyzerDefinitionPropertiesBase + { + /// + /// Convert to all lower-case characters + /// + public const string CaseHandlingLower = "lower"; + + /// + /// Convert to all upper-case characters + /// + public const string CaseHandlingUpper = "upper"; + + /// + /// Do not change character case (default) + /// + public const string CaseHandlingNone = "none"; + + /// + /// Return all tokens + /// + public const string BreakTypeAll = "all"; + + /// + /// Return tokens composed of alphanumeric characters only (default). + /// + public const string BreakTypeAlpha = "alpha"; + + /// + /// Return tokens composed of non-whitespace characters only. + /// Note that the list of whitespace characters does not include line breaks: + /// U+0009 Character Tabulation, U+0020 Space, U+0085 Next Line, + /// U+00A0 No-break Space, U+1680 Ogham Space Mark, U+2000 En Quad, + /// U+2028 Line Separator, U+202F Narrow No-break Space, + /// U+205F Medium Mathematical Space, and U+3000 Ideographic Space. + /// + public const string BreakTypeGraphic = "graphic"; + + /// + /// Determines how to break up the input text. + /// Possible values are , , + /// and + /// + public string Break { get; set; } + + /// + /// Determines how to handle character casing + /// Possible values are , + /// , and + /// + public string Case { get; set; } + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/StemAnalyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/StemAnalyzer.cs new file mode 100644 index 00000000..42698a43 --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/StemAnalyzer.cs @@ -0,0 +1,18 @@ +using System; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Properties for Stem analyzer + /// + public class StemAnalyzer : AnalyzerDefinitionPropertiesBase + { + /// + /// A locale in the format language, e.g. "de" or "en". + /// The locale is forwarded to the Snowball stemmer + /// without checks. An invalid locale does not prevent + /// the creation of the Analyzer. + /// + public string Locale { get; set; } + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/StopwordsAnalyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/StopwordsAnalyzer.cs new file mode 100644 index 00000000..fb634a3c --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/StopwordsAnalyzer.cs @@ -0,0 +1,25 @@ +using System; +using System.Collections.Generic; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Properties for Stopwords analyzer + /// + public class StopwordsAnalyzer : AnalyzerDefinitionPropertiesBase + { + /// + /// A list of strings that describe the tokens to be discarded. + /// The interpretation of each string depends on the value of + /// the property. + /// + public List Stopwords { get; set; } + + /// + /// If false (default), then each string in + /// is used verbatim. If true, then the strings need to be hex-encoded. + /// This allows for removing tokens that contain non-printable characters. + /// + public bool Hex { get; set; } + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/TextAnalyzer.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/TextAnalyzer.cs new file mode 100644 index 00000000..80e31304 --- /dev/null +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerDefinitionProperties/TextAnalyzer.cs @@ -0,0 +1,98 @@ +using System; +using System.Collections.Generic; + +namespace ArangoDBNetStandard.AnalyzerApi.Models.AnalyzerDefinitionProperties +{ + /// + /// Properties for text analyzer + /// + public class TextAnalyzer:AnalyzerDefinitionPropertiesBase + { + /// + /// Convert to all lower-case characters + /// + public const string CaseHandlingLower = "lower"; + + /// + /// Convert to all upper-case characters + /// + public const string CaseHandlingUpper = "upper"; + + /// + /// Do not change character case (default) + /// + public const string CaseHandlingNone = "none"; + + /// + /// A locale in the format language[_COUNTRY] + /// (square brackets denote optional parts), + /// e.g. "de" or "en_US". The locale is forwarded + /// to ICU without checks. An invalid locale does + /// not prevent the creation of the Analyzer. + /// + public string Locale { get; set; } + + /// + /// When true: preserves accented characters (default). + /// When false: converts accented characters to their + /// base characters. + /// + public bool? Accent { get; set; } + + /// + /// Determines how to handle character casing + /// Possible values are , + /// , and + /// + public string Case { get; set; } + + /// + /// When true: apply stemming on returned words (default). + /// When false: leave the tokenized words as-is. + /// + public bool? Stemming { get; set; } + + /// + /// If present, then edge n-grams are generated for + /// each token (word). That is, the start of the + /// n-gram is anchored to the beginning of the token, + /// whereas the ngram Analyzer would produce all possible + /// substrings from a single input token (within the + /// defined length restrictions). Edge n-grams can be + /// used to cover word-based auto-completion queries + /// with an index, for which you should set the following + /// other options: = false, + /// = + /// and most importantly = false. + /// + public TextAnalyzerEdgeNgram EdgeNgram { get; set; } + + /// + /// A list of strings with words to omit from result. + /// Default: load words from . + /// To disable stop-word filtering provide an empty list. + /// If both and + /// are provided then both word sources are combined. + /// + public List Stopwords { get; set; } + + /// + /// A path with a language sub-directory (e.g. en for a locale en_US) + /// containing files with words to omit. Each word has to be on a + /// separate line. Everything after the first whitespace character + /// on a line will be ignored and can be used for comments. The files + /// can be named arbitrarily and have any file extension (or none). + /// Default: if no path is provided then the value of the environment + /// variable IRESEARCH_TEXT_STOPWORD_PATH is used to determine the path, + /// or if it is undefined then the current working directory is assumed. + /// If the stopwords attribute is provided then no stop-words are loaded + /// from files, unless an explicit is also provided. + /// Note that if the can not be accessed, + /// is missing language sub-directories or has no files for a language + /// required by an Analyzer, then the creation of a new Analyzer + /// is refused. If such an issue is discovered for an existing Analyzer + /// during startup then the server will abort with a fatal error. + /// + public string StopwordsPath { get; set; } + } +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerProperties.cs b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerProperties.cs index 09dbb5fb..856d0764 100644 --- a/arangodb-net-standard/AnalyzerApi/Models/AnalyzerProperties.cs +++ b/arangodb-net-standard/AnalyzerApi/Models/AnalyzerProperties.cs @@ -1,10 +1,11 @@ -using System.Collections.Generic; +using System; +using System.Collections.Generic; +using System.Text; namespace ArangoDBNetStandard.AnalyzerApi.Models { /// - /// Properties of an Analyzer. - /// See https://www.arangodb.com/docs/stable/analyzers.html#analyzer-properties + /// All analyzer properties /// public class AnalyzerProperties { @@ -368,4 +369,4 @@ public class AnalyzerProperties /// public string StopwordsPath { get; set; } } -} \ No newline at end of file +} diff --git a/arangodb-net-standard/AnalyzerApi/Models/GeoJSONAnalyzerOptions.cs b/arangodb-net-standard/AnalyzerApi/Models/GeoJSONAnalyzerOptions.cs index 01d52f6d..ec8ac1d7 100644 --- a/arangodb-net-standard/AnalyzerApi/Models/GeoJSONAnalyzerOptions.cs +++ b/arangodb-net-standard/AnalyzerApi/Models/GeoJSONAnalyzerOptions.cs @@ -1,3 +1,5 @@ +using System; + namespace ArangoDBNetStandard.AnalyzerApi.Models { /// diff --git a/arangodb-net-standard/AnalyzerApi/Models/TextAnalyzerEdgeNgram.cs b/arangodb-net-standard/AnalyzerApi/Models/TextAnalyzerEdgeNgram.cs index 28a2cdb5..a0412fb6 100644 --- a/arangodb-net-standard/AnalyzerApi/Models/TextAnalyzerEdgeNgram.cs +++ b/arangodb-net-standard/AnalyzerApi/Models/TextAnalyzerEdgeNgram.cs @@ -1,5 +1,10 @@ -namespace ArangoDBNetStandard.AnalyzerApi.Models +using System; + +namespace ArangoDBNetStandard.AnalyzerApi.Models { + /// + /// + /// public class TextAnalyzerEdgeNgram { ///