diff --git a/admin.proto b/admin.proto index 987c6f7..12841a6 100755 --- a/admin.proto +++ b/admin.proto @@ -57,8 +57,10 @@ message Corpus { repeated Dimension custom_dimensions = 13; repeated FilterAttribute filter_attributes = 14; + } + // A custom dimension is additional numeric metadata that you want to affect // Vectara's scoring. For example, these could be "number of stars" ratings, // or other business metrics like a product's margins that you want to use @@ -120,6 +122,20 @@ message CreateCorpusResponse { Status status = 2; } +message UpdateCorpusRequest { + // Corpus id to update. + uint32 id = 1; + // Name to be updated. + optional string name = 2; + // Description to be updated. + optional string description = 3; +} + +message UpdateCorpusResponse { + // The Status of the update. + Status status = 1; +} + message DeleteCorpusRequest { option (grpc.gateway.protoc_gen_openapiv2.options.openapiv2_schema) = { json_schema: { required: [ "customerId", "corpusId" ] } @@ -205,6 +221,8 @@ message CorpusSize { int64 epoch_secs = 1; // The size of the corpus. + // This is the sum of the number of characters in the + // text and metadata of all documents in the corpus. uint64 size = 2; } @@ -224,6 +242,7 @@ message ReadCorpusRequest { bool read_custom_dimensions = 1004; // Set to true to read the filter attributes of the corpus. bool read_filter_attributes = 1005; + } message ReadCorpusResponse { @@ -249,6 +268,7 @@ message ReadCorpusResponse { repeated FilterAttribute filter_attribute = 6; // Status of the filter attributes. Status filter_attribute_status = 1006; + } // Information about the requested corpora. diff --git a/common.proto b/common.proto index c021314..4dfab22 100755 --- a/common.proto +++ b/common.proto @@ -96,3 +96,4 @@ message StorageQuota { // storage quota. int64 num_metadata_chars = 2; } + diff --git a/core_services.proto b/core_services.proto index 9cf7b38..0b92cda 100755 --- a/core_services.proto +++ b/core_services.proto @@ -22,6 +22,7 @@ message IndexCoreDocumentRequest { int64 corpus_id = 2; // The document being indexed. com.vectara.indexing.CoreDocument document = 3; + } message IndexCoreDocumentResponse { diff --git a/services.proto b/services.proto index 9f3447c..43bea94 100755 --- a/services.proto +++ b/services.proto @@ -31,6 +31,7 @@ message IndexDocumentRequest { int64 corpus_id = 2; // The Document to index. com.vectara.indexing.Document document = 3; + } message IndexDocumentResponse { @@ -104,6 +105,14 @@ service AdminService { }; } + rpc UpdateCorpus(com.vectara.admin.UpdateCorpusRequest) + returns (com.vectara.admin.UpdateCorpusResponse) { + option (google.api.http) = { + post: "/v1/update-corpus" + body: "*" + }; + } + rpc DeleteCorpus(com.vectara.admin.DeleteCorpusRequest) returns (com.vectara.admin.DeleteCorpusResponse){ option (google.api.http) = { post: "/v1/delete-corpus" diff --git a/serving.proto b/serving.proto index e2861bd..f9c5108 100755 --- a/serving.proto +++ b/serving.proto @@ -122,6 +122,10 @@ message SummarizationRequest { // Higher values penalize new tokens based on whether they appear in the text so far, // increasing the model's likelihood to talk about new topics. optional float presence_penalty = 20; + // This feature is in Beta. If specified, the LLM will make a best effort to sample deterministically, + // such that repeated requests with the same seed and parameters should return the same result. + // Note:- Seed value is only used when temperature is set to 0. + optional uint32 seed = 25; } ModelParams model_params = 215; @@ -159,6 +163,8 @@ message QueryRequest { // chars_before is used for showing the end user the characters leading up // to the result snippet. This can help the end-user understand the // context of that result. Ignored if sentences_before is set. + // Vectara will capture the full sentence that contains the captured characters, + // so as to not lose the meaning caused by a truncated word or sentence. int32 chars_before = 5 [ (grpc.gateway.protoc_gen_openapiv2.options.openapiv2_field) = { example: "30" @@ -167,6 +173,8 @@ message QueryRequest { // chars_after is used for showing the end user the characters after the // result snippet. This can help the end-user understand the context of // that result. Ignored if sentences_before is set. + // Vectara will capture the full sentence that contains the captured characters, + // so as to not lose the meaning caused by a truncated word or sentence. int32 chars_after = 10 [ (grpc.gateway.protoc_gen_openapiv2.options.openapiv2_field) = { example: "30" @@ -216,13 +224,17 @@ message QueryRequest { message RerankingConfig { // Which reranking model to use if reranking. Currently, the only IDs // available are: - // - 272725717, HuggingFace Open Source x-attentional reranker // - 272725718, Maximum Marginal Relevance Reranker + // - 272725719, Vectara Multilingual Reranker v1 Reranker uint32 reranker_id = 5; // Reranker-specific parameters. The numbering starts from 100, and moves // upwards in increments of 5. optional MMRConfig mmr_config = 100; + + // User function that will be executed on each search result. + // May return a double or null. If this is null the item is skipped. + optional string user_function = 105; } RerankingConfig reranking_config = 30; @@ -322,7 +334,6 @@ message Summary { repeated Status status = 1000; // Populated for streaming requests only. int32 future_id = 1010; - } // A document part that matched a query.