Table of Contents

Class GatewayTextEmbeddingRequestMetrics

Namespace
FoundationaLLM.Common.Models.Gateway
Assembly
FoundationaLLM.Common.dll

Provides metrics related to text embedding requests submitted by the FoundationaLLM Gateway.

public class GatewayTextEmbeddingRequestMetrics
Inheritance
GatewayTextEmbeddingRequestMetrics
Inherited Members
Extension Methods

Properties

AccountName

The name of the account used for text embedding.

[JsonPropertyName("account_name")]
public required string AccountName { get; set; }

Property Value

string

CurrentRequestTokenCount

The toal number of tokens used in the current request.

[JsonPropertyName("current_request_token_count")]
public int CurrentRequestTokenCount { get; set; }

Property Value

int

CurrentTextChunkCount

The number of text chunks in the current request.

[JsonPropertyName("current_text_chunk_count")]
public int CurrentTextChunkCount { get; set; }

Property Value

int

Id

The unique identifier of the request.

[JsonPropertyName("id")]
public required string Id { get; set; }

Property Value

string

ModelName

The name of the embedding model used for text embedding.

[JsonPropertyName("model_name")]
public required string ModelName { get; set; }

Property Value

string

ModelVersion

The version of the embedding model used for text embedding.

[JsonPropertyName("model_version")]
public required string ModelVersion { get; set; }

Property Value

string

OperationsDetails

The details of the embedding operations from the text chunks. For each embedding operation id, holds the list of the positions of the text chunks from the current request.

[JsonPropertyName("operations_details")]
public Dictionary<string, List<int>> OperationsDetails { get; set; }

Property Value

Dictionary<string, List<int>>

RequestRateWindowRequestCount

The cummulated number of requests for the current request rate window. Includes all calls performed so far in the current call rate window.

[JsonPropertyName("request_rate_window_request_count")]
public int RequestRateWindowRequestCount { get; set; }

Property Value

int

RequestRateWindowStart

The start timestamp of the current request rate window.

[JsonPropertyName("request_rate_window_start")]
public DateTime RequestRateWindowStart { get; set; }

Property Value

DateTime

TokenRateWindowStart

The start timestamp of the current token rate window.

[JsonPropertyName("token_rate_window_start")]
public DateTime TokenRateWindowStart { get; set; }

Property Value

DateTime

TokenRateWindowTokenCount

The cummulated number of tokens for the current token rate window. Includes all tokens used so far in the current token rate window.

[JsonPropertyName("token_rate_window_token_count")]
public int TokenRateWindowTokenCount { get; set; }

Property Value

int