forked from microsoft/kernel-memory
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathOpenAITextEmbeddingGenerator.cs
69 lines (57 loc) · 2.23 KB
/
OpenAITextEmbeddingGenerator.cs
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
// Copyright (c) Microsoft. All rights reserved.
using System.Net.Http;
using System.Threading;
using System.Threading.Tasks;
using Microsoft.Extensions.Logging;
using Microsoft.KernelMemory.Diagnostics;
using Microsoft.SemanticKernel.AI.Embeddings;
using Microsoft.SemanticKernel.Connectors.OpenAI;
namespace Microsoft.KernelMemory.AI.OpenAI;
public class OpenAITextEmbeddingGenerator : ITextEmbeddingGenerator
{
private readonly ITextTokenizer _textTokenizer;
private readonly OpenAITextEmbeddingGenerationService _client;
private readonly ILogger<OpenAITextEmbeddingGenerator> _log;
public OpenAITextEmbeddingGenerator(
OpenAIConfig config,
ITextTokenizer? textTokenizer = null,
ILoggerFactory? loggerFactory = null,
HttpClient? httpClient = null)
: this(config, textTokenizer, loggerFactory?.CreateLogger<OpenAITextEmbeddingGenerator>(), httpClient)
{
}
public OpenAITextEmbeddingGenerator(
OpenAIConfig config,
ITextTokenizer? textTokenizer = null,
ILogger<OpenAITextEmbeddingGenerator>? log = null,
HttpClient? httpClient = null)
{
this._log = log ?? DefaultLogger<OpenAITextEmbeddingGenerator>.Instance;
if (textTokenizer == null)
{
this._log.LogWarning(
"Tokenizer not specified, will use {0}. The token count might be incorrect, causing unexpected errors",
nameof(DefaultGPTTokenizer));
textTokenizer = new DefaultGPTTokenizer();
}
this._textTokenizer = textTokenizer;
this.MaxTokens = config.EmbeddingModelMaxTokenTotal;
this._client = new OpenAITextEmbeddingGenerationService(
modelId: config.EmbeddingModel,
apiKey: config.APIKey,
organization: config.OrgId,
httpClient: httpClient);
}
/// <inheritdoc/>
public int MaxTokens { get; }
/// <inheritdoc/>
public int CountTokens(string text)
{
return this._textTokenizer.CountTokens(text);
}
/// <inheritdoc/>
public Task<Embedding> GenerateEmbeddingAsync(string text, CancellationToken cancellationToken = default)
{
return this._client.GenerateEmbeddingAsync(text, cancellationToken);
}
}