MaIN.NET/src/MaIN.Core/Hub/Contexts/Interfaces/ChatContext/IChatConfigurationBuilder.cs at 729202d6f90a2eebe0d57968ffa3ba7884008262 · wisedev-code/MaIN.NET · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
using MaIN.Domain.Configuration;
using MaIN.Domain.Entities;
using MaIN.Domain.Entities.Tools;
using MaIN.Domain.Models;
using MaIN.Services.Services.Models;
using FileInfo = MaIN.Domain.Entities.FileInfo;

namespace MaIN.Core.Hub.Contexts.Interfaces.ChatContext;

public interface IChatConfigurationBuilder : IChatActions
{
    /// <summary>
    /// Sets the inference parameters for the chat session, allowing you to customize how the AI processes and generates
    /// responses based on specific parameters. Inference parameters can influence various aspects of the chat, such as response length,
    /// temperature, and other model-specific settings.
    /// </summary>
    /// <param name="inferenceParams">An <see cref="InferenceParams"/> object that holds the parameters for inference, such as Temperature,
    /// MaxTokens, TopP, etc. These parameters control the generation behavior of the chat.</param>
    /// <returns>The context instance implementing <see cref="IChatConfigurationBuilder"/> for method chaining.</returns>
    IChatConfigurationBuilder WithInferenceParams(InferenceParams inferenceParams);

    /// <summary>
    /// Attaches external tools/functions that the model can invoke during the conversation.
    /// </summary>
    /// <param name="toolsConfiguration"> A <see cref="ToolsConfiguration"/> - configuration defining available tools
    /// and their execution modes.</param>
    /// <returns>The context instance implementing <see cref="IChatConfigurationBuilder"/> for method chaining.</returns>
    IChatConfigurationBuilder WithTools(ToolsConfiguration toolsConfiguration);

    /// <summary>
    /// Sets the memory parameters for the chat session, allowing you to customize how the AI accesses and
    /// uses its memory for generating responses. Memory parameters influence aspects such as context size, memory search depth,
    /// and token allocation for responses.
    /// </summary>
    /// <param name="memoryParams">A <see cref="MemoryParams"/> object that holds the parameters for memory management, such as ContextSize,
    /// MaxMatchesCount, AnswerTokens, etc. These parameters control how the chat uses memory for response generation.</param>
    /// <returns>The context instance implementing <see cref="IChatConfigurationBuilder"/> for method chaining.</returns>
    IChatConfigurationBuilder WithMemoryParams(MemoryParams memoryParams);

    /// <summary>
    /// Configures the session to use Text-to-Speech for the model's responses.
    /// </summary>
    /// <param name="speechParams">A <see cref="TextToSpeechParams"/> - parameters for the voice synthesis.</param>
    /// <returns>The context instance implementing <see cref="IChatConfigurationBuilder"/> for method chaining.</returns>
    IChatConfigurationBuilder Speak(TextToSpeechParams speechParams);

    /// <summary>
    /// Defines backend that will be used for model inference
    /// </summary>
    /// <param name="backendType">The <see cref="BackendType"/> - an enum that defines which AI backend to use.</param>
    /// <returns>The context instance implementing <see cref="IChatConfigurationBuilder"/> for method chaining.</returns>
    IChatConfigurationBuilder WithBackend(BackendType backendType);

    /// <summary>
    /// Inserts a system message at the beginning of the chat. System messages are typically used for setting the context
    /// or providing instructions to the AI.
    /// </summary>
    /// <param name="systemPrompt">The system prompt content that provides instructions to the AI.</param>
    /// <returns>The context instance implementing <see cref="IChatConfigurationBuilder"/> for method chaining.</returns>
    IChatConfigurationBuilder WithSystemPrompt(string systemPrompt);

    /// <summary>
    /// Attaches files to the most recent message in the chat. Files are associated with the last message to provide additional context
    /// or media for the AI to process.
    /// </summary>
    /// <param name="file">A list of <see cref="FileStream"/> objects representing the files to attach.</param>
    /// <param name="preProcess">Include preprocessing of a document that can consume more time and resources
    /// but can also greatly improve the quality of inference</param>
    /// <returns>The context instance implementing <see cref="IChatConfigurationBuilder"/> for method chaining.</returns>
    IChatConfigurationBuilder WithFiles(List<FileStream> file, bool preProcess = false);

    /// <summary>
    /// Attaches files to the most recent message in the chat. Files are associated with the last message to provide additional context
    /// or media for the AI to process.
    /// </summary>
    /// <param name="file">A list of <see cref="FileInfo"/> objects representing the files to attach.</param>
    /// <param name="preProcess">Include preprocessing of a document that can consume more time and resources
    /// but can also greatly improve the quality of inference</param>
    /// <returns>The context instance implementing <see cref="IChatConfigurationBuilder"/> for method chaining.</returns>
    IChatConfigurationBuilder WithFiles(List<FileInfo> file, bool preProcess = false);

    /// <summary>
    /// Attaches a list of files to the most recent message in the chat by specifying their file paths.
    /// This method is an alternative to using FileInfo.
    /// </summary>
    /// <param name="file">A list of file paths to attach to the most recent message.</param>
    /// <param name="preProcess">Include preprocessing of a document that can consume more time and resources
    /// but can also greatly improve the quality of inference</param>
    /// <returns>The context instance implementing <see cref="IChatConfigurationBuilder"/> for method chaining.</returns>
    IChatConfigurationBuilder WithFiles(List<string> file, bool preProcess = false);

    /// <summary>
    /// Each time we run inference, we need to load the model into memory; this takes time and memory. This method allows us to save some
    /// more of GPU/RAM resources at the cost of time, because model weights are no longer cached
    /// </summary>
    /// <returns>The context instance implementing <see cref="IChatConfigurationBuilder"/> for method chaining.</returns>
    IChatConfigurationBuilder DisableCache();

    /// <summary>
    /// Completes the chat session by generating a response based on the messages so far. This method interacts with the underlying
    /// chat service to process the chat and generate a result.
    /// </summary>
    /// <param name="translate">A flag indicating whether the response should be translated. Default is false.</param>
    /// <param name="interactive">A flag indicating whether the chat session should be interactive. Default is false.</param>
    /// <param name="changeOfValue">An optional callback invoked whenever a new token or update is received during streaming.</param>
    /// <returns>A <see cref="ChatResult"/> object containing the result of the completed chat session.</returns>
    Task<ChatResult> CompleteAsync(bool translate = false, bool interactive = false, Func<LLMTokenValue?, Task>? changeOfValue = null, CancellationToken cancellationToken = default);
}