Unified Protobuf Definition and Container Development for Various Large Language Models

added to epic &5

changed the description

mentioned in issue #42 (closed)

marked this issue as related to #42 (closed)

Updates as on 20_08_2024

syntax = "proto3";

message Empty {

}

message LLMConfig {
    double temp = 1; // Can be expanded - To be discussed.
}

message PromptInput {
    string system = 1;
    string user = 2;
    string context = 3;
    string prompt = 4; // The application-specific prompt to the LLM for processing.
}

// Encapsulates a single question string, representing a user query.
message UserQuestion {
    string question = 1;
}

// Contains a q_id field, which uniquely identifies a conversation or query. This ensures continuity and state tracking across interactions.
message ConvoID {
    string q_id = 1;
}

// Bundles together the LLM configs, prompt input, user question, and conversation ID into a single message.
message LLMQuery {
    LLMConfig config = 1;
    PromptInput input = 2;
    UserQuestion qa = 3;
    ConvoID id = 4;
}

// Response from the LLM
message LLMAnswer {
    string text = 1;
    ConvoID id = 2;  
}

message Status {
    string message = 1;
}

service LLMService {
    rpc llm_functionalities( stream LLMQuery) returns( stream LLMAnswer);
}

Services:

llm_functionalities( stream LLMQuery) returns( stream LLMAnswer);
This method allows for continuous streaming of LLMQuery messages from the client to the server and LLMAnswer messages from the server to the client. This setup is ideal for real-time applications where the client may send multiple queries, and the server needs to respond promptly and continuously, potentially with various responses per query.

removed Work In Progress label

The current protobuf definition aligns with the LLM container's ticket (#42 (closed)), with the most recent addition to this UPI being the AppType feature.

//Unified Protobuf Interface
syntax = "proto3";


// Enum representing different application types.
enum AppType {
    INVOKE_DIRECT_LLM = 0;  // Direct LLM invocation.
    RAG = 1;                // Retrieval-Augmented Generation.
    README = 2;             // Readme Generation.
    LETTER_GEN = 3;         // German-Letter Generation.
}

// Empty message placeholder.
message Empty {
}

// Configuration settings for the LLM.
message LLMConfig {
    double temp = 1;                // Temperature setting for response generation.
    int64 max_tokens = 2;           // Maximum number of tokens in the response.
    double top_p = 3;               // Controls nucleus sampling; only considers tokens with cumulative probability <= top_p.
    double frequency_penalty = 4;   // Penalizes repeated words; ranges from -2.0 to 2.0.
    double presence_penalty = 5;    // Encourages or discourages new topic introductions; ranges from -2.0 to 2.0.
}

// Input structure for a prompt sent to the LLM.
message PromptInput {
    string system = 1;        // System role definition.
    string user = 2;          // User's input.
    string context = 3;       // Context for the prompt.
    string prompt = 4;        // Main question or task for the LLM.
}

// Message representing a user's question.
message UserQuestion {
    string question = 1;      // The user's question or input.
}

// Identifier for a conversation or query.
message ConvoID {
    string q_id = 1;          // Unique ID for the query or conversation.
}

// Main query structure for interacting with the LLM.
message LLMQuery {
    AppType app_type = 1;     // Type of application making the query.
    LLMConfig config = 2;     // Configuration settings for the LLM.
    PromptInput input = 3;    // Input prompt for the LLM.
    UserQuestion qa = 4;      // User's question or input.
    ConvoID id = 5;           // Identifier for the query or conversation.
}

// Response structure for LLM outputs.
message LLMAnswer {
    string text = 1;                   // Default response text from the LLM.
    ConvoID id = 2;                    // Identifier for the corresponding query.
    map<string, string> fields = 3;    // Additional fields for dynamic or application-specific data.
}

// Status message for response or feedback.
message Status {
    string message = 1;        // Status or error message.
}

// Service definition for interacting with the LLM.
service LLMService {
    rpc instruct_llm(LLMQuery) returns (LLMAnswer);
    rpc instruct_llm_stream(stream LLMQuery) returns (stream LLMAnswer);
}

closed

Unified Protobuf Definition and Container Development for Various Large Language Models

Overview:

Sample Protobuf Definition

Tasks

Designs

Child items 0

Activity

Updates as on 20_08_2024

Unified Protobuf Definition and Container Development for Various Large Language Models

Overview:

Sample Protobuf Definition

Tasks

Relates to

Activity

Updates as on 20_08_2024