Merge branch 'main' of ../private

TheLunarCompany · Jan 20, 2025 · 8495626 · 8495626
2 parents 8a5e9b1 + ab3a2cd
commit 8495626
Show file tree

Hide file tree

Showing 13 changed files with 790 additions and 0 deletions.
diff --git a/proxy/Dockerfile b/proxy/Dockerfile
@@ -70,6 +70,8 @@ ENV LUNAR_ACCESS_LOGS_OUTPUT "NULL"
 ENV LUNAR_PROXY_CONFIG_DIR="/etc/lunar-proxy"
 ENV LUNAR_PROXY_INTERNAL_CONFIG_DIR="/etc/lunar-proxy-internal"
 ENV LUNAR_PROXY_LOGS_DIR="/var/log/lunar-proxy"
+# TIKTOKEN_CACHE_DIR is used by the tiktoken to to cache the token dictionary
+ENV TIKTOKEN_CACHE_DIR="/etc/tiktoken_cache"
 ENV HAPROXY_CONFIG_DIR="/etc/haproxy"
 ENV LUNAR_SPOE_CONFIG "${HAPROXY_CONFIG_DIR}/spoe/lunar.conf"
 ENV LUNAR_CERT_DIRECTORY "${LUNAR_PROXY_CONFIG_DIR}/certs"
@@ -232,8 +234,10 @@ RUN groupadd -r $LUNAR_GID && \
 
 # Create directories and files with proper permissions
 RUN mkdir -p /etc/haproxy && \
+    mkdir -p ${TIKTOKEN_CACHE_DIR} && \
     touch /etc/haproxy/allowed_domains.lst && \
     touch /etc/haproxy/blocked_domains.lst && \
+    chown -R "$LUNAR_UID:$LUNAR_GID" ${TIKTOKEN_CACHE_DIR} && \
     chown -R "$LUNAR_UID:$LUNAR_GID" /etc/haproxy && \
     chown -R "$LUNAR_UID:$LUNAR_GID" /var/log/squid/ && \
     chown -R "$LUNAR_UID:$LUNAR_GID" /etc/squid && \

diff --git a/proxy/src/libs/toolkit-core/ai/models/common.go b/proxy/src/libs/toolkit-core/ai/models/common.go
@@ -0,0 +1,29 @@
+package models
+
+import (
+	"encoding/json"
+	"fmt"
+	"strings"
+)
+
+// CombineMessages combines the content of multiple messages into a single string
+func CombineMessages(messages []Message) string {
+	var builder strings.Builder
+	for _, message := range messages {
+		builder.WriteString(message.Content)
+		builder.WriteString("\n")
+	}
+	return builder.String()
+}
+
+// ExtractMessageRequest extracts a MessageRequest from a request body
+func ExtractMessageRequest(body []byte) (*MessageRequest, error) {
+	if len(body) == 0 {
+		return nil, fmt.Errorf("request body is empty")
+	}
+	var request MessageRequest
+	if err := json.Unmarshal(body, &request); err != nil {
+		return nil, fmt.Errorf("failed to unmarshal request body: %w", err)
+	}
+	return &request, nil
+}
diff --git a/proxy/src/libs/toolkit-core/ai/models/models.go b/proxy/src/libs/toolkit-core/ai/models/models.go
@@ -0,0 +1,140 @@
+package models
+
+import (
+	"fmt"
+	"strings"
+
+	"github.com/pkoukk/tiktoken-go"
+	"github.com/rs/zerolog"
+	"github.com/rs/zerolog/log"
+)
+
+const (
+	ChatGPT string = "chatgpt"
+	Claude  string = "claude"
+	Gemini  string = "gemini"
+
+	// all Claude models (including Claude 3 family - Haiku, Sonnet, and Opus)
+	// use the same "cl100k_base" encoding for tokenization
+	ClaudeDefaultEncoding  = "cl100k_base"
+	GeminiDefaultEncoding  = "cl100k_base"
+	ChatGPTDefaultEncoding = "cl100k_base"
+)
+
+type ModelI interface {
+	GetID() string
+	CountTokensOfText(string) (int, error)
+	CountTokensOfLLMMessage([]byte) (int, error)
+}
+
+// Message represents a single message in the conversation
+type Message struct {
+	Role    string `json:"role"`
+	Content string `json:"content"`
+}
+
+// MessageRequest represents the request body for creating a message
+type MessageRequest struct {
+	Model    string    `json:"model"`
+	Messages []Message `json:"messages"`
+}
+
+type Model struct {
+	modelName string // model name (can consist wildcard to specify range): gpt-4o-*, gpt-3.5-turbo
+	modelType string
+	encoding  string
+	encoder   *tiktoken.Tiktoken // Cache the encoder for performance
+	logger    zerolog.Logger
+}
+
+// NewModel creates a new Model
+func NewModel() *Model {
+	return &Model{
+		logger: log.With().Str("component", "ai-model").Logger(),
+	}
+}
+
+func (m *Model) Init() error {
+	var err error
+	if m.encoding != "" {
+		m.encoder, err = tiktoken.GetEncoding(m.encoding)
+	} else if m.modelName != "" {
+		m.encoder, err = tiktoken.EncodingForModel(m.modelName)
+		if err != nil {
+			log.Warn().Err(err).Msgf("Failed to get encoder for model %s, using model type", m.modelName)
+			m.modelType = m.modelName
+			m.encoder, err = tiktoken.GetEncoding(m.modelTypeToEncoding())
+		}
+	} else if m.modelType != "" {
+		m.encoder, err = tiktoken.GetEncoding(m.modelTypeToEncoding())
+	} else {
+		err = fmt.Errorf("no model name or type specified")
+	}
+
+	return err
+}
+
+func (m *Model) WithName(name string) *Model {
+	m.modelName = name
+	return m
+}
+
+func (m *Model) WithType(modelType string) *Model {
+	m.modelType = modelType
+	return m
+}
+
+func (m *Model) WithEncoding(encoding string) *Model {
+	m.encoding = encoding
+	return m
+}
+
+func (m *Model) GetID() string {
+	if m.modelName != "" {
+		return m.modelName
+	}
+	if m.modelType != "" {
+		return string(m.modelType)
+	}
+	return m.encoding
+}
+
+func (m *Model) CountTokensOfLLMMessage(body []byte) (int, error) {
+	request, err := ExtractMessageRequest(body)
+	if err != nil {
+		return 0, err
+	}
+
+	// Combine all message contents to form the full prompt
+	prompt := CombineMessages(request.Messages)
+
+	return m.CountTokensOfText(prompt)
+}
+
+func (m *Model) CountTokensOfText(text string) (int, error) {
+	if m.encoder == nil {
+		return 0, fmt.Errorf("encoder not initialized")
+	}
+
+	tokens := m.encoder.Encode(text, nil, nil)
+	tokenCount := len(tokens)
+	return tokenCount, nil
+}
+
+func (m *Model) modelTypeToEncoding() string {
+	if m.modelType == "" {
+		m.logger.Warn().Msg("Model type not set, using default encoding")
+		return ChatGPTDefaultEncoding
+	}
+	switch strings.ToLower(m.modelType) {
+	case ChatGPT:
+		return ChatGPTDefaultEncoding
+	case Claude:
+		return ClaudeDefaultEncoding
+	case Gemini:
+		return GeminiDefaultEncoding
+	default:
+		m.logger.Error().Msgf("Model type %v not supported, using default encoding", m.modelType)
+		return ChatGPTDefaultEncoding
+	}
+}
diff --git a/proxy/src/libs/toolkit-core/ai/tokenizer.go b/proxy/src/libs/toolkit-core/ai/tokenizer.go
@@ -0,0 +1,93 @@
+package ai
+
+import (
+	"lunar/toolkit-core/ai/models"
+
+	"github.com/rs/zerolog/log"
+)
+
+type Tokenizer struct {
+	model models.ModelI
+}
+
+func NewTokenizer(modelName, modelType, encoding string) (*Tokenizer, error) {
+	log.Trace().
+		Msgf("Creating tokenizer: model %v, type %v, encoding %v", modelName, modelType, encoding)
+	model := models.NewModel().WithName(modelName).WithType(modelType).WithEncoding(encoding)
+	err := model.Init()
+	if err != nil {
+		log.Error().Err(err).Msgf("Error initializing model %v", modelName)
+		return nil, err
+	}
+	return &Tokenizer{model: model}, nil
+}
+
+func NewTokenizerFromModel(modelName string) (*Tokenizer, error) {
+	log.Trace().Msgf("Creating tokenizer for model %v", modelName)
+	model := models.NewModel().WithName(modelName)
+	err := model.Init()
+	if err != nil {
+		log.Error().Err(err).Msgf("Error initializing model %v", modelName)
+		return nil, err
+	}
+	return &Tokenizer{model: model}, nil
+}
+
+func NewTokenizerFromModelType(modelType string) (*Tokenizer, error) {
+	log.Trace().Msgf("Creating tokenizer for model %v", modelType)
+	model := models.NewModel().WithType(modelType)
+	err := model.Init()
+	if err != nil {
+		log.Error().Err(err).Msgf("Error initializing model %v", modelType)
+		return nil, err
+	}
+	return &Tokenizer{model: model}, nil
+}
+
+func NewTokenizerFromEncoding(encoding string) (*Tokenizer, error) {
+	log.Trace().Msgf("Creating tokenizer for encoding %v", encoding)
+	model := models.NewModel().WithEncoding(encoding)
+	err := model.Init()
+	if err != nil {
+		log.Error().Err(err).Msgf("Error initializing model %v", encoding)
+		return nil, err
+	}
+	return &Tokenizer{model: model}, nil
+}
+
+// CountTokensOfLLMMessage counts the number of tokens in the given body
+// LLM message is structured as a JSON object like this:
+//
+//	{
+//	  "messages": [
+//	    {
+//	      "role": "system",
+//	      "content": "You are a helpful assistant."
+//	    },
+//	    {
+//	      "role": "user",
+//	      "content": "Explain how airplanes fly."
+//	    }
+//	  ]
+//	}
+//
+// The content of each message is tokenized and counted.
+// role field is optional and can be omitted.
+func (t *Tokenizer) CountTokensOfLLMMessage(body []byte) (int, error) {
+	tokens, err := t.model.CountTokensOfLLMMessage(body)
+	if err != nil {
+		log.Error().Err(err).Msgf("Error counting LLM tokens for model %v", t.model.GetID())
+		return 0, err
+	}
+	return tokens, err
+}
+
+// CountTokensOfText counts the number of tokens in the given text
+func (t *Tokenizer) CountTokensOfText(text string) (int, error) {
+	tokens, err := t.model.CountTokensOfText(text)
+	if err != nil {
+		log.Error().Err(err).Msgf("Error counting LLM tokens of message for model %v", t.model.GetID())
+		return 0, err
+	}
+	return tokens, err
+}