Class: RubyLLM::SemanticCache::Scoped

Inherits:

Object

Object
RubyLLM::SemanticCache::Scoped

show all

Defined in:: lib/ruby_llm/semantic_cache/scoped.rb

Overview

Scoped cache wrapper for multi-tenant scenarios Each scoped instance maintains its own stores for true isolation

Examples:

support = RubyLLM::SemanticCache::Scoped.new(namespace: "support")
sales = RubyLLM::SemanticCache::Scoped.new(namespace: "sales")

support.store(query: "How to reset password?", response: "...")
sales.store(query: "What is the price?", response: "...")

Defined Under Namespace

Classes: ScopedConfig

Instance Attribute Summary collapse

#namespace ⇒ Object readonly

Returns the value of attribute namespace.

Instance Method Summary collapse

Constructor Details

#initialize(namespace:) ⇒ `Scoped`

Returns a new instance of Scoped.

# File 'lib/ruby_llm/semantic_cache/scoped.rb', line 18

def initialize(namespace:)
  @namespace = namespace
  @vector_store = nil
  @cache_store = nil
  @hits = 0
  @misses = 0
end

Instance Attribute Details

#namespace ⇒ `Object` (readonly)

Returns the value of attribute namespace.



16
17
18

# File 'lib/ruby_llm/semantic_cache/scoped.rb', line 16

def namespace
  @namespace
end

Instance Method Details

#clear! ⇒ `Object`

# File 'lib/ruby_llm/semantic_cache/scoped.rb', line 119

def clear!
  vector_store.clear!
  cache_store.clear!
  @hits = 0
  @misses = 0
end

#delete(query, threshold: nil) ⇒ `Object`

# File 'lib/ruby_llm/semantic_cache/scoped.rb', line 89

def delete(query, threshold: nil)
  threshold ||= config.similarity_threshold
  embedding = embedding_generator.generate(query)
  matches = vector_store.search(embedding, limit: 1)

  return false unless matches.any? && matches.first[:similarity] >= threshold

  id = matches.first[:id]
  vector_store.delete(id)
  cache_store.delete(id)
  true
end

#exists?(query, threshold: nil) ⇒ `Boolean`

Returns:

(Boolean)

# File 'lib/ruby_llm/semantic_cache/scoped.rb', line 82

def exists?(query, threshold: nil)
  threshold ||= config.similarity_threshold
  embedding = embedding_generator.generate(query)
  matches = vector_store.search(embedding, limit: 1)
  matches.any? && matches.first[:similarity] >= threshold
end

#fetch(query, threshold: nil, ttl: nil, &block) ⇒ `Object`

Raises:

(ArgumentError)

# File 'lib/ruby_llm/semantic_cache/scoped.rb', line 26

def fetch(query, threshold: nil, ttl: nil, &block)
  raise ArgumentError, "Block required" unless block_given?

  threshold ||= config.similarity_threshold
  ttl ||= config.ttl_seconds

  embedding = embedding_generator.generate(query)
  matches = vector_store.search(embedding, limit: 1)

  if matches.any? && matches.first[:similarity] >= threshold
    @hits += 1
    entry_data = cache_store.get(matches.first[:id])
    return Serializer.deserialize(entry_data[:response]) if entry_data
  end

  @misses += 1
  response = block.call

  store(query: query, response: response, embedding: embedding, ttl: ttl)
  response
end

#invalidate(query, threshold: nil, limit: 100) ⇒ `Object`

# File 'lib/ruby_llm/semantic_cache/scoped.rb', line 102

def invalidate(query, threshold: nil, limit: 100)
  threshold ||= config.similarity_threshold
  embedding = embedding_generator.generate(query)
  matches = vector_store.search(embedding, limit: limit)

  count = 0
  matches.each do |match|
    next unless match[:similarity] >= threshold

    vector_store.delete(match[:id])
    cache_store.delete(match[:id])
    count += 1
  end

  count
end

#search(query, limit: 5) ⇒ `Object`

# File 'lib/ruby_llm/semantic_cache/scoped.rb', line 65

def search(query, limit: 5)
  embedding = embedding_generator.generate(query)
  matches = vector_store.search(embedding, limit: limit)

  matches.filter_map do |match|
    entry_data = cache_store.get(match[:id])
    next unless entry_data

    {
      query: entry_data[:query],
      response: Serializer.deserialize(entry_data[:response]),
      similarity: match[:similarity],
      metadata: entry_data[:metadata]
    }
  end
end

#stats ⇒ `Object`

# File 'lib/ruby_llm/semantic_cache/scoped.rb', line 126

def stats
  {
    hits: @hits,
    misses: @misses,
    hit_rate: hit_rate,
    entries: cache_store.size
  }
end

#store(query:, response:, embedding: nil, metadata: {}, ttl: nil) ⇒ `Object`

# File 'lib/ruby_llm/semantic_cache/scoped.rb', line 48

def store(query:, response:, embedding: nil, metadata: {}, ttl: nil)
  embedding ||= embedding_generator.generate(query)
  ttl ||= config.ttl_seconds

  entry = Entry.new(
    query: query,
    response: Serializer.serialize(response),
    embedding: embedding,
    metadata: metadata
  )

  vector_store.add(entry.id, embedding)
  cache_store.set(entry.id, entry.to_h, ttl: ttl)

  entry
end

#wrap(chat, threshold: nil, ttl: nil, on_cache_hit: nil, max_messages: nil) ⇒ `Object`

# File 'lib/ruby_llm/semantic_cache/scoped.rb', line 135

def wrap(chat, threshold: nil, ttl: nil, on_cache_hit: nil, max_messages: nil)
  # For scoped wrap, we create a middleware that uses this scoped instance
  ScopedMiddleware.new(
    self,
    chat,
    threshold: threshold,
    ttl: ttl,
    on_cache_hit: on_cache_hit,
    max_messages: max_messages
  )
end

Class: RubyLLM::SemanticCache::Scoped

Overview

Examples:

Defined Under Namespace

Instance Attribute Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize(namespace:) ⇒ Scoped

Instance Attribute Details

#namespace ⇒ Object (readonly)

Instance Method Details

#clear! ⇒ Object

#delete(query, threshold: nil) ⇒ Object

#exists?(query, threshold: nil) ⇒ Boolean

#fetch(query, threshold: nil, ttl: nil, &block) ⇒ Object

#invalidate(query, threshold: nil, limit: 100) ⇒ Object

#search(query, limit: 5) ⇒ Object

#stats ⇒ Object

#store(query:, response:, embedding: nil, metadata: {}, ttl: nil) ⇒ Object

#wrap(chat, threshold: nil, ttl: nil, on_cache_hit: nil, max_messages: nil) ⇒ Object