Module: Kumi::Core::IR::ExecutionEngine::Profiler

Defined in:: lib/kumi/core/ir/execution_engine/profiler.rb

Class Method Summary collapse

.averaged_analysis(top: 20) ⇒ Object

Multi-run averaged analysis.
.cache_overhead_analysis ⇒ Object

Identify potential cache overhead operations.
.compact_attrs(h) ⇒ Object
.cpu_t0 ⇒ Object

CPU time start (process + thread).
.emit_summary! ⇒ Object
.enabled? ⇒ Boolean
.finalize! ⇒ Object
.init_persistent! ⇒ Object
.memory_snapshot(label, extra: {}) ⇒ Object

Memory snapshot with GC statistics.
.op_key(decl, idx, tag, op) ⇒ Object

Stable textual key for “match ops one by one”.
.ops_enabled? ⇒ Boolean
.persistent? ⇒ Boolean
.phase(name, tags = {}) ⇒ Object

Phase timing for coarse-grained operations.
.read_rss_mb ⇒ Object
.record!(decl:, idx:, tag:, op:, t0:, cpu_t0: nil, rows: nil, note: nil) ⇒ Object

Per-op record with both wall time and CPU time (with sampling support).
.reset!(meta: {}) ⇒ Object
.sample_rate ⇒ Object
.set_schema_name(name) ⇒ Object
.stream(obj) ⇒ Object
.summary(top: 20) ⇒ Object
.t0 ⇒ Object

monotonic start time.

Class Method Details

.averaged_analysis(top: 20) ⇒ `Object`

Multi-run averaged analysis

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 208

def averaged_analysis(top: 20)
  return {} unless enabled? && @aggregated_stats&.any?

  # Convert aggregated stats to averaged metrics
  averaged = @aggregated_stats.map do |op_key, stats|
    num_runs = stats[:runs].size
    avg_wall_ms = stats[:total_ms] / stats[:count]
    avg_cpu_ms = stats[:total_cpu_ms] / stats[:count]
    total_wall_ms = stats[:total_ms]
    total_cpu_ms = stats[:total_cpu_ms]

    {
      op_key: op_key,
      decl: stats[:decl],
      idx: stats[:idx],
      tag: stats[:tag],
      runs: num_runs,
      total_calls: stats[:count],
      calls_per_run: stats[:count] / num_runs.to_f,
      avg_wall_ms: avg_wall_ms.round(4),
      avg_cpu_ms: avg_cpu_ms.round(4),
      total_wall_ms: total_wall_ms.round(3),
      total_cpu_ms: total_cpu_ms.round(3),
      cpu_efficiency: total_wall_ms > 0 ? (total_cpu_ms / total_wall_ms * 100).round(1) : 100,
      rows_total: stats[:rows],
      note: stats[:note]
    }
  end.sort_by { |s| -s[:total_wall_ms] }.first(top)

  {
    meta: @meta || {},
    total_runs: @aggregated_stats.values.map { |s| s[:runs].size }.max || 0,
    averaged_ops: averaged,
    total_operations: @aggregated_stats.size
  }
end

.cache_overhead_analysis ⇒ `Object`

Identify potential cache overhead operations

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 246

def cache_overhead_analysis
  return {} unless enabled? && @aggregated_stats&.any?

  # Look for operations that might be cache-related
  cache_ops = @aggregated_stats.select do |op_key, stats|
    op_key.include?("ref") || op_key.include?("load_input") || stats[:note]&.include?("cache")
  end

  cache_analysis = cache_ops.map do |op_key, stats|
    stats[:runs].size
    avg_wall_ms = stats[:total_ms] / stats[:count]

    {
      op_key: op_key,
      decl: stats[:decl],
      tag: stats[:tag],
      avg_time_ms: avg_wall_ms.round(4),
      total_time_ms: stats[:total_ms].round(3),
      call_count: stats[:count],
      overhead_per_call: avg_wall_ms.round(6)
    }
  end.sort_by { |s| -s[:total_time_ms] }

  {
    cache_operations: cache_analysis,
    total_cache_time: cache_analysis.sum { |op| op[:total_time_ms] }.round(3)
  }
end

.compact_attrs(h) ⇒ `Object`

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 318

def compact_attrs(h)
  return {} unless h

  h.transform_values do |v|
    case v
    when Array, Hash, Symbol, String, Numeric, TrueClass, FalseClass, NilClass then v
    else v.to_s
    end
  end
end

.cpu_t0 ⇒ `Object`

CPU time start (process + thread)



91
92
93

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 91

def cpu_t0
  Process.clock_gettime(Process::CLOCK_PROCESS_CPUTIME_ID)
end

.emit_summary! ⇒ `Object`

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 275

def emit_summary!
  return unless enabled?

  stream({ ts: Time.now.utc.iso8601(3), kind: "summary", data: summary })
end

.enabled? ⇒ `Boolean`

Returns:

(Boolean)

14	# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 14 def enabled? = ENV["KUMI_PROFILE"] == "1"

.finalize! ⇒ `Object`

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 288

def finalize!
  return unless enabled?

  # Emit final aggregated summary
  if @aggregated_stats&.any?
    stream({
             ts: Time.now.utc.iso8601(3),
             kind: "final_summary",
             data: averaged_analysis
           })
  end

  # Emit cache analysis if available
  cache_analysis = cache_overhead_analysis
  return unless cache_analysis[:cache_operations]&.any?

  stream({
           ts: Time.now.utc.iso8601(3),
           kind: "cache_analysis",
           data: cache_analysis
         })
end

.init_persistent! ⇒ `Object`

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 281

def init_persistent!
  return unless enabled? && persistent?

  @persistent_initialized = false
  reset!
end

.memory_snapshot(label, extra: {}) ⇒ `Object`

Memory snapshot with GC statistics

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 117

def memory_snapshot(label, extra: {})
  return unless enabled?

  s = GC.stat
  stream({
           ts: Time.now.utc.iso8601(3),
           kind: "mem",
           label: label,
           heap_live: s[:heap_live_slots],
           old_objects: s[:old_objects],
           minor_gc: s[:minor_gc_count],
           major_gc: s[:major_gc_count],
           rss_mb: read_rss_mb,
           run: @run_id,
           **extra
         })
end

.op_key(decl, idx, tag, op) ⇒ `Object`

Stable textual key for “match ops one by one”

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 312

def op_key(decl, idx, tag, op)
  attrs = compact_attrs(op.attrs)
  args  = op.args
  "#{decl}@#{idx}:#{tag}|#{attrs.keys.sort_by(&:to_s).map { |k| "#{k}=#{attrs[k].inspect}" }.join(',')}|args=#{args.inspect}"
end

.ops_enabled? ⇒ `Boolean`

Returns:

(Boolean)

15	# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 15 def ops_enabled? = ENV.fetch("KUMI_PROFILE_OPS", "1") == "1"

.persistent? ⇒ `Boolean`

Returns:

(Boolean)

17	# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 17 def persistent? = ENV["KUMI_PROFILE_PERSISTENT"] == "1"

.phase(name, tags = {}) ⇒ `Object`

Phase timing for coarse-grained operations

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 96

def phase(name, tags = {})
  return yield unless enabled?

  p0 = t0
  c0 = cpu_t0
  result = yield
  wall_ms = (t0 - p0) * 1000.0
  cpu_ms = (cpu_t0 - c0) * 1000.0
  stream({
           ts: Time.now.utc.iso8601(3),
           kind: "phase",
           name: name,
           wall_ms: wall_ms.round(3),
           cpu_ms: cpu_ms.round(3),
           tags: tags,
           run: @run_id
         })
  result
end

.read_rss_mb ⇒ `Object`

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 135

def read_rss_mb
  (File.read("/proc/#{$$}/status")[/VmRSS:\s+(\d+)\skB/, 1].to_i / 1024.0).round(2)
rescue StandardError
  nil
end

.record!(decl:, idx:, tag:, op:, t0:, cpu_t0: nil, rows: nil, note: nil) ⇒ `Object`

Per-op record with both wall time and CPU time (with sampling support)

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 142

def record!(decl:, idx:, tag:, op:, t0:, cpu_t0: nil, rows: nil, note: nil)
  return unless enabled? && ops_enabled?

  @op_seq += 1
  return unless sample_rate <= 1 || (@op_seq % sample_rate).zero?

  wall_ms = ((Process.clock_gettime(Process::CLOCK_MONOTONIC) - t0) * 1000.0)
  cpu_ms = cpu_t0 ? ((Process.clock_gettime(Process::CLOCK_PROCESS_CPUTIME_ID) - cpu_t0) * 1000.0) : wall_ms

  ev = {
    ts: Time.now.utc.iso8601(3),
    run: @run_id,
    schema: @schema_name, # schema identifier for multi-schema differentiation
    decl: decl, # decl name (string/symbol)
    i: idx, # op index
    tag: tag, # op tag (symbol)
    wall_ms: wall_ms.round(4),
    cpu_ms: cpu_ms.round(4),
    rows: rows,
    note: note,
    key: op_key(decl, idx, tag, op), # stable key for grep/diff
    attrs: compact_attrs(op.attrs)
  }

  # Aggregate stats for multi-run averaging
  op_key = "#{decl}@#{idx}:#{tag}"
  agg = @aggregated_stats[op_key]
  agg[:count] += 1
  agg[:total_ms] += wall_ms
  agg[:total_cpu_ms] += cpu_ms
  agg[:rows] += rows || 0
  agg[:runs] << @run_id
  agg[:decl] = decl
  agg[:tag] = tag
  agg[:idx] = idx
  agg[:note] = note if note

  (@events ||= []) << ev
  stream(ev) if ENV["KUMI_PROFILE_STREAM"] == "1"
  ev
end

.reset!(meta: {}) ⇒ `Object`

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 43

def reset!(meta: {})
  set_schema_name(meta[:schema_name]) if meta[:schema_name]
  return unless enabled?

  # In persistent mode, don't reset aggregated stats or increment run_id
  # This allows profiling across multiple schema creations
  if persistent?
    @events = []
    @meta = (@meta || {}).merge(meta)
    @schema_name = meta[:schema_name] if meta[:schema_name]
    @file = ENV["KUMI_PROFILE_FILE"] || "tmp/profile.jsonl"
    @run_id ||= 1
    @op_seq ||= 0
    @aggregated_stats ||= Hash.new { |h, k| h[k] = { count: 0, total_ms: 0.0, total_cpu_ms: 0.0, rows: 0, runs: Set.new } }

    # Only truncate on very first reset in persistent mode
    if ENV["KUMI_PROFILE_TRUNCATE"] == "1" && !@persistent_initialized
      FileUtils.mkdir_p(File.dirname(@file))
      File.write(@file, "")
      @aggregated_stats.clear
      @persistent_initialized = true
    end
  else
    # Original behavior: full reset each time
    @events = []
    @meta   = meta
    @schema_name = meta[:schema_name]
    @file   = ENV["KUMI_PROFILE_FILE"] || "tmp/profile.jsonl"
    @run_id = (@run_id || 0) + 1
    @op_seq = 0
    @aggregated_stats ||= Hash.new do |h, k|
      h[k] = { count: 0, total_ms: 0.0, total_cpu_ms: 0.0, rows: 0, runs: Set.new }
    end

    if ENV["KUMI_PROFILE_TRUNCATE"] == "1"
      FileUtils.mkdir_p(File.dirname(@file))
      File.write(@file, "")
      @aggregated_stats.clear
    end
  end
end

.sample_rate ⇒ `Object`

16	# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 16 def sample_rate = ENV["KUMI_PROFILE_SAMPLE"]&.to_i \|\| 1

.set_schema_name(name) ⇒ `Object`

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 19

def set_schema_name(name)
  @schema_name = name

  # Ensure profiler is initialized in persistent mode
  return if @initialized

  @events = []
  @meta = {}
  @file = ENV["KUMI_PROFILE_FILE"] || "tmp/profile.jsonl"
  @run_id ||= 1
  @op_seq ||= 0
  @aggregated_stats ||= Hash.new { |h, k| h[k] = { count: 0, total_ms: 0.0, total_cpu_ms: 0.0, rows: 0, runs: Set.new } }

  # Truncate file if needed
  if ENV["KUMI_PROFILE_TRUNCATE"] == "1" && !@persistent_initialized
    FileUtils.mkdir_p(File.dirname(@file))
    File.write(@file, "")
    @aggregated_stats.clear
    @persistent_initialized = true
  end

  @initialized = true
end

.stream(obj) ⇒ `Object`

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 329

def stream(obj)
  return unless @file

  FileUtils.mkdir_p(File.dirname(@file))
  File.open(@file, "a") { |f| f.puts(obj.to_json) }
end

.summary(top: 20) ⇒ `Object`

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 184

def summary(top: 20)
  return {} unless enabled?

  # Current run summary (legacy format)
  current_agg = Hash.new { |h, k| h[k] = { count: 0, ms: 0.0, rows: 0 } }
  (@events || []).each do |e|
    k = [e[:decl], e[:tag]]
    a = current_agg[k]
    a[:count] += 1
    a[:ms]    += e[:wall_ms] || e[:ms] || 0
    a[:rows]  += e[:rows] || 0
  end
  current_ranked = current_agg.map do |(decl, tag), v|
    { decl: decl, tag: tag, count: v[:count], ms: v[:ms].round(3), rows: v[:rows],
      rps: v[:rows] > 0 ? (v[:rows] / v[:ms]).round(1) : nil }
  end.sort_by { |h| -h[:ms] }.first(top)

  { meta: @meta || {}, top: current_ranked,
    total_ms: (@events || []).sum { |e| e[:wall_ms] || e[:ms] || 0 }.round(3),
    op_count: (@events || []).size,
    run_id: @run_id }
end

.t0 ⇒ `Object`

monotonic start time



86
87
88

# File 'lib/kumi/core/ir/execution_engine/profiler.rb', line 86

def t0
  Process.clock_gettime(Process::CLOCK_MONOTONIC)
end

Module: Kumi::Core::IR::ExecutionEngine::Profiler

Class Method Summary collapse

Class Method Details

.averaged_analysis(top: 20) ⇒ Object

.cache_overhead_analysis ⇒ Object

.compact_attrs(h) ⇒ Object

.cpu_t0 ⇒ Object

.emit_summary! ⇒ Object

.enabled? ⇒ Boolean

.finalize! ⇒ Object

.init_persistent! ⇒ Object

.memory_snapshot(label, extra: {}) ⇒ Object

.op_key(decl, idx, tag, op) ⇒ Object

.ops_enabled? ⇒ Boolean

.persistent? ⇒ Boolean

.phase(name, tags = {}) ⇒ Object

.read_rss_mb ⇒ Object

.record!(decl:, idx:, tag:, op:, t0:, cpu_t0: nil, rows: nil, note: nil) ⇒ Object

.reset!(meta: {}) ⇒ Object

.sample_rate ⇒ Object

.set_schema_name(name) ⇒ Object

.stream(obj) ⇒ Object

.summary(top: 20) ⇒ Object

.t0 ⇒ Object

.averaged_analysis(top: 20) ⇒ `Object`

.cache_overhead_analysis ⇒ `Object`

.compact_attrs(h) ⇒ `Object`

.cpu_t0 ⇒ `Object`

.emit_summary! ⇒ `Object`

.enabled? ⇒ `Boolean`

.finalize! ⇒ `Object`

.init_persistent! ⇒ `Object`

.memory_snapshot(label, extra: {}) ⇒ `Object`

.op_key(decl, idx, tag, op) ⇒ `Object`

.ops_enabled? ⇒ `Boolean`

.persistent? ⇒ `Boolean`

.phase(name, tags = {}) ⇒ `Object`

.read_rss_mb ⇒ `Object`

.record!(decl:, idx:, tag:, op:, t0:, cpu_t0: nil, rows: nil, note: nil) ⇒ `Object`

.reset!(meta: {}) ⇒ `Object`

.sample_rate ⇒ `Object`

.set_schema_name(name) ⇒ `Object`

.stream(obj) ⇒ `Object`

.summary(top: 20) ⇒ `Object`

.t0 ⇒ `Object`