lqb
/
nginx-ui
зеркало из https://github.com/0xJacky/nginx-ui.git


			
				
					
						
						
							123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364
							package searcher

import (
	"crypto/md5"
	"encoding/hex"
	"encoding/json"
	"fmt"
	"sort"
	"strconv"
	"time"

	"github.com/0xJacky/Nginx-UI/internal/nginx_log/utils"
	"github.com/dgraph-io/ristretto/v2"
)

// OptimizedSearchCache provides high-performance caching using Ristretto
type OptimizedSearchCache struct {
	cache *ristretto.Cache[string, *SearchResult]
}

// NewOptimizedSearchCache creates a new optimized cache with Ristretto
func NewOptimizedSearchCache(maxSize int64) *OptimizedSearchCache {
	cache, err := ristretto.NewCache(&ristretto.Config[string, *SearchResult]{
		NumCounters: maxSize * 10, // Number of keys to track frequency of (10x cache size)
		MaxCost:     maxSize,      // Maximum cost of cache (number of items)
		BufferItems: 64,           // Number of keys per Get buffer
		Metrics:     true,         // Enable metrics collection
	})
	if err != nil {
		panic(fmt.Sprintf("failed to create cache: %v", err))
	}

	return &OptimizedSearchCache{
		cache: cache,
	}
}

// GenerateOptimizedKey generates an efficient cache key for a search request
func (osc *OptimizedSearchCache) GenerateOptimizedKey(req *SearchRequest) string {
	// Create a unique key based on ALL relevant search parameters, including log paths and filters.
	// To avoid order-sensitive keys, sort all slice fields and deduplicate where appropriate.

	// Build sorted copies to avoid mutating the original request
	copyStrings := func(src []string, doSort bool, dedup bool) []string {
		if len(src) == 0 {
			return nil
		}
		res := make([]string, 0, len(src))
		if dedup {
			seen := make(map[string]struct{}, len(src))
			for _, s := range src {
				if _, ok := seen[s]; ok {
					continue
				}
				seen[s] = struct{}{}
				res = append(res, s)
			}
		} else {
			res = append(res, src...)
		}
		if doSort {
			sort.Strings(res)
		}
		return res
	}

	copyInts := func(src []int, doSort bool) []int {
		if len(src) == 0 {
			return nil
		}
		res := append([]int(nil), src...)
		if doSort {
			sort.Ints(res)
		}
		return res
	}

	keyData := struct {
		Query          string   `json:"query"`
		Limit          int      `json:"limit"`
		Offset         int      `json:"offset"`
		SortBy         string   `json:"sort_by"`
		SortOrder      string   `json:"sort_order"`
		StartTime      *int64   `json:"start_time"`
		EndTime        *int64   `json:"end_time"`
		UseMainLogPath bool     `json:"use_main_log_path"`
		LogPaths       []string `json:"log_paths"`
		Fields         []string `json:"fields"`
		IPAddresses    []string `json:"ip_addresses"`
		StatusCodes    []int    `json:"status_codes"`
		Methods        []string `json:"methods"`
		Paths          []string `json:"paths"`
		UserAgents     []string `json:"user_agents"`
		Referers       []string `json:"referers"`
		Countries      []string `json:"countries"`
		Browsers       []string `json:"browsers"`
		OSs            []string `json:"operating_systems"`
		Devices        []string `json:"devices"`
		MinBytes       *int64   `json:"min_bytes"`
		MaxBytes       *int64   `json:"max_bytes"`
		MinReqTime     *float64 `json:"min_request_time"`
		MaxReqTime     *float64 `json:"max_request_time"`
		IncludeFacets  bool     `json:"include_facets"`
		IncludeStats   bool     `json:"include_stats"`
		FacetFields    []string `json:"facet_fields"`
		FacetSize      int      `json:"facet_size"`
		UseCache       bool     `json:"use_cache"`
	}{
		Query:          req.Query,
		Limit:          req.Limit,
		Offset:         req.Offset,
		SortBy:         req.SortBy,
		SortOrder:      req.SortOrder,
		StartTime:      req.StartTime,
		EndTime:        req.EndTime,
		UseMainLogPath: req.UseMainLogPath,
		LogPaths:       copyStrings(req.LogPaths, true, true),
		Fields:         copyStrings(req.Fields, true, false),
		IPAddresses:    copyStrings(req.IPAddresses, true, true),
		StatusCodes:    copyInts(req.StatusCodes, true),
		Methods:        copyStrings(req.Methods, true, true),
		Paths:          copyStrings(req.Paths, true, true),
		UserAgents:     copyStrings(req.UserAgents, true, true),
		Referers:       copyStrings(req.Referers, true, true),
		Countries:      copyStrings(req.Countries, true, true),
		Browsers:       copyStrings(req.Browsers, true, true),
		OSs:            copyStrings(req.OSs, true, true),
		Devices:        copyStrings(req.Devices, true, true),
		MinBytes:       req.MinBytes,
		MaxBytes:       req.MaxBytes,
		MinReqTime:     req.MinReqTime,
		MaxReqTime:     req.MaxReqTime,
		IncludeFacets:  req.IncludeFacets,
		IncludeStats:   req.IncludeStats,
		FacetFields:    copyStrings(req.FacetFields, true, true),
		FacetSize:      req.FacetSize,
		UseCache:       req.UseCache,
	}

	// Convert to JSON and hash for consistent key generation
	jsonData, err := json.Marshal(keyData)
	if err != nil {
		// Fallback to efficient string building if JSON marshal fails
		keyBuf := make([]byte, 0, len(req.Query)+len(req.SortBy)+len(req.SortOrder)+32)
		keyBuf = append(keyBuf, "q:"...)
		keyBuf = append(keyBuf, req.Query...)
		keyBuf = append(keyBuf, "|l:"...)
		keyBuf = utils.AppendInt(keyBuf, req.Limit)
		keyBuf = append(keyBuf, "|o:"...)
		keyBuf = utils.AppendInt(keyBuf, req.Offset)
		keyBuf = append(keyBuf, "|s:"...)
		keyBuf = append(keyBuf, req.SortBy...)
		keyBuf = append(keyBuf, "|so:"...)
		keyBuf = append(keyBuf, req.SortOrder...)
		return utils.BytesToStringUnsafe(keyBuf)
	}

	// Use MD5 hash for compact key representation
	hash := md5.Sum(jsonData)
	return hex.EncodeToString(hash[:])
}

// Get retrieves a search result from cache
func (osc *OptimizedSearchCache) Get(req *SearchRequest) *SearchResult {
	key := osc.GenerateOptimizedKey(req)

	if result, found := osc.cache.Get(key); found {
		// Mark result as from cache
		cachedResult := *result // Create a copy
		cachedResult.FromCache = true
		return &cachedResult
	}

	return nil
}

// Put stores a search result in cache with automatic cost calculation
func (osc *OptimizedSearchCache) Put(req *SearchRequest, result *SearchResult, ttl time.Duration) {
	key := osc.GenerateOptimizedKey(req)

	// Calculate cost based on result size (number of hits + base cost)
	cost := int64(1 + len(result.Hits)/10) // Base cost of 1 plus hits/10
	if cost < 1 {
		cost = 1
	}

	// Set with TTL
	osc.cache.SetWithTTL(key, result, cost, ttl)
	// Wait for the value to pass through buffers to ensure it's cached
	osc.cache.Wait()
}

// Clear clears all cached entries
func (osc *OptimizedSearchCache) Clear() {
	if osc != nil && osc.cache != nil {
		osc.cache.Clear()
	}
}

// GetStats returns cache statistics
func (osc *OptimizedSearchCache) GetStats() *CacheStats {
	metrics := osc.cache.Metrics

	return &CacheStats{
		Size:      int(metrics.KeysAdded() - metrics.KeysEvicted()),
		Capacity:  int(osc.cache.MaxCost()),
		HitCount:  int64(metrics.Hits()),
		MissCount: int64(metrics.Misses()),
		HitRate:   metrics.Ratio(),
		Evictions: int64(metrics.KeysEvicted()),
		Additions: int64(metrics.KeysAdded()),
		Updates:   int64(metrics.KeysUpdated()),
		Cost:      int64(metrics.CostAdded() - metrics.CostEvicted()),
	}
}

// CacheStats provides detailed cache statistics
type CacheStats struct {
	Size      int     `json:"size"`       // Current number of items
	Capacity  int     `json:"capacity"`   // Maximum capacity
	HitCount  int64   `json:"hit_count"`  // Number of cache hits
	MissCount int64   `json:"miss_count"` // Number of cache misses
	HitRate   float64 `json:"hit_rate"`   // Cache hit rate (0.0 to 1.0)
	Evictions int64   `json:"evictions"`  // Number of evicted items
	Additions int64   `json:"additions"`  // Number of items added
	Updates   int64   `json:"updates"`    // Number of items updated
	Cost      int64   `json:"cost"`       // Current cost
}

// WarmupCache pre-loads frequently used queries into cache
func (osc *OptimizedSearchCache) WarmupCache(queries []WarmupQuery) {
	for _, query := range queries {
		// Pre-generate keys to warm up the cache
		key := osc.GenerateOptimizedKey(query.Request)
		if query.Result != nil {
			osc.cache.Set(key, query.Result, 1) // Use cost of 1 for warmup
		}
	}

	// Wait for cache operations to complete
	osc.cache.Wait()
}

// WarmupQuery represents a query and result pair for cache warmup
type WarmupQuery struct {
	Request *SearchRequest `json:"request"`
	Result  *SearchResult  `json:"result"`
}

// Close closes the cache and frees resources
func (osc *OptimizedSearchCache) Close() {
	osc.cache.Close()
}

// FastKeyGenerator provides even faster key generation for hot paths
type FastKeyGenerator struct {
	buffer []byte
}

// NewFastKeyGenerator creates a key generator with pre-allocated buffer
func NewFastKeyGenerator() *FastKeyGenerator {
	return &FastKeyGenerator{
		buffer: make([]byte, 0, 256), // Pre-allocate 256 bytes
	}
}

// GenerateKey generates a key using pre-allocated buffer
func (fkg *FastKeyGenerator) GenerateKey(req *SearchRequest) string {
	fkg.buffer = fkg.buffer[:0] // Reset buffer

	// Build key using buffer to avoid allocations
	fkg.buffer = append(fkg.buffer, "q:"...)
	fkg.buffer = append(fkg.buffer, req.Query...)
	fkg.buffer = append(fkg.buffer, "|l:"...)
	fkg.buffer = strconv.AppendInt(fkg.buffer, int64(req.Limit), 10)
	fkg.buffer = append(fkg.buffer, "|o:"...)
	fkg.buffer = strconv.AppendInt(fkg.buffer, int64(req.Offset), 10)
	fkg.buffer = append(fkg.buffer, "|s:"...)
	fkg.buffer = append(fkg.buffer, req.SortBy...)
	fkg.buffer = append(fkg.buffer, "|so:"...)
	fkg.buffer = append(fkg.buffer, req.SortOrder...)

	// Add timestamps if present
	if req.StartTime != nil {
		fkg.buffer = append(fkg.buffer, "|st:"...)
		fkg.buffer = strconv.AppendInt(fkg.buffer, *req.StartTime, 10)
	}
	if req.EndTime != nil {
		fkg.buffer = append(fkg.buffer, "|et:"...)
		fkg.buffer = strconv.AppendInt(fkg.buffer, *req.EndTime, 10)
	}

	// Add arrays (simplified)
	if len(req.StatusCodes) > 0 {
		fkg.buffer = append(fkg.buffer, "|sc:"...)
		for i, code := range req.StatusCodes {
			if i > 0 {
				fkg.buffer = append(fkg.buffer, ',')
			}
			fkg.buffer = strconv.AppendInt(fkg.buffer, int64(code), 10)
		}
	}

	// Convert to string (this still allocates, but fewer allocations overall)
	return string(fkg.buffer)
}

// CacheMiddleware provides middleware functionality for caching
type CacheMiddleware struct {
	cache      *OptimizedSearchCache
	keyGen     *FastKeyGenerator
	enabled    bool
	defaultTTL time.Duration
}

// NewCacheMiddleware creates a new cache middleware
func NewCacheMiddleware(cache *OptimizedSearchCache, defaultTTL time.Duration) *CacheMiddleware {
	return &CacheMiddleware{
		cache:      cache,
		keyGen:     NewFastKeyGenerator(),
		enabled:    true,
		defaultTTL: defaultTTL,
	}
}

// Enable enables caching
func (cm *CacheMiddleware) Enable() {
	cm.enabled = true
}

// Disable disables caching
func (cm *CacheMiddleware) Disable() {
	cm.enabled = false
}

// IsEnabled returns whether caching is enabled
func (cm *CacheMiddleware) IsEnabled() bool {
	return cm.enabled
}

// GetOrSet attempts to get from cache, or executes the provided function and caches the result
func (cm *CacheMiddleware) GetOrSet(req *SearchRequest, fn func() (*SearchResult, error)) (*SearchResult, error) {
	if !cm.enabled {
		return fn()
	}

	// Try cache first
	if cached := cm.cache.Get(req); cached != nil {
		return cached, nil
	}

	// Execute function
	result, err := fn()
	if err != nil {
		return nil, err
	}

	// Cache successful result
	if result != nil {
		cm.cache.Put(req, result, cm.defaultTTL)
	}

	return result, nil
}