internal/llmapp/check.go - oscar - Git at Google

 // Copyright 2024 The Go Authors. All rights reserved.
 // Use of this source code is governed by a BSD-style
 // license that can be found in the LICENSE file.

 package llmapp

 import (
 	"context"
 	"fmt"
 	"log/slog"

 	"golang.org/x/oscar/internal/llm"
 	"golang.org/x/oscar/internal/storage"
 )

 // NewWithChecker is like [New], but it configures the Client to use
 // the given checker to check the inputs to and outputs of the LLM against
 // safety policies.
 //
 // When any of the Overview functions are called, the prompts and outputs of the LLM
 // will be checked for safety violations.
 //
 // If the checker is nil, [NewWithChecker] is identical to [New].
 func NewWithChecker(lg *slog.Logger, g llm.ContentGenerator, checker llm.PolicyChecker, db storage.DB) *Client {
 	return &Client{slog: lg, g: g, checker: checker, db: db}
 }

 // EvaluatePolicy invokes the policy checker on the given prompts and LLM output and
 // wraps its results as a [*PolicyEvaluation].
 func (c *Client) EvaluatePolicy(ctx context.Context, prompts []llm.Part, output string) *PolicyEvaluation {
 	if c.checker == nil {
 		return nil
 	}
 	pe := &PolicyEvaluation{}
 	for _, p := range prompts {
 		switch v := p.(type) {
 		case llm.Text:
 			r := c.checkPolicy(ctx, string(v), nil)
 			if len(r.Violations) > 0 {
 				pe.Violative = true
 			}
 			pe.PromptResults = append(pe.PromptResults, r)
 		default:
 			// Other types are not supported for checks yet.
 			err := fmt.Errorf("llmapp: can't check policy for prompt part (unsupported type %T", v)
 			pe.PromptResults = append(pe.PromptResults, &PolicyResult{Text: "unknown", Error: err})
 		}
 	}
 	r := c.checkPolicy(ctx, output, prompts)
 	if len(r.Violations) > 0 {
 		pe.Violative = true
 	}
 	pe.OutputResults = r
 	return pe
 }

 // checkPolicy invokes the policy checker on the given text (with optional prompts)
 // and returns its (possibly cached) results.
 func (c *Client) checkPolicy(ctx context.Context, text string, prompts []llm.Part) *PolicyResult {
 	policies := c.checker.Policies()
 	k, h := c.keyAndHashCheckText(policies, text, prompts)

 	c.db.Lock(string(k))
 	defer c.db.Unlock(string(k))

 	r := load[responseCheckText](c, k)
 	cached := r != nil

 	if !cached { // cache miss
 		prs, err := c.checker.CheckText(ctx, text, prompts...)
 		if err != nil {
 			// don't cache errors
 			return &PolicyResult{Text: text, Error: fmt.Errorf("llmapp: error while checking for policy violations: %w", err)}
 		}
 		r = &responseCheckText{
 			Name:      c.checker.Name(),
 			InputHash: h,
 			Response:  prs,
 		}
 		c.db.Set(k, storage.JSON(r))
 	}

 	c.slog.Info("llmapp: found policy results", "text", text, "prompts", prompts, "results", toStrings(r.Response), "cached", cached)
 	if vs := violations(r.Response); len(vs) > 0 {
 		c.slog.Warn("llmapp: found policy violations for LLM output", "text", text, "prompts", prompts, "violations", toStrings(vs), "cached", cached)
 		return &PolicyResult{Text: text, Results: r.Response, Violations: vs, Cached: cached}
 	}
 	return &PolicyResult{Text: text, Results: r.Response, Cached: cached}
 }

 func toStrings(prs []*llm.PolicyResult) []string {
 	var ss []string
 	for _, pr := range prs {
 		ss = append(ss, pr.String())
 	}
 	return ss
 }

 // violations returns the policies in prs that are in violation.
 func violations(prs []*llm.PolicyResult) []*llm.PolicyResult {
 	var vs []*llm.PolicyResult
 	for _, pr := range prs {
 		if pr.IsViolative() {
 			vs = append(vs, pr)
 		}
 	}
 	return vs
 }
	// Copyright 2024 The Go Authors. All rights reserved.
	// Use of this source code is governed by a BSD-style
	// license that can be found in the LICENSE file.

	package llmapp

	import (
	"context"
	"fmt"
	"log/slog"

	"golang.org/x/oscar/internal/llm"
	"golang.org/x/oscar/internal/storage"
	)

	// NewWithChecker is like [New], but it configures the Client to use
	// the given checker to check the inputs to and outputs of the LLM against
	// safety policies.
	//
	// When any of the Overview functions are called, the prompts and outputs of the LLM
	// will be checked for safety violations.
	//
	// If the checker is nil, [NewWithChecker] is identical to [New].
	func NewWithChecker(lg slog.Logger, g llm.ContentGenerator, checker llm.PolicyChecker, db storage.DB) Client {
	return &Client{slog: lg, g: g, checker: checker, db: db}
	}

	// EvaluatePolicy invokes the policy checker on the given prompts and LLM output and
	// wraps its results as a [*PolicyEvaluation].
	func (c Client) EvaluatePolicy(ctx context.Context, prompts []llm.Part, output string) PolicyEvaluation {
	if c.checker == nil {
	return nil
	}
	pe := &PolicyEvaluation{}
	for _, p := range prompts {
	switch v := p.(type) {
	case llm.Text:
	r := c.checkPolicy(ctx, string(v), nil)
	if len(r.Violations) > 0 {
	pe.Violative = true
	}
	pe.PromptResults = append(pe.PromptResults, r)
	default:
	// Other types are not supported for checks yet.
	err := fmt.Errorf("llmapp: can't check policy for prompt part (unsupported type %T", v)
	pe.PromptResults = append(pe.PromptResults, &PolicyResult{Text: "unknown", Error: err})
	}
	}
	r := c.checkPolicy(ctx, output, prompts)
	if len(r.Violations) > 0 {
	pe.Violative = true
	}
	pe.OutputResults = r
	return pe
	}

	// checkPolicy invokes the policy checker on the given text (with optional prompts)
	// and returns its (possibly cached) results.
	func (c Client) checkPolicy(ctx context.Context, text string, prompts []llm.Part) PolicyResult {
	policies := c.checker.Policies()
	k, h := c.keyAndHashCheckText(policies, text, prompts)

	c.db.Lock(string(k))
	defer c.db.Unlock(string(k))

	r := load[responseCheckText](c, k)
	cached := r != nil

	if !cached { // cache miss
	prs, err := c.checker.CheckText(ctx, text, prompts...)
	if err != nil {
	// don't cache errors
	return &PolicyResult{Text: text, Error: fmt.Errorf("llmapp: error while checking for policy violations: %w", err)}
	}
	r = &responseCheckText{
	Name: c.checker.Name(),
	InputHash: h,
	Response: prs,
	}
	c.db.Set(k, storage.JSON(r))
	}

	c.slog.Info("llmapp: found policy results", "text", text, "prompts", prompts, "results", toStrings(r.Response), "cached", cached)
	if vs := violations(r.Response); len(vs) > 0 {
	c.slog.Warn("llmapp: found policy violations for LLM output", "text", text, "prompts", prompts, "violations", toStrings(vs), "cached", cached)
	return &PolicyResult{Text: text, Results: r.Response, Violations: vs, Cached: cached}
	}
	return &PolicyResult{Text: text, Results: r.Response, Cached: cached}
	}

	func toStrings(prs []*llm.PolicyResult) []string {
	var ss []string
	for _, pr := range prs {
	ss = append(ss, pr.String())
	}
	return ss
	}

	// violations returns the policies in prs that are in violation.
	func violations(prs []llm.PolicyResult) []llm.PolicyResult {
	var vs []*llm.PolicyResult
	for _, pr := range prs {
	if pr.IsViolative() {
	vs = append(vs, pr)
	}
	}
	return vs
	}