config

package

v0.7.2 Latest Latest Go to latest Published: Aug 28, 2025 License: MPL-2.0 Imports: 19 Imported by: 0

Details

Valid go.mod file
Redistributable license
Tagged version
Stable version
Learn more about best practices

Repository

github.com/petmal/mindtrial

Links

Open Source Insights

Documentation ¶

Overview ¶

Package config contains the data models representing the structure of configuration and task definition files for the MindTrial application. It provides configuration management and handles loading and validation of application settings, provider configurations, and task definitions from YAML files.

Index ¶

Constants
Variables
func CleanIfNotBlank(filePath string) string
func IsNotBlank(value string) bool
func MakeAbs(baseDirPath string, filePath string) string
func OnceWithContext[S any, T any](f func(context.Context, *S) (T, error)) func(context.Context, *S) (T, error)
func ResolveFileNamePattern(pattern string, timeRef time.Time) string
func ResolveFlagOverride(override *bool, parentValue bool) bool
type AnthropicClientConfig
type AnthropicModelParams
type AppConfig
- func (ac AppConfig) GetJudgesWithEnabledRuns() []JudgeConfig
- func (ac AppConfig) GetProvidersWithEnabledRuns() []ProviderConfig
type ClientConfig
type Config
- func LoadConfigFromFile(ctx context.Context, path string) (*Config, error)
type DeepseekClientConfig
type DeepseekModelParams
type GoogleAIClientConfig
type GoogleAIModelParams
type JudgeConfig
- func (jc JudgeConfig) Resolve(excludeDisabledRuns bool) JudgeConfig
type JudgeSelector
- func (js JudgeSelector) GetName() (name string)
- func (js JudgeSelector) GetVariant() (variant string)
- func (js JudgeSelector) IsEnabled() bool
- func (these JudgeSelector) MergeWith(other JudgeSelector) JudgeSelector
type MistralAIClientConfig
type MistralAIModelParams
type ModelParams
type OpenAIClientConfig
type OpenAIModelParams
type ProviderConfig
- func (pc ProviderConfig) GetRunsResolved() []RunConfig
- func (pc ProviderConfig) Resolve(excludeDisabledRuns bool) ProviderConfig
- func (pc *ProviderConfig) UnmarshalYAML(value *yaml.Node) error
type RetryPolicy
type RunConfig
type Task
- func (t *Task) SetBaseFilePath(basePath string) error
type TaskConfig
- func (o TaskConfig) GetEnabledTasks() []Task
type TaskFile
- func (f *TaskFile) Base64(ctx context.Context) (string, error)
- func (f *TaskFile) Content(ctx context.Context) ([]byte, error)
- func (f *TaskFile) GetDataURL(ctx context.Context) (string, error)
- func (f *TaskFile) SetBasePath(basePath string)
- func (f *TaskFile) TypeValue(ctx context.Context) (string, error)
- func (f *TaskFile) UnmarshalYAML(value *yaml.Node) error
- func (f *TaskFile) Validate() error
type Tasks
- func LoadTasksFromFile(ctx context.Context, path string) (*Tasks, error)
type URI
- func (u URI) IsLocalFile() bool
- func (u URI) IsRemoteFile() bool
- func (u URI) MarshalYAML() (interface{}, error)
- func (u *URI) Parse(raw string) (err error)
- func (u URI) Path(basePath string) string
- func (u URI) String() string
- func (u URI) URL() *url.URL
- func (u *URI) UnmarshalYAML(value *yaml.Node) error
type ValidationRules
- func (vr ValidationRules) IsCaseSensitive() bool
- func (vr ValidationRules) IsIgnoreWhitespace() bool
- func (vr ValidationRules) IsTrimLines() bool
- func (these ValidationRules) MergeWith(other *ValidationRules) ValidationRules
- func (vr ValidationRules) UseJudge() bool
type XAIClientConfig
type XAIModelParams

Constants ¶

View Source

const (
	// OPENAI identifies the OpenAI provider.
	OPENAI string = "openai"
	// GOOGLE identifies the Google AI provider.
	GOOGLE string = "google"
	// ANTHROPIC identifies the Anthropic provider.
	ANTHROPIC string = "anthropic"
	// DEEPSEEK identifies the Deepseek provider.
	DEEPSEEK string = "deepseek"
	// MISTRALAI identifies the Mistral AI provider.
	MISTRALAI string = "mistralai"
	// XAI identifies the xAI provider.
	XAI string = "xai"
)

Variables ¶

View Source

var (
	// ErrInvalidTaskProperty indicates invalid task definition.
	ErrInvalidTaskProperty = errors.New("invalid task property")
	// ErrInvalidURI indicates that the specified URI is invalid or not supported.
	ErrInvalidURI = errors.New("invalid URI")
	// ErrDownloadFile indicates that a remote file could not be downloaded.
	ErrDownloadFile = errors.New("failed to download remote file")
	// ErrAccessFile indicates that a local file could not be accessed.
	ErrAccessFile = errors.New("file is not accessible")
)

View Source

var ErrInvalidConfigProperty = errors.New("invalid configuration property")

ErrInvalidConfigProperty indicates invalid configuration.

Functions ¶

func CleanIfNotBlank ¶

func CleanIfNotBlank(filePath string) string

CleanIfNotBlank cleans the given file path if it's not blank. Returns original path if it's blank.

func IsNotBlank ¶

func IsNotBlank(value string) bool

IsNotBlank returns true if the given string contains non-whitespace characters.

func MakeAbs ¶

func MakeAbs(baseDirPath string, filePath string) string

MakeAbs converts relative file path to absolute using the given base directory. Returns original path if it's already absolute or blank.

func OnceWithContext ¶

func OnceWithContext[S any, T any](f func(context.Context, *S) (T, error)) func(context.Context, *S) (T, error)

OnceWithContext returns a function that invokes f only once regardless of the supplied context. The first call's context is used for execution, and subsequent calls simply return the cached result. This is similar to sync.OnceValues but specifically for functions that need a context.

func ResolveFileNamePattern ¶

func ResolveFileNamePattern(pattern string, timeRef time.Time) string

ResolveFileNamePattern takes a filename pattern containing time placeholders and returns a string with the placeholders replaced by values from the given time reference. Supported placeholders: {{.Year}}, {{.Month}}, {{.Day}}, {{.Hour}}, {{.Minute}}, {{.Second}}. Returns the original pattern if it cannot be resolved.

func ResolveFlagOverride ¶

func ResolveFlagOverride(override *bool, parentValue bool) bool

ResolveFlagOverride returns override value if not nil, otherwise returns parent value.

Types ¶

type AnthropicClientConfig ¶

type AnthropicClientConfig struct {
	// APIKey is the API key for the Anthropic generative models provider.
	APIKey string `yaml:"api-key" validate:"required"`
	// RequestTimeout specifies the timeout for API requests.
	RequestTimeout *time.Duration `yaml:"request-timeout" validate:"omitempty"`
}

AnthropicClientConfig represents Anthropic provider settings.

type AnthropicModelParams ¶

type AnthropicModelParams struct {
	// MaxTokens controls the maximum number of tokens available to the model for generating a response.
	// This includes the thinking budget for reasoning models.
	MaxTokens *int64 `yaml:"max-tokens" validate:"omitempty,min=0"`

	// ThinkingBudgetTokens specifies the number of tokens the model can use for its internal reasoning process.
	// It must be at least 1024 and less than `MaxTokens`.
	// If set, this enables enhanced reasoning capabilities for the model.
	ThinkingBudgetTokens *int64 `yaml:"thinking-budget-tokens" validate:"omitempty,min=1024,ltfield=MaxTokens"`

	// Temperature controls the randomness or "creativity" of responses.
	// Values range from 0.0 to 1.0, with lower values making the output more focused.
	// The default value is 1.0.
	// It is generally recommended to alter this or `TopP` but not both.
	Temperature *float64 `yaml:"temperature" validate:"omitempty,min=0,max=1"`

	// TopP controls diversity via nucleus sampling.
	// Values range from 0.0 to 1.0, with lower values making the output more focused.
	// You usually only need to use `Temperature`.
	TopP *float64 `yaml:"top-p" validate:"omitempty,min=0,max=1"`

	// TopK limits response tokens to top K options for each token position.
	// Higher values allow more diverse outputs by considering more token options.
	// You usually only need to use `Temperature`.
	TopK *int64 `yaml:"top-k" validate:"omitempty,min=0"`
}

AnthropicModelParams represents Anthropic model-specific settings.

type AppConfig ¶

type AppConfig struct {
	// LogFile specifies path to the log file.
	LogFile string `yaml:"log-file" validate:"omitempty,filepath"`

	// OutputDir specifies directory where results will be saved.
	OutputDir string `yaml:"output-dir" validate:"required"`

	// OutputBaseName specifies base filename for result files.
	OutputBaseName string `yaml:"output-basename" validate:"omitempty,filepath"`

	// TaskSource specifies path to the task definitions file.
	TaskSource string `yaml:"task-source" validate:"required,filepath"`

	// Providers lists configurations for AI providers whose models will be used
	// to execute tasks during the trial run.
	Providers []ProviderConfig `yaml:"providers" validate:"required,dive"`

	// Judges lists LLM configurations for semantic evaluation of open-ended task responses.
	Judges []JudgeConfig `yaml:"judges" validate:"omitempty,unique=Name,dive"`
}

AppConfig defines application-wide settings.

func (AppConfig) GetJudgesWithEnabledRuns ¶ added in v0.5.0

func (ac AppConfig) GetJudgesWithEnabledRuns() []JudgeConfig

GetJudgesWithEnabledRuns returns judges with their enabled run variant configurations. Run variant configurations are resolved using GetRunsResolved before filtering. Any disabled run variant configurations are excluded from the results. Judges with no enabled run variant configurations are excluded from the returned list.

func (AppConfig) GetProvidersWithEnabledRuns ¶

func (ac AppConfig) GetProvidersWithEnabledRuns() []ProviderConfig

GetProvidersWithEnabledRuns returns providers with their enabled run configurations. Run configurations are resolved using GetRunsResolved before filtering. Any disabled run configurations are excluded from the results. Providers with no enabled run configurations are excluded from the returned list.

type ClientConfig ¶

type ClientConfig interface{}

ClientConfig is a marker interface for provider-specific configurations.

type Config ¶

type Config struct {
	// Config contains application-wide settings.
	Config AppConfig `yaml:"config" validate:"required"`
}

Config represents the top-level configuration structure.

func LoadConfigFromFile ¶

func LoadConfigFromFile(ctx context.Context, path string) (*Config, error)

LoadConfigFromFile reads and validates application configuration from the specified file path. Returns error if the file cannot be read or contains invalid configuration.

type DeepseekClientConfig ¶

type DeepseekClientConfig struct {
	// APIKey is the API key for the Deepseek generative models provider.
	APIKey string `yaml:"api-key" validate:"required"`
	// RequestTimeout specifies the timeout for API requests.
	RequestTimeout *time.Duration `yaml:"request-timeout" validate:"omitempty"`
}

DeepseekClientConfig represents Deepseek provider settings.

type DeepseekModelParams ¶

type DeepseekModelParams struct {
	// Temperature controls the randomness or "creativity" of the model's outputs.
	// Values range from 0.0 to 2.0, with lower values making the output more focused.
	// The default value is 1.0.
	// Recommended values by use case:
	// - 0.0: Coding / Math (best for precise, deterministic outputs)
	// - 1.0: Data Cleaning / Data Analysis
	// - 1.3: General Conversation / Translation
	// - 1.5: Creative Writing / Poetry (more varied and creative outputs)
	Temperature *float32 `yaml:"temperature" validate:"omitempty,min=0,max=2"`

	// TopP controls diversity via nucleus sampling.
	// Values range from 0.0 to 1.0, with lower values making the output more focused.
	// You usually only need to use `Temperature`.
	TopP *float32 `yaml:"top-p" validate:"omitempty,min=0,max=1"`

	// PresencePenalty penalizes new tokens based on whether they appear in the text so far.
	// Values range from -2.0 to 2.0, with positive values encouraging the model to use new tokens,
	// increasing the model's likelihood to talk about new topics.
	// The default value is 0.0.
	PresencePenalty *float32 `yaml:"presence-penalty" validate:"omitempty,min=-2,max=2"`

	// FrequencyPenalty penalizes new tokens based on their frequency in the text so far.
	// Values range from -2.0 to 2.0, with positive values encouraging the model to use less frequent tokens,
	// decreasing the model's likelihood to repeat the same line verbatim.
	// The default value is 0.0.
	FrequencyPenalty *float32 `yaml:"frequency-penalty" validate:"omitempty,min=-2,max=2"`
}

DeepseekModelParams represents Deepseek model-specific settings.

type GoogleAIClientConfig ¶

type GoogleAIClientConfig struct {
	// APIKey is the API key for the Google AI generative models provider.
	APIKey string `yaml:"api-key" validate:"required"`
}

GoogleAIClientConfig represents Google AI provider settings.

type GoogleAIModelParams ¶

type GoogleAIModelParams struct {
	// TextResponseFormat indicates whether to use plain-text response format
	// for compatibility with models that do not support JSON.
	TextResponseFormat bool `yaml:"text-response-format" validate:"omitempty"`

	// Temperature controls the randomness or "creativity" of the model's outputs.
	// Values range from 0.0 to 2.0, with lower values making the output more focused and deterministic.
	// The default value is typically around 1.0.
	Temperature *float32 `yaml:"temperature" validate:"omitempty,min=0,max=2"`

	// TopP controls diversity via nucleus sampling.
	// Values range from 0.0 to 1.0, with lower values making the output more focused.
	// The default value is typically around 1.0.
	TopP *float32 `yaml:"top-p" validate:"omitempty,min=0,max=1"`

	// TopK limits response tokens to top K options for each token position.
	// Higher values allow more diverse outputs by considering more token options.
	TopK *int32 `yaml:"top-k" validate:"omitempty,min=0"`
}

GoogleAIModelParams represents Google AI model-specific settings.

type JudgeConfig ¶ added in v0.5.0

type JudgeConfig struct {
	// Name is the unique identifier for this judge configuration.
	Name string `yaml:"name" validate:"required"`

	// Provider encapsulates the provider configuration for the judge.
	Provider ProviderConfig `yaml:"provider" validate:"required"`
}

JudgeConfig defines configuration for an LLM judge used for semantic evaluation of complex open-ended task responses. Judges analyze the meaning and quality of answers rather than performing exact text matching, enabling evaluation of subjective or creative tasks where multiple valid interpretations exist.

func (JudgeConfig) Resolve ¶ added in v0.5.0

func (jc JudgeConfig) Resolve(excludeDisabledRuns bool) JudgeConfig

Resolve returns a copy of the judge configuration with run variants resolved. If excludeDisabledRuns is true, only enabled run variants are included.

type JudgeSelector ¶ added in v0.5.0

type JudgeSelector struct {
	// Enabled determines whether judge evaluation is enabled.
	Enabled *bool `yaml:"enabled" validate:"omitempty"`

	// Name specifies the name of the judge configuration to use.
	Name *string `yaml:"name" validate:"omitempty"`

	// Variant specifies the run variant name from the judge's provider configuration.
	Variant *string `yaml:"variant" validate:"omitempty"`
}

JudgeSelector defines settings for using a judge in validation.

func (JudgeSelector) GetName ¶ added in v0.5.0

func (js JudgeSelector) GetName() (name string)

GetName returns the judge name, or empty string if not set.

func (JudgeSelector) GetVariant ¶ added in v0.5.0

func (js JudgeSelector) GetVariant() (variant string)

GetVariant returns the judge run variant, or empty string if not set.

func (JudgeSelector) IsEnabled ¶ added in v0.5.0

func (js JudgeSelector) IsEnabled() bool

IsEnabled returns whether judge evaluation is enabled.

func (JudgeSelector) MergeWith ¶ added in v0.5.0

func (these JudgeSelector) MergeWith(other JudgeSelector) JudgeSelector

MergeWith merges this judge configuration with another and returns the result. The provided other values override these values if set.

type MistralAIClientConfig ¶ added in v0.4.0

type MistralAIClientConfig struct {
	// APIKey is the API key for the Mistral AI generative models provider.
	APIKey string `yaml:"api-key" validate:"required"`
}

MistralAIClientConfig represents Mistral AI provider settings.

type MistralAIModelParams ¶ added in v0.4.0

type MistralAIModelParams struct {
	// Temperature controls the randomness or "creativity" of the model's outputs.
	// Values range from 0.0 to 1.5, with lower values making the output more focused and deterministic.
	// The default value varies depending on the model.
	// It is generally recommended to alter this or `TopP` but not both.
	Temperature *float32 `yaml:"temperature" validate:"omitempty,min=0,max=1.5"`

	// TopP controls diversity via nucleus sampling.
	// Values range from 0.0 to 1.0, with lower values making the output more focused.
	// The default value is 1.0.
	// It is generally recommended to alter this or `Temperature` but not both.
	TopP *float32 `yaml:"top-p" validate:"omitempty,min=0,max=1"`

	// MaxTokens controls the maximum number of tokens to generate in the completion.
	// The token count of the prompt plus max_tokens cannot exceed the model's context length.
	MaxTokens *int32 `yaml:"max-tokens" validate:"omitempty,min=0"`

	// PresencePenalty penalizes new tokens based on whether they appear in the text so far.
	// Values range from -2.0 to 2.0, with positive values encouraging the model to use new tokens,
	// increasing the model's likelihood to talk about new topics.
	// The default value is 0.0.
	PresencePenalty *float32 `yaml:"presence-penalty" validate:"omitempty,min=-2,max=2"`

	// FrequencyPenalty penalizes new tokens based on their frequency in the text so far.
	// Values range from -2.0 to 2.0, with positive values encouraging the model to use less frequent tokens,
	// decreasing the model's likelihood to repeat the same line verbatim.
	// The default value is 0.0.
	FrequencyPenalty *float32 `yaml:"frequency-penalty" validate:"omitempty,min=-2,max=2"`

	// RandomSeed provides the seed to use for random sampling.
	// If set, requests will generate deterministic results.
	RandomSeed *int32 `yaml:"random-seed" validate:"omitempty"`

	// PromptMode sets the prompt mode for the request.
	// When set to "reasoning", a system prompt will be used to instruct the model to reason if supported.
	PromptMode *string `yaml:"prompt-mode" validate:"omitempty,oneof=reasoning"`

	// SafePrompt controls whether to inject a safety prompt before all conversations.
	SafePrompt *bool `yaml:"safe-prompt" validate:"omitempty"`
}

MistralAIModelParams represents Mistral AI model-specific settings.

type ModelParams ¶

type ModelParams interface{}

ModelParams is a marker interface for model-specific parameters.

type OpenAIClientConfig ¶

type OpenAIClientConfig struct {
	// APIKey is the API key for the OpenAI provider.
	APIKey string `yaml:"api-key" validate:"required"`
}

OpenAIClientConfig represents OpenAI provider settings.

type OpenAIModelParams ¶

type OpenAIModelParams struct {
	// ReasoningEffort controls effort level on reasoning for reasoning models.
	// Valid values are: "low", "medium", "high".
	ReasoningEffort *string `yaml:"reasoning-effort" validate:"omitempty,oneof=low medium high"`

	// TextResponseFormat indicates whether to use plain-text response format
	// for compatibility with models that do not support JSON.
	TextResponseFormat bool `yaml:"text-response-format" validate:"omitempty"`

	// Temperature controls the randomness or "creativity" of the model's outputs.
	// Values range from 0.0 to 2.0, with lower values making the output more focused and deterministic.
	// The default value is 1.0.
	// It is generally recommended to alter this or `TopP` but not both.
	Temperature *float32 `yaml:"temperature" validate:"omitempty,min=0,max=2"`

	// TopP controls diversity via nucleus sampling.
	// Values range from 0.0 to 1.0, with lower values making the output more focused.
	// The default value is 1.0.
	// It is generally recommended to alter this or `Temperature` but not both.
	TopP *float32 `yaml:"top-p" validate:"omitempty,min=0,max=1"`

	// PresencePenalty penalizes new tokens based on whether they appear in the text so far.
	// Values range from -2.0 to 2.0, with positive values encouraging the model to use new tokens,
	// increasing the model's likelihood to talk about new topics.
	// The default value is 0.0.
	PresencePenalty *float32 `yaml:"presence-penalty" validate:"omitempty,min=-2,max=2"`

	// FrequencyPenalty penalizes new tokens based on their frequency in the text so far.
	// Values range from -2.0 to 2.0, with positive values encouraging the model to use less frequent tokens,
	// decreasing the model's likelihood to repeat the same line verbatim.
	// The default value is 0.0.
	FrequencyPenalty *float32 `yaml:"frequency-penalty" validate:"omitempty,min=-2,max=2"`
}

OpenAIModelParams represents OpenAI model-specific settings.

type ProviderConfig ¶

type ProviderConfig struct {
	// Name specifies unique identifier of the provider.
	Name string `yaml:"name" validate:"required,oneof=openai google anthropic deepseek mistralai xai"`

	// ClientConfig holds provider-specific client settings.
	ClientConfig ClientConfig `yaml:"client-config" validate:"required"`

	// Runs lists run configurations for this provider.
	Runs []RunConfig `yaml:"runs" validate:"required,unique=Name,dive"`

	// Disabled indicates if all runs should be disabled by default.
	Disabled bool `yaml:"disabled" validate:"omitempty"`

	// RetryPolicy specifies default retry behavior for all runs in this provider.
	RetryPolicy RetryPolicy `yaml:"retry-policy" validate:"omitempty"`
}

ProviderConfig defines settings for an AI provider.

func (ProviderConfig) GetRunsResolved ¶ added in v0.4.0

func (pc ProviderConfig) GetRunsResolved() []RunConfig

GetRunsResolved returns runs with retry policies and disabled flags resolved. If RunConfig.RetryPolicy is nil, the parent ProviderConfig.RetryPolicy value is used instead. If RunConfig.Disabled is nil, the parent ProviderConfig.Disabled value is used instead.

func (ProviderConfig) Resolve ¶ added in v0.5.0

func (pc ProviderConfig) Resolve(excludeDisabledRuns bool) ProviderConfig

Resolve returns a copy of the provider configuration with runs resolved. If excludeDisabledRuns is true, only enabled runs are included.

func (*ProviderConfig) UnmarshalYAML ¶

func (pc *ProviderConfig) UnmarshalYAML(value *yaml.Node) error

UnmarshalYAML implements custom YAML unmarshaling for ProviderConfig. It handles provider-specific client configuration based on provider name.

type RetryPolicy ¶ added in v0.4.0

type RetryPolicy struct {
	// MaxRetryAttempts specifies the maximum number of retry attempts.
	// Value of 0 means no retry attempts will be made.
	MaxRetryAttempts uint `yaml:"max-retry-attempts" validate:"omitempty,min=0"`

	// InitialDelaySeconds specifies the initial delay in seconds before the first retry attempt.
	InitialDelaySeconds int `yaml:"initial-delay-seconds" validate:"omitempty,gt=0"`
}

RetryPolicy defines retry behavior on transient errors.

type RunConfig ¶

type RunConfig struct {
	// Name is a display-friendly identifier shown in results.
	Name string `yaml:"name" validate:"required"`

	// Model specifies target model's identifier.
	Model string `yaml:"model" validate:"required"`

	// MaxRequestsPerMinute limits the number of API requests per minute sent to this specific model.
	// Value of 0 means no rate limiting will be applied.
	MaxRequestsPerMinute int `yaml:"max-requests-per-minute" validate:"omitempty,numeric,min=0"`

	// Disabled indicates if this run configuration should be skipped.
	// If set, overrides the parent ProviderConfig.Disabled value.
	Disabled *bool `yaml:"disabled" validate:"omitempty"`

	// ModelParams holds any model-specific configuration parameters.
	ModelParams ModelParams `yaml:"model-parameters" validate:"omitempty"`

	// RetryPolicy specifies retry behavior on transient errors.
	// If set, overrides the parent ProviderConfig.RetryPolicy value.
	RetryPolicy *RetryPolicy `yaml:"retry-policy" validate:"omitempty"`
}

RunConfig defines settings for a single run configuration.

type Task ¶

type Task struct {
	// Name is a display-friendly identifier shown in results.
	Name string `yaml:"name" validate:"required"`

	// Prompt that will be sent to the AI model.
	Prompt string `yaml:"prompt" validate:"required"`

	// ResponseResultFormat specifies how the AI should format the final answer to the prompt.
	ResponseResultFormat string `yaml:"response-result-format" validate:"required"`

	// ExpectedResult is the set of accepted valid answers for the prompt.
	// All values must follow the ResponseResultFormat precisely.
	// Only one needs to match for the response to be considered correct.
	ExpectedResult utils.StringSet `yaml:"expected-result" validate:"required"`

	// Disabled indicates whether this specific task should be skipped.
	// If set, overrides the global TaskConfig.Disabled value.
	Disabled *bool `yaml:"disabled" validate:"omitempty"`

	// ValidationRules are validation settings for this specific task.
	// If set, overrides the global TaskConfig.ValidationRules values.
	ValidationRules *ValidationRules `yaml:"validation-rules" validate:"omitempty"`

	// Files is a list of files to be included with the prompt.
	// This is primarily used for images but can support other file types
	// depending on the provider's capabilities.
	Files []TaskFile `yaml:"files" validate:"omitempty,unique=Name,dive"`
}

Task defines a single test case to be executed by AI models.

func (*Task) SetBaseFilePath ¶

func (t *Task) SetBaseFilePath(basePath string) error

SetBaseFilePath sets the base path for all local files in the task. The resolved paths are validated to ensure they are accessible.

type TaskConfig ¶

type TaskConfig struct {
	// Tasks is a list of tasks to be executed.
	Tasks []Task `yaml:"tasks" validate:"required,unique=Name,dive"`

	// Disabled indicates whether all tasks should be disabled by default.
	// Individual tasks can override this setting.
	Disabled bool `yaml:"disabled" validate:"omitempty"`

	// ValidationRules are default validation settings for all tasks.
	// Individual tasks can override these settings.
	ValidationRules ValidationRules `yaml:"validation-rules" validate:"omitempty"`
}

TaskConfig represents task definitions and global settings.

func (TaskConfig) GetEnabledTasks ¶

func (o TaskConfig) GetEnabledTasks() []Task

GetEnabledTasks returns a filtered list of tasks that are not disabled. If Task.Disabled is nil, the global TaskConfig.Disabled value is used instead.

type TaskFile ¶

type TaskFile struct {
	// Name is a unique identifier for the file, used to reference it in prompts.
	Name string `yaml:"name" validate:"required"`

	// URI is the path or URL to the file.
	URI URI `yaml:"uri" validate:"required"`

	// Type is the MIME type of the file.
	// If not provided, it will be inferred from the file extension or content.
	Type string `yaml:"type" validate:"omitempty"`
	// contains filtered or unexported fields
}

TaskFile represents a file to be included with a task.

func (*TaskFile) Base64 ¶

func (f *TaskFile) Base64(ctx context.Context) (string, error)

Base64 returns the base64-encoded file content, loading it on demand.

func (*TaskFile) Content ¶

func (f *TaskFile) Content(ctx context.Context) ([]byte, error)

Content returns the raw file content, loading it on demand.

func (*TaskFile) GetDataURL ¶

func (f *TaskFile) GetDataURL(ctx context.Context) (string, error)

GetDataURL returns a complete data URL for the file (e.g., "data:image/png;base64,...").

func (*TaskFile) SetBasePath ¶

func (f *TaskFile) SetBasePath(basePath string)

SetBasePath sets the base path used to resolve relative local paths.

func (*TaskFile) TypeValue ¶

func (f *TaskFile) TypeValue(ctx context.Context) (string, error)

TypeValue returns the MIME type, inferring it if not set, loading content if needed.

func (*TaskFile) UnmarshalYAML ¶

func (f *TaskFile) UnmarshalYAML(value *yaml.Node) error

UnmarshalYAML implements custom YAML unmarshaling for TaskFile.

func (*TaskFile) Validate ¶

func (f *TaskFile) Validate() error

Validate checks if a local file exists, is accessible, and is not a directory. Remote files are not validated as they will be checked when accessed.

type Tasks ¶

type Tasks struct {
	// TaskConfig contains all task definitions and settings.
	TaskConfig TaskConfig `yaml:"task-config" validate:"required"`
}

Tasks represents the top-level task configuration structure.

func LoadTasksFromFile ¶

func LoadTasksFromFile(ctx context.Context, path string) (*Tasks, error)

LoadTasksFromFile reads and validates task definitions from the specified file path. Returns error if the file cannot be read or contains invalid task definitions.

type URI ¶

type URI struct {
	// contains filtered or unexported fields
}

URI represents a parsed URI/URL that can be used to reference a file.

func (URI) IsLocalFile ¶

func (u URI) IsLocalFile() bool

IsLocalFile checks if the URI references a local file.

func (URI) IsRemoteFile ¶

func (u URI) IsRemoteFile() bool

IsRemoteFile checks if the URI references a remote file.

func (URI) MarshalYAML ¶

func (u URI) MarshalYAML() (interface{}, error)

MarshalYAML implements custom YAML marshaling for URI.

func (*URI) Parse ¶

func (u *URI) Parse(raw string) (err error)

Parse parses a raw URI string into a structured URI object. It validates that the URI scheme is supported.

func (URI) Path ¶

func (u URI) Path(basePath string) string

Path returns the filesystem path for local URIs. For relative local paths, it uses the provided basePath to create an absolute path.

func (URI) String ¶

func (u URI) String() string

String returns the original raw URI string.

func (URI) URL ¶

func (u URI) URL() *url.URL

URL returns the parsed URL.

func (*URI) UnmarshalYAML ¶

func (u *URI) UnmarshalYAML(value *yaml.Node) error

UnmarshalYAML implements custom YAML unmarshaling for URI.

type ValidationRules ¶ added in v0.3.0

type ValidationRules struct {
	// CaseSensitive determines whether string comparison should be case-sensitive.
	CaseSensitive *bool `yaml:"case-sensitive" validate:"omitempty"`

	// IgnoreWhitespace determines whether all whitespace should be ignored during comparison.
	// When true, all whitespace characters (spaces, tabs, newlines) are removed before comparison.
	IgnoreWhitespace *bool `yaml:"ignore-whitespace" validate:"omitempty"`

	// TrimLines determines whether to trim leading and trailing whitespace of each line
	// before comparison.
	TrimLines *bool `yaml:"trim-lines" validate:"omitempty"`

	// Judge specifies the judge configuration to use for evaluation.
	// When enabled, an LLM will be used to evaluate the correctness of the response
	// instead of simple string matching.
	Judge JudgeSelector `yaml:"judge" validate:"omitempty"`
}

ValidationRules represents task validation rules. It controls how model responses should be validated against expected results.

func (ValidationRules) IsCaseSensitive ¶ added in v0.3.0

func (vr ValidationRules) IsCaseSensitive() bool

IsCaseSensitive returns whether validation should be case sensitive.

func (ValidationRules) IsIgnoreWhitespace ¶ added in v0.3.0

func (vr ValidationRules) IsIgnoreWhitespace() bool

IsIgnoreWhitespace returns whether whitespace should be ignored during validation.

func (ValidationRules) IsTrimLines ¶ added in v0.6.1

func (vr ValidationRules) IsTrimLines() bool

IsTrimLines returns whether each line should be trimmed before validation.

func (ValidationRules) MergeWith ¶ added in v0.3.0

func (these ValidationRules) MergeWith(other *ValidationRules) ValidationRules

MergeWith merges these validation rules with other rules and returns the result. The provided other values override these values if set.

func (ValidationRules) UseJudge ¶ added in v0.5.0

func (vr ValidationRules) UseJudge() bool

UseJudge returns whether judge evaluation is enabled.

type XAIClientConfig ¶ added in v0.7.2

type XAIClientConfig struct {
	// APIKey is the API key for the xAI provider.
	APIKey string `yaml:"api-key" validate:"required"`
}

XAIClientConfig represents xAI provider settings.

type XAIModelParams ¶ added in v0.7.2

type XAIModelParams struct {
	// Temperature controls the randomness or "creativity" of the model's outputs.
	// Notes: Higher values (e.g. 0.8) make outputs more random; lower values
	// (e.g. 0.2) make outputs more focused and deterministic.
	// Valid range: 0.0 — 2.0. Default: 1.0.
	Temperature *float32 `yaml:"temperature" validate:"omitempty,min=0,max=2"`

	// TopP controls diversity via nucleus sampling (probability mass cutoff).
	// Notes: Use either Temperature or TopP, not both, for sampling control.
	// Valid range: (0.0, 1.0]. Default: 1.0.
	TopP *float32 `yaml:"top-p" validate:"omitempty,min=0,max=1"`

	// MaxCompletionTokens controls the maximum number of tokens to generate in the completion.
	MaxCompletionTokens *int32 `yaml:"max-completion-tokens" validate:"omitempty,min=0"`

	// PresencePenalty penalizes new tokens based on whether they appear in the text so far.
	// Notes: Positive values encourage the model to introduce new topics.
	// Valid range: -2.0 — 2.0. Default: 0.0.
	PresencePenalty *float32 `yaml:"presence-penalty" validate:"omitempty,min=-2,max=2"`

	// FrequencyPenalty penalizes new tokens based on their frequency in the text so far.
	// Notes: Positive values discourage repetition.
	// Valid range: -2.0 — 2.0. Default: 0.0.
	FrequencyPenalty *float32 `yaml:"frequency-penalty" validate:"omitempty,min=-2,max=2"`

	// ReasoningEffort constrains how much "reasoning" budget to spend for reasoning-capable models.
	// Notes: Not all reasoning models support this option.
	// Valid values: "low", "high".
	ReasoningEffort *string `yaml:"reasoning-effort" validate:"omitempty,oneof=low high"`

	// Seed requests deterministic sampling when possible.
	// No guaranteed determinism — xAI makes a best-effort to return
	// repeatable outputs for identical inputs when `seed` and other parameters are the same.
	Seed *int32 `yaml:"seed" validate:"omitempty"`
}

XAIModelParams represents xAI model-specific settings.

Source Files ¶

View all Source files

?	: This menu
/	: Search site
f or F	: Jump to
y or Y	: Canonical URL