Mistral AI · Schema

Hyperparameters

Properties

Name Type Description
training_steps integer Number of training steps
learning_rate number Learning rate for training
weight_decay number Weight decay regularization
warmup_fraction number Fraction of steps for learning rate warmup
epochs number Number of training epochs
seq_len integer Maximum sequence length
View JSON Schema on GitHub

JSON Schema

mistral-hyperparameters-schema.json Raw ↑
{
  "$schema": "https://json-schema.org/draft/2020-12/schema",
  "$id": "#/components/schemas/Hyperparameters",
  "title": "Hyperparameters",
  "type": "object",
  "properties": {
    "training_steps": {
      "type": "integer",
      "minimum": 1,
      "description": "Number of training steps"
    },
    "learning_rate": {
      "type": "number",
      "minimum": 0,
      "description": "Learning rate for training"
    },
    "weight_decay": {
      "type": "number",
      "minimum": 0,
      "description": "Weight decay regularization"
    },
    "warmup_fraction": {
      "type": "number",
      "minimum": 0,
      "maximum": 1,
      "description": "Fraction of steps for learning rate warmup"
    },
    "epochs": {
      "type": "number",
      "minimum": 0,
      "description": "Number of training epochs"
    },
    "seq_len": {
      "type": "integer",
      "description": "Maximum sequence length"
    }
  }
}