llm-arch-research/experiments/llm_only/configs/gpt_generate.json

{
    "bpe_tokenizer": "checkpoints/bpe_tokenizer.json",
    "test_prompts": [
      "The neural network",
      "Transformer architecture",
      "GPT models are"
    ],
    "model_config_path": "checkpoints/gpt-bpe/config.json",
    "model_weights": "checkpoints/gpt-bpe/model.pt",
    "generation": {
      "max_new_tokens": 40,
      "temperature": 0.8,
      "do_sample": true,
      "top_k": null,
      "top_p": null
    },
    "log_path": "checkpoints/llm_only_generation_logs.json"
  }