{ "version": "0.2.0", "configurations": [ { "name": "MiniMind Training (Direct Python)", "type": "python", "request": "launch", "program": "${workspaceFolder}/train_pretrain_accelerate.py", // "args": [ // "--out_dir", "out", // "--epochs", "3", // "--embedding_epoch", "2", // "--batch_size", "128", // "--learning_rate", "8e-5", // "--dtype", "bfloat16", // "--use_swanlab", // "--swanlab_project", "MiniMind-Pretrain", // "--num_workers", "1", // "--accumulation_steps", "16", // "--grad_clip", "0.5", // "--warmup_iters", "0", // "--log_interval", "1", // "--save_interval", "10000", // "--dim", "512", // "--n_layers", "8", // "--max_seq_len", "512", // "--data_path", "./dataset/stable/merged_pretrain.jsonl", // "--profile", // "--profile_interval", "10", // "--use_flash_attn", // "--knowledge_num", "1048576", // "--knowledge_length", "32", // "--database_init_path", "./dataset/stable/sentence_trex_data.json", // "--fast_clustering", // "--cluster_cache_path", "./cache/cluster_tokens_single.pt", // "--memory_monitor_interval", "10", // "--model_type", "model", // "--model_size", "538" // ], "env": { "CUDA_VISIBLE_DEVICES": "0", "NCCL_DEBUG": "INFO", "PYTHONFAULTHANDLER": "1" }, "cwd": "${workspaceFolder}", "console": "integratedTerminal", "justMyCode": false, "stopOnEntry": false, "python": "${workspaceFolder}/.venv/bin/python" }, { "name": "MiniMind Training (Direct Python - Simple)", "type": "python", "request": "launch", "program": "${workspaceFolder}/train_pretrain_accelerate.py", "args": [ "--epochs", "1", "--batch_size", "32", "--learning_rate", "1e-4", "--log_interval", "10", "--profile_interval", "2", "--model_type", "model_original" ], "env": { "CUDA_VISIBLE_DEVICES": "0" }, "cwd": "${workspaceFolder}", "console": "integratedTerminal", "justMyCode": false, "stopOnEntry": false, "python": "${workspaceFolder}/.venv/bin/python" }, { "name": "MiniMind Test (Direct Python)", "type": "python", "request": "launch", "program": "${workspaceFolder}/test.py", "env": { "CUDA_VISIBLE_DEVICES": "0" }, "cwd": "${workspaceFolder}", "console": "integratedTerminal", "justMyCode": false, "python": "${workspaceFolder}/.venv/bin/python" }, { "name": "MiniMind Training Debug (Accelerate)", "type": "python", "request": "launch", "module": "accelerate.commands.launch", "args": [ "--num_processes=1", "--mixed_precision=bf16", "${workspaceFolder}/train_pretrain_accelerate.py", "--epochs", "1", "--batch_size", "32", "--learning_rate", "1e-4", "--log_interval", "10", "--profile_interval", "2", "--model_type", "model_original" ], "env": { "CUDA_VISIBLE_DEVICES": "0" }, "cwd": "${workspaceFolder}", "console": "integratedTerminal", "justMyCode": false, "stopOnEntry": false, "python": "${workspaceFolder}/.venv/bin/python" }, { "name": "MiniMind Test Only", "type": "python", "request": "launch", "program": "${workspaceFolder}/test.py", "env": { "CUDA_VISIBLE_DEVICES": "0" }, "cwd": "${workspaceFolder}", "console": "integratedTerminal", "justMyCode": false } ] }