diff --git a/training/train_opt.m b/training/train_opt.m index a6180c0..7afc60d 100644 --- a/training/train_opt.m +++ b/training/train_opt.m @@ -18,7 +18,7 @@ #import #define CKPT_PATH "ane_stories110M_ckpt.bin" -#define MODEL_PATH "../../assets/models/stories110M.bin" +#define MODEL_PATH_DEFAULT "stories110M.bin" #define DATA_PATH "tinystories_data00.bin" // ===== Pre-allocated capture buffers per layer (Phase 1) ===== @@ -346,14 +346,20 @@ int main(int argc, char *argv[]) { int adam_t = 0, start_step = 0; // Parse args + const char *model_path = MODEL_PATH_DEFAULT; bool do_resume = false; bool use_metal = false; // default off: Metal dW contends with ANE for memory bandwidth + int pos = 0; for (int i=1; i