|
25 | 25 | "<div style=\"display: flex; align-items: center; justify-content: left; padding: 5px; height: 40px; background: linear-gradient(90deg, #7873f5 0%, #ff6ec4 100%); border-radius: 8px; box-shadow: 0 2px 8px rgba(0,0,0,0.12); font-size: 1.5em; font-weight: bold; color: #fff;\">\n", |
26 | 26 | " Step 3: Be More Cost-Effective With Distillation\n", |
27 | 27 | "</div>\n", |
28 | | - "<br/>\n", |
29 | | - "<div style=\"display: flex; align-items: center; justify-content: left; padding: 5px; height: 40px; background: linear-gradient(90deg, #7873f5 0%, #ff6ec4 100%); border-radius: 8px; box-shadow: 0 2px 8px rgba(0,0,0,0.12); font-size: 1.5em; font-weight: bold; color: #fff;\">\n", |
30 | | - " Step 4: Be More Precise with RAFT\n", |
31 | | - "</div>" |
| 28 | + "<br/>" |
32 | 29 | ] |
33 | 30 | }, |
34 | 31 | { |
|
280 | 277 | "name": "stdout", |
281 | 278 | "output_type": "stream", |
282 | 279 | "text": [ |
283 | | - "Training file ID: file-47d965f45742443885faad50263a0e8c\n", |
284 | | - "Validation file ID: file-12c4f25aa14941bb9762c0d574ad4133\n" |
| 280 | + "Training file ID: file-f0e95ad0245146f986e1cb8e9a82373b\n", |
| 281 | + "Validation file ID: file-8b8c2dc873bb43d9aefdfc3b2168fe0c\n" |
285 | 282 | ] |
286 | 283 | } |
287 | 284 | ], |
|
314 | 311 | }, |
315 | 312 | { |
316 | 313 | "cell_type": "code", |
317 | | - "execution_count": 8, |
| 314 | + "execution_count": 7, |
318 | 315 | "id": "86ddf91d", |
319 | 316 | "metadata": {}, |
320 | 317 | "outputs": [ |
321 | 318 | { |
322 | 319 | "name": "stdout", |
323 | 320 | "output_type": "stream", |
324 | 321 | "text": [ |
325 | | - "Job ID: ftjob-45902437a97e4bdf8f2333bc1ebdee99\n", |
326 | | - "Status: ftjob-45902437a97e4bdf8f2333bc1ebdee99\n", |
| 322 | + "Job ID: ftjob-a66c2404eccb417b9070e9f95a3a96e2\n", |
| 323 | + "Status: ftjob-a66c2404eccb417b9070e9f95a3a96e2\n", |
327 | 324 | "{\n", |
328 | | - " \"id\": \"ftjob-45902437a97e4bdf8f2333bc1ebdee99\",\n", |
329 | | - " \"created_at\": 1758111681,\n", |
| 325 | + " \"id\": \"ftjob-a66c2404eccb417b9070e9f95a3a96e2\",\n", |
| 326 | + " \"created_at\": 1758295013,\n", |
330 | 327 | " \"error\": null,\n", |
331 | 328 | " \"fine_tuned_model\": null,\n", |
332 | 329 | " \"finished_at\": null,\n", |
|
342 | 339 | " \"seed\": 105,\n", |
343 | 340 | " \"status\": \"pending\",\n", |
344 | 341 | " \"trained_tokens\": null,\n", |
345 | | - " \"training_file\": \"file-47d965f45742443885faad50263a0e8c\",\n", |
346 | | - " \"validation_file\": \"file-12c4f25aa14941bb9762c0d574ad4133\",\n", |
347 | | - " \"estimated_finish\": 1758112761,\n", |
| 342 | + " \"training_file\": \"file-f0e95ad0245146f986e1cb8e9a82373b\",\n", |
| 343 | + " \"validation_file\": \"file-8b8c2dc873bb43d9aefdfc3b2168fe0c\",\n", |
| 344 | + " \"estimated_finish\": 1758299439,\n", |
348 | 345 | " \"integrations\": null,\n", |
349 | 346 | " \"metadata\": null,\n", |
350 | 347 | " \"method\": null\n", |
|
385 | 382 | }, |
386 | 383 | { |
387 | 384 | "cell_type": "code", |
388 | | - "execution_count": 9, |
| 385 | + "execution_count": 8, |
389 | 386 | "id": "f024bb0f", |
390 | 387 | "metadata": {}, |
391 | 388 | "outputs": [ |
392 | 389 | { |
393 | 390 | "name": "stdout", |
394 | 391 | "output_type": "stream", |
395 | 392 | "text": [ |
396 | | - "Fine-tuning job ftjob-45902437a97e4bdf8f2333bc1ebdee99 finished with status: succeeded\n", |
| 393 | + "Fine-tuning job ftjob-a66c2404eccb417b9070e9f95a3a96e2 finished with status: succeeded\n", |
397 | 394 | "Checking other fine-tune jobs for this resource.\n", |
398 | | - "Found 6 fine-tune jobs.\n" |
| 395 | + "Found 20 fine-tune jobs.\n" |
399 | 396 | ] |
400 | 397 | } |
401 | 398 | ], |
|
443 | 440 | }, |
444 | 441 | { |
445 | 442 | "cell_type": "code", |
446 | | - "execution_count": 10, |
| 443 | + "execution_count": 9, |
447 | 444 | "id": "ebe8fa88", |
448 | 445 | "metadata": {}, |
449 | 446 | "outputs": [ |
|
454 | 451 | "{\n", |
455 | 452 | " \"data\": [\n", |
456 | 453 | " {\n", |
457 | | - " \"id\": \"ftevent-b2270bc1c1554cf88360314d6b27cffd\",\n", |
458 | | - " \"created_at\": 1758117577,\n", |
| 454 | + " \"id\": \"ftevent-0fcbb3e59a174be0bf017c7aa891db8a\",\n", |
| 455 | + " \"created_at\": 1758299162,\n", |
459 | 456 | " \"level\": \"info\",\n", |
460 | 457 | " \"message\": \"Training tokens billed: 8000\",\n", |
461 | 458 | " \"object\": \"fine_tuning.job.event\",\n", |
462 | 459 | " \"data\": null,\n", |
463 | 460 | " \"type\": \"message\"\n", |
464 | 461 | " },\n", |
465 | 462 | " {\n", |
466 | | - " \"id\": \"ftevent-36487722ede245c38bfd312c7ffba4dc\",\n", |
467 | | - " \"created_at\": 1758117577,\n", |
| 463 | + " \"id\": \"ftevent-1daf0625537546ad8fd76f42c31273ba\",\n", |
| 464 | + " \"created_at\": 1758299162,\n", |
468 | 465 | " \"level\": \"info\",\n", |
469 | | - " \"message\": \"Model Evaluation Passed.\",\n", |
| 466 | + " \"message\": \"Completed results file: file-0dda62edd87e4ef7bfa1108b19f345ba\",\n", |
470 | 467 | " \"object\": \"fine_tuning.job.event\",\n", |
471 | 468 | " \"data\": null,\n", |
472 | 469 | " \"type\": \"message\"\n", |
473 | 470 | " },\n", |
474 | 471 | " {\n", |
475 | | - " \"id\": \"ftevent-ffd856eb590342cb9df5b22e554d6a59\",\n", |
476 | | - " \"created_at\": 1758117577,\n", |
| 472 | + " \"id\": \"ftevent-22e8ed38c97440818ac46e7b6e76d15e\",\n", |
| 473 | + " \"created_at\": 1758299161,\n", |
477 | 474 | " \"level\": \"info\",\n", |
478 | | - " \"message\": \"Completed results file: file-876704e7e1ae4c399e8fe08ab856e2b2\",\n", |
| 475 | + " \"message\": \"Model Evaluation Passed.\",\n", |
479 | 476 | " \"object\": \"fine_tuning.job.event\",\n", |
480 | 477 | " \"data\": null,\n", |
481 | 478 | " \"type\": \"message\"\n", |
482 | 479 | " },\n", |
483 | 480 | " {\n", |
484 | | - " \"id\": \"ftevent-427347ddecbf4755be54acb559284b97\",\n", |
485 | | - " \"created_at\": 1758117551,\n", |
| 481 | + " \"id\": \"ftevent-17c825a4e5344dcc8e38fb2679d216c8\",\n", |
| 482 | + " \"created_at\": 1758299116,\n", |
486 | 483 | " \"level\": \"info\",\n", |
487 | 484 | " \"message\": \"Job succeeded.\",\n", |
488 | 485 | " \"object\": \"fine_tuning.job.event\",\n", |
489 | 486 | " \"data\": null,\n", |
490 | 487 | " \"type\": \"message\"\n", |
491 | 488 | " },\n", |
492 | 489 | " {\n", |
493 | | - " \"id\": \"ftevent-808ddf5ee2d72d3808ddf5ee2d72d380\",\n", |
494 | | - " \"created_at\": 1758115747,\n", |
| 490 | + " \"id\": \"ftevent-808ddf794d36042808ddf794d3604280\",\n", |
| 491 | + " \"created_at\": 1758297273,\n", |
495 | 492 | " \"level\": \"info\",\n", |
496 | 493 | " \"message\": \"Step 120: training loss=1.0537992715835571\",\n", |
497 | 494 | " \"object\": \"fine_tuning.job.event\",\n", |
|
507 | 504 | " \"type\": \"metrics\"\n", |
508 | 505 | " },\n", |
509 | 506 | " {\n", |
510 | | - " \"id\": \"ftevent-808ddf5ee277cf2808ddf5ee277cf280\",\n", |
511 | | - " \"created_at\": 1758115737,\n", |
| 507 | + " \"id\": \"ftevent-808ddf794cd6a61808ddf794cd6a6180\",\n", |
| 508 | + " \"created_at\": 1758297263,\n", |
512 | 509 | " \"level\": \"info\",\n", |
513 | 510 | " \"message\": \"Step 110: training loss=0.992326557636261\",\n", |
514 | 511 | " \"object\": \"fine_tuning.job.event\",\n", |
|
522 | 519 | " \"type\": \"metrics\"\n", |
523 | 520 | " },\n", |
524 | 521 | " {\n", |
525 | | - " \"id\": \"ftevent-808ddf5ee218711808ddf5ee21871180\",\n", |
526 | | - " \"created_at\": 1758115727,\n", |
| 522 | + " \"id\": \"ftevent-808ddf794c77480808ddf794c7748080\",\n", |
| 523 | + " \"created_at\": 1758297253,\n", |
527 | 524 | " \"level\": \"info\",\n", |
528 | 525 | " \"message\": \"Step 100: training loss=0.8933090567588806\",\n", |
529 | 526 | " \"object\": \"fine_tuning.job.event\",\n", |
|
537 | 534 | " \"type\": \"metrics\"\n", |
538 | 535 | " },\n", |
539 | 536 | " {\n", |
540 | | - " \"id\": \"ftevent-808ddf5ee1b9130808ddf5ee1b913080\",\n", |
541 | | - " \"created_at\": 1758115717,\n", |
| 537 | + " \"id\": \"ftevent-808ddf794c17e9f808ddf794c17e9f80\",\n", |
| 538 | + " \"created_at\": 1758297243,\n", |
542 | 539 | " \"level\": \"info\",\n", |
543 | 540 | " \"message\": \"Step 90: training loss=1.266113042831421\",\n", |
544 | 541 | " \"object\": \"fine_tuning.job.event\",\n", |
|
552 | 549 | " \"type\": \"metrics\"\n", |
553 | 550 | " },\n", |
554 | 551 | " {\n", |
555 | | - " \"id\": \"ftevent-808ddf5ee159b4f808ddf5ee159b4f80\",\n", |
556 | | - " \"created_at\": 1758115707,\n", |
| 552 | + " \"id\": \"ftevent-808ddf794bb88be808ddf794bb88be80\",\n", |
| 553 | + " \"created_at\": 1758297233,\n", |
557 | 554 | " \"level\": \"info\",\n", |
558 | 555 | " \"message\": \"Step 80: training loss=1.271457314491272\",\n", |
559 | 556 | " \"object\": \"fine_tuning.job.event\",\n", |
|
569 | 566 | " \"type\": \"metrics\"\n", |
570 | 567 | " },\n", |
571 | 568 | " {\n", |
572 | | - " \"id\": \"ftevent-808ddf5ee0fa56e808ddf5ee0fa56e80\",\n", |
573 | | - " \"created_at\": 1758115697,\n", |
| 569 | + " \"id\": \"ftevent-808ddf794b592dd808ddf794b592dd80\",\n", |
| 570 | + " \"created_at\": 1758297223,\n", |
574 | 571 | " \"level\": \"info\",\n", |
575 | 572 | " \"message\": \"Step 70: training loss=1.4114105701446533\",\n", |
576 | 573 | " \"object\": \"fine_tuning.job.event\",\n", |
|
613 | 610 | }, |
614 | 611 | { |
615 | 612 | "cell_type": "code", |
616 | | - "execution_count": 11, |
| 613 | + "execution_count": 10, |
617 | 614 | "id": "7088ebaf", |
618 | 615 | "metadata": {}, |
619 | 616 | "outputs": [ |
|
624 | 621 | "{\n", |
625 | 622 | " \"data\": [\n", |
626 | 623 | " {\n", |
627 | | - " \"id\": \"ftchkpt-350ee1713844412a9b9ea482995d91df\",\n", |
628 | | - " \"created_at\": 1758116262,\n", |
629 | | - " \"fine_tuned_model_checkpoint\": \"gpt-4.1-2025-04-14.ft-45902437a97e4bdf8f2333bc1ebdee99\",\n", |
630 | | - " \"fine_tuning_job_id\": \"ftjob-45902437a97e4bdf8f2333bc1ebdee99\",\n", |
| 624 | + " \"id\": \"ftchkpt-bc8362a9b01b446b9277f91d20b7464f\",\n", |
| 625 | + " \"created_at\": 1758297823,\n", |
| 626 | + " \"fine_tuned_model_checkpoint\": \"gpt-4.1-2025-04-14.ft-a66c2404eccb417b9070e9f95a3a96e2\",\n", |
| 627 | + " \"fine_tuning_job_id\": \"ftjob-a66c2404eccb417b9070e9f95a3a96e2\",\n", |
631 | 628 | " \"metrics\": {\n", |
632 | 629 | " \"full_valid_loss\": 1.2260964284301274,\n", |
633 | 630 | " \"full_valid_mean_token_accuracy\": 0.6798418972332015,\n", |
|
641 | 638 | " \"step_number\": 120\n", |
642 | 639 | " },\n", |
643 | 640 | " {\n", |
644 | | - " \"id\": \"ftchkpt-fb1f94a8c9674839965703faea640c27\",\n", |
645 | | - " \"created_at\": 1758116072,\n", |
646 | | - " \"fine_tuned_model_checkpoint\": \"gpt-4.1-2025-04-14.ft-45902437a97e4bdf8f2333bc1ebdee99:ckpt-step-80\",\n", |
647 | | - " \"fine_tuning_job_id\": \"ftjob-45902437a97e4bdf8f2333bc1ebdee99\",\n", |
| 641 | + " \"id\": \"ftchkpt-47b40e0ca68b48efa4527c904db9590d\",\n", |
| 642 | + " \"created_at\": 1758297635,\n", |
| 643 | + " \"fine_tuned_model_checkpoint\": \"gpt-4.1-2025-04-14.ft-a66c2404eccb417b9070e9f95a3a96e2:ckpt-step-80\",\n", |
| 644 | + " \"fine_tuning_job_id\": \"ftjob-a66c2404eccb417b9070e9f95a3a96e2\",\n", |
648 | 645 | " \"metrics\": {\n", |
649 | 646 | " \"full_valid_loss\": 1.2668834354566492,\n", |
650 | 647 | " \"full_valid_mean_token_accuracy\": 0.6482213438735178,\n", |
|
658 | 655 | " \"step_number\": 80\n", |
659 | 656 | " },\n", |
660 | 657 | " {\n", |
661 | | - " \"id\": \"ftchkpt-94685b61cf314c508538a4aa5a5c9bb7\",\n", |
662 | | - " \"created_at\": 1758115882,\n", |
663 | | - " \"fine_tuned_model_checkpoint\": \"gpt-4.1-2025-04-14.ft-45902437a97e4bdf8f2333bc1ebdee99:ckpt-step-40\",\n", |
664 | | - " \"fine_tuning_job_id\": \"ftjob-45902437a97e4bdf8f2333bc1ebdee99\",\n", |
| 658 | + " \"id\": \"ftchkpt-434282d99454403d89b0f410a3c75522\",\n", |
| 659 | + " \"created_at\": 1758297443,\n", |
| 660 | + " \"fine_tuned_model_checkpoint\": \"gpt-4.1-2025-04-14.ft-a66c2404eccb417b9070e9f95a3a96e2:ckpt-step-40\",\n", |
| 661 | + " \"fine_tuning_job_id\": \"ftjob-a66c2404eccb417b9070e9f95a3a96e2\",\n", |
665 | 662 | " \"metrics\": {\n", |
666 | 663 | " \"full_valid_loss\": 1.781834651358985,\n", |
667 | 664 | " \"full_valid_mean_token_accuracy\": 0.5612648221343873,\n", |
|
704 | 701 | }, |
705 | 702 | { |
706 | 703 | "cell_type": "code", |
707 | | - "execution_count": 12, |
| 704 | + "execution_count": 11, |
708 | 705 | "id": "4a77c5b8", |
709 | 706 | "metadata": {}, |
710 | 707 | "outputs": [ |
|
713 | 710 | "output_type": "stream", |
714 | 711 | "text": [ |
715 | 712 | "{\n", |
716 | | - " \"id\": \"ftjob-45902437a97e4bdf8f2333bc1ebdee99\",\n", |
717 | | - " \"created_at\": 1758111681,\n", |
| 713 | + " \"id\": \"ftjob-a66c2404eccb417b9070e9f95a3a96e2\",\n", |
| 714 | + " \"created_at\": 1758295013,\n", |
718 | 715 | " \"error\": null,\n", |
719 | | - " \"fine_tuned_model\": \"gpt-4.1-2025-04-14.ft-45902437a97e4bdf8f2333bc1ebdee99\",\n", |
720 | | - " \"finished_at\": 1758117577,\n", |
| 716 | + " \"fine_tuned_model\": \"gpt-4.1-2025-04-14.ft-a66c2404eccb417b9070e9f95a3a96e2\",\n", |
| 717 | + " \"finished_at\": 1758299162,\n", |
721 | 718 | " \"hyperparameters\": {\n", |
722 | 719 | " \"batch_size\": 1,\n", |
723 | 720 | " \"learning_rate_multiplier\": 2.0,\n", |
|
727 | 724 | " \"object\": \"fine_tuning.job\",\n", |
728 | 725 | " \"organization_id\": null,\n", |
729 | 726 | " \"result_files\": [\n", |
730 | | - " \"file-876704e7e1ae4c399e8fe08ab856e2b2\"\n", |
| 727 | + " \"file-0dda62edd87e4ef7bfa1108b19f345ba\"\n", |
731 | 728 | " ],\n", |
732 | 729 | " \"seed\": 105,\n", |
733 | 730 | " \"status\": \"succeeded\",\n", |
734 | 731 | " \"trained_tokens\": 10440,\n", |
735 | | - " \"training_file\": \"file-47d965f45742443885faad50263a0e8c\",\n", |
736 | | - " \"validation_file\": \"file-12c4f25aa14941bb9762c0d574ad4133\",\n", |
737 | | - " \"estimated_finish\": 1758115220,\n", |
| 732 | + " \"training_file\": \"file-f0e95ad0245146f986e1cb8e9a82373b\",\n", |
| 733 | + " \"validation_file\": \"file-8b8c2dc873bb43d9aefdfc3b2168fe0c\",\n", |
| 734 | + " \"estimated_finish\": 1758296743,\n", |
738 | 735 | " \"integrations\": null,\n", |
739 | 736 | " \"metadata\": null,\n", |
740 | 737 | " \"method\": null\n", |
|
0 commit comments