3v324v23 commited on
Commit
161f12d
Β·
1 Parent(s): 04cfe37

initial training

Browse files
Files changed (1) hide show
  1. training/training.ipynb +212 -2
training/training.ipynb CHANGED
@@ -460,7 +460,7 @@
460
  },
461
  {
462
  "cell_type": "code",
463
- "execution_count": null,
464
  "id": "9b76b385",
465
  "metadata": {},
466
  "outputs": [
@@ -490,7 +490,217 @@
490
  "name": "stderr",
491
  "output_type": "stream",
492
  "text": [
493
- "Epoch 2/15: 4%|▍ | 12/274 [01:44<37:59, 8.70s/it, accuracy=71.6, loss=0.743]"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
494
  ]
495
  }
496
  ],
 
460
  },
461
  {
462
  "cell_type": "code",
463
+ "execution_count": 23,
464
  "id": "9b76b385",
465
  "metadata": {},
466
  "outputs": [
 
490
  "name": "stderr",
491
  "output_type": "stream",
492
  "text": [
493
+ "Epoch 2/15: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 274/274 [41:55<00:00, 9.18s/it, accuracy=73.7, loss=0.706]\n"
494
+ ]
495
+ },
496
+ {
497
+ "name": "stdout",
498
+ "output_type": "stream",
499
+ "text": [
500
+ "Epoch 2/15\n",
501
+ "Train Loss: 0.7060 | Train Accuracy: 73.68%\n"
502
+ ]
503
+ },
504
+ {
505
+ "name": "stderr",
506
+ "output_type": "stream",
507
+ "text": [
508
+ "Epoch 3/15: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 274/274 [42:13<00:00, 9.25s/it, accuracy=75.8, loss=0.666]\n"
509
+ ]
510
+ },
511
+ {
512
+ "name": "stdout",
513
+ "output_type": "stream",
514
+ "text": [
515
+ "Epoch 3/15\n",
516
+ "Train Loss: 0.6662 | Train Accuracy: 75.79%\n"
517
+ ]
518
+ },
519
+ {
520
+ "name": "stderr",
521
+ "output_type": "stream",
522
+ "text": [
523
+ "Epoch 4/15: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 274/274 [39:27<00:00, 8.64s/it, accuracy=76.9, loss=0.636]\n"
524
+ ]
525
+ },
526
+ {
527
+ "name": "stdout",
528
+ "output_type": "stream",
529
+ "text": [
530
+ "Epoch 4/15\n",
531
+ "Train Loss: 0.6361 | Train Accuracy: 76.89%\n"
532
+ ]
533
+ },
534
+ {
535
+ "name": "stderr",
536
+ "output_type": "stream",
537
+ "text": [
538
+ "Epoch 5/15: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 274/274 [41:08<00:00, 9.01s/it, accuracy=77.7, loss=0.628]\n"
539
+ ]
540
+ },
541
+ {
542
+ "name": "stdout",
543
+ "output_type": "stream",
544
+ "text": [
545
+ "Epoch 5/15\n",
546
+ "Train Loss: 0.6281 | Train Accuracy: 77.70%\n"
547
+ ]
548
+ },
549
+ {
550
+ "name": "stderr",
551
+ "output_type": "stream",
552
+ "text": [
553
+ "Epoch 6/15: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 274/274 [41:22<00:00, 9.06s/it, accuracy=80.3, loss=0.547]\n"
554
+ ]
555
+ },
556
+ {
557
+ "name": "stdout",
558
+ "output_type": "stream",
559
+ "text": [
560
+ "Epoch 6/15\n",
561
+ "Train Loss: 0.5466 | Train Accuracy: 80.31%\n"
562
+ ]
563
+ },
564
+ {
565
+ "name": "stderr",
566
+ "output_type": "stream",
567
+ "text": [
568
+ "Epoch 7/15: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 274/274 [40:05<00:00, 8.78s/it, accuracy=81.5, loss=0.512]\n"
569
+ ]
570
+ },
571
+ {
572
+ "name": "stdout",
573
+ "output_type": "stream",
574
+ "text": [
575
+ "Epoch 7/15\n",
576
+ "Train Loss: 0.5121 | Train Accuracy: 81.48%\n"
577
+ ]
578
+ },
579
+ {
580
+ "name": "stderr",
581
+ "output_type": "stream",
582
+ "text": [
583
+ "Epoch 8/15: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 274/274 [41:18<00:00, 9.05s/it, accuracy=82.5, loss=0.488]\n"
584
+ ]
585
+ },
586
+ {
587
+ "name": "stdout",
588
+ "output_type": "stream",
589
+ "text": [
590
+ "Epoch 8/15\n",
591
+ "Train Loss: 0.4880 | Train Accuracy: 82.49%\n"
592
+ ]
593
+ },
594
+ {
595
+ "name": "stderr",
596
+ "output_type": "stream",
597
+ "text": [
598
+ "Epoch 9/15: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 274/274 [42:20<00:00, 9.27s/it, accuracy=82.7, loss=0.473]\n"
599
+ ]
600
+ },
601
+ {
602
+ "name": "stdout",
603
+ "output_type": "stream",
604
+ "text": [
605
+ "Epoch 9/15\n",
606
+ "Train Loss: 0.4732 | Train Accuracy: 82.66%\n"
607
+ ]
608
+ },
609
+ {
610
+ "name": "stderr",
611
+ "output_type": "stream",
612
+ "text": [
613
+ "Epoch 10/15: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 274/274 [40:16<00:00, 8.82s/it, accuracy=83.2, loss=0.465]\n"
614
+ ]
615
+ },
616
+ {
617
+ "name": "stdout",
618
+ "output_type": "stream",
619
+ "text": [
620
+ "Epoch 10/15\n",
621
+ "Train Loss: 0.4646 | Train Accuracy: 83.17%\n"
622
+ ]
623
+ },
624
+ {
625
+ "name": "stderr",
626
+ "output_type": "stream",
627
+ "text": [
628
+ "Epoch 11/15: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 274/274 [39:24<00:00, 8.63s/it, accuracy=85, loss=0.433] \n"
629
+ ]
630
+ },
631
+ {
632
+ "name": "stdout",
633
+ "output_type": "stream",
634
+ "text": [
635
+ "Epoch 11/15\n",
636
+ "Train Loss: 0.4328 | Train Accuracy: 85.01%\n"
637
+ ]
638
+ },
639
+ {
640
+ "name": "stderr",
641
+ "output_type": "stream",
642
+ "text": [
643
+ "Epoch 12/15: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 274/274 [39:36<00:00, 8.67s/it, accuracy=84.3, loss=0.438]\n"
644
+ ]
645
+ },
646
+ {
647
+ "name": "stdout",
648
+ "output_type": "stream",
649
+ "text": [
650
+ "Epoch 12/15\n",
651
+ "Train Loss: 0.4381 | Train Accuracy: 84.26%\n"
652
+ ]
653
+ },
654
+ {
655
+ "name": "stderr",
656
+ "output_type": "stream",
657
+ "text": [
658
+ "Epoch 13/15: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 274/274 [38:42<00:00, 8.48s/it, accuracy=84.9, loss=0.427]\n"
659
+ ]
660
+ },
661
+ {
662
+ "name": "stdout",
663
+ "output_type": "stream",
664
+ "text": [
665
+ "Epoch 13/15\n",
666
+ "Train Loss: 0.4268 | Train Accuracy: 84.93%\n"
667
+ ]
668
+ },
669
+ {
670
+ "name": "stderr",
671
+ "output_type": "stream",
672
+ "text": [
673
+ "Epoch 14/15: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 274/274 [39:57<00:00, 8.75s/it, accuracy=84.5, loss=0.429]\n"
674
+ ]
675
+ },
676
+ {
677
+ "name": "stdout",
678
+ "output_type": "stream",
679
+ "text": [
680
+ "Epoch 14/15\n",
681
+ "Train Loss: 0.4288 | Train Accuracy: 84.50%\n"
682
+ ]
683
+ },
684
+ {
685
+ "name": "stderr",
686
+ "output_type": "stream",
687
+ "text": [
688
+ "Epoch 15/15: 100%|β–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆβ–ˆ| 274/274 [43:25<00:00, 9.51s/it, accuracy=84.6, loss=0.43] "
689
+ ]
690
+ },
691
+ {
692
+ "name": "stdout",
693
+ "output_type": "stream",
694
+ "text": [
695
+ "Epoch 15/15\n",
696
+ "Train Loss: 0.4299 | Train Accuracy: 84.61%\n"
697
+ ]
698
+ },
699
+ {
700
+ "name": "stderr",
701
+ "output_type": "stream",
702
+ "text": [
703
+ "\n"
704
  ]
705
  }
706
  ],