{ "best_metric": 3.5546064376831055, "best_model_checkpoint": "//amltff6de91c1707b018e950147da959e142/projects/sca-xiaoke-v3/amlt-results/7300230113.98638-a536a63f-7921-4c0f-a350-97817c95c30d/checkpoint-90000", "epoch": 82.64462809917356, "global_step": 100000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "_prepare_inputs_in_ms": 27.127794979605824, "compute_loss_in_ms": 1811.1886270344257, "epoch": 0.0, "learning_rate/full": 0.0, "loss": 7.5531, "step": 1, "training_step_in_ms": 2240.9718980197795 }, { "epoch": 0.0, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 7.401121139526367, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.029569745772319803, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 83.1742, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 9.618, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.301, "step": 1 }, { "_prepare_inputs_in_ms": 9.555798228632284, "compute_loss_in_ms": 536.5458341809833, "epoch": 0.83, "learning_rate/full": 0.0003999392508508148, "loss": 4.3937, "step": 1000, "training_step_in_ms": 946.2872614599979 }, { "_prepare_inputs_in_ms": 9.661823262518737, "compute_loss_in_ms": 537.3916240136023, "epoch": 1.65, "learning_rate/full": 0.00039968541343111914, "loss": 4.0494, "step": 2000, "training_step_in_ms": 955.0557815724169 }, { "_prepare_inputs_in_ms": 9.627924977685325, "compute_loss_in_ms": 537.9465775624267, "epoch": 2.48, "learning_rate/full": 0.0003992346658781257, "loss": 3.9791, "step": 3000, "training_step_in_ms": 958.343352012278 }, { "_prepare_inputs_in_ms": 9.754187489685137, "compute_loss_in_ms": 538.0461517369258, "epoch": 3.31, "learning_rate/full": 0.0003985858034191765, "loss": 3.9371, "step": 4000, "training_step_in_ms": 961.1277512954548 }, { "_prepare_inputs_in_ms": 9.712934053619392, "compute_loss_in_ms": 537.9799637984834, "epoch": 4.13, "learning_rate/full": 0.0003977411181848781, "loss": 3.9065, "step": 5000, "training_step_in_ms": 954.7033457334619 }, { "epoch": 4.13, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.763737201690674, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.23929773235608354, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 102.1516, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.831, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.245, "step": 5000 }, { "_prepare_inputs_in_ms": 9.484028106941501, "compute_loss_in_ms": 535.8051792999613, "epoch": 4.96, "learning_rate/full": 0.0003966997561999938, "loss": 3.8844, "step": 6000, "training_step_in_ms": 946.6810292407754 }, { "_prepare_inputs_in_ms": 9.555567614093889, "compute_loss_in_ms": 537.8309749438195, "epoch": 5.79, "learning_rate/full": 0.000395466162801616, "loss": 3.8646, "step": 7000, "training_step_in_ms": 956.3491519849049 }, { "_prepare_inputs_in_ms": 9.571906232624315, "compute_loss_in_ms": 535.8670682059601, "epoch": 6.61, "learning_rate/full": 0.0003940366164283571, "loss": 3.8482, "step": 8000, "training_step_in_ms": 955.7397421186324 }, { "_prepare_inputs_in_ms": 9.494116805610247, "compute_loss_in_ms": 535.7246166499099, "epoch": 7.44, "learning_rate/full": 0.0003924165284571268, "loss": 3.8329, "step": 9000, "training_step_in_ms": 956.2797198233311 }, { "_prepare_inputs_in_ms": 9.442963820649311, "compute_loss_in_ms": 535.982440788066, "epoch": 8.26, "learning_rate/full": 0.00039060426098193074, "loss": 3.8234, "step": 10000, "training_step_in_ms": 960.6822794212494 }, { "epoch": 8.26, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.69438099861145, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.24724186480974675, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 99.2464, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 8.061, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.252, "step": 10000 }, { "_prepare_inputs_in_ms": 9.298451105870942, "compute_loss_in_ms": 533.8574210923398, "epoch": 9.09, "learning_rate/full": 0.00038860732494287416, "loss": 3.8075, "step": 11000, "training_step_in_ms": 953.7077538485173 }, { "_prepare_inputs_in_ms": 9.43831800215412, "compute_loss_in_ms": 534.8986968573299, "epoch": 9.92, "learning_rate/full": 0.0003864196958913291, "loss": 3.8011, "step": 12000, "training_step_in_ms": 952.7247995454236 }, { "_prepare_inputs_in_ms": 9.553659793222323, "compute_loss_in_ms": 535.9662136517582, "epoch": 10.74, "learning_rate/full": 0.0003840498188962311, "loss": 3.7873, "step": 13000, "training_step_in_ms": 957.1981301900814 }, { "_prepare_inputs_in_ms": 9.344144803879317, "compute_loss_in_ms": 535.5388605375774, "epoch": 11.57, "learning_rate/full": 0.0003814979428002389, "loss": 3.7786, "step": 14000, "training_step_in_ms": 959.83031323459 }, { "_prepare_inputs_in_ms": 9.39019125822233, "compute_loss_in_ms": 536.7152543000993, "epoch": 12.4, "learning_rate/full": 0.00037876659104596076, "loss": 3.7703, "step": 15000, "training_step_in_ms": 961.1087728133425 }, { "epoch": 12.4, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.6609387397766113, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.2538100106775413, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 103.2498, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.748, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.242, "step": 15000 }, { "_prepare_inputs_in_ms": 9.56299589696999, "compute_loss_in_ms": 535.2517742190976, "epoch": 13.22, "learning_rate/full": 0.00037585846455191155, "loss": 3.7622, "step": 16000, "training_step_in_ms": 952.1916261643055 }, { "_prepare_inputs_in_ms": 9.559556159831118, "compute_loss_in_ms": 535.5560795084457, "epoch": 14.05, "learning_rate/full": 0.00037277643904168816, "loss": 3.7606, "step": 17000, "training_step_in_ms": 957.2516361214803 }, { "_prepare_inputs_in_ms": 9.455631462449674, "compute_loss_in_ms": 535.3892399296165, "epoch": 14.88, "learning_rate/full": 0.0003695235622002878, "loss": 3.749, "step": 18000, "training_step_in_ms": 953.2538345798966 }, { "_prepare_inputs_in_ms": 9.365507787151728, "compute_loss_in_ms": 535.8022946891142, "epoch": 15.7, "learning_rate/full": 0.00036609954385629034, "loss": 3.7464, "step": 19000, "training_step_in_ms": 959.837038420781 }, { "_prepare_inputs_in_ms": 9.457632376637775, "compute_loss_in_ms": 535.8551492407569, "epoch": 16.53, "learning_rate/full": 0.00036251461734986354, "loss": 3.7357, "step": 20000, "training_step_in_ms": 960.2882608400541 }, { "epoch": 16.53, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.6332855224609375, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.26106709230289454, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 103.6434, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.719, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.241, "step": 20000 }, { "_prepare_inputs_in_ms": 9.350896289958278, "compute_loss_in_ms": 534.3410268089501, "epoch": 17.36, "learning_rate/full": 0.0003587689869947874, "loss": 3.7335, "step": 21000, "training_step_in_ms": 951.9007690685103 }, { "_prepare_inputs_in_ms": 9.444510843255557, "compute_loss_in_ms": 536.0995619180612, "epoch": 18.18, "learning_rate/full": 0.0003548663566868928, "loss": 3.726, "step": 22000, "training_step_in_ms": 959.7129821323324 }, { "_prepare_inputs_in_ms": 9.432463558274321, "compute_loss_in_ms": 535.7645625439472, "epoch": 19.01, "learning_rate/full": 0.00035081058557264036, "loss": 3.7237, "step": 23000, "training_step_in_ms": 963.4282936626696 }, { "_prepare_inputs_in_ms": 9.293582127720583, "compute_loss_in_ms": 535.7767343233572, "epoch": 19.83, "learning_rate/full": 0.00034660568423297317, "loss": 3.7142, "step": 24000, "training_step_in_ms": 953.5687257153331 }, { "_prepare_inputs_in_ms": 9.35004804620985, "compute_loss_in_ms": 537.011823366629, "epoch": 20.66, "learning_rate/full": 0.00034225581071742215, "loss": 3.7071, "step": 25000, "training_step_in_ms": 957.869783453003 }, { "epoch": 20.66, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.6175005435943604, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.26405073790614886, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 104.9682, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.621, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.238, "step": 25000 }, { "_prepare_inputs_in_ms": 9.984895624163583, "compute_loss_in_ms": 534.7242227215902, "epoch": 21.49, "learning_rate/full": 0.0003377607023892813, "loss": 3.7083, "step": 26000, "training_step_in_ms": 955.9584859979805 }, { "_prepare_inputs_in_ms": 10.137336196319666, "compute_loss_in_ms": 535.9911008346826, "epoch": 22.31, "learning_rate/full": 0.00033313379374801615, "loss": 3.7022, "step": 27000, "training_step_in_ms": 965.8537974991486 }, { "_prepare_inputs_in_ms": 10.160301688476466, "compute_loss_in_ms": 536.8555397295277, "epoch": 23.14, "learning_rate/full": 0.0003283704069974003, "loss": 3.7009, "step": 28000, "training_step_in_ms": 961.128851325775 }, { "_prepare_inputs_in_ms": 10.110118357348256, "compute_loss_in_ms": 536.1848762420123, "epoch": 23.97, "learning_rate/full": 0.0003234847784387827, "loss": 3.6952, "step": 29000, "training_step_in_ms": 951.6901445918484 }, { "_prepare_inputs_in_ms": 10.067090163414832, "compute_loss_in_ms": 535.8437895118841, "epoch": 24.79, "learning_rate/full": 0.0003184770409925566, "loss": 3.6897, "step": 30000, "training_step_in_ms": 964.9359193513519 }, { "epoch": 24.79, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.603607416152954, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.26295626788132803, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 101.4282, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.887, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.246, "step": 30000 }, { "_prepare_inputs_in_ms": 10.085794753678961, "compute_loss_in_ms": 535.1409671568545, "epoch": 25.62, "learning_rate/full": 0.00031335214659900727, "loss": 3.6866, "step": 31000, "training_step_in_ms": 961.3275795525988 }, { "_prepare_inputs_in_ms": 10.185186771384906, "compute_loss_in_ms": 536.1119842829066, "epoch": 26.45, "learning_rate/full": 0.0003081098663889108, "loss": 3.6829, "step": 32000, "training_step_in_ms": 963.5977011280484 }, { "_prepare_inputs_in_ms": 10.249891238170676, "compute_loss_in_ms": 535.0950576688629, "epoch": 27.27, "learning_rate/full": 0.0003027712689775676, "loss": 3.6771, "step": 33000, "training_step_in_ms": 955.397748134099 }, { "_prepare_inputs_in_ms": 10.17424620629754, "compute_loss_in_ms": 534.6862363539985, "epoch": 28.1, "learning_rate/full": 0.0002973202486383942, "loss": 3.672, "step": 34000, "training_step_in_ms": 958.4871930885711 }, { "_prepare_inputs_in_ms": 10.059338139777537, "compute_loss_in_ms": 535.8044806576218, "epoch": 28.93, "learning_rate/full": 0.000291778393459607, "loss": 3.6714, "step": 35000, "training_step_in_ms": 956.3396593880607 }, { "epoch": 28.93, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.590414524078369, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.26513770557999966, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 104.3253, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.668, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.24, "step": 35000 }, { "_prepare_inputs_in_ms": 10.062245466610099, "compute_loss_in_ms": 534.5042656344594, "epoch": 29.75, "learning_rate/full": 0.0002861457824996332, "loss": 3.6645, "step": 36000, "training_step_in_ms": 959.2977655951399 }, { "_prepare_inputs_in_ms": 10.064813164470252, "compute_loss_in_ms": 536.1598941528937, "epoch": 30.58, "learning_rate/full": 0.00028042798560981287, "loss": 3.6574, "step": 37000, "training_step_in_ms": 956.0697433989844 }, { "_prepare_inputs_in_ms": 10.116965677938424, "compute_loss_in_ms": 536.2070164434845, "epoch": 31.4, "learning_rate/full": 0.0002746248158102387, "loss": 3.6578, "step": 38000, "training_step_in_ms": 956.2041009759996 }, { "_prepare_inputs_in_ms": 10.094019736570772, "compute_loss_in_ms": 535.4710150305182, "epoch": 32.23, "learning_rate/full": 0.0002687536169947349, "loss": 3.6524, "step": 39000, "training_step_in_ms": 959.96617779386 }, { "_prepare_inputs_in_ms": 10.109433323028497, "compute_loss_in_ms": 535.6941579723498, "epoch": 33.06, "learning_rate/full": 0.0002628144306280816, "loss": 3.6524, "step": 40000, "training_step_in_ms": 961.5450095872511 }, { "epoch": 33.06, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.580965280532837, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.2693198298047019, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 99.8174, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 8.015, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.25, "step": 40000 }, { "_prepare_inputs_in_ms": 10.042415707621997, "compute_loss_in_ms": 535.0675269728526, "epoch": 33.88, "learning_rate/full": 0.000256813129721104, "loss": 3.6463, "step": 41000, "training_step_in_ms": 951.0752835389576 }, { "_prepare_inputs_in_ms": 10.117303489823826, "compute_loss_in_ms": 535.5392771296902, "epoch": 34.71, "learning_rate/full": 0.00025076173835033525, "loss": 3.6408, "step": 42000, "training_step_in_ms": 959.7704490462202 }, { "_prepare_inputs_in_ms": 10.175786619714927, "compute_loss_in_ms": 536.3846810262767, "epoch": 35.54, "learning_rate/full": 0.0002446479775734085, "loss": 3.6381, "step": 43000, "training_step_in_ms": 963.5900993177202 }, { "_prepare_inputs_in_ms": 10.058058980386704, "compute_loss_in_ms": 535.5972880260088, "epoch": 36.36, "learning_rate/full": 0.00023849615593840492, "loss": 3.6361, "step": 44000, "training_step_in_ms": 966.5910823547165 }, { "_prepare_inputs_in_ms": 10.140807795512956, "compute_loss_in_ms": 535.745742837491, "epoch": 37.19, "learning_rate/full": 0.00023230626707893625, "loss": 3.6344, "step": 45000, "training_step_in_ms": 960.7837667464628 }, { "epoch": 37.19, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.575321912765503, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.2694013022299941, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 103.7207, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.713, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.241, "step": 45000 }, { "_prepare_inputs_in_ms": 10.123616369532012, "compute_loss_in_ms": 534.5586088547134, "epoch": 38.02, "learning_rate/full": 0.00022608443191494596, "loss": 3.6259, "step": 46000, "training_step_in_ms": 954.3300566331018 }, { "_prepare_inputs_in_ms": 10.126525112020317, "compute_loss_in_ms": 536.6205943481764, "epoch": 38.84, "learning_rate/full": 0.0002198305382138328, "loss": 3.6279, "step": 47000, "training_step_in_ms": 953.759260071849 }, { "_prepare_inputs_in_ms": 10.257417954970151, "compute_loss_in_ms": 535.2681058159797, "epoch": 39.67, "learning_rate/full": 0.00021356327694485794, "loss": 3.6213, "step": 48000, "training_step_in_ms": 962.4967881785124 }, { "_prepare_inputs_in_ms": 10.271113389520906, "compute_loss_in_ms": 535.4450263003819, "epoch": 40.5, "learning_rate/full": 0.0002072826035235433, "loss": 3.6186, "step": 49000, "training_step_in_ms": 961.3730522751575 }, { "_prepare_inputs_in_ms": 10.129716445459053, "compute_loss_in_ms": 536.4764073403785, "epoch": 41.32, "learning_rate/full": 0.00020099472864285533, "loss": 3.6137, "step": 50000, "training_step_in_ms": 960.2726457127137 }, { "epoch": 41.32, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.5703847408294678, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.2688142864806811, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 100.2164, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.983, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.249, "step": 50000 }, { "_prepare_inputs_in_ms": 10.502501730693549, "compute_loss_in_ms": 535.0548804986756, "epoch": 42.15, "learning_rate/full": 0.0001947058701169798, "loss": 3.6106, "step": 51000, "training_step_in_ms": 958.0683015501127 }, { "_prepare_inputs_in_ms": 10.785648202290758, "compute_loss_in_ms": 536.7012275556335, "epoch": 42.98, "learning_rate/full": 0.0001884222467327876, "loss": 3.6073, "step": 52000, "training_step_in_ms": 951.947691895999 }, { "_prepare_inputs_in_ms": 10.585681669297628, "compute_loss_in_ms": 535.5102476192405, "epoch": 43.8, "learning_rate/full": 0.00018214380145695523, "loss": 3.6024, "step": 53000, "training_step_in_ms": 962.6988452640362 }, { "_prepare_inputs_in_ms": 10.68288057774771, "compute_loss_in_ms": 535.9786380403675, "epoch": 44.63, "learning_rate/full": 0.00017588929863586686, "loss": 3.6046, "step": 54000, "training_step_in_ms": 966.1844932027161 }, { "_prepare_inputs_in_ms": 10.645952994469553, "compute_loss_in_ms": 535.4971501872642, "epoch": 45.45, "learning_rate/full": 0.00016965863787013347, "loss": 3.5954, "step": 55000, "training_step_in_ms": 966.1277901912108 }, { "epoch": 45.45, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.5649678707122803, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.27166900209048683, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 102.2773, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.822, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.244, "step": 55000 }, { "_prepare_inputs_in_ms": 10.577075158859172, "compute_loss_in_ms": 534.4740462127374, "epoch": 46.28, "learning_rate/full": 0.00016345179061642948, "loss": 3.5963, "step": 56000, "training_step_in_ms": 961.5655309080612 }, { "_prepare_inputs_in_ms": 10.732970108627342, "compute_loss_in_ms": 537.2660472553689, "epoch": 47.11, "learning_rate/full": 0.0001572873072366209, "loss": 3.597, "step": 57000, "training_step_in_ms": 964.5027116436977 }, { "_prepare_inputs_in_ms": 10.73382615565788, "compute_loss_in_ms": 538.1741794921691, "epoch": 47.93, "learning_rate/full": 0.0001511650606366491, "loss": 3.5895, "step": 58000, "training_step_in_ms": 949.1175830988213 }, { "_prepare_inputs_in_ms": 10.706503831432201, "compute_loss_in_ms": 536.7453673920827, "epoch": 48.76, "learning_rate/full": 0.0001450911048478807, "loss": 3.5876, "step": 59000, "training_step_in_ms": 968.0035566822626 }, { "_prepare_inputs_in_ms": 10.903483389178291, "compute_loss_in_ms": 537.1148272417486, "epoch": 49.59, "learning_rate/full": 0.00013906544966141887, "loss": 3.5819, "step": 60000, "training_step_in_ms": 964.3682058413979 }, { "epoch": 49.59, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.5601305961608887, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.27116285100803245, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 101.8706, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.853, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.245, "step": 60000 }, { "_prepare_inputs_in_ms": 10.826663774233765, "compute_loss_in_ms": 535.5709582263371, "epoch": 50.41, "learning_rate/full": 0.00013310610391163933, "loss": 3.5762, "step": 61000, "training_step_in_ms": 957.2617566076806 }, { "_prepare_inputs_in_ms": 10.595198371564038, "compute_loss_in_ms": 536.0367681181524, "epoch": 51.24, "learning_rate/full": 0.0001272129067134662, "loss": 3.5751, "step": 62000, "training_step_in_ms": 959.1705903129186 }, { "_prepare_inputs_in_ms": 10.456255728611723, "compute_loss_in_ms": 536.2733452994144, "epoch": 52.07, "learning_rate/full": 0.00012139747473708569, "loss": 3.5774, "step": 63000, "training_step_in_ms": 955.730251706671 }, { "_prepare_inputs_in_ms": 10.639551113941707, "compute_loss_in_ms": 535.7200796955731, "epoch": 52.89, "learning_rate/full": 0.00011564819693413189, "loss": 3.568, "step": 64000, "training_step_in_ms": 951.6928666429594 }, { "_prepare_inputs_in_ms": 10.60645360336639, "compute_loss_in_ms": 535.3036272318568, "epoch": 53.72, "learning_rate/full": 0.00010998812020655949, "loss": 3.5703, "step": 65000, "training_step_in_ms": 963.1167565376963 }, { "epoch": 53.72, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.5590660572052, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.2733920686032914, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 99.9831, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 8.001, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.25, "step": 65000 }, { "_prepare_inputs_in_ms": 10.624523456094831, "compute_loss_in_ms": 534.0653136165347, "epoch": 54.55, "learning_rate/full": 0.00010441152222708468, "loss": 3.5693, "step": 66000, "training_step_in_ms": 955.8435329974163 }, { "_prepare_inputs_in_ms": 10.65835806389805, "compute_loss_in_ms": 536.2088124424918, "epoch": 55.37, "learning_rate/full": 9.893506973588506e-05, "loss": 3.5599, "step": 67000, "training_step_in_ms": 957.1059285002993 }, { "_prepare_inputs_in_ms": 10.751230709021911, "compute_loss_in_ms": 536.6291307259817, "epoch": 56.2, "learning_rate/full": 9.355322604944605e-05, "loss": 3.5668, "step": 68000, "training_step_in_ms": 959.1418899303535 }, { "_prepare_inputs_in_ms": 10.653449523961172, "compute_loss_in_ms": 536.7383008667966, "epoch": 57.02, "learning_rate/full": 8.829252005938348e-05, "loss": 3.5592, "step": 69000, "training_step_in_ms": 955.6575022591278 }, { "_prepare_inputs_in_ms": 10.65822267276235, "compute_loss_in_ms": 535.9257607464679, "epoch": 57.85, "learning_rate/full": 8.312650768346744e-05, "loss": 3.5575, "step": 70000, "training_step_in_ms": 951.2662082569441 }, { "epoch": 57.85, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.5556719303131104, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.2734467694599133, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 104.2955, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.671, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.24, "step": 70000 }, { "_prepare_inputs_in_ms": 10.608355628053953, "compute_loss_in_ms": 534.1021929110866, "epoch": 58.68, "learning_rate/full": 7.80762980438341e-05, "loss": 3.5556, "step": 71000, "training_step_in_ms": 948.2094520897372 }, { "_prepare_inputs_in_ms": 10.676257735467516, "compute_loss_in_ms": 536.0682506592711, "epoch": 59.5, "learning_rate/full": 7.315176250595717e-05, "loss": 3.5537, "step": 72000, "training_step_in_ms": 954.8686325427843 }, { "_prepare_inputs_in_ms": 10.610922348219901, "compute_loss_in_ms": 536.3908133659279, "epoch": 60.33, "learning_rate/full": 6.835266183844516e-05, "loss": 3.5479, "step": 73000, "training_step_in_ms": 954.1712517963024 }, { "_prepare_inputs_in_ms": 10.579945259494707, "compute_loss_in_ms": 534.4352571795462, "epoch": 61.16, "learning_rate/full": 6.368374166947542e-05, "loss": 3.5467, "step": 74000, "training_step_in_ms": 953.0113322847756 }, { "_prepare_inputs_in_ms": 10.577161580207758, "compute_loss_in_ms": 536.7000861178385, "epoch": 61.98, "learning_rate/full": 5.914514927911328e-05, "loss": 3.5466, "step": 75000, "training_step_in_ms": 950.8998943779152 }, { "epoch": 61.98, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.5562994480133057, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.27468764903823617, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 102.8368, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.779, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.243, "step": 75000 }, { "_prepare_inputs_in_ms": 10.397925437655209, "compute_loss_in_ms": 535.1076509790728, "epoch": 62.81, "learning_rate/full": 5.475477712440255e-05, "loss": 3.5454, "step": 76000, "training_step_in_ms": 949.9264260384953 }, { "_prepare_inputs_in_ms": 10.516429967130534, "compute_loss_in_ms": 537.9902690803865, "epoch": 63.64, "learning_rate/full": 5.0499380128392283e-05, "loss": 3.5418, "step": 77000, "training_step_in_ms": 963.6520826652413 }, { "_prepare_inputs_in_ms": 10.470940343337134, "compute_loss_in_ms": 536.5116302901879, "epoch": 64.46, "learning_rate/full": 4.639614598504125e-05, "loss": 3.5397, "step": 78000, "training_step_in_ms": 957.950764612644 }, { "_prepare_inputs_in_ms": 10.59993867285084, "compute_loss_in_ms": 537.1390544432215, "epoch": 65.29, "learning_rate/full": 4.244480421242036e-05, "loss": 3.5388, "step": 79000, "training_step_in_ms": 961.8771279493812 }, { "_prepare_inputs_in_ms": 10.679984404356219, "compute_loss_in_ms": 536.696684517432, "epoch": 66.12, "learning_rate/full": 3.8649262125702656e-05, "loss": 3.5329, "step": 80000, "training_step_in_ms": 957.4748168167425 }, { "epoch": 66.12, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.556597948074341, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.2742539533100543, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 100.6419, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.949, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.248, "step": 80000 }, { "_prepare_inputs_in_ms": 10.708052520753771, "compute_loss_in_ms": 535.2645241598366, "epoch": 66.94, "learning_rate/full": 3.500971449864994e-05, "loss": 3.5345, "step": 81000, "training_step_in_ms": 948.9210075238952 }, { "_prepare_inputs_in_ms": 10.605949840741232, "compute_loss_in_ms": 535.3940441570012, "epoch": 67.77, "learning_rate/full": 3.153703882232173e-05, "loss": 3.5346, "step": 82000, "training_step_in_ms": 957.2232636878034 }, { "_prepare_inputs_in_ms": 10.527875950676389, "compute_loss_in_ms": 535.3903734084452, "epoch": 68.6, "learning_rate/full": 2.823094906089525e-05, "loss": 3.5362, "step": 83000, "training_step_in_ms": 960.9660885017365 }, { "_prepare_inputs_in_ms": 10.645452778204344, "compute_loss_in_ms": 535.3771834741347, "epoch": 69.42, "learning_rate/full": 2.509166124130553e-05, "loss": 3.5284, "step": 84000, "training_step_in_ms": 959.7084383748006 }, { "_prepare_inputs_in_ms": 10.593148670741357, "compute_loss_in_ms": 534.9863913216395, "epoch": 70.25, "learning_rate/full": 2.212855773155269e-05, "loss": 3.5273, "step": 85000, "training_step_in_ms": 970.6172955055954 }, { "epoch": 70.25, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.555929660797119, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.2741459251366367, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 104.7737, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.636, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.239, "step": 85000 }, { "_prepare_inputs_in_ms": 10.723522963888216, "compute_loss_in_ms": 534.6476732452866, "epoch": 71.07, "learning_rate/full": 1.9341343786710864e-05, "loss": 3.5266, "step": 86000, "training_step_in_ms": 961.9524979006965 }, { "_prepare_inputs_in_ms": 10.785187994129956, "compute_loss_in_ms": 536.4809199275915, "epoch": 71.9, "learning_rate/full": 1.6732775565058435e-05, "loss": 3.5253, "step": 87000, "training_step_in_ms": 950.8976757206256 }, { "_prepare_inputs_in_ms": 10.603952513309196, "compute_loss_in_ms": 535.7741147053894, "epoch": 72.73, "learning_rate/full": 1.4305432569654864e-05, "loss": 3.524, "step": 88000, "training_step_in_ms": 959.2451942999614 }, { "_prepare_inputs_in_ms": 10.706391342449933, "compute_loss_in_ms": 536.408079084591, "epoch": 73.55, "learning_rate/full": 1.2059561887499037e-05, "loss": 3.5265, "step": 89000, "training_step_in_ms": 973.4634857769124 }, { "_prepare_inputs_in_ms": 10.6856812821934, "compute_loss_in_ms": 537.2633295034757, "epoch": 74.38, "learning_rate/full": 1.0003841866378549e-05, "loss": 3.5218, "step": 90000, "training_step_in_ms": 966.5726283045951 }, { "epoch": 74.38, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.5546064376831055, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.27359656588473774, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 104.0763, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.687, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.24, "step": 90000 }, { "_prepare_inputs_in_ms": 10.64931857888019, "compute_loss_in_ms": 535.808490979718, "epoch": 75.21, "learning_rate/full": 8.132070715440754e-06, "loss": 3.5219, "step": 91000, "training_step_in_ms": 957.4841072742129 }, { "_prepare_inputs_in_ms": 10.87383456970565, "compute_loss_in_ms": 537.6603767276974, "epoch": 76.03, "learning_rate/full": 6.453582116869461e-06, "loss": 3.5235, "step": 92000, "training_step_in_ms": 954.7427223158302 }, { "_prepare_inputs_in_ms": 10.69017239450477, "compute_loss_in_ms": 537.0892604731489, "epoch": 76.86, "learning_rate/full": 4.964706300643118e-06, "loss": 3.5189, "step": 93000, "training_step_in_ms": 950.3190122217638 }, { "_prepare_inputs_in_ms": 10.618111693882383, "compute_loss_in_ms": 535.7142543839291, "epoch": 77.69, "learning_rate/full": 3.6686926578696213e-06, "loss": 3.5235, "step": 94000, "training_step_in_ms": 958.8555470507126 }, { "_prepare_inputs_in_ms": 10.73988960427232, "compute_loss_in_ms": 536.3263423398603, "epoch": 78.51, "learning_rate/full": 2.5658174353882404e-06, "loss": 3.5215, "step": 95000, "training_step_in_ms": 964.6057669939473 }, { "epoch": 78.51, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.5548150539398193, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.27406488207696067, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 104.9846, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.62, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.238, "step": 95000 }, { "_prepare_inputs_in_ms": 10.761066970824286, "compute_loss_in_ms": 535.5862640386913, "epoch": 79.34, "learning_rate/full": 1.6593767888209988e-06, "loss": 3.5201, "step": 96000, "training_step_in_ms": 953.487945659901 }, { "_prepare_inputs_in_ms": 10.744887009612285, "compute_loss_in_ms": 536.8042176247109, "epoch": 80.17, "learning_rate/full": 9.484543083217335e-07, "loss": 3.5242, "step": 97000, "training_step_in_ms": 955.935797311482 }, { "_prepare_inputs_in_ms": 10.609967146418057, "compute_loss_in_ms": 536.5163776981644, "epoch": 80.99, "learning_rate/full": 4.3558991431862373e-07, "loss": 3.5217, "step": 98000, "training_step_in_ms": 951.0243763268227 }, { "_prepare_inputs_in_ms": 10.550453630159609, "compute_loss_in_ms": 535.8989973879652, "epoch": 81.82, "learning_rate/full": 1.1945383759244255e-07, "loss": 3.523, "step": 99000, "training_step_in_ms": 959.1436755338218 }, { "_prepare_inputs_in_ms": 10.565008323756047, "compute_loss_in_ms": 536.139583913493, "epoch": 82.64, "learning_rate/full": 9.51678964100644e-10, "loss": 3.523, "step": 100000, "training_step_in_ms": 958.2332628678996 }, { "epoch": 82.64, "eval_visual_genome-region_descriptions_v1.2.0-test_loss": 3.554699182510376, "eval_visual_genome-region_descriptions_v1.2.0-test_meteor": 0.2739906528866304, "eval_visual_genome-region_descriptions_v1.2.0-test_runtime": 105.8588, "eval_visual_genome-region_descriptions_v1.2.0-test_samples_per_second": 7.557, "eval_visual_genome-region_descriptions_v1.2.0-test_steps_per_second": 0.236, "step": 100000 } ], "max_steps": 100000, "num_train_epochs": 83, "total_flos": 1.7305644974792963e+23, "trial_name": null, "trial_params": null }