epoch:0training loss:tensor(21.8620, grad_fn=<MseLossBackward>)test loss:tensor(19.6877, grad_fn=<MseLossBackward>)
epoch:10training loss:tensor(6.4311, grad_fn=<MseLossBackward>)test loss:tensor(5.1118, grad_fn=<MseLossBackward>)
epoch:20training loss:tensor(1.8502, grad_fn=<MseLossBackward>)test loss:tensor(1.3755, grad_fn=<MseLossBackward>)
epoch:30training loss:tensor(0.5939, grad_fn=<MseLossBackward>)test loss:tensor(0.5410, grad_fn=<MseLossBackward>)
epoch:40training loss:tensor(0.5125, grad_fn=<MseLossBackward>)test loss:tensor(0.5418, grad_fn=<MseLossBackward>)
epoch:50training loss:tensor(0.4310, grad_fn=<MseLossBackward>)test loss:tensor(0.4055, grad_fn=<MseLossBackward>)
epoch:60training loss:tensor(0.2948, grad_fn=<MseLossBackward>)test loss:tensor(0.2869, grad_fn=<MseLossBackward>)
epoch:70training loss:tensor(0.2303, grad_fn=<MseLossBackward>)test loss:tensor(0.2224, grad_fn=<MseLossBackward>)
epoch:80training loss:tensor(0.1678, grad_fn=<MseLossBackward>)test loss:tensor(0.1665, grad_fn=<MseLossBackward>)
epoch:90training loss:tensor(0.1272, grad_fn=<MseLossBackward>)test loss:tensor(0.1284, grad_fn=<MseLossBackward>)
epoch:100training loss:tensor(0.1007, grad_fn=<MseLossBackward>)test loss:tensor(0.1034, grad_fn=<MseLossBackward>)
epoch:110training loss:tensor(0.0824, grad_fn=<MseLossBackward>)test loss:tensor(0.0858, grad_fn=<MseLossBackward>)
epoch:120training loss:tensor(0.0675, grad_fn=<MseLossBackward>)test loss:tensor(0.0712, grad_fn=<MseLossBackward>)
epoch:130training loss:tensor(0.0555, grad_fn=<MseLossBackward>)test loss:tensor(0.0595, grad_fn=<MseLossBackward>)
epoch:140training loss:tensor(0.0464, grad_fn=<MseLossBackward>)test loss:tensor(0.0504, grad_fn=<MseLossBackward>)
epoch:150training loss:tensor(0.0394, grad_fn=<MseLossBackward>)test loss:tensor(0.0435, grad_fn=<MseLossBackward>)
epoch:160training loss:tensor(0.0343, grad_fn=<MseLossBackward>)test loss:tensor(0.0385, grad_fn=<MseLossBackward>)
epoch:170training loss:tensor(0.0304, grad_fn=<MseLossBackward>)test loss:tensor(0.0347, grad_fn=<MseLossBackward>)
epoch:180training loss:tensor(0.0273, grad_fn=<MseLossBackward>)test loss:tensor(0.0315, grad_fn=<MseLossBackward>)
epoch:190training loss:tensor(0.0246, grad_fn=<MseLossBackward>)test loss:tensor(0.0288, grad_fn=<MseLossBackward>)
epoch:200training loss:tensor(0.0224, grad_fn=<MseLossBackward>)test loss:tensor(0.0265, grad_fn=<MseLossBackward>)
epoch:210training loss:tensor(0.0204, grad_fn=<MseLossBackward>)test loss:tensor(0.0245, grad_fn=<MseLossBackward>)
epoch:220training loss:tensor(0.0188, grad_fn=<MseLossBackward>)test loss:tensor(0.0228, grad_fn=<MseLossBackward>)
epoch:230training loss:tensor(0.0173, grad_fn=<MseLossBackward>)test loss:tensor(0.0213, grad_fn=<MseLossBackward>)
epoch:240training loss:tensor(0.0161, grad_fn=<MseLossBackward>)test loss:tensor(0.0200, grad_fn=<MseLossBackward>)
epoch:250training loss:tensor(0.0150, grad_fn=<MseLossBackward>)test loss:tensor(0.0189, grad_fn=<MseLossBackward>)
epoch:260training loss:tensor(0.0141, grad_fn=<MseLossBackward>)test loss:tensor(0.0179, grad_fn=<MseLossBackward>)
epoch:270training loss:tensor(0.0133, grad_fn=<MseLossBackward>)test loss:tensor(0.0170, grad_fn=<MseLossBackward>)
epoch:280training loss:tensor(0.0125, grad_fn=<MseLossBackward>)test loss:tensor(0.0162, grad_fn=<MseLossBackward>)
epoch:290training loss:tensor(0.0118, grad_fn=<MseLossBackward>)test loss:tensor(0.0155, grad_fn=<MseLossBackward>)
epoch:300training loss:tensor(0.0112, grad_fn=<MseLossBackward>)test loss:tensor(0.0148, grad_fn=<MseLossBackward>)
epoch:310training loss:tensor(0.0106, grad_fn=<MseLossBackward>)test loss:tensor(0.0142, grad_fn=<MseLossBackward>)
epoch:320training loss:tensor(0.0100, grad_fn=<MseLossBackward>)test loss:tensor(0.0136, grad_fn=<MseLossBackward>)
epoch:330training loss:tensor(0.0095, grad_fn=<MseLossBackward>)test loss:tensor(0.0131, grad_fn=<MseLossBackward>)
epoch:340training loss:tensor(0.0090, grad_fn=<MseLossBackward>)test loss:tensor(0.0125, grad_fn=<MseLossBackward>)
epoch:350training loss:tensor(0.0086, grad_fn=<MseLossBackward>)test loss:tensor(0.0121, grad_fn=<MseLossBackward>)
epoch:360training loss:tensor(0.0081, grad_fn=<MseLossBackward>)test loss:tensor(0.0117, grad_fn=<MseLossBackward>)
epoch:370training loss:tensor(0.0077, grad_fn=<MseLossBackward>)test loss:tensor(0.0112, grad_fn=<MseLossBackward>)
epoch:380training loss:tensor(0.0073, grad_fn=<MseLossBackward>)test loss:tensor(0.0108, grad_fn=<MseLossBackward>)
epoch:390training loss:tensor(0.0070, grad_fn=<MseLossBackward>)test loss:tensor(0.0105, grad_fn=<MseLossBackward>)
epoch:400training loss:tensor(0.0066, grad_fn=<MseLossBackward>)test loss:tensor(0.0101, grad_fn=<MseLossBackward>)
epoch:410training loss:tensor(0.0063, grad_fn=<MseLossBackward>)test loss:tensor(0.0098, grad_fn=<MseLossBackward>)
epoch:420training loss:tensor(0.0060, grad_fn=<MseLossBackward>)test loss:tensor(0.0095, grad_fn=<MseLossBackward>)
epoch:430training loss:tensor(0.0058, grad_fn=<MseLossBackward>)test loss:tensor(0.0092, grad_fn=<MseLossBackward>)
epoch:440training loss:tensor(0.0055, grad_fn=<MseLossBackward>)test loss:tensor(0.0089, grad_fn=<MseLossBackward>)
epoch:450training loss:tensor(0.0053, grad_fn=<MseLossBackward>)test loss:tensor(0.0086, grad_fn=<MseLossBackward>)
epoch:460training loss:tensor(0.0051, grad_fn=<MseLossBackward>)test loss:tensor(0.0084, grad_fn=<MseLossBackward>)
epoch:470training loss:tensor(0.0049, grad_fn=<MseLossBackward>)test loss:tensor(0.0082, grad_fn=<MseLossBackward>)
epoch:480training loss:tensor(0.0048, grad_fn=<MseLossBackward>)test loss:tensor(0.0082, grad_fn=<MseLossBackward>)
epoch:490training loss:tensor(0.0044, grad_fn=<MseLossBackward>)test loss:tensor(0.0077, grad_fn=<MseLossBackward>)
epoch:500training loss:tensor(0.0043, grad_fn=<MseLossBackward>)test loss:tensor(0.0076, grad_fn=<MseLossBackward>)
epoch:510training loss:tensor(0.0041, grad_fn=<MseLossBackward>)test loss:tensor(0.0073, grad_fn=<MseLossBackward>)
epoch:520training loss:tensor(0.0058, grad_fn=<MseLossBackward>)test loss:tensor(0.0088, grad_fn=<MseLossBackward>)
epoch:530training loss:tensor(0.0039, grad_fn=<MseLossBackward>)test loss:tensor(0.0074, grad_fn=<MseLossBackward>)
epoch:540training loss:tensor(0.0038, grad_fn=<MseLossBackward>)test loss:tensor(0.0068, grad_fn=<MseLossBackward>)
epoch:550training loss:tensor(0.0035, grad_fn=<MseLossBackward>)test loss:tensor(0.0067, grad_fn=<MseLossBackward>)
epoch:560training loss:tensor(0.0045, grad_fn=<MseLossBackward>)test loss:tensor(0.0081, grad_fn=<MseLossBackward>)
epoch:570training loss:tensor(0.0045, grad_fn=<MseLossBackward>)test loss:tensor(0.0079, grad_fn=<MseLossBackward>)
epoch:580training loss:tensor(0.0038, grad_fn=<MseLossBackward>)test loss:tensor(0.0066, grad_fn=<MseLossBackward>)
epoch:590training loss:tensor(0.0039, grad_fn=<MseLossBackward>)test loss:tensor(0.0070, grad_fn=<MseLossBackward>)
epoch:600training loss:tensor(0.0032, grad_fn=<MseLossBackward>)test loss:tensor(0.0063, grad_fn=<MseLossBackward>)
epoch:610training loss:tensor(0.0080, grad_fn=<MseLossBackward>)test loss:tensor(0.0119, grad_fn=<MseLossBackward>)
epoch:620training loss:tensor(0.0028, grad_fn=<MseLossBackward>)test loss:tensor(0.0063, grad_fn=<MseLossBackward>)
epoch:630training loss:tensor(0.0033, grad_fn=<MseLossBackward>)test loss:tensor(0.0058, grad_fn=<MseLossBackward>)
epoch:640training loss:tensor(0.0028, grad_fn=<MseLossBackward>)test loss:tensor(0.0060, grad_fn=<MseLossBackward>)
epoch:650training loss:tensor(0.0026, grad_fn=<MseLossBackward>)test loss:tensor(0.0056, grad_fn=<MseLossBackward>)
epoch:660training loss:tensor(0.0093, grad_fn=<MseLossBackward>)test loss:tensor(0.0141, grad_fn=<MseLossBackward>)
epoch:670training loss:tensor(0.0031, grad_fn=<MseLossBackward>)test loss:tensor(0.0080, grad_fn=<MseLossBackward>)
epoch:680training loss:tensor(0.0032, grad_fn=<MseLossBackward>)test loss:tensor(0.0067, grad_fn=<MseLossBackward>)
epoch:690training loss:tensor(0.0026, grad_fn=<MseLossBackward>)test loss:tensor(0.0058, grad_fn=<MseLossBackward>)
epoch:700training loss:tensor(0.0025, grad_fn=<MseLossBackward>)test loss:tensor(0.0053, grad_fn=<MseLossBackward>)
epoch:710training loss:tensor(0.0027, grad_fn=<MseLossBackward>)test loss:tensor(0.0058, grad_fn=<MseLossBackward>)
epoch:720training loss:tensor(0.0058, grad_fn=<MseLossBackward>)test loss:tensor(0.0074, grad_fn=<MseLossBackward>)
epoch:730training loss:tensor(0.0025, grad_fn=<MseLossBackward>)test loss:tensor(0.0051, grad_fn=<MseLossBackward>)
epoch:740training loss:tensor(0.0021, grad_fn=<MseLossBackward>)test loss:tensor(0.0050, grad_fn=<MseLossBackward>)
epoch:750training loss:tensor(0.0041, grad_fn=<MseLossBackward>)test loss:tensor(0.0070, grad_fn=<MseLossBackward>)
epoch:760training loss:tensor(0.0023, grad_fn=<MseLossBackward>)test loss:tensor(0.0056, grad_fn=<MseLossBackward>)
epoch:770training loss:tensor(0.0033, grad_fn=<MseLossBackward>)test loss:tensor(0.0052, grad_fn=<MseLossBackward>)
epoch:780training loss:tensor(0.0021, grad_fn=<MseLossBackward>)test loss:tensor(0.0049, grad_fn=<MseLossBackward>)
epoch:790training loss:tensor(0.0025, grad_fn=<MseLossBackward>)test loss:tensor(0.0052, grad_fn=<MseLossBackward>)
epoch:800training loss:tensor(0.0026, grad_fn=<MseLossBackward>)test loss:tensor(0.0061, grad_fn=<MseLossBackward>)
epoch:810training loss:tensor(0.0051, grad_fn=<MseLossBackward>)test loss:tensor(0.0093, grad_fn=<MseLossBackward>)
epoch:820training loss:tensor(0.0035, grad_fn=<MseLossBackward>)test loss:tensor(0.0064, grad_fn=<MseLossBackward>)
epoch:830training loss:tensor(0.0025, grad_fn=<MseLossBackward>)test loss:tensor(0.0054, grad_fn=<MseLossBackward>)
epoch:840training loss:tensor(0.0017, grad_fn=<MseLossBackward>)test loss:tensor(0.0047, grad_fn=<MseLossBackward>)
epoch:850training loss:tensor(0.0017, grad_fn=<MseLossBackward>)test loss:tensor(0.0046, grad_fn=<MseLossBackward>)
epoch:860training loss:tensor(0.0053, grad_fn=<MseLossBackward>)test loss:tensor(0.0107, grad_fn=<MseLossBackward>)
epoch:870training loss:tensor(0.0022, grad_fn=<MseLossBackward>)test loss:tensor(0.0048, grad_fn=<MseLossBackward>)
epoch:880training loss:tensor(0.0016, grad_fn=<MseLossBackward>)test loss:tensor(0.0052, grad_fn=<MseLossBackward>)
epoch:890training loss:tensor(0.0016, grad_fn=<MseLossBackward>)test loss:tensor(0.0047, grad_fn=<MseLossBackward>)
epoch:900training loss:tensor(0.0019, grad_fn=<MseLossBackward>)test loss:tensor(0.0046, grad_fn=<MseLossBackward>)
epoch:910training loss:tensor(0.0020, grad_fn=<MseLossBackward>)test loss:tensor(0.0049, grad_fn=<MseLossBackward>)
epoch:920training loss:tensor(0.0051, grad_fn=<MseLossBackward>)test loss:tensor(0.0078, grad_fn=<MseLossBackward>)
epoch:930training loss:tensor(0.0031, grad_fn=<MseLossBackward>)test loss:tensor(0.0053, grad_fn=<MseLossBackward>)
epoch:940training loss:tensor(0.0027, grad_fn=<MseLossBackward>)test loss:tensor(0.0053, grad_fn=<MseLossBackward>)
epoch:950training loss:tensor(0.0020, grad_fn=<MseLossBackward>)test loss:tensor(0.0052, grad_fn=<MseLossBackward>)
epoch:960training loss:tensor(0.0014, grad_fn=<MseLossBackward>)test loss:tensor(0.0054, grad_fn=<MseLossBackward>)
epoch:970training loss:tensor(0.0022, grad_fn=<MseLossBackward>)test loss:tensor(0.0043, grad_fn=<MseLossBackward>)
epoch:980training loss:tensor(0.0019, grad_fn=<MseLossBackward>)test loss:tensor(0.0049, grad_fn=<MseLossBackward>)
epoch:990training loss:tensor(0.0019, grad_fn=<MseLossBackward>)test loss:tensor(0.0048, grad_fn=<MseLossBackward>)
