{"id":8443,"date":"2019-11-05T12:06:44","date_gmt":"2019-11-05T03:06:44","guid":{"rendered":"http:\/\/www.gisdeveloper.co.kr\/?p=8443"},"modified":"2020-05-28T09:59:45","modified_gmt":"2020-05-28T00:59:45","slug":"%eb%94%a5%eb%9f%ac%eb%8b%9d-%ed%95%99%ec%8a%b5%eb%a0%a5-%ed%96%a5%ec%83%81%ec%9d%84-%ec%9c%84%ed%95%b4-%ea%b3%a0%eb%a0%a4%ed%95%a0-%ec%82%ac%ed%95%ad%eb%93%a4","status":"publish","type":"post","link":"http:\/\/www.gisdeveloper.co.kr\/?p=8443","title":{"rendered":"\ub525\ub7ec\ub2dd \ud559\uc2b5 \ud5a5\uc0c1\uc744 \uc704\ud55c \uace0\ub824 \uc0ac\ud56d\ub4e4"},"content":{"rendered":"<h3>1. \uac00\uc911\uce58 \uac10\uc18c(Weight Decay)\ub97c \ud1b5\ud55c \uac00\uc911\uce58 \uc815\ud615\ud654(Weight Regularization)<\/h3>\n<p>\uc190\uc2e4\ud568\uc218\uc5d0 \uc5b4\ub5a4 \uc81c\uc57d \uc870\uac74\uc744 \uc801\uc6a9\ud574 \uc624\ubc84\ud53c\ud305\uc744 \ucd5c\uc18c\ud654\ud558\ub294 \ubc29\ubc95\uc73c\ub85c L1 \uc815\ud615\ud654\uc640 L2 \uc815\ud615\ud654\uac00 \uc788\uc2b5\ub2c8\ub2e4. \uc624\ubc84\ud53c\ud305\uc740 \ud2b9\uc815 \uac00\uc911\uce58\uac12\uc774 \ucee4\uc9c8\uc218\ub85d \ubc1c\uc0dd\ud560 \uac00\ub2a5\uc131\uc774 \ub192\uc544\uc9c0\ubbc0\ub85c \uc774\ub97c \ud574\uc18c\ud558\uae30 \uc704\ud574 \ud2b9\uc815\uac12\uc744 \uc190\uc2e4\ud568\uc218\uc5d0 \ub354\ud574\uc8fc\ub294 \uac83\uc774 \uc815\ud615\ud654 \uc911 \uac00\uc911\uce58 \uac10\uc18c(Weight Decay)\uc774\uba70, \ub354\ud574\uc8fc\ub294 \ud2b9\uc815\uac12\uc744 \uacb0\uc815\ud558\ub294 \uac83\uc774 L1 \uc815\ud615\ud654\uc640 L2 \uc815\ud615\ud654\uc785\ub2c8\ub2e4. \ud30c\uc774\ud1a0\uce58\uc5d0\uc11c \uc774 Weight Decay\ub294 \ub2e4\uc74c \ucf54\ub4dc\ucc98\ub7fc \uc801\uc6a9\ud560 \uc218 \uc788\uc2b5\ub2c8\ub2e4.<\/p>\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"python\">\r\noptimizer = torch.optim.SGD(model.parameters(), lr=learning_rate, weight_decay=0.1)\r\n<\/pre>\n<p>\uacb0\uacfc\uc801\uc73c\ub85c weight_decay\uc758 \uac12\uc774 \ucee4\uc9c8\uc218\ub85d \uac00\uc911\uce58 \uac12\uc774 \uc791\uc5b4\uc9c0\uac8c \ub418\uace0, \uc624\ubc84\ud53c\ud305 \ud604\uc0c1\uc744 \ud574\uc18c\ud560 \uc218 \uc788\uc9c0\ub9cc, weight_decay \uac12\uc744 \ub108\ubb34 \ud06c\uac8c \ud558\uba74 \uc5b8\ub354\ud53c\ud305 \ud604\uc0c1\uc774 \ubc1c\uc0dd\ud558\ubbc0\ub85c \uc801\ub2f9\ud55c \uac12\uc744 \uc0ac\uc6a9\ud574\uc57c \ud569\ub2c8\ub2e4.<\/p>\n<h3>2. \ub370\uc774\ud130 \uc99d\uac15(Data Augmentation)<\/h3>\n<p>\ud6c8\ub828 \ub370\uc774\ud130\ub97c \uc54c\uace0\ub9ac\uc998\uc5d0 \uc758\ud574 \uadf8 \uc218\ub97c \ub298\ub9ac\ub294 \ubc29\ubc95\uc73c\ub85c, \uc624\ubc84\ud53c\ud305 \ud574\uc18c\ub294 \ubb3c\ub860 \ud6c8\ub828 \ubc0f \ud14c\uc2a4\ud2b8 \ub370\uc774\ud130\uc5d0 \ub300\ud55c \uc815\ud655\ub3c4\ub97c \ub192\uc77c \uc218 \uc788\ub294 \ubc29\ubc95\uc785\ub2c8\ub2e4. \ub2e4\uc74c \ucf54\ub4dc\uc758 \uc608\ucc98\ub7fc \ub370\uc774\ud130\uc14b\uc5d0 \ub300\ud55c transform \uc778\uc790\uc5d0 \uc9c0\uc815\ud558\uc5ec \uc801\uc6a9\ud560 \uc218 \uc788\uc2b5\ub2c8\ub2e4.<\/p>\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"python\">\r\nmnist_train = dset.MNIST(\r\n    '.\/', \r\n    train=True, \r\n    transform = transforms.Compose([\r\n        transforms.Resize(34),                        # \uc6d0\ub798 28x28\uc778 \uc774\ubbf8\uc9c0\ub97c 34x34\ub85c \ub298\ub9bd\ub2c8\ub2e4.\r\n        transforms.CenterCrop(28),                    # \uc911\uc559 28x28\ub97c \ubf51\uc544\ub0c5\ub2c8\ub2e4.\r\n        transforms.RandomHorizontalFlip(),            # \ub79c\ub364\ud558\uac8c \uc88c\uc6b0\ubc18\uc804 \ud569\ub2c8\ub2e4.\r\n        transforms.Lambda(lambda x: x.rotate(90)),    # \ub78c\ub2e4\ud568\uc218\ub97c \uc774\uc6a9\ud574 90\ub3c4 \ud68c\uc804\ud574\uc90d\ub2c8\ub2e4.\r\n        transforms.ToTensor(),                        # \uc774\ubbf8\uc9c0\ub97c \ud150\uc11c\ub85c \ubcc0\ud615\ud569\ub2c8\ub2e4.\r\n    ]),\r\n    target_transform=None,\r\n    download=True\r\n)\r\n<\/pre>\n<h3>3. \uac00\uc911\uce58 \ucd08\uae30\ud654(Weight Initialization)<\/h3>\n<p>\uc2e0\uacbd\ub9dd\uc774 \uae4a\uc5b4\uc9c8 \uc218\ub85d \uac01 \uc2e0\uacbd\ub9dd\uc758 \uac00\uc911\uce58\uac12\ub4e4\uc758 \ubd84\ud3ec\uac00 \ud55c\ucabd\uc73c\ub85c \uc3e0\ub9ac\uac70\ub098, \ud2b9\uc815 \uac12 \ubd80\ubd84\uc73c\ub85c \uc2ec\ud558\uac8c \ubaa8\uc77c \uc218 \uc788\ub294 \ud604\uc0c1\uc774 \ubc1c\uc0dd\ud569\ub2c8\ub2e4. \uc774\ub7f0 \ud604\uc0c1\uc774 \ubc1c\uc0dd\ud558\uba74 \uae30\uc6b8\uae30 \uc18c\uc2e4(Gradient Vanishing)\uc774 \ubc1c\uc0dd\ud560 \uc218 \uc788\uace0, \uc2e0\uacbd\ub9dd\uc758 \ud45c\ud604\ub825\uc5d0 \uc81c\ud55c\uc774 \uc0dd\uaca8 \uc2e0\uacbd\ub9dd\uc744 \uae4a\uac8c \uad6c\uc131\ud558\ub294 \uc758\ubbf8\uac00 \uc0ac\ub77c\uc9d1\ub2c8\ub2e4. \uc774\ub97c \uc704\ud574 \ud559\uc2b5\ud558\uae30 \uc804\uc5d0 \uac00\uc911\uce58\ub97c \uc801\ub2f9\ud558\uac8c \ucd08\uae30\ud558\ub294 \uac83\uc774 \ud544\uc694\ud569\ub2c8\ub2e4. \uc544\ub798\uc758 \ucf54\ub4dc\ub294 \ud30c\uc774\ud1a0\uce58\uc5d0\uc11c \ud754\ud788\ud558\uac8c \uac00\uc911\uce58\ub97c \ucd08\uae30\ud558\ub294 \ucf54\ub4dc\uc758 \uc608\uc785\ub2c8\ub2e4.<\/p>\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"python\">\r\nclass aDNN(nn.Module):\r\n    def __init__(self):\r\n        super(aDNN,self).__init__()\r\n        self.layer = nn.Sequential(\r\n            # ...\r\n        )             \r\n        \r\n        for m in self.modules():\r\n            if isinstance(m, nn.Conv2d):\r\n                '''\r\n                m.weight.data.normal_(0.0, 0.1)     # \uac00\uc911\uce58\ub97c \ud3c9\uade0 0, \ud3b8\ucc28 0.1\ub85c \ucd08\uae30\ud654\r\n                m.bias.data.fill_(0)                # \ud3b8\ucc28\ub97c 0\uc73c\ub85c \ucd08\uae30\ud654\r\n                '''\r\n\r\n                '''\r\n                init.xavier_normal(m.weight.data)   # Xavier Initialization\r\n                m.bias.data.fill_(0)                # \ud3b8\ucc28\ub97c 0\uc73c\ub85c \ucd08\uae30\ud654 \r\n                '''\r\n\r\n                '''                \r\n                init.kaiming_normal_(m.weight.data) # Kaming He Initialization\r\n                m.bias.data.fill_(0)                # \ud3b8\ucc28\ub97c 0\uc73c\ub85c \ucd08\uae30\ud654 \r\n                '''\r\n            elif isinstance(m, nn.Linear):\r\n                # \uc704\uc758 \ucf54\ub4dc\uc640 \uc720\uc0ac\ud568\r\n<\/pre>\n<p>Xavier \ucd08\uae30\ud654\ub294 \ud65c\uc131\ud654\ud568\uc218\uac00 Sigmoid\ub098 Tanh\uc77c\ub54c \uc801\ub2f9\ud558\uba70, Kaming He \ucd08\uae30\ud654\ub294 \ud65c\uc131\ud654 \ud568\uc218\uac00 ReLU\uc77c\ub54c \uc801\ub2f9\ud569\ub2c8\ub2e4.<\/p>\n<h3>4. \ud559\uc2b5\ub960 \uc2a4\ucf00\uc974\ub7ec(Learning Rate Scheduler)<\/h3>\n<p>\ud559\uc2b5\uc774 \uc9c4\ud589\ub418\uba74\uc11c \ud559\uc2b5\ub960\uc744 \uadf8 \uc0c1\ud669\uc5d0 \ub9de\uac8c \uac00\ubcc0\uc801\uc73c\ub85c \uc801\ub2f9\ud558\uac8c \ubcc0\uacbd\ub420 \uc218 \uc788\ub2e4\uba74 \ub354 \ub0ae\uc740 \uc190\uc2e4\uac12\uc744 \uc5bb\uc744 \uc218 \uc788\uc2b5\ub2c8\ub2e4. \uc774\ub97c \uc704\ud574 \ud559\uc2b5\ub960\uc744 \uc2a4\ucf00\uc974\uc774 \ud544\uc694\ud569\ub2c8\ub2e4. \uc774\uc640 \uad00\ub828\ub41c \ucf54\ub4dc\ub294 \ub2e4\uc74c\uacfc \uac19\uc2b5\ub2c8\ub2e4.<\/p>\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"python\">\r\n# \ud559\uc2b5\ub960 \uc2a4\ucf00\uc904\ub7ec\ub294 \uc635\ud2f0\ub9c8\uc774\uc838\ub97c \ud1b5\ud574 \uc801\uc6a9\ub41c\ub2e4.\r\noptimizer = torch.optim.SGD(model.parameters(), lr=0.01)\r\n\r\n# \uc9c0\uc815\ud55c \uc2a4\ud15d \ub2e8\uc704\ub85c \ud559\uc2b5\ub960\uc5d0 \uac10\ub9c8\ub97c \uacf1\ud574 \ud559\uc2b5\ub960\uc744 \uac10\uc18c\uc2dc\ud0a4\ub294 \ubc29\uc2dd\r\nscheduler = lr_scheduler.StepLR(optimizer, step_size=1, gamma= 0.99)       \r\n\r\n# \uc9c0\uc815\ud55c \uc2a4\ud15d \uc9c0\uc810(\uc608\uc2dc\uc5d0\uc11c\ub294 10,20,40)\ub9c8\ub2e4 \ud559\uc2b5\ub960\uc5d0 \uac10\ub9c8\ub97c \uacf1\ud574\uc918\uc11c \uac10\uc18c\uc2dc\ud0a4\ub294 \ubc29\uc2dd\r\nscheduler = lr_scheduler.MultiStepLR(optimizer, milestones=[10,20,40], gamma= 0.1)  \r\n\r\n# \ub9e4 epoch\ub9c8\ub2e4 \ud559\uc2b5\ub960\uc5d0 \uac10\ub9c8\ub97c \uacf1\ud574\uc90c\uc73c\ub85c\uc368 \uac10\uc18c\uc2dc\ud0a4\ub294 \ubc29\uc2dd\r\nscheduler = lr_scheduler.ExponentialLR(optimizer, gamma= 0.99)                             \r\n\r\n# \uc6d0\ud558\ub294 \uc5d0\ud3ed\ub9c8\ub2e4, \uc774\uc804 \ud559\uc2b5\ub960 \ub300\ube44 \ubcc0\uacbd\ud3ed\uc5d0 \ub530\ub77c \ud559\uc2b5\ub960\uc744 \uac10\uc18c\uc2dc\ucf1c\uc8fc\ub294 \ubc29\uc2dd\r\nscheduler = lr_scheduler.ReduceLROnPlateau(optimizer,threshold=1,patience=1,mode='min')\r\n<\/pre>\n<p>\uc704\uc758 \uc2a4\ucf00\uc904\ub7ec\ub97c \ud559\uc2b5\uc5d0 \uc801\uc6a9\ud560\ub54c \uc0ac\uc6a9\ubc29\ubc95\uc740 \ub098\ub258\ub294\ub370, StepLR, MultiStepLR, ExponentialLR\uc758 \uacbd\uc6b0\ub294 \uc544\ub798 \ucf54\ub4dc\ub97c \ucc38\uace0\ud558\uae30 \ubc14\ub78d\ub2c8\ub2e4.<\/p>\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"python\">\r\nfor i in range(num_epoch):\r\n    scheduler.step() # !!\r\n\r\n    optimizer.zero_grad()\r\n    output = model.forward( .. )\r\n    loss = loss( .. )\r\n    loss.backward()\r\n    optimizer.step()\r\n<\/pre>\n<p>ReduceLRONPlateau\uc758 \uacbd\uc6b0\ub294 \uc544\ub798 \ucf54\ub4dc\ub97c \ucc38\uace0\ud558\uae30 \ubc14\ub78d\ub2c8\ub2e4.<\/p>\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"python\">\r\nfor i in range(num_epoch):\r\n    optimizer.zero_grad()\r\n    output = model.forward( .. )\r\n    loss = loss( .. )\r\n    loss.backward()\r\n    optimizer.step()\r\n    \r\n    scheduler.step(loss) # !!  \r\n<\/pre>\n<h3>5. \ud559\uc2b5 \ub370\uc774\ud130\uc758 \uc815\uaddc\ud654(Data Normalization)<\/h3>\n<p>\uc785\ub825\ub418\ub294 \ub370\uc774\ud130\uc5d0 \ub300\ud574\uc11c \uacf5\uac04\uc0c1 \ubd84\ud3ec\ub97c \uc815\uaddc\ud654\uc2dc\ucf1c\uc8fc\uac8c \ub418\uba74, \ub354 \ub192\uc740 \uc815\ud655\ub3c4\ub97c \uc5bb\uc744 \uc218 \uc788\uac8c \ub429\ub2c8\ub2e4. \uc815\uaddc\ud654\uc758 \ubc29\ubc95\uc740 \uc804\uccb4 \ub370\uc774\ud130\uc5d0 \ub300\ud55c \ud3c9\uade0\uacfc \ud45c\uc900\ud3b8\ucc28\ub97c \uc774\uc6a9\ud558\ub294\ub370, \ub370\uc774\ud130\uc5d0 \ub300\ud574\uc11c \ud3c9\uade0\uc744 \ube7c\uace0 \ud45c\uc900\ud3b8\ucc28\ub85c \ub098\ub220\uc90d\ub2c8\ub2e4. \uc774\ub97c \uc704\ud55c \ucf54\ub4dc\uc758 \uc608\ub294 \uc544\ub798\uc640 \uac19\uc2b5\ub2c8\ub2e4.<\/p>\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"python\">\r\nmnist_train = dset.MNIST(\r\n    \".\/\", \r\n    train=True, \r\n    transform=transforms.Compose([\r\n        transforms.ToTensor(),\r\n        transforms.Normalize(mean=(0.1307,), std=(0.3081,))\r\n    ]),\r\n    download=True\r\n)\r\n\r\nmnist_test = dset.MNIST(\r\n    \".\/\", \r\n    train=False, \r\n    transform=transforms.Compose([\r\n        transforms.ToTensor(),\r\n        transforms.Normalize(mean=(0.1307,), std=(0.3081,))\r\n    ]),\r\n    download=True)\r\n<\/pre>\n<p>\ub370\uc774\ud130\uc5d0 \ub300\ud55c \ud3c9\uade0 \ubc0f \ud45c\uc900\ud3b8\ucc28\ub97c \uc5bb\ub294 \uac83\uc740 \uc544\ub798\uc758 \uae00\uc744 \ucc38\uace0\ud558\uae30 \ubc14\ub78d\ub2c8\ub2e4.<\/p>\n<blockquote class=\"wp-embedded-content\" data-secret=\"30L1TeCKz9\"><p><a href=\"http:\/\/www.gisdeveloper.co.kr\/?p=8168\">\uc774\ubbf8\uc9c0 Dataset\uc5d0 \ub300\ud55c \ud3c9\uade0\uacfc \ud45c\uc900\ud3b8\ucc28 \uad6c\ud558\uae30<\/a><\/p><\/blockquote>\n<p><iframe loading=\"lazy\" class=\"wp-embedded-content\" sandbox=\"allow-scripts\" security=\"restricted\" style=\"position: absolute; clip: rect(1px, 1px, 1px, 1px);\" title=\"&#8220;\uc774\ubbf8\uc9c0 Dataset\uc5d0 \ub300\ud55c \ud3c9\uade0\uacfc \ud45c\uc900\ud3b8\ucc28 \uad6c\ud558\uae30&#8221; &#8212; GIS Developer\" src=\"http:\/\/www.gisdeveloper.co.kr\/?p=8168&#038;embed=true#?secret=VRmDXRWlk0#?secret=30L1TeCKz9\" data-secret=\"30L1TeCKz9\" width=\"525\" height=\"296\" frameborder=\"0\" marginwidth=\"0\" marginheight=\"0\" scrolling=\"no\"><\/iframe><\/p>\n<h3>6. \ub2e4\uc591\ud55c \uacbd\uc0ac\ud558\uac15\ubc95(Gradient Descent Variants)<\/h3>\n<p>\ucd5c\uc18c\uc758 \uc190\uc2e4\uac12\uc744 \ucc3e\uae30 \uc704\ud574 \uc190\uc2e4\ud568\uc218\uc758 \ubbf8\ubd84\uc73c\ub85c \uad6c\ud55c \uae30\uc6b8\uae30\ub97c \ub530\ub77c \uc774\ub3d9\ud558\uac8c \ub418\ub294\ub370, \uc774\ub3d9\ud558\ub294 \ubc29\uc2dd\uc5d0 \ub300\ud55c \uc120\ud0dd\uc5d0 \ub300\ud55c \uac83\uc785\ub2c8\ub2e4. SGD \ubc29\uc2dd, Adam \ubc29\uc2dd \ub4f1\uc774 \uc874\uc7ac\ud558\ub294\ub370 \uadf8\uc911 Adam\uc5d0 \ub300\ud55c \ud30c\uc774\ud1a0\uce58\uc758 \ucf54\ub4dc\ub294 \ub2e4\uc74c\uacfc \uac19\uc2b5\ub2c8\ub2e4.<\/p>\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"python\">\r\noptimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)\r\n<\/pre>\n<p>SGD\uc640 Adam \uc774\uc678\uc5d0\ub3c4 Momentum \ubc29\uc2dd\uacfc AdaGrad \ubc29\uc2dd\uc758 \uc788\uc73c\uba70, Adam\uc774 Momentum \ubc29\uc2dd\uacfc AdaGrad \ubc29\uc2dd\uc758 \uc7a5\uc810\uc744 \ud63c\ud569\ud55c \uac83\uc785\ub2c8\ub2e4.<\/p>\n<h3>7. \ubc30\uce58 \uc815\uaddc\ud654(Batch Normalization)<\/h3>\n<p>\uac01 \uc2e0\uacbd\ub9dd\uc758 \ud65c\uc131\ud654 \uac12 \ubd84\ud3ec\uac00 \uc801\ub2f9\ud788 \ud37c\uc9c0\ub3c4\ub85d \uac1c\uc120\ud558\uc5ec \uc6d0\ud560\ud55c \ud559\uc2b5\uc774 \uc9c4\ud589\ub418\ub3c4\ub85d \ub3d5\ub294 \uae30\ubc95\uc785\ub2c8\ub2e4. \ud559\uc2b5\uc18d\ub3c4\uac00 \ube68\ub77c\uc9c0\uace0, \uc55e\uc11c \uc5b8\uae09\ud55c \uac00\uc911\uce58 \ucd08\uae30\uac12 \uc124\uc815\uc5d0 \uc2e0\uacbd\uc4f8 \ud544\uc694\uac00 \uc5c6\uac8c \ub429\ub2c8\ub2e4. \ub610\ud558\ub294 \uc624\ubc84\ud53c\ud305\uc744 \uc5b5\uc81c\ud558\uac8c \ub418\uc5b4 \uac00\uc911\uce58 \uac10\uc18c \uae30\ubc95\uc774\ub098 \ub4dc\ub86d\uc544\uc6c3 \uae30\ubc95\uc758 \ud544\uc694\uc131\uc774 \uac10\uc18c\ud569\ub2c8\ub2e4. \uc774 \ubc30\uce58 \uc815\uaddc\ud654\ub294 \ubc30\uce58 \ub2e8\uc704\ub85c \uc785\ub825\ub418\ub294 \ub370\uc774\ud130\uc758 \uc5f0\uc0b0 \uacb0\uacfc\ub97c \ub2e4\uc2dc \uacb0\uacfc\uc758 \ud3c9\uade0\uacfc \ubd84\uc120\uc774 1\uc774 \ub418\ub3c4\ub85d \uc7ac\uac00\uacf5\ud569\ub2c8\ub2e4. \uadf8\ub9ac\uace0 \ub610 \ub2e4\uc2dc \ud2b9\uc815 \uac12\uc744 \uacf1\ud558\uace0 \ub610 \ub2e4\ub978 \ud2b9\uc815\uac12\uc744 \ub354\ud558\ub294 \uac04\ub2e8\ud55c Scaling \ubc0f Shifting \ucc98\ub9ac\uac00 \uc774\ub8e8\uc5b4\uc9d1\ub2c8\ub2e4. Scaling \ubc0f Shifting \ucc98\ub9ac\ub97c \uc704\ud55c 2\uac1c\uc758 \uac12\uc740 \ud559\uc2b5\uc744 \ud1b5\ud574 \uc0b0\ucd9c\ub429\ub2c8\ub2e4.<\/p>\n<p>\uc544\ub798\uc758 \ucf54\ub4dc\ub294 \ubc30\uce58 \uc815\uaddc\ud654\uc5d0 \ub300\ud55c \uc608\uc81c \ucf54\ub4dc\uc785\ub2c8\ub2e4.<\/p>\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"python\">\r\nclass CNN(nn.Module):\r\n    def __init__(self):\r\n        super(CNN,self).__init__()\r\n        self.layer = nn.Sequential(\r\n            nn.Conv2d(1, 16, 3, padding=1),\r\n            nn.BatchNorm2d(16),\r\n            nn.ReLU(),\r\n            nn.Conv2d(16, 32, 3,padding=1),\r\n            nn.BatchNorm2d(32),\r\n            nn.ReLU(),\r\n            nn.MaxPool2d(2, 2),           \r\n            nn.Conv2d(32, 64, 3,padding=1),\r\n            nn.BatchNorm2d(64),\r\n            nn.ReLU(),\r\n            nn.MaxPool2d(2, 2)        \r\n        )\r\n        self.fc_layer = nn.Sequential(\r\n            nn.Linear(64*7*7, 128),\r\n            nn.BatchNorm1d(128),\r\n            nn.ReLU(),\r\n            nn.Linear(128, 64),\r\n            nn.BatchNorm1d(64),\r\n            nn.ReLU(),            \r\n            nn.Linear(64, 10),\r\n        )       \r\n\r\n    def forward(self,x):\r\n        out = self.layer(x)\r\n        out = out.view(batch_size, -1)\r\n        out = self.fc_layer(out)\r\n        return out\r\n<\/pre>\n<p>\ud559\uc2b5\uc774 \ub05d\ub098\uace0 \ud3c9\uac00 \uc2dc\uc5d0\ub294 \ubc18\ub4dc\uc2dc \uc544\ub798\uc758 \ucf54\ub4dc \ud638\ucd9c\uc774 \uc120\ud589\ub418\uc5b4\uc57c \ud569\ub2c8\ub2e4.<\/p>\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"python\">\r\nmodel.eval()\r\n<\/pre>\n<h3>8. \ub4dc\ub86d\uc544\uc6c3(Drop Out)<\/h3>\n<p>\uc774 \uae30\ubc95\uc774 \uc801\uc6a9\ub418\uba74 \ud6c8\ub828 \ub370\uc774\ud130\uc5d0 \ub300\ud55c \uc815\ud655\ub3c4\uac00 \ub5a8\uc5b4\uc9c0\uc9c0\ub9cc \uc624\ubc84\ud53c\ud305\uc744 \uc5b5\uc81c\ud558\uae30 \uc704\ud55c \uae30\ubc95\uc785\ub2c8\ub2e4. \uc989, \ud2b9\uc815 \ud655\ub960\ub85c \uc2e0\uacbd\ub9dd\uc758 \ub274\ub7f0\uc744 \ube44\ud65c\uc131\ud654\uc2dc\ucf1c \uc5f0\uc0b0\uc5d0\uc11c \uc81c\uc678\uc2dc\ud0a4\ub294 \ubc29\uc2dd\uc785\ub2c8\ub2e4. \ub4dc\ub86d\uc544\uc6c3\uc5d0 \ub300\ud55c \ucf54\ub4dc \uc608\ub294 \ub2e4\uc74c\uacfc \uac19\uc2b5\ub2c8\ub2e4.<\/p>\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"python\">\r\nlayer = nn.Sequential(\r\n     nn.Conv2d(1,16,3,padding=1),\r\n     nn.ReLU(),\r\n    nn.Dropout2d(0.2),\r\n    nn.Conv2d(16,32,3,padding=1),\r\n    nn.ReLU(),\r\n    nn.Dropout2d(0.2),\r\n    nn.MaxPool2d(2,2),\r\n    nn.Conv2d(32,64,3,padding=1),\r\n    nn.ReLU(),\r\n    nn.Dropout2d(0.2),\r\n    nn.MaxPool2d(2,2)\r\n)\r\n<\/pre>\n<p>\ud559\uc2b5\uc774 \ub05d\ub098\uace0 \ud3c9\uac00 \uc2dc\uc5d0\ub294 \ubc18\ub4dc\uc2dc \uc544\ub798\uc758 \ucf54\ub4dc \ud638\ucd9c\uc774 \uc120\ud589\ub418\uc5b4\uc57c \ud569\ub2c8\ub2e4.<\/p>\n<pre class=\"EnlighterJSRAW\" data-enlighter-language=\"python\">\r\nmodel.eval()\r\n<\/pre>\n","protected":false},"excerpt":{"rendered":"<p>1. \uac00\uc911\uce58 \uac10\uc18c(Weight Decay)\ub97c \ud1b5\ud55c \uac00\uc911\uce58 \uc815\ud615\ud654(Weight Regularization) \uc190\uc2e4\ud568\uc218\uc5d0 \uc5b4\ub5a4 \uc81c\uc57d \uc870\uac74\uc744 \uc801\uc6a9\ud574 \uc624\ubc84\ud53c\ud305\uc744 \ucd5c\uc18c\ud654\ud558\ub294 \ubc29\ubc95\uc73c\ub85c L1 \uc815\ud615\ud654\uc640 L2 \uc815\ud615\ud654\uac00 \uc788\uc2b5\ub2c8\ub2e4. \uc624\ubc84\ud53c\ud305\uc740 \ud2b9\uc815 \uac00\uc911\uce58\uac12\uc774 \ucee4\uc9c8\uc218\ub85d \ubc1c\uc0dd\ud560 \uac00\ub2a5\uc131\uc774 \ub192\uc544\uc9c0\ubbc0\ub85c \uc774\ub97c \ud574\uc18c\ud558\uae30 \uc704\ud574 \ud2b9\uc815\uac12\uc744 \uc190\uc2e4\ud568\uc218\uc5d0 \ub354\ud574\uc8fc\ub294 \uac83\uc774 \uc815\ud615\ud654 \uc911 \uac00\uc911\uce58 \uac10\uc18c(Weight Decay)\uc774\uba70, \ub354\ud574\uc8fc\ub294 \ud2b9\uc815\uac12\uc744 \uacb0\uc815\ud558\ub294 \uac83\uc774 L1 \uc815\ud615\ud654\uc640 L2 \uc815\ud615\ud654\uc785\ub2c8\ub2e4. \ud30c\uc774\ud1a0\uce58\uc5d0\uc11c \uc774 Weight Decay\ub294 \ub2e4\uc74c \ucf54\ub4dc\ucc98\ub7fc \uc801\uc6a9\ud560 &hellip; <\/p>\n<p class=\"link-more\"><a href=\"http:\/\/www.gisdeveloper.co.kr\/?p=8443\" class=\"more-link\">\ub354 \ubcf4\uae30<span class=\"screen-reader-text\"> &#8220;\ub525\ub7ec\ub2dd \ud559\uc2b5 \ud5a5\uc0c1\uc744 \uc704\ud55c \uace0\ub824 \uc0ac\ud56d\ub4e4&#8221;<\/span><\/a><\/p>\n","protected":false},"author":1,"featured_media":0,"comment_status":"open","ping_status":"open","sticky":false,"template":"","format":"standard","meta":{"footnotes":""},"categories":[131,132],"tags":[],"class_list":["post-8443","post","type-post","status-publish","format-standard","hentry","category-python","category-deep-machine-learning"],"_links":{"self":[{"href":"http:\/\/www.gisdeveloper.co.kr\/index.php?rest_route=\/wp\/v2\/posts\/8443","targetHints":{"allow":["GET"]}}],"collection":[{"href":"http:\/\/www.gisdeveloper.co.kr\/index.php?rest_route=\/wp\/v2\/posts"}],"about":[{"href":"http:\/\/www.gisdeveloper.co.kr\/index.php?rest_route=\/wp\/v2\/types\/post"}],"author":[{"embeddable":true,"href":"http:\/\/www.gisdeveloper.co.kr\/index.php?rest_route=\/wp\/v2\/users\/1"}],"replies":[{"embeddable":true,"href":"http:\/\/www.gisdeveloper.co.kr\/index.php?rest_route=%2Fwp%2Fv2%2Fcomments&post=8443"}],"version-history":[{"count":21,"href":"http:\/\/www.gisdeveloper.co.kr\/index.php?rest_route=\/wp\/v2\/posts\/8443\/revisions"}],"predecessor-version":[{"id":9355,"href":"http:\/\/www.gisdeveloper.co.kr\/index.php?rest_route=\/wp\/v2\/posts\/8443\/revisions\/9355"}],"wp:attachment":[{"href":"http:\/\/www.gisdeveloper.co.kr\/index.php?rest_route=%2Fwp%2Fv2%2Fmedia&parent=8443"}],"wp:term":[{"taxonomy":"category","embeddable":true,"href":"http:\/\/www.gisdeveloper.co.kr\/index.php?rest_route=%2Fwp%2Fv2%2Fcategories&post=8443"},{"taxonomy":"post_tag","embeddable":true,"href":"http:\/\/www.gisdeveloper.co.kr\/index.php?rest_route=%2Fwp%2Fv2%2Ftags&post=8443"}],"curies":[{"name":"wp","href":"https:\/\/api.w.org\/{rel}","templated":true}]}}