10月, 2018 | 個人用メモ帳

2018年10月7日2018年10月7日

PyTorch の動作確認をしてみた（７）

1. 環境は、Window 10 Home (64bit) 上で行った。

2. Anaconda3 (64bit) – Spyder上で、動作確認を行った。

3. python のバージョンは、python 3.6.5 である。

4. pytorch のバージョンは、pytorch 0.4.1 である。

5. GPU は, NVIDIA社の GeForce GTX 1050 である。

6. CPU は, Intel社の Core(TM) i7-7700HQ である。

今回確認した内容は、現場で使える! PyTorch開発入門深層学習モデルの作成とアプリケーションへの実装 (AI & TECHNOLOGY) の 4.2.2 CNNの構築と学習(P.067 – P.071) である。
前回に引き続き, Fashion-MNIST を使った, CNN の画像分類について, 少し動作確認を行った.
前回の課題として, 書籍上には, 正誤判定の結果に関する, 具体的な情報が未記載だったので, 今回は, 実際に, 画像を出力させるようにプログラムを書き換えて確認することになった.

※プログラムの詳細は、書籍を参考(P.067 – P.071)にして下さい。

■Fashion-MNISTの学習(正誤判定の画像出力版).

# -*- coding: utf-8 -*-
# tqdm を 下記コマンドで, install.
# conda install -c conda-forge tqdm
# 1. library import.
from __future__ import print_function
import torch
import torchvision
from torchvision.datasets import FashionMNIST
from torchvision import transforms
from torch.utils.data import DataLoader
import os, time
from torch import nn, optim
from tqdm import tqdm
import numpy as np
import matplotlib.pyplot as plt

# 2. declare functions.
# 2-1. display image function.
def imshow(inp, title=None):
    """Imshow for Tensor."""
    inp = inp.numpy().transpose((1, 2, 0))
    mean = np.array([0.485, 0.456, 0.406])
    std = np.array([0.229, 0.224, 0.225])
    inp = std * inp + mean
    inp = np.clip(inp, 0, 1)
    plt.axis('off')
    plt.imshow(inp)
    if title is not None:
        plt.title(title)
    # plt.pause(0.001)  # pause a bit so that plots are updated

# 2-2. A layer that stretches a Tensor of the (H, C, H, W) type to (N, C * H * W).
# required to pass the output of convolution layer to MLP.
class FlattenLayer(nn.Module):
    def forward(self, x):
        sizes = x.size()
        return x.view(sizes[0], - 1)

～(略)～

# 2-4. eval helper function.
def eval_net(net, data_loader, device="cpu"):
    # invalidate Dropout and BatchNorm.
～(略)～
    # a = [1, 2, 3, 4, 5]
    # b = [1, 3, 4, 3, 5]
    # c = [i for i, j in zip(a, b) if i == j]
    # print(c) # [1, 5]
    # [index, i, j] は, 誤検知画像のindex, 正解ラベル, 予測ラベル の意味.
    correct, wrong = [], []
    for index, (i, j) in enumerate(zip(ys, ypreds)):
        if i == j:
            correct.append([index, i, j])
        else:
            wrong.append([index, i, j])
    return acc.item(), correct, wrong
    

～(略)～

# 2-5. train net helper function.
def train_net(net, train_loader, test_loader, optimizer_cls=optim.Adam, 
              loss_fn=nn.CrossEntropyLoss(), n_iter=10, device="cpu"):
    train_losses, train_acc, val_acc = [], [], []
    optimizer = optimizer_cls(net.parameters())
    correct_list, wrong_list = [], []
～(略)～
        e = eval_net(net, test_loader, device)
        val_acc.append(e[0])
        if epoch + 1 == n_iter:
            correct_list.append(e[1])
            wrong_list.append(e[2])
        print(epoch, train_losses[-1], train_acc[-1], val_acc[-1], flush=True)
    return correct_list, wrong_list


～(略)～

# 5. execute training.
net.to("cuda:0")
correct_list, wrong_list = train_net(net, train_loader, test_loader, n_iter=1, device="cuda:0")

# 6. display processing time.
end = time.time()
# images: torch.Size([128, 1, 28, 28])
# images, labels: <class 'torch.Tensor'>
# images[0]: torch.Size([1, 28, 28])
images, labels = next(iter(test_loader))
# print(images.size())

# check the data size.
print('--- display 9 wrong answers ------------------------------------------')
# wrong_list[0][0:9][0]: <class 'list'>, wrong_list[0][0:9][0][1]: <class 'torch.Tensor'>
print(wrong_list[0][0:9])
indexes_for_wrong_list_image = [x[0] for x in wrong_list[0][0:9]]
print(str(indexes_for_wrong_list_image)) # ex. [17, 23, 40, 42, 46, 49, 68, 74, 98]
wrong_images_list = []
for i, v in enumerate(images):
    if i in indexes_for_wrong_list_image:
        # print(i)
        # 検証用画像 の サイズ(28 × 28)
        # v[0].size(): torch.Size([28, 28])
        # print(v[0].size())
        # Adding a dimension to a tensor in PyTorch.
        # http://blog.outcome.io/adding-a-dimension-to-a-tensor-in-pytorch/
        # uv: torch.Size([28, 28]) -> torch.Size([1, 28, 28])
        uv = v[0][None, :, :]
        wrong_images_list.append(uv)
# How to turn a list of tensor to tensor?
# https://discuss.pytorch.org/t/how-to-turn-a-list-of-tensor-to-tensor/8868/4
# -> convert list to torch.Tensor by torch.stack.
wrong_images_list = torch.stack(wrong_images_list)
print(wrong_images_list.size()) # torch.Size([9, 1, 28, 28])
wrong_images = torchvision.utils.make_grid(wrong_images_list, nrow=3, padding=1)
plt.subplot(121)
plt.title('wrong')
imshow(wrong_images)

print('--- display 9 correct answers ----------------------------------------')
print(correct_list[0][0:9])
indexes_for_correct_list_image = [x[0] for x in correct_list[0][0:9]]
print(str(indexes_for_correct_list_image)) # ex. [0, 1, 2, 3, 4, 5, 6, 7, 8]
correct_images_list = []
for i, v in enumerate(images):
    if i in indexes_for_correct_list_image:
        uv = v[0][None, :, :]
        correct_images_list.append(uv)        
correct_images_list = torch.stack(correct_images_list)
# print(correct_images_list.size())
correct_images = torchvision.utils.make_grid(correct_images_list, nrow=3, padding=1)
plt.subplot(122)
plt.title('correct')
imshow(correct_images)        

print('--------------------------------------------------')
print('Elapsed Time: ' + str(end - start) + "[sec]")

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

# -*- coding: utf-8 -*-

# tqdm を下記コマンドで, install.

# conda install -c conda-forge tqdm

# 1. library import.

from __future__ import print_function

import torch

import torchvision

from torchvision.datasets import FashionMNIST

from torchvision import transforms

from torch.utils.data import DataLoader

import os, time

from torch import nn, optim

from tqdm import tqdm

import numpy as np

import matplotlib.pyplot as plt

# 2. declare functions.

# 2-1. display image function.

def imshow(inp, title=None):

"""Imshow for Tensor."""

inp = inp.numpy().transpose((1, 2, 0))

mean = np.array([0.485, 0.456, 0.406])

std = np.array([0.229, 0.224, 0.225])

inp = std * inp + mean

inp = np.clip(inp, 0, 1)

plt.axis('off')

plt.imshow(inp)

if title is not None:

plt.title(title)

# plt.pause(0.001) # pause a bit so that plots are updated

# 2-2. A layer that stretches a Tensor of the (H, C, H, W) type to (N, C * H * W).

# required to pass the output of convolution layer to MLP.

class FlattenLayer(nn.Module):

def forward(self, x):

sizes = x.size()

return x.view(sizes[0], - 1)

～(略)～

# 2-4. eval helper function.

def eval_net(net, data_loader, device="cpu"):

# invalidate Dropout and BatchNorm.

～(略)～

# a = [1, 2, 3, 4, 5]

# b = [1, 3, 4, 3, 5]

# c = [i for i, j in zip(a, b) if i == j]

# print(c) # [1, 5]

# [index, i, j] は, 誤検知画像のindex, 正解ラベル, 予測ラベルの意味.

correct, wrong = [], []

for index, (i, j) in enumerate(zip(ys, ypreds)):

if i == j:

correct.append([index, i, j])

else:

wrong.append([index, i, j])

return acc.item(), correct, wrong

～(略)～

# 2-5. train net helper function.

def train_net(net, train_loader, test_loader, optimizer_cls=optim.Adam,

loss_fn=nn.CrossEntropyLoss(), n_iter=10, device="cpu"):

train_losses, train_acc, val_acc = [], [], []

optimizer = optimizer_cls(net.parameters())

correct_list, wrong_list = [], []

～(略)～

e = eval_net(net, test_loader, device)

val_acc.append(e[0])

if epoch + 1 == n_iter:

correct_list.append(e[1])

wrong_list.append(e[2])

print(epoch, train_losses[-1], train_acc[-1], val_acc[-1], flush=True)

return correct_list, wrong_list

～(略)～

# 5. execute training.

net.to("cuda:0")

correct_list, wrong_list = train_net(net, train_loader, test_loader, n_iter=1, device="cuda:0")

# 6. display processing time.

end = time.time()

# images: torch.Size([128, 1, 28, 28])

# images, labels: <class 'torch.Tensor'>

# images[0]: torch.Size([1, 28, 28])

images, labels = next(iter(test_loader))

# print(images.size())

# check the data size.

print('--- display 9 wrong answers ------------------------------------------')

# wrong_list[0][0:9][0]: <class 'list'>, wrong_list[0][0:9][0][1]: <class 'torch.Tensor'>

print(wrong_list[0][0:9])

indexes_for_wrong_list_image = [x[0] for x in wrong_list[0][0:9]]

print(str(indexes_for_wrong_list_image)) # ex. [17, 23, 40, 42, 46, 49, 68, 74, 98]

wrong_images_list = []

for i, v in enumerate(images):

if i in indexes_for_wrong_list_image:

# print(i)

# 検証用画像のサイズ(28 × 28)

# v[0].size(): torch.Size([28, 28])

# print(v[0].size())

# Adding a dimension to a tensor in PyTorch.

# http://blog.outcome.io/adding-a-dimension-to-a-tensor-in-pytorch/

# uv: torch.Size([28, 28]) -> torch.Size([1, 28, 28])

uv = v[0][None, :, :]

wrong_images_list.append(uv)

# How to turn a list of tensor to tensor?

# https://discuss.pytorch.org/t/how-to-turn-a-list-of-tensor-to-tensor/8868/4

# -> convert list to torch.Tensor by torch.stack.

wrong_images_list = torch.stack(wrong_images_list)

print(wrong_images_list.size()) # torch.Size([9, 1, 28, 28])

wrong_images = torchvision.utils.make_grid(wrong_images_list, nrow=3, padding=1)

plt.subplot(121)

plt.title('wrong')

imshow(wrong_images)

print('--- display 9 correct answers ----------------------------------------')

print(correct_list[0][0:9])

indexes_for_correct_list_image = [x[0] for x in correct_list[0][0:9]]

print(str(indexes_for_correct_list_image)) # ex. [0, 1, 2, 3, 4, 5, 6, 7, 8]

correct_images_list = []

for i, v in enumerate(images):

if i in indexes_for_correct_list_image:

uv = v[0][None, :, :]

correct_images_list.append(uv)

correct_images_list = torch.stack(correct_images_list)

# print(correct_images_list.size())

correct_images = torchvision.utils.make_grid(correct_images_list, nrow=3, padding=1)

plt.subplot(122)

plt.title('correct')

imshow(correct_images)

print('--------------------------------------------------')

print('Elapsed Time: ' + str(end - start) + "[sec]")

■実行結果(epoch = 1).

100%|██████████| 469/469 [00:10<00:00, 46.54it/s]
0 0.46340912513625926 0.8374666666666667 0.8877999782562256
--- display 9 wrong answers ------------------------------------------
[[12, tensor(7, device='cuda:0'), tensor(5, device='cuda:0')], [17, tensor(4, device='cuda:0'), tensor(2, device='cuda:0')], [23, tensor(9, device='cuda:0'), tensor(5, device='cuda:0')], [25, tensor(4, device='cuda:0'), tensor(6, device='cuda:0')], [42, tensor(3, device='cuda:0'), tensor(6, device='cuda:0')], [46, tensor(2, device='cuda:0'), tensor(6, device='cuda:0')], [49, tensor(2, device='cuda:0'), tensor(6, device='cuda:0')], [57, tensor(4, device='cuda:0'), tensor(6, device='cuda:0')], [66, tensor(2, device='cuda:0'), tensor(6, device='cuda:0')]]
[12, 17, 23, 25, 42, 46, 49, 57, 66]
torch.Size([9, 1, 28, 28])
--- display 9 correct answers ----------------------------------------
[[0, tensor(9, device='cuda:0'), tensor(9, device='cuda:0')], [1, tensor(2, device='cuda:0'), tensor(2, device='cuda:0')], [2, tensor(1, device='cuda:0'), tensor(1, device='cuda:0')], [3, tensor(1, device='cuda:0'), tensor(1, device='cuda:0')], [4, tensor(6, device='cuda:0'), tensor(6, device='cuda:0')], [5, tensor(1, device='cuda:0'), tensor(1, device='cuda:0')], [6, tensor(4, device='cuda:0'), tensor(4, device='cuda:0')], [7, tensor(6, device='cuda:0'), tensor(6, device='cuda:0')], [8, tensor(5, device='cuda:0'), tensor(5, device='cuda:0')]]
[0, 1, 2, 3, 4, 5, 6, 7, 8]
--------------------------------------------------
Elapsed Time: 12.64216923713684[sec]

100%|██████████| 469/469 [00:10<00:00, 46.54it/s]

0 0.46340912513625926 0.8374666666666667 0.8877999782562256

--- display 9 wrong answers ------------------------------------------

[[12, tensor(7, device='cuda:0'), tensor(5, device='cuda:0')], [17, tensor(4, device='cuda:0'), tensor(2, device='cuda:0')], [23, tensor(9, device='cuda:0'), tensor(5, device='cuda:0')], [25, tensor(4, device='cuda:0'), tensor(6, device='cuda:0')], [42, tensor(3, device='cuda:0'), tensor(6, device='cuda:0')], [46, tensor(2, device='cuda:0'), tensor(6, device='cuda:0')], [49, tensor(2, device='cuda:0'), tensor(6, device='cuda:0')], [57, tensor(4, device='cuda:0'), tensor(6, device='cuda:0')], [66, tensor(2, device='cuda:0'), tensor(6, device='cuda:0')]]

[12, 17, 23, 25, 42, 46, 49, 57, 66]

torch.Size([9, 1, 28, 28])

--- display 9 correct answers ----------------------------------------

[[0, tensor(9, device='cuda:0'), tensor(9, device='cuda:0')], [1, tensor(2, device='cuda:0'), tensor(2, device='cuda:0')], [2, tensor(1, device='cuda:0'), tensor(1, device='cuda:0')], [3, tensor(1, device='cuda:0'), tensor(1, device='cuda:0')], [4, tensor(6, device='cuda:0'), tensor(6, device='cuda:0')], [5, tensor(1, device='cuda:0'), tensor(1, device='cuda:0')], [6, tensor(4, device='cuda:0'), tensor(4, device='cuda:0')], [7, tensor(6, device='cuda:0'), tensor(6, device='cuda:0')], [8, tensor(5, device='cuda:0'), tensor(5, device='cuda:0')]]

[0, 1, 2, 3, 4, 5, 6, 7, 8]

--------------------------------------------------

Elapsed Time: 12.64216923713684[sec]

■実行結果(epoch = 3).

100%|██████████| 469/469 [00:10<00:00, 44.76it/s]
0 0.4758336953500397 0.83515 0.8811999559402466
100%|██████████| 469/469 [00:09<00:00, 48.26it/s]
1 0.31819574741853607 0.8837833333333334 0.8960999846458435
100%|██████████| 469/469 [00:09<00:00, 48.05it/s]
2 0.2854099352326658 0.8958166666666667 0.899899959564209
--- display 9 wrong answers ------------------------------------------
[[17, tensor(4, device='cuda:0'), tensor(6, device='cuda:0')], [23, tensor(9, device='cuda:0'), tensor(5, device='cuda:0')], [25, tensor(4, device='cuda:0'), tensor(6, device='cuda:0')], [42, tensor(3, device='cuda:0'), tensor(6, device='cuda:0')], [43, tensor(7, device='cuda:0'), tensor(9, device='cuda:0')], [49, tensor(2, device='cuda:0'), tensor(6, device='cuda:0')], [66, tensor(2, device='cuda:0'), tensor(3, device='cuda:0')], [67, tensor(3, device='cuda:0'), tensor(4, device='cuda:0')], [68, tensor(9, device='cuda:0'), tensor(7, device='cuda:0')]]
[17, 23, 25, 42, 43, 49, 66, 67, 68]
torch.Size([9, 1, 28, 28])
--- display 9 correct answers ----------------------------------------
[[0, tensor(9, device='cuda:0'), tensor(9, device='cuda:0')], [1, tensor(2, device='cuda:0'), tensor(2, device='cuda:0')], [2, tensor(1, device='cuda:0'), tensor(1, device='cuda:0')], [3, tensor(1, device='cuda:0'), tensor(1, device='cuda:0')], [4, tensor(6, device='cuda:0'), tensor(6, device='cuda:0')], [5, tensor(1, device='cuda:0'), tensor(1, device='cuda:0')], [6, tensor(4, device='cuda:0'), tensor(4, device='cuda:0')], [7, tensor(6, device='cuda:0'), tensor(6, device='cuda:0')], [8, tensor(5, device='cuda:0'), tensor(5, device='cuda:0')]]
[0, 1, 2, 3, 4, 5, 6, 7, 8]
--------------------------------------------------
Elapsed Time: 37.92949438095093[sec]

100%|██████████| 469/469 [00:10<00:00, 44.76it/s]

0 0.4758336953500397 0.83515 0.8811999559402466

100%|██████████| 469/469 [00:09<00:00, 48.26it/s]

1 0.31819574741853607 0.8837833333333334 0.8960999846458435

100%|██████████| 469/469 [00:09<00:00, 48.05it/s]

2 0.2854099352326658 0.8958166666666667 0.899899959564209

--- display 9 wrong answers ------------------------------------------

[[17, tensor(4, device='cuda:0'), tensor(6, device='cuda:0')], [23, tensor(9, device='cuda:0'), tensor(5, device='cuda:0')], [25, tensor(4, device='cuda:0'), tensor(6, device='cuda:0')], [42, tensor(3, device='cuda:0'), tensor(6, device='cuda:0')], [43, tensor(7, device='cuda:0'), tensor(9, device='cuda:0')], [49, tensor(2, device='cuda:0'), tensor(6, device='cuda:0')], [66, tensor(2, device='cuda:0'), tensor(3, device='cuda:0')], [67, tensor(3, device='cuda:0'), tensor(4, device='cuda:0')], [68, tensor(9, device='cuda:0'), tensor(7, device='cuda:0')]]

[17, 23, 25, 42, 43, 49, 66, 67, 68]

torch.Size([9, 1, 28, 28])

--- display 9 correct answers ----------------------------------------

[0, 1, 2, 3, 4, 5, 6, 7, 8]

--------------------------------------------------

Elapsed Time: 37.92949438095093[sec]

■以上の実行結果から, 以下のことが分かった.
① 例えば, epoch = 1 の場合, Fashion-MNIST のテスト画像の (index的に)12番目について,
“Sandal” と予想(tensor(5, device=’cuda:0′)) したが, “Sneaker” が正解(tensor(7, device=’cuda:0′)) との情報が得られた.

② また, 例えば, epoch = 3 の場合, Fashion-MNIST のテスト画像の (index的に)25番目について,
“Shirt” と予想(tensor(6, device=’cuda:0′)) したが, “Coat” が正解(tensor(4, device=’cuda:0′)) との情報が得られた.

③ なお, epoch = 1, 3 のいずれも, (index的に)0～8番目について, 予想と正解が一致しているとの情報が得られた.

■参照サイト
Adding a dimension to a tensor in PyTorch.
How to turn a list of tensor to tensor?
Fashion-MNIST

■参考書籍
現場で使える! PyTorch開発入門深層学習モデルの作成とアプリケーションへの実装 (AI & TECHNOLOGY)

2018年10月7日2018年10月7日

C++ の動作確認をしてみた（２４）

C++の練習を兼ねて, AtCoder Beginner Contest 112 の問題C（Pyramid), 問題D（Partition) を解いてみた.

■感想.
1. 問題D は, 時間内で, テストケース C030_scrambled を除いて, 通過したが, ロジック修正を, 自力で出来なかったため, コンテスト終了後, 解説を見て, ロジック修正した.
2. 問題C は, 時間内で, 外枠だけコーディングしたが, 問題の意図を理解できなかったので, コンテスト終了後, 再度解き直した.
3. 問題C は, テストケース in04.txt, in06.txt, in20.txt の Wrong Answer を, 解説見ても, 自力で修正できなかったので, 正解者のコーディングを参照したところ, N個のピラミッド情報で, ピラミッド高度に関する降順 sort が, 必要なことが分かった(※初回取得で, 高度 0 を取得させないようにするため)ので, ロジック修正した.
4. 個人的には, ここ最近, ABCコンテストの難易度が, かなり上昇気味に感じた, 復習がかなり大変となっている模様(汗).

本家のサイトABC 112 解説をご覧下さい.

■C++版プログラム(問題C).

// 解き直し.
// ABC 112 解説.
// https://img.atcoder.jp/abc112/editorial.pdf
#include <bits/stdc++.h>

using namespace std;

typedef long long LL;

#define FOR(i, a, b) for(int i = (a); i < (b); ++i)

struct pyramid {
    int x;    // ピラミッドのx座標.
    int y;    // ピラミッドのy座標.
    LL  h;    // ピラミッドの高度.
};

int main() {
    
    // 1. 入力情報取得.
    int N;
    cin >> N;
    vector<pyramid> v;
    FOR(i, 0, N) {
        pyramid p;
        cin >> p.x >> p.y >> p.h;
        v.push_back(p);
    }
    
    // 2. ピラミッドの高度に関して, 降順sort の ロジック追加.
    // テストケース in04.txt, in06.txt, in20.txt の Wrong Answer を, 自力で修正できなかったので, 
    // 正解者 の コーディングを参照したところ, 下記 3-1. の ロジックで, 
    // ピラミッドの高度 が 0 より大きいものが取れている必要があるとの情報が得られたため.
    sort(v.begin(), v.end(), [](const pyramid& x, const pyramid& y) {return x.h > y.h;});
    
    // 3. ピラミッド中心座標を計算.
    // 中心が, (pCx, pCy) だったとして, 全部調査してみる.
    int cx = 0;
    int cy = 0;
    LL  h  = 0LL;
    FOR(pCx, 0, 101) {
        FOR(pCy, 0, 101) {
            bool isCenter = true;
            LL lh = -1LL;
            for (auto &p : v) {
                // 3-1. とりあえず, 高さを抽出.
                if(lh == -1LL) {
                    lh = p.h + abs(p.x - pCx) + abs(p.y - pCy);
                    continue;
                }
                
                // 3-2. 抽出した高さが, 条件を満たすかを確認.
                // -> ピラミッド中心座標が確定すれば, (p.x, p.y) によらず, 高さが一定になるはず.
                LL lh2 = max(lh - abs(p.x - pCx) - abs(p.y - pCy), 0LL);
                if(p.h != lh2) {
                    isCenter = false;
                    break;
                }
                
            }
            // 3-3. 確定したピラミッド中心座標, 高度を保存.
            if(isCenter) {
                cx = pCx;
                cy = pCy;
                h  = lh;
                break;
            }
        }
    }

    // 4. 出力 ～ 後処理.
    cout << cx << " " << cy << " " << h << endl;
    return 0;
    
}

// 解き直し.

// ABC 112 解説.

// https://img.atcoder.jp/abc112/editorial.pdf

#include <bits/stdc++.h>

using namespace std;

typedef long long LL;

#define FOR(i, a, b) for(int i = (a); i < (b); ++i)

struct pyramid {

int x; // ピラミッドのx座標.

int y; // ピラミッドのy座標.

LL h; // ピラミッドの高度.

};

int main() {

// 1. 入力情報取得.

int N;

cin >> N;

vector<pyramid> v;

FOR(i, 0, N) {

pyramid p;

cin >> p.x >> p.y >> p.h;

v.push_back(p);

}

// 2. ピラミッドの高度に関して, 降順sort のロジック追加.

// テストケース in04.txt, in06.txt, in20.txt の Wrong Answer を, 自力で修正できなかったので,

// 正解者のコーディングを参照したところ, 下記 3-1. のロジックで,

// ピラミッドの高度が 0 より大きいものが取れている必要があるとの情報が得られたため.

sort(v.begin(), v.end(), [](const pyramid& x, const pyramid& y) {return x.h > y.h;});

// 3. ピラミッド中心座標を計算.

// 中心が, (pCx, pCy) だったとして, 全部調査してみる.

int cx = 0;

int cy = 0;

LL h = 0LL;

FOR(pCx, 0, 101) {

FOR(pCy, 0, 101) {

bool isCenter = true;

LL lh = -1LL;

for (auto &p : v) {

// 3-1. とりあえず, 高さを抽出.

if(lh == -1LL) {

lh = p.h + abs(p.x - pCx) + abs(p.y - pCy);

continue;

}

// 3-2. 抽出した高さが, 条件を満たすかを確認.

// -> ピラミッド中心座標が確定すれば, (p.x, p.y) によらず, 高さが一定になるはず.

LL lh2 = max(lh - abs(p.x - pCx) - abs(p.y - pCy), 0LL);

if(p.h != lh2) {

isCenter = false;

break;

}

// 3-3. 確定したピラミッド中心座標, 高度を保存.

if(isCenter) {

cx = pCx;

cy = pCy;

h = lh;

break;

}

// 4. 出力～後処理.

cout << cx << " " << cy << " " << h << endl;

return 0;

}

■C++版プログラム(問題D).

// 解き直し.
// ABC 112 解説.
// https://img.atcoder.jp/abc112/editorial.pdf
#include <bits/stdc++.h>

using namespace std;

typedef long long LL;

#define FOR(i, a, b) for(LL i = (a); i < (b); ++i)

int main() {
    
    // 1. 入力情報取得.
    LL N, M;
    cin >> N >> M;
    // 2. 最大公約数を計算.
    LL ans = 1;
    if(M % N == 0) ans = M / N;
    if(M % N != 0) {
        LL LGCD = 1;
        // C030_scrambled が通過できなかった.
        // FOR(i, 2, 100001) {
        LL LIMIT = M / N;
        FOR(i, 2, LIMIT) {
            if(M % i == 0) LGCD = i;
            if(LGCD * N <= M) ans = max(ans, LGCD);
        }
    }
    
    // 3. 出力 ～ 後処理.
    cout << ans << endl;
    return 0;

}

// 解き直し.

// ABC 112 解説.

// https://img.atcoder.jp/abc112/editorial.pdf

#include <bits/stdc++.h>

using namespace std;

typedef long long LL;

#define FOR(i, a, b) for(LL i = (a); i < (b); ++i)

int main() {

// 1. 入力情報取得.

LL N, M;

cin >> N >> M;

// 2. 最大公約数を計算.

LL ans = 1;

if(M % N == 0) ans = M / N;

if(M % N != 0) {

LL LGCD = 1;

// C030_scrambled が通過できなかった.

// FOR(i, 2, 100001) {

LL LIMIT = M / N;

FOR(i, 2, LIMIT) {

if(M % i == 0) LGCD = i;

if(LGCD * N <= M) ans = max(ans, LGCD);

}

// 3. 出力～後処理.

cout << ans << endl;

return 0;

}

■参照サイト
AtCoder Beginner Contest 112

2018年10月6日2018年10月6日

C++ の動作確認をしてみた（２３）

C++の練習を兼ねて, AtCoder Beginner Contest 066 の問題C（pushpush）を解いてみた.

■感想.
1. 数列の要素を, 問題文の操作で並び順を変えると, 膨大な計算量(O(nの2乗)) が必要となるが, 規則性を見つけると, 計算量が O(n) の 3倍程度まで, 削減できる点が, 面白いと感じた.
2. 解説を読んだところ, 標準ライブラリ std::deque があるとのことで, 大変参考になったと思う.
3. 標準ライブラリ std::deque を使ってみたところ, 実装が, よりコンパクトにまとまって, びっくりした(汗).

本家のサイトABC066 / ARC077 解説をご覧下さい.

■C++版プログラム.

#include <bits/stdc++.h>

using namespace std;

#define FOR(i, a, b) for(int i=(a); i<(b); ++i)

typedef long long LL;

int main() {
    
    // 1. 入力情報取得.
    int N;
    cin >> N;
    LL A[N] = {};
    FOR(i, 0, N) cin >> A[i];
    
    // 2. 問題文の操作した数列を保存.
    // 例)
    // 1 -> 1
    // 1 2 -> 2 1
    // 1 2 3 -> 3 1 2
    // 1 2 3 4 -> 4 2 1 3
    // 1 2 3 4 5 -> 5 3 1 2 4
    // -> 以上のことから, 
    // A の i番目の要素 は,  
    // B の (N / 2) + sign * ((i + 1)/ 2)番目 に, 対応することが分かった.
    // 但し, 符合 sign の 初期値 は, N の 偶奇 で 分岐.
    LL B[N] = {};
    int sign = ((N % 2 == 0) ? (-1) : 1);
    FOR(i, 0, N) {
        sign *= (-1);
        int index = (N / 2);
        index += (sign * ((i + 1) / 2));
        // cout << index << endl;
        B[index] = A[i];
    }
    
    // 3. 出力 ～ 後処理.
    FOR(i, 0, N) cout << B[i] << " ";
    return 0;
    
}

#include <bits/stdc++.h>

using namespace std;

#define FOR(i, a, b) for(int i=(a); i<(b); ++i)

typedef long long LL;

int main() {

// 1. 入力情報取得.

int N;

cin >> N;

LL A[N] = {};

FOR(i, 0, N) cin >> A[i];

// 2. 問題文の操作した数列を保存.

// 例)

// 1 -> 1

// 1 2 -> 2 1

// 1 2 3 -> 3 1 2

// 1 2 3 4 -> 4 2 1 3

// 1 2 3 4 5 -> 5 3 1 2 4

// -> 以上のことから,

// A の i番目の要素は,

// B の (N / 2) + sign * ((i + 1)/ 2)番目に, 対応することが分かった.

// 但し, 符合 sign の初期値は, N の偶奇で分岐.

LL B[N] = {};

int sign = ((N % 2 == 0) ? (-1) : 1);

FOR(i, 0, N) {

sign *= (-1);

int index = (N / 2);

index += (sign * ((i + 1) / 2));

// cout << index << endl;

B[index] = A[i];

}

// 3. 出力～後処理.

FOR(i, 0, N) cout << B[i] << " ";

return 0;

}

■C++版プログラム(std::dequeを使った場合).

// 解き直し.
// std::deque を 使って, 実装した版.
// ABC066 / ARC077 解説.
// https://atcoder.jp/img/arc077/editorial.pdf
#include <bits/stdc++.h>

using namespace std;

#define FOR(i, a, b) for(int i=(a); i<(b); ++i)

typedef long long LL;

int main() {
    
    // 1. 入力情報取得.
    int N;
    cin >> N;
    LL A[N] = {};
    FOR(i, 0, N) cin >> A[i];
    
    // 2. 問題文の操作した数列を保存.
    // 例)
    // 1 -> 1
    // 1 2 -> 2 1
    // 1 2 3 -> 3 1 2
    // 1 2 3 4 -> 4 2 1 3
    // 1 2 3 4 5 -> 5 3 1 2 4
    // 
    // 解説通り.
    // i(※0 ～ N - 1) と N の 偶奇 を確認して, 
    // 一致する   … 数列A の要素を, deque の 末尾 に追加.
    // 一致しない … 数列A の要素を, deque の 先頭 に追加.
    deque<LL> dq;
    FOR(i, 0, N) {
        if((N - i) % 2 == 0) dq.push_back(A[i]);
        else                 dq.push_front(A[i]);
    }
    
    // 3. 出力 ～ 後処理.
    for (auto &p : dq) cout << p << " ";
    return 0;
    
}

// 解き直し.

// std::deque を使って, 実装した版.

// ABC066 / ARC077 解説.

// https://atcoder.jp/img/arc077/editorial.pdf

#include <bits/stdc++.h>

using namespace std;

#define FOR(i, a, b) for(int i=(a); i<(b); ++i)

typedef long long LL;

int main() {

// 1. 入力情報取得.

int N;

cin >> N;

LL A[N] = {};

FOR(i, 0, N) cin >> A[i];

// 2. 問題文の操作した数列を保存.

// 例)

// 1 -> 1

// 1 2 -> 2 1

// 1 2 3 -> 3 1 2

// 1 2 3 4 -> 4 2 1 3

// 1 2 3 4 5 -> 5 3 1 2 4

// 解説通り.

// i(※0 ～ N - 1) と N の偶奇を確認して,

// 一致する … 数列A の要素を, deque の末尾に追加.

// 一致しない … 数列A の要素を, deque の先頭に追加.

deque<LL> dq;

FOR(i, 0, N) {

if((N - i) % 2 == 0) dq.push_back(A[i]);

else dq.push_front(A[i]);

}

// 3. 出力～後処理.

for (auto &p : dq) cout << p << " ";

return 0;

}

■参照サイト
AtCoder Beginner Contest 066

2018年10月4日

PyTorch の動作確認をしてみた（６）

1. 環境は、Window 10 Home (64bit) 上で行った。

2. Anaconda3 (64bit) – Spyder上で、動作確認を行った。

3. python のバージョンは、python 3.6.5 である。

4. pytorch のバージョンは、pytorch 0.4.1 である。

5. GPU は, NVIDIA社の GeForce GTX 1050 である。

6. CPU は, Intel社の Core(TM) i7-7700HQ である。

今回確認した内容は、現場で使える! PyTorch開発入門深層学習モデルの作成とアプリケーションへの実装 (AI & TECHNOLOGY) の 4.2.2 CNNの構築と学習(P.067 – P.071) である。
Fashion-MNIST を使った, CNN の画像分類について書かれていたので, 少し動作確認を行った.
また, tqdm の使い方も確認できた.

※プログラムの詳細は、書籍を参考(P.067 – P.071)にして下さい。

■Fashion-MNISTの学習(GPU版).

# tqdm を 下記コマンドで, install.
# conda install -c conda-forge tqdm
# 1. library import.
from __future__ import print_function
import torch
from torchvision.datasets import FashionMNIST
from torchvision import transforms
from torch.utils.data import DataLoader
import os, time
from torch import nn, optim
from tqdm import tqdm

# 2. declare functions.
# 2-1. A layer that stretches a Tensor of the (H, C, H, W) type to (N, C * H * W).
# required to pass the output of convolution layer to MLP.
class FlattenLayer(nn.Module):
    def forward(self, x):
        sizes = x.size()
        return x.view(sizes[0], - 1)

～(略)～
        n, n_acc = 0, 0
        for i ,(xx, yy) in tqdm(enumerate(train_loader), total=len(train_loader)):
            xx, yy = xx.to(device), yy.to(device)
～(略)～

# 5. execute training.
net.to("cuda:0")
train_net(net, train_loader, test_loader, n_iter=20, device="cuda:0")

# 6. display processing time.
end = time.time()
print('--------------------------------------------------')
print('Elapsed Time: ' + str(end - start) + "[sec]")

# tqdm を下記コマンドで, install.

# conda install -c conda-forge tqdm

# 1. library import.

from __future__ import print_function

import torch

from torchvision.datasets import FashionMNIST

from torchvision import transforms

from torch.utils.data import DataLoader

import os, time

from torch import nn, optim

from tqdm import tqdm

# 2. declare functions.

# 2-1. A layer that stretches a Tensor of the (H, C, H, W) type to (N, C * H * W).

# required to pass the output of convolution layer to MLP.

class FlattenLayer(nn.Module):

def forward(self, x):

sizes = x.size()

return x.view(sizes[0], - 1)

～(略)～

n, n_acc = 0, 0

for i ,(xx, yy) in tqdm(enumerate(train_loader), total=len(train_loader)):

xx, yy = xx.to(device), yy.to(device)

～(略)～

# 5. execute training.

net.to("cuda:0")

train_net(net, train_loader, test_loader, n_iter=20, device="cuda:0")

# 6. display processing time.

end = time.time()

print('--------------------------------------------------')

print('Elapsed Time: ' + str(end - start) + "[sec]")

■実行結果(GPU版).

■Fashion-MNISTの学習(CPU版).

# -*- coding: utf-8 -*-
# tqdm を 下記コマンドで, install.
# conda install -c conda-forge tqdm
# 1. library import.
from __future__ import print_function
import torch
from torchvision.datasets import FashionMNIST
from torchvision import transforms
from torch.utils.data import DataLoader
import os, time
from torch import nn, optim
from tqdm import tqdm

# 2. declare functions.
# 2-1. A layer that stretches a Tensor of the (H, C, H, W) type to (N, C * H * W).
# required to pass the output of convolution layer to MLP.
class FlattenLayer(nn.Module):
    def forward(self, x):
        sizes = x.size()
        return x.view(sizes[0], - 1)

～(略)～
        n, n_acc = 0, 0
        for i ,(xx, yy) in tqdm(enumerate(train_loader), total=len(train_loader)):
            xx, yy = xx.to(device), yy.to(device)
～(略)～

# 5. execute training.
train_net(net, train_loader, test_loader, n_iter=20)

# 6. display processing time.
end = time.time()
print('--------------------------------------------------')
print('Elapsed Time: ' + str(end - start) + "[sec]")

# -*- coding: utf-8 -*-

# tqdm を下記コマンドで, install.

# conda install -c conda-forge tqdm

# 1. library import.

from __future__ import print_function

import torch

from torchvision.datasets import FashionMNIST

from torchvision import transforms

from torch.utils.data import DataLoader

import os, time

from torch import nn, optim

from tqdm import tqdm

# 2. declare functions.

# 2-1. A layer that stretches a Tensor of the (H, C, H, W) type to (N, C * H * W).

# required to pass the output of convolution layer to MLP.

class FlattenLayer(nn.Module):

def forward(self, x):

sizes = x.size()

return x.view(sizes[0], - 1)

～(略)～

n, n_acc = 0, 0

for i ,(xx, yy) in tqdm(enumerate(train_loader), total=len(train_loader)):

xx, yy = xx.to(device), yy.to(device)

～(略)～

# 5. execute training.

train_net(net, train_loader, test_loader, n_iter=20)

# 6. display processing time.

end = time.time()

print('--------------------------------------------------')

print('Elapsed Time: ' + str(end - start) + "[sec]")

■実行結果(CPU版).

■以上の実行結果から, 以下のことが分かった.
① 処理速度.
実行結果(GPU版): Elapsed Time: 189.46908950805664[sec]
実行結果(CPU版): Elapsed Time: 1290.8199858665466[sec]
-> GPU版が CPU版に比べて, 約6.8倍早く処理できたことが分かった.

② tqdm の使い方.
著書上の tqdm.tqdm(enumerate～(略)～では, 動作しなかったので, tqdm(enumerate～(略)～で確認した.

■参考書籍
現場で使える! PyTorch開発入門深層学習モデルの作成とアプリケーションへの実装 (AI & TECHNOLOGY)

C++の練習を兼ねて, AtCoder Beginner Contest 112 の 問題C（Pyramid), 問題D（Partition) を解いてみた.

C++の練習を兼ねて, AtCoder Beginner Contest 066 の 問題C（pushpush）を解いてみた.

C++の練習を兼ねて, AtCoder Beginner Contest 112 の問題C（Pyramid), 問題D（Partition) を解いてみた.

C++の練習を兼ねて, AtCoder Beginner Contest 066 の問題C（pushpush）を解いてみた.