car-detection-bayes/utils/torch_utils.py

import os

import torch


def init_seeds(seed=0):
    torch.manual_seed(seed)
    torch.cuda.manual_seed(seed)
    torch.cuda.manual_seed_all(seed)

    # Remove randomness (may be slower on Tesla GPUs) # https://pytorch.org/docs/stable/notes/randomness.html
    if seed == 0:
        torch.backends.cudnn.deterministic = True
        torch.backends.cudnn.benchmark = False


def select_device(device='', apex=False):
    # device = 'cpu' or '0' or '0,1,2,3'
    cpu_request = device.lower() == 'cpu'
    if device and not cpu_request:  # if device requested other than 'cpu'
        os.environ['CUDA_VISIBLE_DEVICES'] = device  # set environment variable
        assert torch.cuda.is_available(), 'CUDA unavailable, invalid device %s requested' % device  # check availablity

    cuda = False if cpu_request else torch.cuda.is_available()
    if cuda:
        c = 1024 ** 2  # bytes to MB
        ng = torch.cuda.device_count()
        x = [torch.cuda.get_device_properties(i) for i in range(ng)]
        cuda_str = 'Using CUDA ' + ('Apex ' if apex else '')  # apex for mixed precision https://github.com/NVIDIA/apex
        for i in range(0, ng):
            if i == 1:
                cuda_str = ' ' * len(cuda_str)
            print("%sdevice%g _CudaDeviceProperties(name='%s', total_memory=%dMB)" %
                  (cuda_str, i, x[i].name, x[i].total_memory / c))
    else:
        print('Using CPU')

    print('')  # skip a line
    return torch.device('cuda:0' if cuda else 'cpu')


def fuse_conv_and_bn(conv, bn):
    # https://tehnokv.com/posts/fusing-batchnorm-and-conv/
    with torch.no_grad():
        # init
        fusedconv = torch.nn.Conv2d(conv.in_channels,
                                    conv.out_channels,
                                    kernel_size=conv.kernel_size,
                                    stride=conv.stride,
                                    padding=conv.padding,
                                    bias=True)

        # prepare filters
        w_conv = conv.weight.clone().view(conv.out_channels, -1)
        w_bn = torch.diag(bn.weight.div(torch.sqrt(bn.eps + bn.running_var)))
        fusedconv.weight.copy_(torch.mm(w_bn, w_conv).view(fusedconv.weight.size()))

        # prepare spatial bias
        if conv.bias is not None:
            b_conv = conv.bias
        else:
            b_conv = torch.zeros(conv.weight.size(0))
        b_bn = bn.bias - bn.weight.mul(bn.running_mean).div(torch.sqrt(bn.running_var + bn.eps))
        fusedconv.bias.copy_(b_conv + b_bn)

        return fusedconv
updates 2019-09-10 12:59:45 +00:00			`import os`
updates 2019-09-13 14:00:52 +00:00
Extract seed and cuda initialization utils 2018-12-05 10:55:27 +00:00			`import torch`


			`def init_seeds(seed=0):`
			`torch.manual_seed(seed)`
updates 2019-02-25 12:47:51 +00:00			`torch.cuda.manual_seed(seed)`
			`torch.cuda.manual_seed_all(seed)`
updates 2019-09-10 08:56:56 +00:00
			`# Remove randomness (may be slower on Tesla GPUs) # https://pytorch.org/docs/stable/notes/randomness.html`
			`if seed == 0:`
			`torch.backends.cudnn.deterministic = True`
			`torch.backends.cudnn.benchmark = False`
Extract seed and cuda initialization utils 2018-12-05 10:55:27 +00:00

updates 2019-09-26 10:52:16 +00:00			`def select_device(device='', apex=False):`
updates 2019-09-26 11:52:37 +00:00			`# device = 'cpu' or '0' or '0,1,2,3'`
			`cpu_request = device.lower() == 'cpu'`
			`if device and not cpu_request: # if device requested other than 'cpu'`
			`os.environ['CUDA_VISIBLE_DEVICES'] = device # set environment variable`
			`assert torch.cuda.is_available(), 'CUDA unavailable, invalid device %s requested' % device # check availablity`

			`cuda = False if cpu_request else torch.cuda.is_available()`
updates 2019-04-08 13:41:14 +00:00			`if cuda:`
			`c = 1024 ** 2 # bytes to MB`
			`ng = torch.cuda.device_count()`
			`x = [torch.cuda.get_device_properties(i) for i in range(ng)]`
updates 2019-09-26 11:52:37 +00:00			`cuda_str = 'Using CUDA ' + ('Apex ' if apex else '') # apex for mixed precision https://github.com/NVIDIA/apex`
updates 2019-07-16 17:09:40 +00:00			`for i in range(0, ng):`
updates 2019-07-16 17:10:33 +00:00			`if i == 1:`
updates 2019-07-16 17:09:40 +00:00			`cuda_str = ' ' * len(cuda_str)`
			`print("%sdevice%g _CudaDeviceProperties(name='%s', total_memory=%dMB)" %`
			`(cuda_str, i, x[i].name, x[i].total_memory / c))`
updates 2019-09-26 11:52:37 +00:00			`else:`
			`print('Using CPU')`
select GPU0 if multiple available 2019-02-16 13:33:52 +00:00
updates 2019-05-03 16:14:16 +00:00			`print('') # skip a line`
updates 2019-09-26 11:52:37 +00:00			`return torch.device('cuda:0' if cuda else 'cpu')`
hyperparameter updates 2019-04-19 18:41:18 +00:00

			`def fuse_conv_and_bn(conv, bn):`
			`# https://tehnokv.com/posts/fusing-batchnorm-and-conv/`
			`with torch.no_grad():`
			`# init`
updates 2019-07-24 17:02:24 +00:00			`fusedconv = torch.nn.Conv2d(conv.in_channels,`
			`conv.out_channels,`
			`kernel_size=conv.kernel_size,`
			`stride=conv.stride,`
			`padding=conv.padding,`
			`bias=True)`
hyperparameter updates 2019-04-19 18:41:18 +00:00
			`# prepare filters`
			`w_conv = conv.weight.clone().view(conv.out_channels, -1)`
			`w_bn = torch.diag(bn.weight.div(torch.sqrt(bn.eps + bn.running_var)))`
			`fusedconv.weight.copy_(torch.mm(w_bn, w_conv).view(fusedconv.weight.size()))`

			`# prepare spatial bias`
			`if conv.bias is not None:`
			`b_conv = conv.bias`
			`else:`
			`b_conv = torch.zeros(conv.weight.size(0))`
			`b_bn = bn.bias - bn.weight.mul(bn.running_mean).div(torch.sqrt(bn.running_var + bn.eps))`
			`fusedconv.bias.copy_(b_conv + b_bn)`

			`return fusedconv`