Python chainer.cuda 模块，get_array_module() 实例源码

我们从Python开源项目中，提取了以下50个代码示例，用于说明如何使用chainer.cuda.get_array_module()。

项目：shoelace 作者：rjagerman | 项目源码 | 文件源码

def listmle(x, t):
    """
    The ListMLE loss as in Xia et al (2008), Listwise Approach to Learning to
    Rank - Theory and Algorithm.

    :param x: The activation of the previous layer 
    :param t: The target labels
    :return: The loss
    """

    # Get the ground truth by sorting activations by the relevance labels
    xp = cuda.get_array_module(t)
    t_hat = t[:, 0]
    x_hat = x[xp.flip(xp.argsort(t_hat), axis=0)]

    # Compute MLE loss
    final = logcumsumexp(x_hat)
    return F.sum(final - x_hat)

项目：chainerrl 作者：chainer | 项目源码 | 文件源码

def bound_by_tanh(x, low, high):
    """Bound a given value into [low, high] by tanh.

    Args:
        x (chainer.Variable): value to bound
        low (numpy.ndarray): lower bound
        high (numpy.ndarray): upper bound
    Returns: chainer.Variable
    """
    assert isinstance(x, chainer.Variable)
    assert low is not None
    assert high is not None
    xp = cuda.get_array_module(x.data)
    x_scale = (high - low) / 2
    x_scale = xp.expand_dims(xp.asarray(x_scale), axis=0)
    x_mean = (high + low) / 2
    x_mean = xp.expand_dims(xp.asarray(x_mean), axis=0)
    return F.tanh(x) * x_scale + x_mean

项目：chainerrl 作者：chainer | 项目源码 | 文件源码

def check_forward(self, x_data):
        xp = cuda.get_array_module(x_data)
        y = maximum_entropy_mellowmax(x_data)
        self.assertEqual(y.data.dtype, self.dtype)

        print('y', y.data)

        # Outputs must be positive
        xp.testing.assert_array_less(xp.zeros_like(y.data), y.data)

        # Sums must be ones
        sums = xp.sum(y.data, axis=1)
        testing.assert_allclose(sums, xp.ones_like(sums))

        # Expectations must be equal to memllowmax's outputs
        testing.assert_allclose(
            xp.sum(y.data * x_data, axis=1), mellowmax(x_data, axis=1).data)

项目：chainer-faster-rcnn 作者：mitmul | 项目源码 | 文件源码

def bbox_transform(ex_rois, gt_rois):
    xp = get_array_module(ex_rois)

    ex_widths = ex_rois[:, 2] - ex_rois[:, 0] + 1.0
    ex_heights = ex_rois[:, 3] - ex_rois[:, 1] + 1.0
    ex_ctr_x = ex_rois[:, 0] + 0.5 * ex_widths
    ex_ctr_y = ex_rois[:, 1] + 0.5 * ex_heights

    gt_widths = gt_rois[:, 2] - gt_rois[:, 0] + 1.0
    gt_heights = gt_rois[:, 3] - gt_rois[:, 1] + 1.0
    gt_ctr_x = gt_rois[:, 0] + 0.5 * gt_widths
    gt_ctr_y = gt_rois[:, 1] + 0.5 * gt_heights

    targets_dx = (gt_ctr_x - ex_ctr_x) / ex_widths
    targets_dy = (gt_ctr_y - ex_ctr_y) / ex_heights
    targets_dw = xp.log(gt_widths / ex_widths)
    targets_dh = xp.log(gt_heights / ex_heights)

    targets = xp.vstack(
        (targets_dx, targets_dy, targets_dw, targets_dh)).transpose()
    return targets

项目：GrouPy 作者：tscohen | 项目源码 | 文件源码

def forward_gpu(self, inputs):

        w, = inputs
        xp = cuda.get_array_module(w)
        och, ich, _, ny, nx = w.shape

        nto, nti = self.T.shape[:2]
        rotated_w = xp.empty((och, nto, ich, nti, ny, nx), dtype=w.dtype)

        index_group_func_kernel(
            input=w,
            T=self.T,
            U=self.U,
            V=self.V,
            output=rotated_w
        )

        return rotated_w,

项目：GrouPy 作者：tscohen | 项目源码 | 文件源码

def backward_gpu(self, inputs, grad_output):

        w, = inputs
        grad_rotated_w, = grad_output
        xp = cuda.get_array_module(w)

        # Gradient must be initialized with zeros,
        # because the kernel accumulates the gradient instead of overwriting it
        grad_w = xp.zeros_like(w)

        grad_index_group_func_kernel(
            grad_output=grad_rotated_w,
            T=self.T,
            U=self.U,
            V=self.V,
            grad_input=grad_w
        )

        return grad_w,

项目：chainer-neural-style 作者：dsanno | 项目源码 | 文件源码

def nearest_neighbor_patch(x, patch, patch_norm):
    assert patch.data.shape[0] == 1, 'mini batch size of patch must be 1'
    assert patch_norm.data.shape[0] == 1, 'mini batch size of patch_norm must be 1'

    xp = cuda.get_array_module(x.data)
    z = x.data
    b, ch, h, w = z.shape
    z = z.transpose((1, 0, 2, 3)).reshape((ch, -1))
    norm = xp.expand_dims(xp.sum(z ** 2, axis=0) ** 0.5, 0)
    z = z / xp.broadcast_to(norm, z.shape)
    p = patch.data
    p_norm = patch_norm.data
    p = p.reshape((ch, -1))
    p_norm = p_norm.reshape((1, -1))
    p_normalized = p / xp.broadcast_to(p_norm, p.shape)
    correlation = z.T.dot(p_normalized)
    min_index = xp.argmax(correlation, axis=1)
    nearest_neighbor = p.take(min_index, axis=1).reshape((ch, b, h, w)).transpose((1, 0, 2, 3))
    return Variable(nearest_neighbor)

项目：chainer-speech-recognition 作者：musyoku | 项目源码 | 文件源码

def update_stats(self, iteration, batchsizes, augmentation=None):
        # stack = None
        for i in range(iteration):
            batch, bucket_idx, piece_id = self.reader.sample_minibatch(batchsizes)
            audio_features, sentences, max_feature_length, max_sentence_length = self.extract_batch_features(batch, augmentation=augmentation)
            x_batch, x_length_batch, t_batch, t_length_batch, bigram_batch = self.processor.features_to_minibatch(audio_features, sentences, max_feature_length, max_sentence_length, self.token_ids, self.id_blank)

            # xp = cuda.get_array_module(x_batch)
            for x, length in zip(x_batch, x_length_batch):
                # if stack is None:
                #   stack = x[..., :length]
                # else:
                #   stack = xp.concatenate((stack, x[..., :length]), axis=2)
                self._update_stats_recursively(x[..., :length])

        # x_mean, x_std = self.get_mean_and_std()
        # true_mean = np.mean(stack, axis=2)
        # true_std = np.std(stack, axis=2)
        # print(xp.mean(abs(true_mean - x_mean), axis=(0, 2)))
        # print(xp.mean(abs(true_std - x_std), axis=(0, 2)))

项目：chainer-speech-recognition 作者：musyoku | 项目源码 | 文件源码

def _backward_sum(gy, in_shape):
    xp = cuda.get_array_module(gy)
    sum_axis = (1, 2)
    keepdims = True
    if not (len(in_shape) == 0 or sum_axis is None or keepdims):
        actual_axis = []
        for axis in sum_axis:
            if axis < 0:
                axis += len(in_shape)
            actual_axis.append(axis)
        for axis in sorted(actual_axis):
            gy = xp.expand_dims(gy, axis=axis)
    if hasattr(xp, 'broadcast_to'):
        gx = xp.broadcast_to(gy, in_shape)
    else:
        # NumPy 1.9 does not support broadcast_to.
        dummy_x = xp.empty(in_shape, 'b')
        gx, _ = xp.broadcast_arrays(gy, dummy_x)

    return gx

项目：chainer-speech-recognition 作者：musyoku | 项目源码 | 文件源码

def forward(self, xs, eps=1e-6):
        self.retain_inputs(())
        self.eps = eps
        x = xs[0]
        self.x_shape = x.shape
        self.x_dtype = x.dtype
        xp = cuda.get_array_module(x)
        size = x.shape[1] * x.shape[2]
        self.x_size = size
        mean = xp.mean(x, axis=(1, 2), keepdims=True)
        self.broadcast_shape = mean.shape
        self.diff = x - mean
        std = xp.sqrt(xp.sum(self.diff ** 2, axis=(1, 2), keepdims=True) / size)
        # std = xp.std(x, axis=(1, 2), keepdims=True)
        self.std = std
        return self.diff / std,

项目：chainer-speech-recognition 作者：musyoku | 项目源码 | 文件源码

def backward_cpu(self, inputs, grad_outputs):
        x, V, g = inputs[:3]
        b = inputs[3] if len(inputs) == 4 else None
        if b is None:
            gb = None
            gx, gW = super(Convolution2DFunction, self).backward_cpu((x, self.W), grad_outputs)
        else:
            gx, gW, gb = super(Convolution2DFunction, self).backward_cpu((x, self.W, b), grad_outputs)

        xp = cuda.get_array_module(x)
        gg = xp.sum(gW * self.V_normalized, axis=(1, 2, 3), keepdims=True).astype(g.dtype, copy=False)
        gV = g * (gW - gg * self.V_normalized) / self.norm
        gV = gV.astype(V.dtype, copy=False)

        if b is None:
            return gx, gV, gg
        else:
            return gx, gV, gg, gb

项目：chainer-speech-recognition 作者：musyoku | 项目源码 | 文件源码

def _initialize_params(self, t):
        xp = cuda.get_array_module(t)
        # ???????????????????
        mean_t = xp.mean(t, axis=(0, 2, 3)).reshape(1, -1, 1, 1)
        std_t = xp.sqrt(xp.var(t, axis=(0, 2, 3))).reshape(1, -1, 1, 1)
        g = 1 / std_t
        b = -mean_t / std_t

        # print "g <- {}, b <- {}".format(g.reshape((-1,)), b.reshape((-1,)))

        with self.init_scope():
            if self.nobias == False:
                self.b = variable.Parameter(b.reshape((-1,)))
            self.g = variable.Parameter(g.reshape((self.out_channels, 1, 1, 1)))

        return mean_t, std_t

项目：chainer-speech-recognition 作者：musyoku | 项目源码 | 文件源码

def backward(self, inputs, grad_output):
        xp = cuda.get_array_module(inputs[0])
        batch_size = len(inputs[2])

        total_probability = _logsumexp(self.prob_trans[0], xp, axis=1)
        label_prob = _compute_label_probability(self.yseq.shape[2], self.path, self.path_length, self.prob_trans, xp, self.zero_padding)
        self.yseq -= xp.exp(label_prob - total_probability[:, None])
        if self.reduce == 'mean':
            self.yseq *= grad_output[0] / batch_size
        else:
            self.yseq *= grad_output[0][..., None]
        # mask
        self.yseq *= (xp.arange(len(self.yseq))[:, None] < self.input_length)[..., None]
        return (None, None, None, None) + tuple([y for y in self.yseq])

# xs????

项目：chainer-qrnn 作者：musyoku | 项目源码 | 文件源码

def backward(self, inputs, grad_outputs):
        x, V, g = inputs[:3]
        if hasattr(self, "W") == False:
            self.norm = _get_norm(V)
            self.V_normalized = V / self.norm
            self.W = g * self.V_normalized

        b = inputs[3] if len(inputs) == 4 else None
        if b is None:
            gx, gW = super(Convolution1DFunction, self).backward((x, self.W), grad_outputs)
        else:
            gx, gW, gb = super(Convolution1DFunction, self).backward((x, self.W, b), grad_outputs)

        xp = cuda.get_array_module(x)
        gg = xp.sum(gW * self.V_normalized, axis=(1, 2), keepdims=True)
        gV = g * (gW - gg * self.V_normalized) / self.norm

        if b is None:
            return gx, gV, gg
        else:
            return gx, gV, gg, gb

项目：chainer-qrnn 作者：musyoku | 项目源码 | 文件源码

def _initialize_params(self, t):
        xp = cuda.get_array_module(t)

        self.mean_t = xp.mean(t, axis=(0, 2))           # calculate average for each channel
        self.std_t = xp.sqrt(xp.var(t, axis=(0, 2)))    # calculate stddev for each channel
        g = 1 / self.std_t
        b = -self.mean_t / self.std_t

        # print("g <- {}, b <- {}".format(g.reshape((-1,)), b.reshape((-1,))))

        with self.init_scope():
            if self.nobias == False:
                self.b = Parameter(b, b.shape)

            g_shape = (self.out_channels, 1) + (1,) * len(self.ksize)
            self.g = Parameter(g.reshape(g_shape), g_shape)