Source: owl_utils_conv.ml (p.owl-base.0.3.8.doc.src.owl-base)

1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147# 1 "src/base/misc/owl_utils_conv.ml" (* * OWL - an OCaml numerical library for scientific computing * Copyright (c) 2016-2018 Liang Wang <liang.wang@cl.cam.ac.uk> *) open Owl_types (* This module contains helper function for ndarray convolution functions. *) (* calculate the output shape of [conv2d] given input and kernel and stride *) let calc_conv2d_output_shape padding input_cols input_rows kernel_cols kernel_rows row_stride col_stride = let input_cols = float_of_int input_cols in let input_rows = float_of_int input_rows in let kernel_cols = float_of_int kernel_cols in let kernel_rows = float_of_int kernel_rows in let row_stride = float_of_int row_stride in let col_stride = float_of_int col_stride in let output_cols = match padding with | SAME -> (input_cols /. col_stride) |> ceil |> int_of_float | VALID -> ((input_cols -. kernel_cols +. 1.) /. col_stride) |> ceil |> int_of_float in let output_rows = match padding with | SAME -> (input_rows /. row_stride) |> ceil |> int_of_float | VALID -> ((input_rows -. kernel_rows +. 1.) /. row_stride) |> ceil |> int_of_float in (output_cols, output_rows) (* calculate the output shape of [transpose_conv2d] given input and kernel and stride *) let calc_transpose_conv2d_output_shape padding input_cols input_rows kernel_cols kernel_rows row_stride col_stride = let output_cols = match padding with | SAME -> input_cols * col_stride | VALID -> input_cols * col_stride + (max (kernel_cols - col_stride) 0) in let output_rows = match padding with | SAME -> input_rows * row_stride | VALID -> input_rows * row_stride + (max (kernel_rows - row_stride) 0) in (output_cols, output_rows) (* calculate the padding size along width and height *) let calc_conv2d_padding input_cols input_rows kernel_cols kernel_rows output_cols output_rows row_stride col_stride = let pad_along_height = Pervasives.max ((output_rows - 1) * row_stride + kernel_rows - input_rows) 0 in let pad_along_width = Pervasives.max ((output_cols - 1) * col_stride + kernel_cols - input_cols) 0 in let pad_top = pad_along_height / 2 in let pad_bottom = pad_along_height - pad_top in let pad_left = pad_along_width / 2 in let pad_right = pad_along_width - pad_left in pad_top, pad_left, pad_bottom, pad_right (* calc_conv1d_output_shape actually calls its 2d version *) let calc_conv1d_output_shape padding input_cols kernel_cols col_stride = let input_rows = 1 in let kernel_rows = 1 in let row_stride = 1 in calc_conv2d_output_shape padding input_cols input_rows kernel_cols kernel_rows row_stride col_stride |> fst (* calc_transpose_conv1d_output_shape actually calls its 2d version *) let calc_transpose_conv1d_output_shape padding input_cols kernel_cols col_stride = let input_rows = 1 in let kernel_rows = 1 in let row_stride = 1 in calc_transpose_conv2d_output_shape padding input_cols input_rows kernel_cols kernel_rows row_stride col_stride |> fst (* calculate the output shape of [conv3d] given input and kernel and stride *) let calc_conv3d_output_shape padding input_cols input_rows input_dpts kernel_cols kernel_rows kernel_dpts row_stride col_stride dpt_stride = let input_cols = float_of_int input_cols in let input_rows = float_of_int input_rows in let input_dpts = float_of_int input_dpts in let kernel_cols = float_of_int kernel_cols in let kernel_rows = float_of_int kernel_rows in let kernel_dpts = float_of_int kernel_dpts in let row_stride = float_of_int row_stride in let col_stride = float_of_int col_stride in let dpt_stride = float_of_int dpt_stride in let output_cols = match padding with | SAME -> (input_cols /. col_stride) |> ceil |> int_of_float | VALID -> ((input_cols -. kernel_cols +. 1.) /. col_stride) |> ceil |> int_of_float in let output_rows = match padding with | SAME -> (input_rows /. row_stride) |> ceil |> int_of_float | VALID -> ((input_rows -. kernel_rows +. 1.) /. row_stride) |> ceil |> int_of_float in let output_dpts = match padding with | SAME -> (input_dpts /. dpt_stride) |> ceil |> int_of_float | VALID -> ((input_dpts -. kernel_dpts +. 1.) /. dpt_stride) |> ceil |> int_of_float in (output_cols, output_rows, output_dpts) (* calculate the output shape of [transpose_conv3d] given input and kernel and stride *) let calc_transpose_conv3d_output_shape padding input_cols input_rows input_dpts kernel_cols kernel_rows kernel_dpts row_stride col_stride dpt_stride = let output_cols = match padding with | SAME -> input_cols * col_stride | VALID -> input_cols * col_stride + (max (kernel_cols - col_stride) 0) in let output_rows = match padding with | SAME -> input_rows * row_stride | VALID -> input_rows * row_stride + (max (kernel_rows - row_stride) 0) in let output_dpts = match padding with | SAME -> input_dpts * dpt_stride | VALID -> input_dpts * dpt_stride + (max (kernel_dpts - dpt_stride) 0) in (output_cols, output_rows, output_dpts) (* calculate the padding size along width, height, and depth. *) let calc_conv3d_padding input_cols input_rows input_depth kernel_cols kernel_rows kernel_depth output_cols output_rows output_depth row_stride col_stride depth_stride = let pad_along_height = Pervasives.max ((output_rows - 1) * row_stride + kernel_rows - input_rows) 0 in let pad_along_width = Pervasives.max ((output_cols - 1) * col_stride + kernel_cols - input_cols) 0 in let pad_along_depth = Pervasives.max ((output_depth - 1) * depth_stride + kernel_depth - input_depth) 0 in let pad_top = pad_along_height / 2 in let pad_bottom = pad_along_height - pad_top in let pad_left = pad_along_width / 2 in let pad_right = pad_along_width - pad_left in let pad_shallow = pad_along_depth / 2 in let pad_deep = pad_along_depth - pad_shallow in pad_top, pad_left, pad_shallow, pad_bottom, pad_right, pad_deep