From 1741ed0ab57fbd51e5ad3fb5508f30b66b8a0da9 Mon Sep 17 00:00:00 2001
From: Anatoly Baksheev <no@mail>
Date: Thu, 5 Jul 2018 18:45:41 +0300
Subject: [PATCH 1/8] formatting, if name == main

---
 convert_torch.py | 230 ++++++++++++++++++++++++-----------------------
 1 file changed, 119 insertions(+), 111 deletions(-)

diff --git a/convert_torch.py b/convert_torch.py
index b639f73..62ec8fc 100644
--- a/convert_torch.py
+++ b/convert_torch.py
@@ -14,6 +14,7 @@
 from torch.autograd import Variable
 from torch.utils.serialization import load_lua
 
+
 class LambdaBase(nn.Sequential):
     def __init__(self, fn, *args):
         super(LambdaBase, self).__init__(*args)
@@ -25,134 +26,139 @@ def forward_prepare(self, input):
             output.append(module(input))
         return output if output else input
 
+
 class Lambda(LambdaBase):
     def forward(self, input):
         return self.lambda_func(self.forward_prepare(input))
 
+
 class LambdaMap(LambdaBase):
     def forward(self, input):
         # result is Variables list [Variable1, Variable2, ...]
-        return list(map(self.lambda_func,self.forward_prepare(input)))
+        return list(map(self.lambda_func, self.forward_prepare(input)))
+
 
 class LambdaReduce(LambdaBase):
     def forward(self, input):
         # result is a Variable
-        return reduce(self.lambda_func,self.forward_prepare(input))
+        return reduce(self.lambda_func, self.forward_prepare(input))
 
 
-def copy_param(m,n):
+def copy_param(m, n):
     if m.weight is not None: n.weight.data.copy_(m.weight)
     if m.bias is not None: n.bias.data.copy_(m.bias)
-    if hasattr(n,'running_mean'): n.running_mean.copy_(m.running_mean)
-    if hasattr(n,'running_var'): n.running_var.copy_(m.running_var)
+    if hasattr(n, 'running_mean'): n.running_mean.copy_(m.running_mean)
+    if hasattr(n, 'running_var'): n.running_var.copy_(m.running_var)
+
 
 def add_submodule(seq, *args):
     for n in args:
-        seq.add_module(str(len(seq._modules)),n)
+        seq.add_module(str(len(seq._modules)), n)
+
 
-def lua_recursive_model(module,seq):
+def lua_recursive_model(module, seq):
     for m in module.modules:
         name = type(m).__name__
         real = m
         if name == 'TorchObject':
-            name = m._typename.replace('cudnn.','')
+            name = m._typename.replace('cudnn.', '')
             m = m._obj
 
         if name == 'SpatialConvolution' or name == 'nn.SpatialConvolutionMM':
-            if not hasattr(m,'groups') or m.groups is None: m.groups=1
-            n = nn.Conv2d(m.nInputPlane,m.nOutputPlane,(m.kW,m.kH),(m.dW,m.dH),(m.padW,m.padH),1,m.groups,bias=(m.bias is not None))
-            copy_param(m,n)
-            add_submodule(seq,n)
+            if not hasattr(m, 'groups') or m.groups is None: m.groups = 1
+            n = nn.Conv2d(m.nInputPlane, m.nOutputPlane, (m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), 1, m.groups, bias=(m.bias is not None))
+            copy_param(m, n)
+            add_submodule(seq, n)
         elif name == 'SpatialBatchNormalization':
             n = nn.BatchNorm2d(m.running_mean.size(0), m.eps, m.momentum, m.affine)
-            copy_param(m,n)
-            add_submodule(seq,n)
+            copy_param(m, n)
+            add_submodule(seq, n)
         elif name == 'VolumetricBatchNormalization':
             n = nn.BatchNorm3d(m.running_mean.size(0), m.eps, m.momentum, m.affine)
             copy_param(m, n)
             add_submodule(seq, n)
         elif name == 'ReLU':
             n = nn.ReLU()
-            add_submodule(seq,n)
+            add_submodule(seq, n)
         elif name == 'Sigmoid':
             n = nn.Sigmoid()
-            add_submodule(seq,n)
+            add_submodule(seq, n)
         elif name == 'SpatialMaxPooling':
-            n = nn.MaxPool2d((m.kW,m.kH),(m.dW,m.dH),(m.padW,m.padH),ceil_mode=m.ceil_mode)
-            add_submodule(seq,n)
+            n = nn.MaxPool2d((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), ceil_mode=m.ceil_mode)
+            add_submodule(seq, n)
         elif name == 'SpatialAveragePooling':
-            n = nn.AvgPool2d((m.kW,m.kH),(m.dW,m.dH),(m.padW,m.padH),ceil_mode=m.ceil_mode)
-            add_submodule(seq,n)
+            n = nn.AvgPool2d((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), ceil_mode=m.ceil_mode)
+            add_submodule(seq, n)
         elif name == 'SpatialUpSamplingNearest':
             n = nn.UpsamplingNearest2d(scale_factor=m.scale_factor)
-            add_submodule(seq,n)
+            add_submodule(seq, n)
         elif name == 'View':
-            n = Lambda(lambda x: x.view(x.size(0),-1))
-            add_submodule(seq,n)
+            n = Lambda(lambda x: x.view(x.size(0), -1))
+            add_submodule(seq, n)
         elif name == 'Reshape':
-            n = Lambda(lambda x: x.view(x.size(0),-1))
-            add_submodule(seq,n)
+            n = Lambda(lambda x: x.view(x.size(0), -1))
+            add_submodule(seq, n)
         elif name == 'Linear':
             # Linear in pytorch only accept 2D input
-            n1 = Lambda(lambda x: x.view(1,-1) if 1==len(x.size()) else x )
-            n2 = nn.Linear(m.weight.size(1),m.weight.size(0),bias=(m.bias is not None))
-            copy_param(m,n2)
-            n = nn.Sequential(n1,n2)
-            add_submodule(seq,n)
+            n1 = Lambda(lambda x: x.view(1, -1) if 1 == len(x.size()) else x)
+            n2 = nn.Linear(m.weight.size(1), m.weight.size(0), bias=(m.bias is not None))
+            copy_param(m, n2)
+            n = nn.Sequential(n1, n2)
+            add_submodule(seq, n)
         elif name == 'Dropout':
             m.inplace = False
             n = nn.Dropout(m.p)
-            add_submodule(seq,n)
+            add_submodule(seq, n)
         elif name == 'SoftMax':
             n = nn.Softmax()
-            add_submodule(seq,n)
+            add_submodule(seq, n)
         elif name == 'Identity':
-            n = Lambda(lambda x: x) # do nothing
-            add_submodule(seq,n)
+            n = Lambda(lambda x: x)  # do nothing
+            add_submodule(seq, n)
         elif name == 'SpatialFullConvolution':
-            n = nn.ConvTranspose2d(m.nInputPlane,m.nOutputPlane,(m.kW,m.kH),(m.dW,m.dH),(m.padW,m.padH),(m.adjW,m.adjH))
-            copy_param(m,n)
-            add_submodule(seq,n)
+            n = nn.ConvTranspose2d(m.nInputPlane, m.nOutputPlane, (m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), (m.adjW, m.adjH))
+            copy_param(m, n)
+            add_submodule(seq, n)
         elif name == 'VolumetricFullConvolution':
-            n = nn.ConvTranspose3d(m.nInputPlane,m.nOutputPlane,(m.kT,m.kW,m.kH),(m.dT,m.dW,m.dH),(m.padT,m.padW,m.padH),(m.adjT,m.adjW,m.adjH),m.groups)
-            copy_param(m,n)
+            n = nn.ConvTranspose3d(m.nInputPlane, m.nOutputPlane, (m.kT, m.kW, m.kH), (m.dT, m.dW, m.dH), (m.padT, m.padW, m.padH), (m.adjT, m.adjW, m.adjH), m.groups)
+            copy_param(m, n)
             add_submodule(seq, n)
         elif name == 'SpatialReplicationPadding':
-            n = nn.ReplicationPad2d((m.pad_l,m.pad_r,m.pad_t,m.pad_b))
-            add_submodule(seq,n)
+            n = nn.ReplicationPad2d((m.pad_l, m.pad_r, m.pad_t, m.pad_b))
+            add_submodule(seq, n)
         elif name == 'SpatialReflectionPadding':
-            n = nn.ReflectionPad2d((m.pad_l,m.pad_r,m.pad_t,m.pad_b))
-            add_submodule(seq,n)
+            n = nn.ReflectionPad2d((m.pad_l, m.pad_r, m.pad_t, m.pad_b))
+            add_submodule(seq, n)
         elif name == 'Copy':
-            n = Lambda(lambda x: x) # do nothing
-            add_submodule(seq,n)
+            n = Lambda(lambda x: x)  # do nothing
+            add_submodule(seq, n)
         elif name == 'Narrow':
-            n = Lambda(lambda x,a=(m.dimension,m.index,m.length): x.narrow(*a))
-            add_submodule(seq,n)
+            n = Lambda(lambda x, a=(m.dimension, m.index, m.length): x.narrow(*a))
+            add_submodule(seq, n)
         elif name == 'SpatialCrossMapLRN':
-            lrn = lnn.SpatialCrossMapLRN(m.size,m.alpha,m.beta,m.k)
-            n = Lambda(lambda x,lrn=lrn: Variable(lrn.forward(x.data)))
-            add_submodule(seq,n)
+            lrn = lnn.SpatialCrossMapLRN(m.size, m.alpha, m.beta, m.k)
+            n = Lambda(lambda x, lrn=lrn: Variable(lrn.forward(x.data)))
+            add_submodule(seq, n)
         elif name == 'Sequential':
             n = nn.Sequential()
-            lua_recursive_model(m,n)
-            add_submodule(seq,n)
-        elif name == 'ConcatTable': # output is list
+            lua_recursive_model(m, n)
+            add_submodule(seq, n)
+        elif name == 'ConcatTable':  # output is list
             n = LambdaMap(lambda x: x)
-            lua_recursive_model(m,n)
-            add_submodule(seq,n)
-        elif name == 'CAddTable': # input is list
-            n = LambdaReduce(lambda x,y: x+y)
-            add_submodule(seq,n)
+            lua_recursive_model(m, n)
+            add_submodule(seq, n)
+        elif name == 'CAddTable':  # input is list
+            n = LambdaReduce(lambda x, y: x + y)
+            add_submodule(seq, n)
         elif name == 'Concat':
             dim = m.dimension
-            n = LambdaReduce(lambda x,y,dim=dim: torch.cat((x,y),dim))
-            lua_recursive_model(m,n)
-            add_submodule(seq,n)
+            n = LambdaReduce(lambda x, y, dim=dim: torch.cat((x, y), dim))
+            lua_recursive_model(m, n)
+            add_submodule(seq, n)
         elif name == 'TorchObject':
-            print('Not Implement',name,real._typename)
+            print('Not Implement', name, real._typename)
         else:
-            print('Not Implement',name)
+            print('Not Implement', name)
 
 
 def lua_recursive_source(module):
@@ -161,13 +167,13 @@ def lua_recursive_source(module):
         name = type(m).__name__
         real = m
         if name == 'TorchObject':
-            name = m._typename.replace('cudnn.','')
+            name = m._typename.replace('cudnn.', '')
             m = m._obj
 
         if name == 'SpatialConvolution' or name == 'nn.SpatialConvolutionMM':
-            if not hasattr(m,'groups') or m.groups is None: m.groups=1
+            if not hasattr(m, 'groups') or m.groups is None: m.groups = 1
             s += ['nn.Conv2d({},{},{},{},{},{},{},bias={}),#Conv2d'.format(m.nInputPlane,
-                m.nOutputPlane,(m.kW,m.kH),(m.dW,m.dH),(m.padW,m.padH),1,m.groups,m.bias is not None)]
+                                                                           m.nOutputPlane, (m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), 1, m.groups, m.bias is not None)]
         elif name == 'SpatialBatchNormalization':
             s += ['nn.BatchNorm2d({},{},{},{}),#BatchNorm2d'.format(m.running_mean.size(0), m.eps, m.momentum, m.affine)]
         elif name == 'VolumetricBatchNormalization':
@@ -177,9 +183,9 @@ def lua_recursive_source(module):
         elif name == 'Sigmoid':
             s += ['nn.Sigmoid()']
         elif name == 'SpatialMaxPooling':
-            s += ['nn.MaxPool2d({},{},{},ceil_mode={}),#MaxPool2d'.format((m.kW,m.kH),(m.dW,m.dH),(m.padW,m.padH),m.ceil_mode)]
+            s += ['nn.MaxPool2d({},{},{},ceil_mode={}),#MaxPool2d'.format((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), m.ceil_mode)]
         elif name == 'SpatialAveragePooling':
-            s += ['nn.AvgPool2d({},{},{},ceil_mode={}),#AvgPool2d'.format((m.kW,m.kH),(m.dW,m.dH),(m.padW,m.padH),m.ceil_mode)]
+            s += ['nn.AvgPool2d({},{},{},ceil_mode={}),#AvgPool2d'.format((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), m.ceil_mode)]
         elif name == 'SpatialUpSamplingNearest':
             s += ['nn.UpsamplingNearest2d(scale_factor={})'.format(m.scale_factor)]
         elif name == 'View':
@@ -188,8 +194,8 @@ def lua_recursive_source(module):
             s += ['Lambda(lambda x: x.view(x.size(0),-1)), # Reshape']
         elif name == 'Linear':
             s1 = 'Lambda(lambda x: x.view(1,-1) if 1==len(x.size()) else x )'
-            s2 = 'nn.Linear({},{},bias={})'.format(m.weight.size(1),m.weight.size(0),(m.bias is not None))
-            s += ['nn.Sequential({},{}),#Linear'.format(s1,s2)]
+            s2 = 'nn.Linear({},{},bias={})'.format(m.weight.size(1), m.weight.size(0), (m.bias is not None))
+            s += ['nn.Sequential({},{}),#Linear'.format(s1, s2)]
         elif name == 'Dropout':
             s += ['nn.Dropout({})'.format(m.p)]
         elif name == 'SoftMax':
@@ -198,20 +204,21 @@ def lua_recursive_source(module):
             s += ['Lambda(lambda x: x), # Identity']
         elif name == 'SpatialFullConvolution':
             s += ['nn.ConvTranspose2d({},{},{},{},{},{})'.format(m.nInputPlane,
-                m.nOutputPlane,(m.kW,m.kH),(m.dW,m.dH),(m.padW,m.padH),(m.adjW,m.adjH))]
+                                                                 m.nOutputPlane, (m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), (m.adjW, m.adjH))]
         elif name == 'VolumetricFullConvolution':
             s += ['nn.ConvTranspose3d({},{},{},{},{},{},{})'.format(m.nInputPlane,
-                m.nOutputPlane,(m.kT,m.kW,m.kH),(m.dT,m.dW,m.dH),(m.padT,m.padW,m.padH),(m.adjT,m.adjW,m.adjH),m.groups)]
+                                                                    m.nOutputPlane, (m.kT, m.kW, m.kH), (m.dT, m.dW, m.dH), (m.padT, m.padW, m.padH), (m.adjT, m.adjW, m.adjH),
+                                                                    m.groups)]
         elif name == 'SpatialReplicationPadding':
-            s += ['nn.ReplicationPad2d({})'.format((m.pad_l,m.pad_r,m.pad_t,m.pad_b))]
+            s += ['nn.ReplicationPad2d({})'.format((m.pad_l, m.pad_r, m.pad_t, m.pad_b))]
         elif name == 'SpatialReflectionPadding':
-            s += ['nn.ReflectionPad2d({})'.format((m.pad_l,m.pad_r,m.pad_t,m.pad_b))]
+            s += ['nn.ReflectionPad2d({})'.format((m.pad_l, m.pad_r, m.pad_t, m.pad_b))]
         elif name == 'Copy':
             s += ['Lambda(lambda x: x), # Copy']
         elif name == 'Narrow':
-            s += ['Lambda(lambda x,a={}: x.narrow(*a))'.format((m.dimension,m.index,m.length))]
+            s += ['Lambda(lambda x,a={}: x.narrow(*a))'.format((m.dimension, m.index, m.length))]
         elif name == 'SpatialCrossMapLRN':
-            lrn = 'lnn.SpatialCrossMapLRN(*{})'.format((m.size,m.alpha,m.beta,m.k))
+            lrn = 'lnn.SpatialCrossMapLRN(*{})'.format((m.size, m.alpha, m.beta, m.k))
             s += ['Lambda(lambda x,lrn={}: Variable(lrn.forward(x.data)))'.format(lrn)]
 
         elif name == 'Sequential':
@@ -231,33 +238,35 @@ def lua_recursive_source(module):
             s += [')']
         else:
             s += '# ' + name + ' Not Implement,\n'
-    s = map(lambda x: '\t{}'.format(x),s)
+    s = map(lambda x: '\t{}'.format(x), s)
     return s
 
+
 def simplify_source(s):
-    s = map(lambda x: x.replace(',(1, 1),(0, 0),1,1,bias=True),#Conv2d',')'),s)
-    s = map(lambda x: x.replace(',(0, 0),1,1,bias=True),#Conv2d',')'),s)
-    s = map(lambda x: x.replace(',1,1,bias=True),#Conv2d',')'),s)
-    s = map(lambda x: x.replace(',bias=True),#Conv2d',')'),s)
-    s = map(lambda x: x.replace('),#Conv2d',')'),s)
-    s = map(lambda x: x.replace(',1e-05,0.1,True),#BatchNorm2d',')'),s)
-    s = map(lambda x: x.replace('),#BatchNorm2d',')'),s)
-    s = map(lambda x: x.replace(',(0, 0),ceil_mode=False),#MaxPool2d',')'),s)
-    s = map(lambda x: x.replace(',ceil_mode=False),#MaxPool2d',')'),s)
-    s = map(lambda x: x.replace('),#MaxPool2d',')'),s)
-    s = map(lambda x: x.replace(',(0, 0),ceil_mode=False),#AvgPool2d',')'),s)
-    s = map(lambda x: x.replace(',ceil_mode=False),#AvgPool2d',')'),s)
-    s = map(lambda x: x.replace(',bias=True)),#Linear',')), # Linear'),s)
-    s = map(lambda x: x.replace(')),#Linear',')), # Linear'),s)
-
-    s = map(lambda x: '{},\n'.format(x),s)
-    s = map(lambda x: x[1:],s)
-    s = reduce(lambda x,y: x+y, s)
+    s = map(lambda x: x.replace(',(1, 1),(0, 0),1,1,bias=True),#Conv2d', ')'), s)
+    s = map(lambda x: x.replace(',(0, 0),1,1,bias=True),#Conv2d', ')'), s)
+    s = map(lambda x: x.replace(',1,1,bias=True),#Conv2d', ')'), s)
+    s = map(lambda x: x.replace(',bias=True),#Conv2d', ')'), s)
+    s = map(lambda x: x.replace('),#Conv2d', ')'), s)
+    s = map(lambda x: x.replace(',1e-05,0.1,True),#BatchNorm2d', ')'), s)
+    s = map(lambda x: x.replace('),#BatchNorm2d', ')'), s)
+    s = map(lambda x: x.replace(',(0, 0),ceil_mode=False),#MaxPool2d', ')'), s)
+    s = map(lambda x: x.replace(',ceil_mode=False),#MaxPool2d', ')'), s)
+    s = map(lambda x: x.replace('),#MaxPool2d', ')'), s)
+    s = map(lambda x: x.replace(',(0, 0),ceil_mode=False),#AvgPool2d', ')'), s)
+    s = map(lambda x: x.replace(',ceil_mode=False),#AvgPool2d', ')'), s)
+    s = map(lambda x: x.replace(',bias=True)),#Linear', ')), # Linear'), s)
+    s = map(lambda x: x.replace(')),#Linear', ')), # Linear'), s)
+
+    s = map(lambda x: '{},\n'.format(x), s)
+    s = map(lambda x: x[1:], s)
+    s = reduce(lambda x, y: x + y, s)
     return s
 
-def torch_to_pytorch(t7_filename,outputname=None):
-    model = load_lua(t7_filename,unknown_classes=True)
-    if type(model).__name__=='hashable_uniq_dict': model=model.model
+
+def torch_to_pytorch(t7_filename, outputname=None):
+    model = load_lua(t7_filename, unknown_classes=True)
+    if type(model).__name__ == 'hashable_uniq_dict': model = model.model
     model.gradInput = None
     slist = lua_recursive_source(lnn.Sequential().add(model))
     s = simplify_source(slist)
@@ -292,23 +301,22 @@ class LambdaReduce(LambdaBase):
     def forward(self, input):
         return reduce(self.lambda_func,self.forward_prepare(input))
 '''
-    varname = t7_filename.replace('.t7','').replace('.','_').replace('-','_')
-    s = '{}\n\n{} = {}'.format(header,varname,s[:-2])
+    varname = t7_filename.replace('.t7', '').replace('.', '_').replace('-', '_')
+    s = '{}\n\n{} = {}'.format(header, varname, s[:-2])
 
-    if outputname is None: outputname=varname
-    with open(outputname+'.py', "w") as pyfile:
+    if outputname is None: outputname = varname
+    with open(outputname + '.py', "w") as pyfile:
         pyfile.write(s)
 
     n = nn.Sequential()
-    lua_recursive_model(model,n)
-    torch.save(n.state_dict(),outputname+'.pth')
+    lua_recursive_model(model, n)
+    torch.save(n.state_dict(), outputname + '.pth')
 
 
-parser = argparse.ArgumentParser(description='Convert torch t7 model to pytorch')
-parser.add_argument('--model','-m', type=str, required=True,
-                    help='torch model file in t7 format')
-parser.add_argument('--output', '-o', type=str, default=None,
-                    help='output file name prefix, xxx.py xxx.pth')
-args = parser.parse_args()
+if __name__ == '__main__':
+    parser = argparse.ArgumentParser(description='Convert torch t7 model to pytorch')
+    parser.add_argument('--model', '-m', type=str, required=True, help='torch model file in t7 format')
+    parser.add_argument('--output', '-o', type=str, default=None, help='output file name prefix, xxx.py xxx.pth')
+    args = parser.parse_args()
 
-torch_to_pytorch(args.model,args.output)
+    torch_to_pytorch(args.model, args.output)

From b0ee72c35b42d0279ccbae116c7f927d2d41df0e Mon Sep 17 00:00:00 2001
From: Anatoly Baksheev <no@mail>
Date: Fri, 6 Jul 2018 11:53:24 +0300
Subject: [PATCH 2/8] formatting

---
 convert_torch.py | 42 +++++++++---------------------------------
 header.py        |  0
 2 files changed, 9 insertions(+), 33 deletions(-)
 create mode 100644 header.py

diff --git a/convert_torch.py b/convert_torch.py
index 62ec8fc..84d8545 100644
--- a/convert_torch.py
+++ b/convert_torch.py
@@ -14,41 +14,18 @@
 from torch.autograd import Variable
 from torch.utils.serialization import load_lua
 
-
-class LambdaBase(nn.Sequential):
-    def __init__(self, fn, *args):
-        super(LambdaBase, self).__init__(*args)
-        self.lambda_func = fn
-
-    def forward_prepare(self, input):
-        output = []
-        for module in self._modules.values():
-            output.append(module(input))
-        return output if output else input
-
-
-class Lambda(LambdaBase):
-    def forward(self, input):
-        return self.lambda_func(self.forward_prepare(input))
-
-
-class LambdaMap(LambdaBase):
-    def forward(self, input):
-        # result is Variables list [Variable1, Variable2, ...]
-        return list(map(self.lambda_func, self.forward_prepare(input)))
-
-
-class LambdaReduce(LambdaBase):
-    def forward(self, input):
-        # result is a Variable
-        return reduce(self.lambda_func, self.forward_prepare(input))
+from header import LambdaBase, Lambda, LambdaMap, LambdaReduce
 
 
 def copy_param(m, n):
-    if m.weight is not None: n.weight.data.copy_(m.weight)
-    if m.bias is not None: n.bias.data.copy_(m.bias)
-    if hasattr(n, 'running_mean'): n.running_mean.copy_(m.running_mean)
-    if hasattr(n, 'running_var'): n.running_var.copy_(m.running_var)
+    if m.weight is not None:
+        n.weight.data.copy_(m.weight, broadcast=False)
+    if hasattr(m, 'bias') and m.bias is not None:
+        n.bias.data.copy_(m.bias, broadcast=False)
+    if hasattr(n, 'running_mean'):
+        n.running_mean.copy_(m.running_mean, broadcast=False)
+    if hasattr(n, 'running_var'):
+        n.running_var.copy_(m.running_var, broadcast=False)
 
 
 def add_submodule(seq, *args):
@@ -165,7 +142,6 @@ def lua_recursive_source(module):
     s = []
     for m in module.modules:
         name = type(m).__name__
-        real = m
         if name == 'TorchObject':
             name = m._typename.replace('cudnn.', '')
             m = m._obj
diff --git a/header.py b/header.py
new file mode 100644
index 0000000..e69de29

From 944a34654693bd580d8161f40f121ff5547050d6 Mon Sep 17 00:00:00 2001
From: Anatoly Baksheev <no@mail>
Date: Fri, 6 Jul 2018 11:54:05 +0300
Subject: [PATCH 3/8] moved source to separate header file

---
 convert_torch.py |  37 +++-------------
 header.py        | 111 +++++++++++++++++++++++++++++++++++++++++++++++
 2 files changed, 117 insertions(+), 31 deletions(-)

diff --git a/convert_torch.py b/convert_torch.py
index 84d8545..54a0b96 100644
--- a/convert_torch.py
+++ b/convert_torch.py
@@ -242,42 +242,17 @@ def simplify_source(s):
 
 def torch_to_pytorch(t7_filename, outputname=None):
     model = load_lua(t7_filename, unknown_classes=True)
-    if type(model).__name__ == 'hashable_uniq_dict': model = model.model
+    if type(model).__name__ == 'hashable_uniq_dict':
+        model = model.model
     model.gradInput = None
+
     slist = lua_recursive_source(lnn.Sequential().add(model))
     s = simplify_source(slist)
-    header = '''
-import torch
-import torch.nn as nn
-import torch.legacy.nn as lnn
-
-from functools import reduce
-from torch.autograd import Variable
-
-class LambdaBase(nn.Sequential):
-    def __init__(self, fn, *args):
-        super(LambdaBase, self).__init__(*args)
-        self.lambda_func = fn
-
-    def forward_prepare(self, input):
-        output = []
-        for module in self._modules.values():
-            output.append(module(input))
-        return output if output else input
-
-class Lambda(LambdaBase):
-    def forward(self, input):
-        return self.lambda_func(self.forward_prepare(input))
 
-class LambdaMap(LambdaBase):
-    def forward(self, input):
-        return list(map(self.lambda_func,self.forward_prepare(input)))
+    varname = os.path.basename(t7_filename).replace('.t7', '').replace('.', '_').replace('-', '_')
 
-class LambdaReduce(LambdaBase):
-    def forward(self, input):
-        return reduce(self.lambda_func,self.forward_prepare(input))
-'''
-    varname = t7_filename.replace('.t7', '').replace('.', '_').replace('-', '_')
+    with open("header.py") as f:
+        header = f.read()
     s = '{}\n\n{} = {}'.format(header, varname, s[:-2])
 
     if outputname is None: outputname = varname
diff --git a/header.py b/header.py
index e69de29..3fb1099 100644
--- a/header.py
+++ b/header.py
@@ -0,0 +1,111 @@
+import torch
+import torch.nn as nn
+
+from functools import reduce
+from torch.autograd import Variable
+
+
+class LambdaBase(nn.Sequential):
+    def __init__(self, fn, *args):
+        super(LambdaBase, self).__init__(*args)
+        self.lambda_func = fn
+
+    def forward_prepare(self, input):
+        output = []
+        for module in self._modules.values():
+            output.append(module(input))
+        return output if output else input
+
+
+class Lambda(LambdaBase):
+    def forward(self, input):
+        return self.lambda_func(self.forward_prepare(input))
+
+
+class LambdaMap(LambdaBase):
+    def forward(self, input):
+        # result is Variables list [Variable1, Variable2, ...]
+        return list(map(self.lambda_func, self.forward_prepare(input)))
+
+
+class LambdaReduce(LambdaBase):
+    def forward(self, input):
+        # result is a Variable
+        return reduce(self.lambda_func, self.forward_prepare(input))
+
+
+class Padding(nn.Module):
+    # pad puts in [pad] amount of [value] over dimension [dim], starting at
+    # index [index] in that dimension. If pad<0, index counts from the left.
+    # If pad>0 index counts from the right.
+    # When nInputDim is provided, inputs larger than that value will be considered batches
+    # where the actual dim to be padded will be dimension dim + 1.
+    def __init__(self, dim, pad, value, index, nInputDim):
+        super(Padding, self).__init__()
+        self.value = value
+        # self.index = index
+        self.dim = dim
+        self.pad = pad
+        self.nInputDim = nInputDim
+        if index != 0:
+            raise NotImplementedError("Padding: index != 0 not implemented")
+
+    def forward(self, input):
+        dim = self.dim
+        if self.nInputDim != 0:
+            dim += input.dim() - self.nInputDim
+        pad_size = list(input.size())
+        pad_size[dim] = self.pad
+        padder = Variable(input.data.new(*pad_size).fill_(self.value))
+
+        if self.pad < 0:
+            padded = torch.cat((padder, input), dim)
+        else:
+            padded = torch.cat((input, padder), dim)
+        return padded
+
+
+class Dropout(nn.Dropout):
+    """
+    Cancel out PyTorch rescaling by 1/(1-p)
+    """
+    def forward(self, input):
+        input = input * (1 - self.p)
+        return super(Dropout, self).forward(input)
+
+
+class Dropout2d(nn.Dropout2d):
+    """
+    Cancel out PyTorch rescaling by 1/(1-p)
+    """
+    def forward(self, input):
+        input = input * (1 - self.p)
+        return super(Dropout2d, self).forward(input)
+
+
+class StatefulMaxPool2d(nn.MaxPool2d): # object keeps indices and input sizes
+
+    def __init__(self, *args, **kwargs):
+        super(StatefulMaxPool2d, self).__init__(*args, **kwargs)
+        self.indices = None
+        self.input_size = None
+
+    def forward(self, x):
+        return_indices, self.return_indices = self.return_indices, True
+        output, indices = super(StatefulMaxPool2d, self).forward(x)
+        self.return_indices = return_indices
+        self.indices = indices
+        self.input_size = x.size()
+        if return_indices:
+            return output, indices
+        return output
+
+
+class StatefulMaxUnpool2d(nn.Module):
+    def __init__(self, pooling):
+        super(StatefulMaxUnpool2d, self).__init__()
+        self.pooling = pooling
+        self.unpooling = nn.MaxUnpool2d(pooling.kernel_size, pooling.stride, pooling.padding)
+
+    def forward(self, x):
+        return self.unpooling.forward(x, self.pooling.indices, self.pooling.input_size)

From 82f5b6d43ab4ad0bd4bc7c0ba2a2b304eaaad301 Mon Sep 17 00:00:00 2001
From: Anatoly Baksheev <no@mail>
Date: Fri, 6 Jul 2018 13:04:48 +0300
Subject: [PATCH 4/8] formatting

---
 convert_torch.py | 11 ++++++-----
 header.py        |  2 +-
 2 files changed, 7 insertions(+), 6 deletions(-)

diff --git a/convert_torch.py b/convert_torch.py
index 54a0b96..d746bcb 100644
--- a/convert_torch.py
+++ b/convert_torch.py
@@ -1,6 +1,7 @@
 from __future__ import print_function
 
 import os
+import re
 import math
 import torch
 import argparse
@@ -14,18 +15,18 @@
 from torch.autograd import Variable
 from torch.utils.serialization import load_lua
 
-from header import LambdaBase, Lambda, LambdaMap, LambdaReduce
+from header import LambdaBase, Lambda, LambdaMap, LambdaReduce, StatefulMaxPool2d, StatefulMaxUnpool2d
 
 
 def copy_param(m, n):
     if m.weight is not None:
-        n.weight.data.copy_(m.weight, broadcast=False)
+        n.weight.data.copy_(m.weight)
     if hasattr(m, 'bias') and m.bias is not None:
-        n.bias.data.copy_(m.bias, broadcast=False)
+        n.bias.data.copy_(m.bias)
     if hasattr(n, 'running_mean'):
-        n.running_mean.copy_(m.running_mean, broadcast=False)
+        n.running_mean.copy_(m.running_mean)
     if hasattr(n, 'running_var'):
-        n.running_var.copy_(m.running_var, broadcast=False)
+        n.running_var.copy_(m.running_var)
 
 
 def add_submodule(seq, *args):
diff --git a/header.py b/header.py
index 3fb1099..2b84a50 100644
--- a/header.py
+++ b/header.py
@@ -83,7 +83,7 @@ def forward(self, input):
         return super(Dropout2d, self).forward(input)
 
 
-class StatefulMaxPool2d(nn.MaxPool2d): # object keeps indices and input sizes
+class StatefulMaxPool2d(nn.MaxPool2d):  # object keeps indices and input sizes
 
     def __init__(self, *args, **kwargs):
         super(StatefulMaxPool2d, self).__init__(*args, **kwargs)

From e77709fb574ba7210adfda50a6b77a5fbc42f0c5 Mon Sep 17 00:00:00 2001
From: Anatoly Baksheev <no@mail>
Date: Fri, 6 Jul 2018 13:07:34 +0300
Subject: [PATCH 5/8] moved to class, added MaxUnpool support

---
 convert_torch.py | 428 +++++++++++++++++++++++++----------------------
 1 file changed, 227 insertions(+), 201 deletions(-)

diff --git a/convert_torch.py b/convert_torch.py
index d746bcb..53d49a8 100644
--- a/convert_torch.py
+++ b/convert_torch.py
@@ -34,211 +34,236 @@ def add_submodule(seq, *args):
         seq.add_module(str(len(seq._modules)), n)
 
 
-def lua_recursive_model(module, seq):
-    for m in module.modules:
-        name = type(m).__name__
-        real = m
-        if name == 'TorchObject':
-            name = m._typename.replace('cudnn.', '')
-            m = m._obj
+class Convertor(object):
 
-        if name == 'SpatialConvolution' or name == 'nn.SpatialConvolutionMM':
-            if not hasattr(m, 'groups') or m.groups is None: m.groups = 1
-            n = nn.Conv2d(m.nInputPlane, m.nOutputPlane, (m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), 1, m.groups, bias=(m.bias is not None))
-            copy_param(m, n)
-            add_submodule(seq, n)
-        elif name == 'SpatialBatchNormalization':
-            n = nn.BatchNorm2d(m.running_mean.size(0), m.eps, m.momentum, m.affine)
-            copy_param(m, n)
-            add_submodule(seq, n)
-        elif name == 'VolumetricBatchNormalization':
-            n = nn.BatchNorm3d(m.running_mean.size(0), m.eps, m.momentum, m.affine)
-            copy_param(m, n)
-            add_submodule(seq, n)
-        elif name == 'ReLU':
-            n = nn.ReLU()
-            add_submodule(seq, n)
-        elif name == 'Sigmoid':
-            n = nn.Sigmoid()
-            add_submodule(seq, n)
-        elif name == 'SpatialMaxPooling':
-            n = nn.MaxPool2d((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), ceil_mode=m.ceil_mode)
-            add_submodule(seq, n)
-        elif name == 'SpatialAveragePooling':
-            n = nn.AvgPool2d((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), ceil_mode=m.ceil_mode)
-            add_submodule(seq, n)
-        elif name == 'SpatialUpSamplingNearest':
-            n = nn.UpsamplingNearest2d(scale_factor=m.scale_factor)
-            add_submodule(seq, n)
-        elif name == 'View':
-            n = Lambda(lambda x: x.view(x.size(0), -1))
-            add_submodule(seq, n)
-        elif name == 'Reshape':
-            n = Lambda(lambda x: x.view(x.size(0), -1))
-            add_submodule(seq, n)
-        elif name == 'Linear':
-            # Linear in pytorch only accept 2D input
-            n1 = Lambda(lambda x: x.view(1, -1) if 1 == len(x.size()) else x)
-            n2 = nn.Linear(m.weight.size(1), m.weight.size(0), bias=(m.bias is not None))
-            copy_param(m, n2)
-            n = nn.Sequential(n1, n2)
-            add_submodule(seq, n)
-        elif name == 'Dropout':
-            m.inplace = False
-            n = nn.Dropout(m.p)
-            add_submodule(seq, n)
-        elif name == 'SoftMax':
-            n = nn.Softmax()
-            add_submodule(seq, n)
-        elif name == 'Identity':
-            n = Lambda(lambda x: x)  # do nothing
-            add_submodule(seq, n)
-        elif name == 'SpatialFullConvolution':
-            n = nn.ConvTranspose2d(m.nInputPlane, m.nOutputPlane, (m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), (m.adjW, m.adjH))
-            copy_param(m, n)
-            add_submodule(seq, n)
-        elif name == 'VolumetricFullConvolution':
-            n = nn.ConvTranspose3d(m.nInputPlane, m.nOutputPlane, (m.kT, m.kW, m.kH), (m.dT, m.dW, m.dH), (m.padT, m.padW, m.padH), (m.adjT, m.adjW, m.adjH), m.groups)
-            copy_param(m, n)
-            add_submodule(seq, n)
-        elif name == 'SpatialReplicationPadding':
-            n = nn.ReplicationPad2d((m.pad_l, m.pad_r, m.pad_t, m.pad_b))
-            add_submodule(seq, n)
-        elif name == 'SpatialReflectionPadding':
-            n = nn.ReflectionPad2d((m.pad_l, m.pad_r, m.pad_t, m.pad_b))
-            add_submodule(seq, n)
-        elif name == 'Copy':
-            n = Lambda(lambda x: x)  # do nothing
-            add_submodule(seq, n)
-        elif name == 'Narrow':
-            n = Lambda(lambda x, a=(m.dimension, m.index, m.length): x.narrow(*a))
-            add_submodule(seq, n)
-        elif name == 'SpatialCrossMapLRN':
-            lrn = lnn.SpatialCrossMapLRN(m.size, m.alpha, m.beta, m.k)
-            n = Lambda(lambda x, lrn=lrn: Variable(lrn.forward(x.data)))
-            add_submodule(seq, n)
-        elif name == 'Sequential':
-            n = nn.Sequential()
-            lua_recursive_model(m, n)
-            add_submodule(seq, n)
-        elif name == 'ConcatTable':  # output is list
-            n = LambdaMap(lambda x: x)
-            lua_recursive_model(m, n)
-            add_submodule(seq, n)
-        elif name == 'CAddTable':  # input is list
-            n = LambdaReduce(lambda x, y: x + y)
-            add_submodule(seq, n)
-        elif name == 'Concat':
-            dim = m.dimension
-            n = LambdaReduce(lambda x, y, dim=dim: torch.cat((x, y), dim))
-            lua_recursive_model(m, n)
-            add_submodule(seq, n)
-        elif name == 'TorchObject':
-            print('Not Implement', name, real._typename)
-        else:
-            print('Not Implement', name)
+    def __init__(self):
+        self.prefix_code = []
+        self.t2pt_names = dict()
+        self.t2pt_layers = dict()
 
+    def lua_recursive_model(self, module, seq):
+        for m in module.modules:
+            name = type(m).__name__
+            real = m
+            if name == 'TorchObject':
+                name = m._typename.replace('cudnn.', '')
+                m = m._obj
 
-def lua_recursive_source(module):
-    s = []
-    for m in module.modules:
-        name = type(m).__name__
-        if name == 'TorchObject':
-            name = m._typename.replace('cudnn.', '')
-            m = m._obj
+            if name == 'SpatialConvolution' or name == 'nn.SpatialConvolutionMM':
+                if not hasattr(m, 'groups') or m.groups is None: m.groups = 1
+                n = nn.Conv2d(m.nInputPlane, m.nOutputPlane, (m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), 1, m.groups, bias=(m.bias is not None))
+                copy_param(m, n)
+                add_submodule(seq, n)
+            elif name == 'SpatialBatchNormalization':
+                n = nn.BatchNorm2d(m.running_mean.size(0), m.eps, m.momentum, m.affine)
+                copy_param(m, n)
+                add_submodule(seq, n)
+            elif name == 'VolumetricBatchNormalization':
+                n = nn.BatchNorm3d(m.running_mean.size(0), m.eps, m.momentum, m.affine)
+                copy_param(m, n)
+                add_submodule(seq, n)
+            elif name == 'ReLU':
+                n = nn.ReLU()
+                add_submodule(seq, n)
+            elif name == 'Sigmoid':
+                n = nn.Sigmoid()
+                add_submodule(seq, n)
+            elif name == 'SpatialMaxPooling':
+                # n = nn.MaxPool2d((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), ceil_mode=m.ceil_mode)
+                n = StatefulMaxPool2d((m.kH, m.kW), (m.dH, m.dW), (m.padH, m.padW), ceil_mode=m.ceil_mode)
+                self.t2pt_layers[m] = n
+                add_submodule(seq, n)
+            elif name == 'SpatialMaxUnpooling':
+                if m.pooling in self.t2pt_layers:
+                    n = StatefulMaxUnpool2d(self.t2pt_layers[m.pooling])
+                    add_submodule(seq, n)
+                else:
+                    print('Not Implement {}. Can\'t find corresponding MaxPool layer'.format(name))
+            elif name == 'SpatialAveragePooling':
+                n = nn.AvgPool2d((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), ceil_mode=m.ceil_mode)
+                add_submodule(seq, n)
+            elif name == 'SpatialUpSamplingNearest':
+                n = nn.UpsamplingNearest2d(scale_factor=m.scale_factor)
+                add_submodule(seq, n)
+            elif name == 'View':
+                n = Lambda(lambda x: x.view(x.size(0), -1))
+                add_submodule(seq, n)
+            elif name == 'Reshape':
+                n = Lambda(lambda x: x.view(x.size(0), -1))
+                add_submodule(seq, n)
+            elif name == 'Linear':
+                # Linear in pytorch only accept 2D input
+                n1 = Lambda(lambda x: x.view(1, -1) if 1 == len(x.size()) else x)
+                n2 = nn.Linear(m.weight.size(1), m.weight.size(0), bias=(m.bias is not None))
+                copy_param(m, n2)
+                n = nn.Sequential(n1, n2)
+                add_submodule(seq, n)
+            elif name == 'Dropout':
+                m.inplace = False
+                n = nn.Dropout(m.p)
+                add_submodule(seq, n)
+            elif name == 'SoftMax':
+                n = nn.Softmax()
+                add_submodule(seq, n)
+            elif name == 'Identity':
+                n = Lambda(lambda x: x)  # do nothing
+                add_submodule(seq, n)
+            elif name == 'SpatialFullConvolution':
+                n = nn.ConvTranspose2d(m.nInputPlane, m.nOutputPlane, (m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), (m.adjW, m.adjH))
+                copy_param(m, n)
+                add_submodule(seq, n)
+            elif name == 'VolumetricFullConvolution':
+                n = nn.ConvTranspose3d(m.nInputPlane, m.nOutputPlane, (m.kT, m.kW, m.kH), (m.dT, m.dW, m.dH), (m.padT, m.padW, m.padH), (m.adjT, m.adjW, m.adjH), m.groups)
+                copy_param(m, n)
+                add_submodule(seq, n)
+            elif name == 'SpatialReplicationPadding':
+                n = nn.ReplicationPad2d((m.pad_l, m.pad_r, m.pad_t, m.pad_b))
+                add_submodule(seq, n)
+            elif name == 'SpatialReflectionPadding':
+                n = nn.ReflectionPad2d((m.pad_l, m.pad_r, m.pad_t, m.pad_b))
+                add_submodule(seq, n)
+            elif name == 'Copy':
+                n = Lambda(lambda x: x)  # do nothing
+                add_submodule(seq, n)
+            elif name == 'Narrow':
+                n = Lambda(lambda x, a=(m.dimension, m.index, m.length): x.narrow(*a))
+                add_submodule(seq, n)
+            elif name == 'SpatialCrossMapLRN':
+                lrn = lnn.SpatialCrossMapLRN(m.size, m.alpha, m.beta, m.k)
+                n = Lambda(lambda x, lrn=lrn: Variable(lrn.forward(x.data)))
+                add_submodule(seq, n)
+            elif name == 'Sequential':
+                n = nn.Sequential()
+                self.lua_recursive_model(m, n)
+                add_submodule(seq, n)
+            elif name == 'ConcatTable':  # output is list
+                n = LambdaMap(lambda x: x)
+                self.lua_recursive_model(m, n)
+                add_submodule(seq, n)
+            elif name == 'CAddTable':  # input is list
+                n = LambdaReduce(lambda x, y: x + y)
+                add_submodule(seq, n)
+            elif name == 'Concat':
+                dim = m.dimension
+                n = LambdaReduce(lambda x, y, dim=dim: torch.cat((x, y), dim))
+                self.lua_recursive_model(m, n)
+                add_submodule(seq, n)
+            elif name == 'TorchObject':
+                print('Not Implement', name, real._typename)
+            else:
+                print('Not Implement', name)
 
-        if name == 'SpatialConvolution' or name == 'nn.SpatialConvolutionMM':
-            if not hasattr(m, 'groups') or m.groups is None: m.groups = 1
-            s += ['nn.Conv2d({},{},{},{},{},{},{},bias={}),#Conv2d'.format(m.nInputPlane,
-                                                                           m.nOutputPlane, (m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), 1, m.groups, m.bias is not None)]
-        elif name == 'SpatialBatchNormalization':
-            s += ['nn.BatchNorm2d({},{},{},{}),#BatchNorm2d'.format(m.running_mean.size(0), m.eps, m.momentum, m.affine)]
-        elif name == 'VolumetricBatchNormalization':
-            s += ['nn.BatchNorm3d({},{},{},{}),#BatchNorm3d'.format(m.running_mean.size(0), m.eps, m.momentum, m.affine)]
-        elif name == 'ReLU':
-            s += ['nn.ReLU()']
-        elif name == 'Sigmoid':
-            s += ['nn.Sigmoid()']
-        elif name == 'SpatialMaxPooling':
-            s += ['nn.MaxPool2d({},{},{},ceil_mode={}),#MaxPool2d'.format((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), m.ceil_mode)]
-        elif name == 'SpatialAveragePooling':
-            s += ['nn.AvgPool2d({},{},{},ceil_mode={}),#AvgPool2d'.format((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), m.ceil_mode)]
-        elif name == 'SpatialUpSamplingNearest':
-            s += ['nn.UpsamplingNearest2d(scale_factor={})'.format(m.scale_factor)]
-        elif name == 'View':
-            s += ['Lambda(lambda x: x.view(x.size(0),-1)), # View']
-        elif name == 'Reshape':
-            s += ['Lambda(lambda x: x.view(x.size(0),-1)), # Reshape']
-        elif name == 'Linear':
-            s1 = 'Lambda(lambda x: x.view(1,-1) if 1==len(x.size()) else x )'
-            s2 = 'nn.Linear({},{},bias={})'.format(m.weight.size(1), m.weight.size(0), (m.bias is not None))
-            s += ['nn.Sequential({},{}),#Linear'.format(s1, s2)]
-        elif name == 'Dropout':
-            s += ['nn.Dropout({})'.format(m.p)]
-        elif name == 'SoftMax':
-            s += ['nn.Softmax()']
-        elif name == 'Identity':
-            s += ['Lambda(lambda x: x), # Identity']
-        elif name == 'SpatialFullConvolution':
-            s += ['nn.ConvTranspose2d({},{},{},{},{},{})'.format(m.nInputPlane,
-                                                                 m.nOutputPlane, (m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), (m.adjW, m.adjH))]
-        elif name == 'VolumetricFullConvolution':
-            s += ['nn.ConvTranspose3d({},{},{},{},{},{},{})'.format(m.nInputPlane,
-                                                                    m.nOutputPlane, (m.kT, m.kW, m.kH), (m.dT, m.dW, m.dH), (m.padT, m.padW, m.padH), (m.adjT, m.adjW, m.adjH),
-                                                                    m.groups)]
-        elif name == 'SpatialReplicationPadding':
-            s += ['nn.ReplicationPad2d({})'.format((m.pad_l, m.pad_r, m.pad_t, m.pad_b))]
-        elif name == 'SpatialReflectionPadding':
-            s += ['nn.ReflectionPad2d({})'.format((m.pad_l, m.pad_r, m.pad_t, m.pad_b))]
-        elif name == 'Copy':
-            s += ['Lambda(lambda x: x), # Copy']
-        elif name == 'Narrow':
-            s += ['Lambda(lambda x,a={}: x.narrow(*a))'.format((m.dimension, m.index, m.length))]
-        elif name == 'SpatialCrossMapLRN':
-            lrn = 'lnn.SpatialCrossMapLRN(*{})'.format((m.size, m.alpha, m.beta, m.k))
-            s += ['Lambda(lambda x,lrn={}: Variable(lrn.forward(x.data)))'.format(lrn)]
+    def lua_recursive_source(self, module):
+        s = []
 
-        elif name == 'Sequential':
-            s += ['nn.Sequential( # Sequential']
-            s += lua_recursive_source(m)
-            s += [')']
-        elif name == 'ConcatTable':
-            s += ['LambdaMap(lambda x: x, # ConcatTable']
-            s += lua_recursive_source(m)
-            s += [')']
-        elif name == 'CAddTable':
-            s += ['LambdaReduce(lambda x,y: x+y), # CAddTable']
-        elif name == 'Concat':
-            dim = m.dimension
-            s += ['LambdaReduce(lambda x,y,dim={}: torch.cat((x,y),dim), # Concat'.format(m.dimension)]
-            s += lua_recursive_source(m)
-            s += [')']
-        else:
-            s += '# ' + name + ' Not Implement,\n'
-    s = map(lambda x: '\t{}'.format(x), s)
-    return s
+        for m in module.modules:
+            name = type(m).__name__
+            if name == 'TorchObject':
+                name = m._typename.replace('cudnn.', '')
+                m = m._obj
 
+            if name == 'SpatialConvolution' or name == 'nn.SpatialConvolutionMM':
+                if not hasattr(m, 'groups') or m.groups is None: m.groups = 1
+                s += ['nn.Conv2d({},{},{},{},{},{},{},bias={}),#Conv2d'.format(m.nInputPlane,
+                                                                               m.nOutputPlane, (m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), 1, m.groups, m.bias is not None)]
+            elif name == 'SpatialBatchNormalization':
+                s += ['nn.BatchNorm2d({},{},{},{}),#BatchNorm2d'.format(m.running_mean.size(0), m.eps, m.momentum, m.affine)]
+            elif name == 'VolumetricBatchNormalization':
+                s += ['nn.BatchNorm3d({},{},{},{}),#BatchNorm3d'.format(m.running_mean.size(0), m.eps, m.momentum, m.affine)]
+            elif name == 'ReLU':
+                s += ['nn.ReLU()']
+            elif name == 'Sigmoid':
+                s += ['nn.Sigmoid()']
+            elif name == 'SpatialMaxPooling':
+                # s += ['nn.MaxPool2d({},{},{},ceil_mode={}),#MaxPool2d'.format((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), m.ceil_mode)]
+                suffixes = sorted(int(re.match('pooling_(\d*)', v).group(1)) for v in self.t2pt_names.values())
+                name = 'pooling_{}'.format(suffixes[-1] + 1 if suffixes else 1)
+                s += [name]
+                self.t2pt_names[m] = name
+                self.prefix_code += ['{} = StatefulMaxPool2d({}, {}, {}, ceil_mode={})'.format(name, (m.kH, m.kW), (m.dH, m.dW), (m.padH, m.padW), m.ceil_mode)]
+            elif name == 'SpatialMaxUnpooling':
+                if m.pooling in self.t2pt_names:
+                    s += ['StatefulMaxUnpool2d({}), #SpatialMaxUnpooling'.format(self.t2pt_names[m.pooling])]
+                else:
+                    s += ['# ' + name + ' Not Implement (can\'t find corresponding SpatialMaxUnpooling,\n']
+            elif name == 'SpatialAveragePooling':
+                s += ['nn.AvgPool2d({},{},{},ceil_mode={}),#AvgPool2d'.format((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), m.ceil_mode)]
+            elif name == 'SpatialUpSamplingNearest':
+                s += ['nn.UpsamplingNearest2d(scale_factor={})'.format(m.scale_factor)]
+            elif name == 'View':
+                s += ['Lambda(lambda x: x.view(x.size(0),-1)), # View']
+            elif name == 'Reshape':
+                s += ['Lambda(lambda x: x.view(x.size(0),-1)), # Reshape']
+            elif name == 'Linear':
+                s1 = 'Lambda(lambda x: x.view(1,-1) if 1==len(x.size()) else x )'
+                s2 = 'nn.Linear({},{},bias={})'.format(m.weight.size(1), m.weight.size(0), (m.bias is not None))
+                s += ['nn.Sequential({},{}),#Linear'.format(s1, s2)]
+            elif name == 'Dropout':
+                s += ['nn.Dropout({})'.format(m.p)]
+            elif name == 'SoftMax':
+                s += ['nn.Softmax()']
+            elif name == 'Identity':
+                s += ['Lambda(lambda x: x), # Identity']
+            elif name == 'SpatialFullConvolution':
+                s += ['nn.ConvTranspose2d({},{},{},{},{},{})'.format(m.nInputPlane,
+                                                                     m.nOutputPlane, (m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), (m.adjW, m.adjH))]
+            elif name == 'VolumetricFullConvolution':
+                s += ['nn.ConvTranspose3d({},{},{},{},{},{},{})'.format(m.nInputPlane,
+                                                                        m.nOutputPlane, (m.kT, m.kW, m.kH), (m.dT, m.dW, m.dH), (m.padT, m.padW, m.padH), (m.adjT, m.adjW, m.adjH),
+                                                                        m.groups)]
+            elif name == 'SpatialReplicationPadding':
+                s += ['nn.ReplicationPad2d({})'.format((m.pad_l, m.pad_r, m.pad_t, m.pad_b))]
+            elif name == 'SpatialReflectionPadding':
+                s += ['nn.ReflectionPad2d({})'.format((m.pad_l, m.pad_r, m.pad_t, m.pad_b))]
+            elif name == 'Copy':
+                s += ['Lambda(lambda x: x), # Copy']
+            elif name == 'Narrow':
+                s += ['Lambda(lambda x,a={}: x.narrow(*a))'.format((m.dimension, m.index, m.length))]
+            elif name == 'SpatialCrossMapLRN':
+                lrn = 'lnn.SpatialCrossMapLRN(*{})'.format((m.size, m.alpha, m.beta, m.k))
+                s += ['Lambda(lambda x,lrn={}: Variable(lrn.forward(x.data)))'.format(lrn)]
 
-def simplify_source(s):
-    s = map(lambda x: x.replace(',(1, 1),(0, 0),1,1,bias=True),#Conv2d', ')'), s)
-    s = map(lambda x: x.replace(',(0, 0),1,1,bias=True),#Conv2d', ')'), s)
-    s = map(lambda x: x.replace(',1,1,bias=True),#Conv2d', ')'), s)
-    s = map(lambda x: x.replace(',bias=True),#Conv2d', ')'), s)
-    s = map(lambda x: x.replace('),#Conv2d', ')'), s)
-    s = map(lambda x: x.replace(',1e-05,0.1,True),#BatchNorm2d', ')'), s)
-    s = map(lambda x: x.replace('),#BatchNorm2d', ')'), s)
-    s = map(lambda x: x.replace(',(0, 0),ceil_mode=False),#MaxPool2d', ')'), s)
-    s = map(lambda x: x.replace(',ceil_mode=False),#MaxPool2d', ')'), s)
-    s = map(lambda x: x.replace('),#MaxPool2d', ')'), s)
-    s = map(lambda x: x.replace(',(0, 0),ceil_mode=False),#AvgPool2d', ')'), s)
-    s = map(lambda x: x.replace(',ceil_mode=False),#AvgPool2d', ')'), s)
-    s = map(lambda x: x.replace(',bias=True)),#Linear', ')), # Linear'), s)
-    s = map(lambda x: x.replace(')),#Linear', ')), # Linear'), s)
+            elif name == 'Sequential':
+                s += ['nn.Sequential( # Sequential']
+                s += self.lua_recursive_source(m)
+                s += [')']
+            elif name == 'ConcatTable':
+                s += ['LambdaMap(lambda x: x, # ConcatTable']
+                s += self.lua_recursive_source(m)
+                s += [')']
+            elif name == 'CAddTable':
+                s += ['LambdaReduce(lambda x,y: x+y), # CAddTable']
+            elif name == 'Concat':
+                s += ['LambdaReduce(lambda x,y,dim={}: torch.cat((x,y),dim), # Concat'.format(m.dimension)]
+                s += self.lua_recursive_source(m)
+                s += [')']
+            else:
+                s += ['# ' + name + ' Not Implement,\n']
 
-    s = map(lambda x: '{},\n'.format(x), s)
-    s = map(lambda x: x[1:], s)
-    s = reduce(lambda x, y: x + y, s)
-    return s
+        s = map(lambda x: '\t{}'.format(x), s)
+        return list(s)
+
+    @staticmethod
+    def simplify_source(s):
+        s = map(lambda x: x.replace(',(1, 1),(0, 0),1,1,bias=True),#Conv2d', ')'), s)
+        s = map(lambda x: x.replace(',(0, 0),1,1,bias=True),#Conv2d', ')'), s)
+        s = map(lambda x: x.replace(',1,1,bias=True),#Conv2d', ')'), s)
+        s = map(lambda x: x.replace(',bias=True),#Conv2d', ')'), s)
+        s = map(lambda x: x.replace('),#Conv2d', ')'), s)
+        s = map(lambda x: x.replace(',1e-05,0.1,True),#BatchNorm2d', ')'), s)
+        s = map(lambda x: x.replace('),#BatchNorm2d', ')'), s)
+        s = map(lambda x: x.replace(',(0, 0),ceil_mode=False),#MaxPool2d', ')'), s)
+        s = map(lambda x: x.replace(',ceil_mode=False),#MaxPool2d', ')'), s)
+        s = map(lambda x: x.replace('),#MaxPool2d', ')'), s)
+        s = map(lambda x: x.replace(',(0, 0),ceil_mode=False),#AvgPool2d', ')'), s)
+        s = map(lambda x: x.replace(',ceil_mode=False),#AvgPool2d', ')'), s)
+        s = map(lambda x: x.replace(',bias=True)),#Linear', ')), # Linear'), s)
+        s = map(lambda x: x.replace(')),#Linear', ')), # Linear'), s)
+
+        s = map(lambda x: '{},\n'.format(x), s)
+        s = map(lambda x: x[1:], s)
+        s = reduce(lambda x, y: x + y, s)
+        return s
 
 
 def torch_to_pytorch(t7_filename, outputname=None):
@@ -247,21 +272,22 @@ def torch_to_pytorch(t7_filename, outputname=None):
         model = model.model
     model.gradInput = None
 
-    slist = lua_recursive_source(lnn.Sequential().add(model))
-    s = simplify_source(slist)
+    cvt = Convertor()
+    slist = cvt.lua_recursive_source(lnn.Sequential().add(model))
+    s = cvt.simplify_source(slist)
 
     varname = os.path.basename(t7_filename).replace('.t7', '').replace('.', '_').replace('-', '_')
 
     with open("header.py") as f:
         header = f.read()
-    s = '{}\n\n{} = {}'.format(header, varname, s[:-2])
+    s = '{}\n{}\n\n{} = {}'.format(header, '\n'.join(cvt.prefix_code), varname, s[:-2])
 
     if outputname is None: outputname = varname
     with open(outputname + '.py', "w") as pyfile:
         pyfile.write(s)
 
     n = nn.Sequential()
-    lua_recursive_model(model, n)
+    cvt.lua_recursive_model(model, n)
     torch.save(n.state_dict(), outputname + '.pth')
 
 

From a0ea3e4161493af3526944e86fe011cadcbd93ee Mon Sep 17 00:00:00 2001
From: Anatoly Baksheev <no@mail>
Date: Fri, 6 Jul 2018 13:40:39 +0300
Subject: [PATCH 6/8] formatting + use nn.MaxPool2d if no SpatialMaxUnpooling

---
 convert_torch.py | 91 ++++++++++++++++++++++++++++++------------------
 1 file changed, 57 insertions(+), 34 deletions(-)

diff --git a/convert_torch.py b/convert_torch.py
index 53d49a8..7841084 100644
--- a/convert_torch.py
+++ b/convert_torch.py
@@ -36,11 +36,27 @@ def add_submodule(seq, *args):
 
 class Convertor(object):
 
-    def __init__(self):
+    def __init__(self, model):
         self.prefix_code = []
         self.t2pt_names = dict()
         self.t2pt_layers = dict()
 
+        self.have_max_unpool = False
+
+        modules = []
+        modules.extend(model.modules)
+        containers = ['Sequential', 'Concat']
+
+        while modules:
+            m = modules.pop()
+            name = type(m).__name__
+            if name in containers:
+                modules.extend(m.modules)
+
+            self.have_max_unpool =  name == 'SpatialMaxUnpooling'
+            if self.have_max_unpool:
+                break
+
     def lua_recursive_model(self, module, seq):
         for m in module.modules:
             name = type(m).__name__
@@ -69,9 +85,11 @@ def lua_recursive_model(self, module, seq):
                 n = nn.Sigmoid()
                 add_submodule(seq, n)
             elif name == 'SpatialMaxPooling':
-                # n = nn.MaxPool2d((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), ceil_mode=m.ceil_mode)
-                n = StatefulMaxPool2d((m.kH, m.kW), (m.dH, m.dW), (m.padH, m.padW), ceil_mode=m.ceil_mode)
-                self.t2pt_layers[m] = n
+                if not self.have_max_unpool:
+                    n = nn.MaxPool2d((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), ceil_mode=m.ceil_mode)
+                else:
+                    n = StatefulMaxPool2d((m.kH, m.kW), (m.dH, m.dW), (m.padH, m.padW), ceil_mode=m.ceil_mode)
+                    self.t2pt_layers[m] = n
                 add_submodule(seq, n)
             elif name == 'SpatialMaxUnpooling':
                 if m.pooling in self.t2pt_layers:
@@ -164,10 +182,11 @@ def lua_recursive_source(self, module):
 
             if name == 'SpatialConvolution' or name == 'nn.SpatialConvolutionMM':
                 if not hasattr(m, 'groups') or m.groups is None: m.groups = 1
-                s += ['nn.Conv2d({},{},{},{},{},{},{},bias={}),#Conv2d'.format(m.nInputPlane,
-                                                                               m.nOutputPlane, (m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), 1, m.groups, m.bias is not None)]
+                s += ['nn.Conv2d({}, {}, {}, {}, {}, {}, {},bias={}), #Conv2d'.format(m.nInputPlane,
+                                                                                      m.nOutputPlane, (m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), 1, m.groups,
+                                                                                      m.bias is not None)]
             elif name == 'SpatialBatchNormalization':
-                s += ['nn.BatchNorm2d({},{},{},{}),#BatchNorm2d'.format(m.running_mean.size(0), m.eps, m.momentum, m.affine)]
+                s += ['nn.BatchNorm2d({}, {}, {}, {}), #BatchNorm2d'.format(m.running_mean.size(0), m.eps, m.momentum, m.affine)]
             elif name == 'VolumetricBatchNormalization':
                 s += ['nn.BatchNorm3d({},{},{},{}),#BatchNorm3d'.format(m.running_mean.size(0), m.eps, m.momentum, m.affine)]
             elif name == 'ReLU':
@@ -175,19 +194,21 @@ def lua_recursive_source(self, module):
             elif name == 'Sigmoid':
                 s += ['nn.Sigmoid()']
             elif name == 'SpatialMaxPooling':
-                # s += ['nn.MaxPool2d({},{},{},ceil_mode={}),#MaxPool2d'.format((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), m.ceil_mode)]
-                suffixes = sorted(int(re.match('pooling_(\d*)', v).group(1)) for v in self.t2pt_names.values())
-                name = 'pooling_{}'.format(suffixes[-1] + 1 if suffixes else 1)
-                s += [name]
-                self.t2pt_names[m] = name
-                self.prefix_code += ['{} = StatefulMaxPool2d({}, {}, {}, ceil_mode={})'.format(name, (m.kH, m.kW), (m.dH, m.dW), (m.padH, m.padW), m.ceil_mode)]
+                if not self.have_max_unpool:
+                    s += ['nn.MaxPool2d({}, {}, {}, ceil_mode={}), #MaxPool2d'.format((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), m.ceil_mode)]
+                else:
+                    suffixes = sorted(int(re.match('pooling_(\d*)', v).group(1)) for v in self.t2pt_names.values())
+                    name = 'pooling_{}'.format(suffixes[-1] + 1 if suffixes else 1)
+                    s += [name]
+                    self.t2pt_names[m] = name
+                    self.prefix_code += ['{} = StatefulMaxPool2d({}, {}, {}, ceil_mode={})'.format(name, (m.kH, m.kW), (m.dH, m.dW), (m.padH, m.padW), m.ceil_mode)]
             elif name == 'SpatialMaxUnpooling':
                 if m.pooling in self.t2pt_names:
                     s += ['StatefulMaxUnpool2d({}), #SpatialMaxUnpooling'.format(self.t2pt_names[m.pooling])]
                 else:
                     s += ['# ' + name + ' Not Implement (can\'t find corresponding SpatialMaxUnpooling,\n']
             elif name == 'SpatialAveragePooling':
-                s += ['nn.AvgPool2d({},{},{},ceil_mode={}),#AvgPool2d'.format((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), m.ceil_mode)]
+                s += ['nn.AvgPool2d({}, {}, {}, ceil_mode={}), #AvgPool2d'.format((m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), m.ceil_mode)]
             elif name == 'SpatialUpSamplingNearest':
                 s += ['nn.UpsamplingNearest2d(scale_factor={})'.format(m.scale_factor)]
             elif name == 'View':
@@ -197,7 +218,7 @@ def lua_recursive_source(self, module):
             elif name == 'Linear':
                 s1 = 'Lambda(lambda x: x.view(1,-1) if 1==len(x.size()) else x )'
                 s2 = 'nn.Linear({},{},bias={})'.format(m.weight.size(1), m.weight.size(0), (m.bias is not None))
-                s += ['nn.Sequential({},{}),#Linear'.format(s1, s2)]
+                s += ['nn.Sequential({}, {}), #Linear'.format(s1, s2)]
             elif name == 'Dropout':
                 s += ['nn.Dropout({})'.format(m.p)]
             elif name == 'SoftMax':
@@ -245,20 +266,20 @@ def lua_recursive_source(self, module):
 
     @staticmethod
     def simplify_source(s):
-        s = map(lambda x: x.replace(',(1, 1),(0, 0),1,1,bias=True),#Conv2d', ')'), s)
-        s = map(lambda x: x.replace(',(0, 0),1,1,bias=True),#Conv2d', ')'), s)
-        s = map(lambda x: x.replace(',1,1,bias=True),#Conv2d', ')'), s)
-        s = map(lambda x: x.replace(',bias=True),#Conv2d', ')'), s)
-        s = map(lambda x: x.replace('),#Conv2d', ')'), s)
-        s = map(lambda x: x.replace(',1e-05,0.1,True),#BatchNorm2d', ')'), s)
-        s = map(lambda x: x.replace('),#BatchNorm2d', ')'), s)
-        s = map(lambda x: x.replace(',(0, 0),ceil_mode=False),#MaxPool2d', ')'), s)
-        s = map(lambda x: x.replace(',ceil_mode=False),#MaxPool2d', ')'), s)
-        s = map(lambda x: x.replace('),#MaxPool2d', ')'), s)
-        s = map(lambda x: x.replace(',(0, 0),ceil_mode=False),#AvgPool2d', ')'), s)
-        s = map(lambda x: x.replace(',ceil_mode=False),#AvgPool2d', ')'), s)
-        s = map(lambda x: x.replace(',bias=True)),#Linear', ')), # Linear'), s)
-        s = map(lambda x: x.replace(')),#Linear', ')), # Linear'), s)
+        s = map(lambda x: x.replace(', (1, 1), (0, 0), 1, 1, bias=True), #Conv2d', ')'), s)
+        s = map(lambda x: x.replace(', (0, 0), 1, 1, bias=True), #Conv2d', ')'), s)
+        s = map(lambda x: x.replace(', 1, 1, bias=True), #Conv2d', ')'), s)
+        s = map(lambda x: x.replace(', bias=True), #Conv2d', ')'), s)
+        s = map(lambda x: x.replace('), #Conv2d', ')'), s)
+        s = map(lambda x: x.replace(', 1e-05, 0.1, True), #BatchNorm2d', ')'), s)
+        s = map(lambda x: x.replace('), #BatchNorm2d', ')'), s)
+        s = map(lambda x: x.replace(', (0, 0), ceil_mode=False), #MaxPool2d', ')'), s)
+        s = map(lambda x: x.replace(', ceil_mode=False), #MaxPool2d', ')'), s)
+        s = map(lambda x: x.replace('), #MaxPool2d', ')'), s)
+        s = map(lambda x: x.replace(', (0, 0), ceil_mode=False), #AvgPool2d', ')'), s)
+        s = map(lambda x: x.replace(', ceil_mode=False), #AvgPool2d', ')'), s)
+        s = map(lambda x: x.replace(', bias=True)), #Linear', ')), # Linear'), s)
+        s = map(lambda x: x.replace(')), #Linear', ')), # Linear'), s)
 
         s = map(lambda x: '{},\n'.format(x), s)
         s = map(lambda x: x[1:], s)
@@ -272,9 +293,9 @@ def torch_to_pytorch(t7_filename, outputname=None):
         model = model.model
     model.gradInput = None
 
-    cvt = Convertor()
-    slist = cvt.lua_recursive_source(lnn.Sequential().add(model))
-    s = cvt.simplify_source(slist)
+    cvt = Convertor(model)
+    s = cvt.lua_recursive_source(lnn.Sequential().add(model))
+    s = cvt.simplify_source(s)
 
     varname = os.path.basename(t7_filename).replace('.t7', '').replace('.', '_').replace('-', '_')
 
@@ -282,7 +303,9 @@ def torch_to_pytorch(t7_filename, outputname=None):
         header = f.read()
     s = '{}\n{}\n\n{} = {}'.format(header, '\n'.join(cvt.prefix_code), varname, s[:-2])
 
-    if outputname is None: outputname = varname
+    if outputname is None:
+        outputname = varname
+
     with open(outputname + '.py', "w") as pyfile:
         pyfile.write(s)
 
@@ -294,7 +317,7 @@ def torch_to_pytorch(t7_filename, outputname=None):
 if __name__ == '__main__':
     parser = argparse.ArgumentParser(description='Convert torch t7 model to pytorch')
     parser.add_argument('--model', '-m', type=str, required=True, help='torch model file in t7 format')
-    parser.add_argument('--output', '-o', type=str, default=None, help='output file name prefix, xxx.py xxx.pth')
+    parser.add_argument('--output', '-o', type=str, default='/tmp/model', help='output file name prefix, xxx.py xxx.pth')
     args = parser.parse_args()
 
     torch_to_pytorch(args.model, args.output)

From bf26724078501224edcd385447c30955caee2d4a Mon Sep 17 00:00:00 2001
From: Anatoly Baksheev <no@mail>
Date: Fri, 6 Jul 2018 14:18:45 +0300
Subject: [PATCH 7/8] restore copying modelfilename by default

---
 convert_torch.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/convert_torch.py b/convert_torch.py
index 7841084..fcdb7bd 100644
--- a/convert_torch.py
+++ b/convert_torch.py
@@ -304,7 +304,7 @@ def torch_to_pytorch(t7_filename, outputname=None):
     s = '{}\n{}\n\n{} = {}'.format(header, '\n'.join(cvt.prefix_code), varname, s[:-2])
 
     if outputname is None:
-        outputname = varname
+        outputname = os.path.join('/tmp', varname)
 
     with open(outputname + '.py', "w") as pyfile:
         pyfile.write(s)
@@ -317,7 +317,7 @@ def torch_to_pytorch(t7_filename, outputname=None):
 if __name__ == '__main__':
     parser = argparse.ArgumentParser(description='Convert torch t7 model to pytorch')
     parser.add_argument('--model', '-m', type=str, required=True, help='torch model file in t7 format')
-    parser.add_argument('--output', '-o', type=str, default='/tmp/model', help='output file name prefix, xxx.py xxx.pth')
+    parser.add_argument('--output', '-o', type=str, default=None, help='output file name prefix, xxx.py xxx.pth')
     args = parser.parse_args()
 
     torch_to_pytorch(args.model, args.output)

From 1d5e5d92854704507162edc2c5272677656555c2 Mon Sep 17 00:00:00 2001
From: Anatoly Baksheev <no@mail>
Date: Fri, 6 Jul 2018 14:32:32 +0300
Subject: [PATCH 8/8] formatting

---
 convert_torch.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/convert_torch.py b/convert_torch.py
index fcdb7bd..5793afe 100644
--- a/convert_torch.py
+++ b/convert_torch.py
@@ -182,7 +182,7 @@ def lua_recursive_source(self, module):
 
             if name == 'SpatialConvolution' or name == 'nn.SpatialConvolutionMM':
                 if not hasattr(m, 'groups') or m.groups is None: m.groups = 1
-                s += ['nn.Conv2d({}, {}, {}, {}, {}, {}, {},bias={}), #Conv2d'.format(m.nInputPlane,
+                s += ['nn.Conv2d({}, {}, {}, {}, {}, {}, {}, bias={}), #Conv2d'.format(m.nInputPlane,
                                                                                       m.nOutputPlane, (m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), 1, m.groups,
                                                                                       m.bias is not None)]
             elif name == 'SpatialBatchNormalization':
@@ -217,7 +217,7 @@ def lua_recursive_source(self, module):
                 s += ['Lambda(lambda x: x.view(x.size(0),-1)), # Reshape']
             elif name == 'Linear':
                 s1 = 'Lambda(lambda x: x.view(1,-1) if 1==len(x.size()) else x )'
-                s2 = 'nn.Linear({},{},bias={})'.format(m.weight.size(1), m.weight.size(0), (m.bias is not None))
+                s2 = 'nn.Linear({}, {}, bias={})'.format(m.weight.size(1), m.weight.size(0), (m.bias is not None))
                 s += ['nn.Sequential({}, {}), #Linear'.format(s1, s2)]
             elif name == 'Dropout':
                 s += ['nn.Dropout({})'.format(m.p)]
@@ -226,10 +226,10 @@ def lua_recursive_source(self, module):
             elif name == 'Identity':
                 s += ['Lambda(lambda x: x), # Identity']
             elif name == 'SpatialFullConvolution':
-                s += ['nn.ConvTranspose2d({},{},{},{},{},{})'.format(m.nInputPlane,
+                s += ['nn.ConvTranspose2d({}, {}, {}, {}, {}, {})'.format(m.nInputPlane,
                                                                      m.nOutputPlane, (m.kW, m.kH), (m.dW, m.dH), (m.padW, m.padH), (m.adjW, m.adjH))]
             elif name == 'VolumetricFullConvolution':
-                s += ['nn.ConvTranspose3d({},{},{},{},{},{},{})'.format(m.nInputPlane,
+                s += ['nn.ConvTranspose3d({}, {}, {}, {}, {}, {}, {})'.format(m.nInputPlane,
                                                                         m.nOutputPlane, (m.kT, m.kW, m.kH), (m.dT, m.dW, m.dH), (m.padT, m.padW, m.padH), (m.adjT, m.adjW, m.adjH),
                                                                         m.groups)]
             elif name == 'SpatialReplicationPadding':