Training: Use e-lab's torch-toolbox sanitize.

2016-01-09 17:17:20 -05:00 · 2016-01-09 17:17:20 -05:00 · 8155840989
parent 6029baf48e
commit 8155840989
2 changed files with 96 additions and 16 deletions
--- a/training/sanitize.lua
+++ b/training/sanitize.lua
@ -0,0 +1,95 @@
 -- From https://github.com/e-lab/torch-toolbox/blob/master/Sanitize/sanitize.lua
 require('torch')
 require('nn')
 require('cunn')
 require('cudnn')
 -- common obj name to be freed
 local common = {'output', 'gradInput'}
 -- temporary buffer name other than output/gradInput
 local t = {
   -- convolution
   ['nn.SpatialConvolution'] = {'finput', 'fgradInput'},
   ['nn.SpatialConvolutionMM'] = {'finput', 'fgradInput'},
   -- pooling
   ['nn.SpatialMaxPooling'] = {'indices'},
   ['nn.TemporalMaxPooling'] = {'indices'},
   ['nn.VolumetricMaxPooling'] = {'indices'},
   ['nn.SpatialFractionalMaxPooling'] = {'indices'},
   -- regularizer
   ['nn.BatchNormalization'] = {'buffer', 'buffer2', 'centered', 'normalized'},
   ['nn.SpatialBatchNormalization'] = {'buffer', 'buffer2','centered', 'normalized'},
   ['nn.Dropout'] = {'noise'},
   ['nn.SpatialDropout'] = {'noise'},
   -- transfer
   ['nn.PReLU'] = {'gradWeightBuf', 'gradWeightBuf2'},
   ['nn.LogSigmoid'] = {'buffer'},
   -- etc
   ['nn.Mean'] = {'_gradInput'},
   ['nn.Normalize'] = {'_output', 'norm', 'normp'},
   ['nn.PairwiseDistance'] = {'diff'},
   ['nn.Reshape'] = {'_input', '_gradOutput'},
   -- fbcunn
   ['nn.AbstractParallel'] = {'homeGradBuffers', 'input_gpu', 'gradOutput_gpu', 'gradInput_gpu'},
   ['nn.DataParallel'] = {'homeGradBuffers', 'input_gpu', 'gradOutput_gpu', 'gradInput_gpu'},
   ['nn.ModelParallel'] = {'homeGradBuffers', 'input_gpu', 'gradOutput_gpu', 'gradInput_gpu'},
 }
 local function free_table_or_tensor(val, name, field)
   if type(val[name]) == 'table' then
      val[name] = {}
   elseif type(val[name]) == 'userdata' then
      val[name] = field.new()
   end
 end
 local function is_member(name, t)
   if t == nil then
      return false
   end
   for _, value in pairs(t) do
      if name == value then
         return true
      end
   end
   return false
 end
 -- Taken and modified from Soumith's imagenet-multiGPU.torch code
 -- https://github.com/soumith/imagenet-multiGPU.torch/blob/master/train.lua
 local function sanitize(model)
   local list = model:listModules()
   for _,val in ipairs(list) do
      for name,field in pairs(val) do
         -- remove ffi obj
         if torch.type(field) == 'cdata' then
            val[name] = nil
         -- remove common obj
         elseif is_member(name, common) then
            free_table_or_tensor(val, name, field)
         -- remove specific obj
         elseif is_member(name, t[val.__typename]) then
            free_table_or_tensor(val, name, field)
         end
      end
   end
   return model
 end
 return sanitize
--- a/training/train.lua
+++ b/training/train.lua
@ -23,6 +23,7 @@ require 'torchx' --for concetration the table of tensors
 paths.dofile("OpenFaceOptim.lua")
 local sanitize = paths.dofile('sanitize.lua')
 local optimMethod = optim.adadelta
 local optimState = {} -- Use for other algorithms like SGD
@ -34,22 +35,6 @@ local batchNumber
 local triplet_loss
 local function sanitize(net)
   net:apply(function (val)
         for name,field in pairs(val) do
            if torch.type(field) == 'cdata' then val[name] = nil end
            if name == 'homeGradBuffers' then val[name] = nil end
            if name == 'input_gpu' then val['input_gpu'] = {} end
            if name == 'gradOutput_gpu' then val['gradOutput_gpu'] = {} end
            if name == 'gradInput_gpu' then val['gradInput_gpu'] = {} end
            if (name == 'output' or name == 'gradInput')
            and torch.type(field) == 'torch.CudaTensor' then
               cutorch.withDevice(field:getDevice(), function() val[name] = field.new() end)
            end
         end
   end)
 end
 -- From https://groups.google.com/d/msg/torch7/i8sJYlgQPeA/wiHlPSa5-HYJ
 local function replaceModules(net, orig_class_name, replacer)
   local nodes, container_nodes = net:findModules(orig_class_name)