learn_autoencoder.lua

require 'torch'
require 'nn'
require 'optim'
require 'image'
require 'xlua'
require 'math'
require 'string'
require 'cunn'
require 'nngraph'
--local cuda = pcall(require, 'cutorch') -- Use CUDA if available

require 'Get_Images_Set'
require 'functions'

require 'const'


function AE_Training(model, batch, optimizer)
   input=batch
   expected=batch

   if NOISE then
      noise=torch.rand(batch:size())
      noise = noise/3
      noise=noise:cuda() --this step is always needed when running in either CPU/GPU mode
      input=input+noise
   end

   -- local img_merge = image.toDisplayTensor({input[1],expected[1]})
   -- image.display{image=img_merge,win=WINDOW}
   -- io.read()

   -- create closure to evaluate f(X) and df/dX
   local feval = function(x)
      -- just in case:
      collectgarbage()
      --get new parameters
      if x ~= parameters then
         parameters:copy(x)
      end
      --reset gradients
      gradParameters:zero()
      criterion=nn.SmoothL1Criterion()
      criterion=criterion:cuda()
      ouput=model:forward(input)
      loss = criterion:forward(ouput, expected)
      gradInput=model:backward(input, criterion:backward(ouput, expected))
      --print(gradInput:mean())
      return loss,gradParameters
   end
   optimState={learningRate=LR, learningRateDecay=LR_DECAY}
   parameters, loss=optimizer(feval, parameters, optimState)

   return loss[1]
end

function test_model(model, list_folders_images)

   criterion=nn.SmoothL1Criterion()
   criterion:cuda()

   -- for num_test=1,NB_TEST-1 do
   img = getRandomBatchFromSeparateList(1, 'regular'):view(1,3,224,224):cuda()
   output = model:forward(img)

   if VISUALIZE_AE then
      local img_compare = image.toDisplayTensor({img[1], output})
      -- image.display(img)
      image.display{image=img_compare,win=w}
   end

   --    local id_test = #list_folders_images - num_test
   --    local seq = load_seq_by_id(id_test)
   --    for im=1,#seq.images do
   --       current_img = seq.images[im]:view(1,3,200,200):cuda()
   --       output = model:forward(current_img)
   --       print(#current_img)
   --       print(#output)
   --
   --       if VISUALIZE_AE and im == 1 then
   --          local img_merge = image.toDisplayTensor({current_img[1], output})
   --          image.display({image=img_merge,win=WINDOW})
   --          io.read()
   --       end
   --    end
   -- end
end

local function save_decoder(model)

   local path = LOG_FOLDER..NAME_SAVE
   lfs.mkdir(path)
   local file_string = path..'/'..NAME_SAVE..'_decoder'..'.t7'

   local saved = model.modules[2]:clone():float()
   torch.save(file_string, model.modules[2]) --saving only encoding module
end

function train_Epoch(optimizer, list_folders_images,list_txt,Log_Folder)
   local totImg=AVG_FRAMES_PER_RECORD*NB_SEQUENCES

   print("total Imges: ",totImg)
   local nbIter=math.floor(totImg/BATCH_SIZE)

   local list_loss={}
   local list_corr={}
   local loss=0

   --test_model(model, list_folders_images)

   print("Begin Learning... "..NB_EPOCHS.." epochs")
   for epoch=1,NB_EPOCHS do
      loss=0
      print('--------------Epoch : '..epoch..' ---------------')
      for iter=1, nbIter do
         batch=getRandomBatchFromSeparateList(BATCH_SIZE, 'regular') --just taking random images from all sequences

         batch=batch:cuda()

         loss_iter=AE_Training(model,batch, optimizer)
         loss = loss + loss_iter
         xlua.progress(iter, nbIter)
      end
      print("DAE Mean Loss : "..loss/(nbIter*BATCH_SIZE))
      if epoch % 1 == 0 then
         save_autoencoder(model,name_save)
         save_decoder(model)
      end

      -- if epoch > 0 then
      --    test_model(model, list_folders_images)
      -- end
   end
   test_model(model, list_folders_images)
end

function set_AE_hyperparams(params)
   -- OVERRIDING hyperparameters since it's not for auto-encoders :  ** MAIN DIFFERENCES:
   MODEL_ARCHITECTURE_FILE = AENET -- important to call in this order, as DIFFERENT_FORMAT is defined based on this setting. TODO idea: Pass MODEL_ARCHITECTURE_FILE as default cmd param in which is different in each script?
   set_hyperparams(params, 'AE', true)
   LR = 0.0001
   LR_DECAY = 3*1e-6

   BATCH_SIZE= 20
   NB_EPOCHS = 50
   NUM_HIDDEN = DIMENSION_OUT
   NOISE = true
   if params.optimiser=="sgd" then  optimizer = optim.sgd end
   if params.optimiser=="rmsprop" then  optimizer = optim.rmsprop end
   if params.optimiser=="adam" then optimizer = optim.adam end
   return optimizer
end

local function main(params)
   print("\n\n>> learn_autoencoder.lua")
   optimizer = set_AE_hyperparams(params)
   print('cmd default params (overridden by following set_hyperparams): ')
   print(params)
   print_hyperparameters(false, 'learn_autoencoder.lua hyperparams:')

   if VISUALIZE_AE then
      w = image.display(torch.Tensor(3,200,400))
   end

   -- if DIFFERENT_FORMAT then
   --    error([[Don't forget to switch model to BASE_TIMNET in hyperparameters
   --  Because the images' format is the same for auto-encoder]])
   --  end
   --Not necessary anymore because ae uses resnet

   NAME_SAVE = 'AE_'..DATA_FOLDER..NUM_HIDDEN..NAME_SAVE
   print('NAME SAVE IN set_AE_hyp:  '..NAME_SAVE)
   local list_folders_images, list_txt=Get_HeadCamera_View_Files(DATA_FOLDER)

    NB_TEST = 3
    NB_SEQUENCES = #list_folders_images-NB_TEST --That way, the last X sequences are used as test

    ALL_SEQ = precompute_all_seq(NB_SEQUENCES)

    image_width=IM_LENGTH
    image_height=IM_HEIGHT

    require('./models/autoencoder_conv')
    model = getModel(NUM_HIDDEN)
    print(model)
    model=model:cuda()

    parameters,gradParameters = model:getParameters()
    train_Epoch(optimizer, list_folders_images,list_txt,Log_Folder)
    print_hyperparameters(false, "Experiment run successfully for hyperparams: ")
    imgs={} --memory is free!!!!!
end


-- Command-line options
local cmd = torch.CmdLine()
cmd:option('-optimiser', 'adam', 'Optimiser : adam|sgd|rmsprop')
cmd:option('-model', 'DAE', 'model : AE|DAE')
cmd:option('-use_cuda', true, 'true to use GPU, false (default) for CPU only mode')
cmd:option('-use_continuous', true, 'true to use a continuous action space, false (default) for discrete one (0.5 range actions)')
cmd:option('-data_folder', STATIC_BUTTON_SIMPLEST, 'Possible Datasets to use: staticButtonSimplest, mobileRobot, staticButtonSimplest, simpleData3D, pushingButton3DAugmented, babbling')
cmd:option('-mcd', 0.5, 'Max cosine distance')
cmd:option('-sigma', 0.1, 'Max cosine distance')
cmd:option('-states_dimension', -1, "states_dimension: Default DIMENSION_OUT, i.e., dimensionality of the states learned (default is 3)")

local params = cmd:parse(arg)
main(params)