forked from lvdmaaten/fb.resnet.torch
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathcifar10-gen.lua
67 lines (57 loc) · 1.96 KB
/
cifar10-gen.lua
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
--
-- Copyright (c) 2016, Facebook, Inc.
-- All rights reserved.
--
-- This source code is licensed under the BSD-style license found in the
-- LICENSE file in the root directory of this source tree. An additional grant
-- of patent rights can be found in the PATENTS file in the same directory.
--
-- Script to compute list of ImageNet filenames and classes
--
-- This automatically downloads the CIFAR-10 dataset from
-- http://torch7.s3-website-us-east-1.amazonaws.com/data/cifar-10-torch.tar.gz
--
local URL = 'http://torch7.s3-website-us-east-1.amazonaws.com/data/cifar-10-torch.tar.gz'
local M = {}
local function convertToTensor(files)
local data, labels
for _, file in ipairs(files) do
local m = torch.load(file, 'ascii')
if not data then
data = m.data:t()
labels = m.labels:squeeze()
else
data = torch.cat(data, m.data:t(), 1)
labels = torch.cat(labels, m.labels:squeeze())
end
end
-- This is *very* important. The downloaded files have labels 0-9, which do
-- not work with CrossEntropyCriterion
labels:add(1)
return {
data = data:contiguous():view(-1, 3, 32, 32),
labels = labels,
}
end
function M.exec(opt, cacheFile)
print("=> Downloading CIFAR-10 dataset from " .. URL)
local ok = os.execute('curl ' .. URL .. ' | tar xz -C gen/')
assert(ok == true or ok == 0, 'error downloading CIFAR-10')
print(" | combining dataset into a single file")
local trainData = convertToTensor({
'gen/cifar-10-batches-t7/data_batch_1.t7',
'gen/cifar-10-batches-t7/data_batch_2.t7',
'gen/cifar-10-batches-t7/data_batch_3.t7',
'gen/cifar-10-batches-t7/data_batch_4.t7',
'gen/cifar-10-batches-t7/data_batch_5.t7',
})
local testData = convertToTensor({
'gen/cifar-10-batches-t7/test_batch.t7',
})
print(" | saving CIFAR-10 dataset to " .. cacheFile)
torch.save(cacheFile, {
train = trainData,
val = testData,
})
end
return M