1 Star 0 Fork 0

GhMa/variational-autoencoder

加入 Gitee
与超过 1200万 开发者一起发现、参与优秀开源项目,私有仓库也完全免费 :)
免费加入
文件
克隆/下载
data.py 1.61 KB
一键复制 编辑 原始数据 按行查看 历史
"""Get the binarized MNIST dataset and convert to hdf5.
From https://github.com/yburda/iwae/blob/master/datasets.py
"""
import urllib.request
import os
import numpy as np
import h5py
def parse_binary_mnist(data_dir):
def lines_to_np_array(lines):
return np.array([[int(i) for i in line.split()] for line in lines])
with open(os.path.join(data_dir, 'binarized_mnist_train.amat')) as f:
lines = f.readlines()
train_data = lines_to_np_array(lines).astype('float32')
with open(os.path.join(data_dir, 'binarized_mnist_valid.amat')) as f:
lines = f.readlines()
validation_data = lines_to_np_array(lines).astype('float32')
with open(os.path.join(data_dir, 'binarized_mnist_test.amat')) as f:
lines = f.readlines()
test_data = lines_to_np_array(lines).astype('float32')
return train_data, validation_data, test_data
def download_binary_mnist(fname):
data_dir = '/tmp/'
subdatasets = ['train', 'valid', 'test']
for subdataset in subdatasets:
filename = 'binarized_mnist_{}.amat'.format(subdataset)
url = 'http://www.cs.toronto.edu/~larocheh/public/datasets/binarized_mnist/binarized_mnist_{}.amat'.format(
subdataset)
local_filename = os.path.join(data_dir, filename)
urllib.request.urlretrieve(url, local_filename)
train, validation, test = parse_binary_mnist(data_dir)
data_dict = {'train': train, 'valid': validation, 'test': test}
f = h5py.File(fname, 'w')
f.create_dataset('train', data=data_dict['train'])
f.create_dataset('valid', data=data_dict['valid'])
f.create_dataset('test', data=data_dict['test'])
f.close()
print(f'Saved binary MNIST data to: {fname}')
Loading...
马建仓 AI 助手
尝试更多
代码解读
代码找茬
代码优化
1
https://gitee.com/ghma/variational-autoencoder.git
git@gitee.com:ghma/variational-autoencoder.git
ghma
variational-autoencoder
variational-autoencoder
master

搜索帮助