编程 Python

pytorch制作自己的LMDB数据操作示例

Posted in Python onDecember 18, 2019

本文实例讲述了pytorch制作自己的LMDB数据操作。分享给大家供大家参考，具体如下：

前言

记录下pytorch里如何使用lmdb的code，自用

制作部分的Code

code就是ASTER里数据制作部分的代码改了点，aster_train.txt里面就算图片的完整路径每行一个，图片同目录下有同名的txt，里面记着jpg的标签

import os
import lmdb # install lmdb by "pip install lmdb"
import cv2
import numpy as np
from tqdm import tqdm
import six
from PIL import Image
import scipy.io as sio
from tqdm import tqdm
import re
def checkImageIsValid(imageBin):
 if imageBin is None:
  return False
 imageBuf = np.fromstring(imageBin, dtype=np.uint8)
 img = cv2.imdecode(imageBuf, cv2.IMREAD_GRAYSCALE)
 imgH, imgW = img.shape[0], img.shape[1]
 if imgH * imgW == 0:
  return False
 return True
def writeCache(env, cache):
 with env.begin(write=True) as txn:
  for k, v in cache.items():
   txn.put(k.encode(), v)
def _is_difficult(word):
 assert isinstance(word, str)
 return not re.match('^[\w]+$', word)
def createDataset(outputPath, imagePathList, labelList, lexiconList=None, checkValid=True):
 """
 Create LMDB dataset for CRNN training.
 ARGS:
   outputPath  : LMDB output path
   imagePathList : list of image path
   labelList   : list of corresponding groundtruth texts
   lexiconList  : (optional) list of lexicon lists
   checkValid  : if true, check the validity of every image
 """
 assert(len(imagePathList) == len(labelList))
 nSamples = len(imagePathList)
 env = lmdb.open(outputPath, map_size=1099511627776)#最大空间1048576GB
 cache = {}
 cnt = 1
 for i in range(nSamples):
  imagePath = imagePathList[i]
  label = labelList[i]
  if len(label) == 0:
   continue
  if not os.path.exists(imagePath):
   print('%s does not exist' % imagePath)
   continue
  with open(imagePath, 'rb') as f:
   imageBin = f.read()
  if checkValid:
   if not checkImageIsValid(imageBin):
    print('%s is not a valid image' % imagePath)
    continue
  #数据库中都是二进制数据
  imageKey = 'image-%09d' % cnt#9位数不足填零
  labelKey = 'label-%09d' % cnt
  cache[imageKey] = imageBin
  cache[labelKey] = label.encode()
  if lexiconList:
   lexiconKey = 'lexicon-%09d' % cnt
   cache[lexiconKey] = ' '.join(lexiconList[i])
  if cnt % 1000 == 0:
   writeCache(env, cache)
   cache = {}
   print('Written %d / %d' % (cnt, nSamples))
  cnt += 1
 nSamples = cnt-1
 cache['num-samples'] = str(nSamples).encode()
 writeCache(env, cache)
 print('Created dataset with %d samples' % nSamples)
def get_sample_list(txt_path:str):
  with open(txt_path,'r') as fr:
    jpg_list=[x.strip() for x in fr.readlines() if os.path.exists(x.replace('.jpg','.txt').strip())]
  txt_content_list=[]
  for jpg in jpg_list:
    label_path=jpg.replace('.jpg','.txt')
    with open(label_path,'r') as fr:
      try:
        str_tmp=fr.readline()
      except UnicodeDecodeError as e:
        print(label_path)
        raise(e)
      txt_content_list.append(str_tmp.strip())
  return jpg_list,txt_content_list
if __name__ == "__main__":
 txt_path='/home/gpu-server/disk/disk1/NumberData/8NumberSample/aster_train.txt'
 lmdb_output_path = '/home/gpu-server/project/aster/dataset/train'
 imagePathList,labelList=get_sample_list(txt_path)
 createDataset(lmdb_output_path, imagePathList, labelList)

读取部分

这里用的pytorch的dataloader，简单记录一下,人比较懒，代码就直接抄过来，不整理拆分了，重点看__getitem__

from __future__ import absolute_import
# import sys
# sys.path.append('./')
import os
# import moxing as mox
import pickle
from tqdm import tqdm
from PIL import Image, ImageFile
import numpy as np
import random
import cv2
import lmdb
import sys
import six
import torch
from torch.utils import data
from torch.utils.data import sampler
from torchvision import transforms
from lib.utils.labelmaps import get_vocabulary, labels2strs
from lib.utils import to_numpy
ImageFile.LOAD_TRUNCATED_IMAGES = True
from config import get_args
global_args = get_args(sys.argv[1:])
if global_args.run_on_remote:
 import moxing as mox
 #moxing是一个分布式的框架 跳过
class LmdbDataset(data.Dataset):
 def __init__(self, root, voc_type, max_len, num_samples, transform=None):
  super(LmdbDataset, self).__init__()
  if global_args.run_on_remote:
   dataset_name = os.path.basename(root)
   data_cache_url = "/cache/%s" % dataset_name
   if not os.path.exists(data_cache_url):
    os.makedirs(data_cache_url)
   if mox.file.exists(root):
    mox.file.copy_parallel(root, data_cache_url)
   else:
    raise ValueError("%s not exists!" % root)
   self.env = lmdb.open(data_cache_url, max_readers=32, readonly=True)
  else:
   self.env = lmdb.open(root, max_readers=32, readonly=True)
  assert self.env is not None, "cannot create lmdb from %s" % root
  self.txn = self.env.begin()
  self.voc_type = voc_type
  self.transform = transform
  self.max_len = max_len
  self.nSamples = int(self.txn.get(b"num-samples"))
  self.nSamples = min(self.nSamples, num_samples)
  assert voc_type in ['LOWERCASE', 'ALLCASES', 'ALLCASES_SYMBOLS','DIGITS']
  self.EOS = 'EOS'
  self.PADDING = 'PADDING'
  self.UNKNOWN = 'UNKNOWN'
  self.voc = get_vocabulary(voc_type, EOS=self.EOS, PADDING=self.PADDING, UNKNOWN=self.UNKNOWN)
  self.char2id = dict(zip(self.voc, range(len(self.voc))))
  self.id2char = dict(zip(range(len(self.voc)), self.voc))
  self.rec_num_classes = len(self.voc)
  self.lowercase = (voc_type == 'LOWERCASE')
 def __len__(self):
  return self.nSamples
 def __getitem__(self, index):
  assert index <= len(self), 'index range error'
  index += 1
  img_key = b'image-%09d' % index
  imgbuf = self.txn.get(img_key)
  #由于Image.open需要一个类文件对象 所以这里需要把二进制转为一个类文件对象
  buf = six.BytesIO()
  buf.write(imgbuf)
  buf.seek(0)
  try:
   img = Image.open(buf).convert('RGB')
   # img = Image.open(buf).convert('L')
   # img = img.convert('RGB')
  except IOError:
   print('Corrupted image for %d' % index)
   return self[index + 1]
  # reconition labels
  label_key = b'label-%09d' % index
  word = self.txn.get(label_key).decode()
  if self.lowercase:
   word = word.lower()
  ## fill with the padding token
  label = np.full((self.max_len,), self.char2id[self.PADDING], dtype=np.int)
  label_list = []
  for char in word:
   if char in self.char2id:
    label_list.append(self.char2id[char])
   else:
    ## add the unknown token
    print('{0} is out of vocabulary.'.format(char))
    label_list.append(self.char2id[self.UNKNOWN])
  ## add a stop token
  label_list = label_list + [self.char2id[self.EOS]]
  assert len(label_list) <= self.max_len
  label[:len(label_list)] = np.array(label_list)
  if len(label) <= 0:
   return self[index + 1]
  # label length
  label_len = len(label_list)
  if self.transform is not None:
   img = self.transform(img)
  return img, label, label_len

更多关于Python相关内容可查看本站专题：《Python数学运算技巧总结》、《Python图片操作技巧总结》、《Python数据结构与算法教程》、《Python函数使用技巧总结》、《Python字符串操作技巧汇总》及《Python入门与进阶经典教程》

希望本文所述对大家Python程序设计有所帮助。

pytorch制作自己的LMDB数据操作示例

- Author -

团长sama

声明：登载此文出于传递更多信息之目的，并不意味着赞同其观点或证实其描述。

Python 相关文章推荐

Python中内置数据类型list,tuple,dict,set的区别和用法

Dec 14 Python

Python3实战之爬虫抓取网易云音乐的热门评论

Oct 09 Python

Python中的pygal安装和绘制直方图代码分享

Dec 08 Python

微信跳一跳python辅助脚本（总结）

Jan 11 Python

Python的numpy库中将矩阵转换为列表等函数的方法

Apr 04 Python

python多进程控制学习小结

Oct 31 Python

Python多线程同步---文件读写控制方法

Feb 12 Python

windows系统中Python多版本与jupyter notebook使用虚拟环境的过程

May 15 Python

解决Django Static内容不能加载显示的问题

Jul 28 Python

Python SQLAlchemy库的使用方法

Oct 13 Python

Pytorch 使用tensor特定条件判断索引

Apr 08 Python

Django使用echarts进行可视化展示的实践

Jun 10 Python

Python Gluon参数和模块命名操作教程

Dec 18 #Python

python turtle 绘制太极图的实例

Dec 18 #Python

Python使用gluon/mxnet模块实现的mnist手写数字识别功能完整示例

Dec 18 #Python

简单了解Python读取大文件代码实例

Dec 18 #Python

python 比较2张图片的相似度的方法示例

Dec 18 #Python

使用Python的Turtle库绘制森林的实例

Dec 18 #Python

python3 requests库实现多图片爬取教程

Dec 18 #Python

You might like

Codeigniter出现错误提示Error with CACHE directory的解决方案

2014/06/12 PHP

php switch语句多个值匹配同一代码块应用示例

2014/07/29 PHP

PHP实现的json类实例

2015/07/28 PHP

PHP面向对象程序设计（OOP）之方法重写（override）操作示例

2018/12/21 PHP

预加载css或javascript的js代码

2010/04/23 Javascript

cnblogs中在闪存中屏蔽某人的实现代码

2010/11/14 Javascript

JQuery 返回布尔值Is()条件判断方法代码

2012/05/14 Javascript

jqGrid日期格式的判断示例代码(开始日期与结束日期)

2013/11/08 Javascript

jquery批量设置属性readonly和disabled的方法

2014/01/24 Javascript

Javascript的&&和||的另类用法

2014/07/23 Javascript

nodejs 整合kindEditor实现图片上传

2015/02/03 NodeJs

javascript框架设计之框架分类及主要功能

2015/06/23 Javascript

JavaScript 节流函数 Throttle 详解

2016/07/04 Javascript

Vue Router去掉url中默认的锚点#

2018/08/01 Javascript

vue实现滑动切换效果（仅在手机模式下可用）

2020/06/29 Javascript

原生js实现随机点名功能

2019/11/05 Javascript

微信小程序wxs实现吸顶效果

2020/01/08 Javascript

Vue中qs插件的使用详解

2020/02/07 Javascript

原生js实现五子棋游戏

2020/05/28 Javascript

vue实现信息管理系统

2020/05/30 Javascript

python实现用户登陆邮件通知的方法

2015/07/09 Python

使用FastCGI部署Python的Django应用的教程

2015/07/22 Python

利用标准库fractions模块让Python支持分数类型的方法详解

2017/08/11 Python

python实现神经网络感知器算法

2017/12/20 Python

Python算法的时间复杂度和空间复杂度(实例解析)

2019/11/19 Python

python中使用paramiko模块并实现远程连接服务器执行上传下载功能

2020/02/29 Python

Python tornado上传文件的功能

2020/03/26 Python

python实现图像外边界跟踪操作

2020/07/13 Python

一款纯css3实现的响应式导航

2014/10/31 HTML / CSS

英国虚拟主机服务商：eUKhost

2016/08/16 全球购物

介绍一下HDLC(High-Level Data Link Control)高层数据链路协议

2012/01/21 面试题

老师对学生的寄语

2014/04/09 职场文书

志愿者个人总结

2015/03/03 职场文书

试用期工作表现自我评价

2015/03/06 职场文书

关于Python OS模块常用文件/目录函数详解

2021/07/01 Python

Redis基本数据类型Set常用操作命令

2022/06/01 Redis