编程 Python

pytorch中获取模型input/output shape实例

Posted in Python onDecember 30, 2019

Pytorch官方目前无法像tensorflow, caffe那样直接给出shape信息，详见

https://github.com/pytorch/pytorch/pull/3043

以下代码算一种workaround。由于CNN, RNN等模块实现不一样，添加其他模块支持可能需要改代码。

例如RNN中bias是bool类型，其权重也不是存于weight属性中，不过我们只关注shape够用了。

该方法必须构造一个输入调用forward后（model(x)调用）才可获取shape

#coding:utf-8
from collections import OrderedDict
import torch
from torch.autograd import Variable
import torch.nn as nn
import models.crnn as crnn
import json
 
 
def get_output_size(summary_dict, output):
 if isinstance(output, tuple):
 for i in xrange(len(output)):
  summary_dict[i] = OrderedDict()
  summary_dict[i] = get_output_size(summary_dict[i],output[i])
 else:
 summary_dict['output_shape'] = list(output.size())
 return summary_dict
 
def summary(input_size, model):
 def register_hook(module):
 def hook(module, input, output):
  class_name = str(module.__class__).split('.')[-1].split("'")[0]
  module_idx = len(summary)
 
  m_key = '%s-%i' % (class_name, module_idx+1)
  summary[m_key] = OrderedDict()
  summary[m_key]['input_shape'] = list(input[0].size())
  summary[m_key] = get_output_size(summary[m_key], output)
 
  params = 0
  if hasattr(module, 'weight'):
  params += torch.prod(torch.LongTensor(list(module.weight.size())))
  if module.weight.requires_grad:
   summary[m_key]['trainable'] = True
  else:
   summary[m_key]['trainable'] = False
  #if hasattr(module, 'bias'):
  # params += torch.prod(torch.LongTensor(list(module.bias.size())))
 
  summary[m_key]['nb_params'] = params
  
 if not isinstance(module, nn.Sequential) and \
  not isinstance(module, nn.ModuleList) and \
  not (module == model):
  hooks.append(module.register_forward_hook(hook))
 
 # check if there are multiple inputs to the network
 if isinstance(input_size[0], (list, tuple)):
 x = [Variable(torch.rand(1,*in_size)) for in_size in input_size]
 else:
 x = Variable(torch.rand(1,*input_size))
 
 # create properties
 summary = OrderedDict()
 hooks = []
 # register hook
 model.apply(register_hook)
 # make a forward pass
 model(x)
 # remove these hooks
 for h in hooks:
 h.remove()
 
 return summary
 
crnn = crnn.CRNN(32, 1, 3755, 256, 1)
x = summary([1,32,128],crnn)
print json.dumps(x)

以pytorch版CRNN为例，输出shape如下

{
"Conv2d-1": {
"input_shape": [1, 1, 32, 128],
"output_shape": [1, 64, 32, 128],
"trainable": true,
"nb_params": 576
},
"ReLU-2": {
"input_shape": [1, 64, 32, 128],
"output_shape": [1, 64, 32, 128],
"nb_params": 0
},
"MaxPool2d-3": {
"input_shape": [1, 64, 32, 128],
"output_shape": [1, 64, 16, 64],
"nb_params": 0
},
"Conv2d-4": {
"input_shape": [1, 64, 16, 64],
"output_shape": [1, 128, 16, 64],
"trainable": true,
"nb_params": 73728
},
"ReLU-5": {
"input_shape": [1, 128, 16, 64],
"output_shape": [1, 128, 16, 64],
"nb_params": 0
},
"MaxPool2d-6": {
"input_shape": [1, 128, 16, 64],
"output_shape": [1, 128, 8, 32],
"nb_params": 0
},
"Conv2d-7": {
"input_shape": [1, 128, 8, 32],
"output_shape": [1, 256, 8, 32],
"trainable": true,
"nb_params": 294912
},
"BatchNorm2d-8": {
"input_shape": [1, 256, 8, 32],
"output_shape": [1, 256, 8, 32],
"trainable": true,
"nb_params": 256
},
"ReLU-9": {
"input_shape": [1, 256, 8, 32],
"output_shape": [1, 256, 8, 32],
"nb_params": 0
},
"Conv2d-10": {
"input_shape": [1, 256, 8, 32],
"output_shape": [1, 256, 8, 32],
"trainable": true,
"nb_params": 589824
},
"ReLU-11": {
"input_shape": [1, 256, 8, 32],
"output_shape": [1, 256, 8, 32],
"nb_params": 0
},
"MaxPool2d-12": {
"input_shape": [1, 256, 8, 32],
"output_shape": [1, 256, 4, 33],
"nb_params": 0
},
"Conv2d-13": {
"input_shape": [1, 256, 4, 33],
"output_shape": [1, 512, 4, 33],
"trainable": true,
"nb_params": 1179648
},
"BatchNorm2d-14": {
"input_shape": [1, 512, 4, 33],
"output_shape": [1, 512, 4, 33],
"trainable": true,
"nb_params": 512
},
"ReLU-15": {
"input_shape": [1, 512, 4, 33],
"output_shape": [1, 512, 4, 33],
"nb_params": 0
},
"Conv2d-16": {
"input_shape": [1, 512, 4, 33],
"output_shape": [1, 512, 4, 33],
"trainable": true,
"nb_params": 2359296
},
"ReLU-17": {
"input_shape": [1, 512, 4, 33],
"output_shape": [1, 512, 4, 33],
"nb_params": 0
},
"MaxPool2d-18": {
"input_shape": [1, 512, 4, 33],
"output_shape": [1, 512, 2, 34],
"nb_params": 0
},
"Conv2d-19": {
"input_shape": [1, 512, 2, 34],
"output_shape": [1, 512, 1, 33],
"trainable": true,
"nb_params": 1048576
},
"BatchNorm2d-20": {
"input_shape": [1, 512, 1, 33],
"output_shape": [1, 512, 1, 33],
"trainable": true,
"nb_params": 512
},
"ReLU-21": {
"input_shape": [1, 512, 1, 33],
"output_shape": [1, 512, 1, 33],
"nb_params": 0
},
"LSTM-22": {
"input_shape": [33, 1, 512],
"0": {
"output_shape": [33, 1, 512]
},
"1": {
"0": {
"output_shape": [2, 1, 256]
},
"1": {
"output_shape": [2, 1, 256]
}
},
"nb_params": 0
},
"Linear-23": {
"input_shape": [33, 512],
"output_shape": [33, 256],
"trainable": true,
"nb_params": 131072
},
"BidirectionalLSTM-24": {
"input_shape": [33, 1, 512],
"output_shape": [33, 1, 256],
"nb_params": 0
},
"LSTM-25": {
"input_shape": [33, 1, 256],
"0": {
"output_shape": [33, 1, 512]
},
"1": {
"0": {
"output_shape": [2, 1, 256]
},
"1": {
"output_shape": [2, 1, 256]
}
},
"nb_params": 0
},
"Linear-26": {
"input_shape": [33, 512],
"output_shape": [33, 3755],
"trainable": true,
"nb_params": 1922560
},
"BidirectionalLSTM-27": {
"input_shape": [33, 1, 256],
"output_shape": [33, 1, 3755],
"nb_params": 0
}
}

以上这篇pytorch中获取模型input/output shape实例就是小编分享给大家的全部内容了，希望能给大家一个参考，也希望大家多多支持三水点靠木。

pytorch中获取模型input/output shape实例

- Author -

mylibrary1

声明：登载此文出于传递更多信息之目的，并不意味着赞同其观点或证实其描述。

Python 相关文章推荐

Python中3种内建数据结构：列表、元组和字典

Nov 30 Python

Python-OpenCV基本操作方法详解

Apr 02 Python

对matplotlib改变colorbar位置和方向的方法详解

Dec 13 Python

Django实现web端tailf日志文件功能及实例详解

Jul 28 Python

简单了解django orm中介模型

Jul 30 Python

python 发送json数据操作实例分析

Oct 15 Python

Python web如何在IIS发布应用过程解析

May 27 Python

Python 高效编程技巧分享

Sep 10 Python

python3字符串输出常见面试题总结

Dec 01 Python

python实现xml转json文件的示例代码

Dec 30 Python

通用的Django注册功能模块实现方法

Feb 05 Python

Python 多线程处理任务实例

Nov 07 Python

Python读取csv文件实例解析

Dec 30 #Python

Pytorch Tensor的统计属性实例讲解

Dec 30 #Python

PyTorch中permute的用法详解

Dec 30 #Python

python实现多进程按序号批量修改文件名的方法示例

Dec 30 #Python

Pytorch Tensor基本数学运算详解

Dec 30 #Python

python垃圾回收机制(GC)原理解析

Dec 30 #Python

利用Python代码实现一键抠背景功能

Dec 29 #Python

You might like

php桌面中心(三) 修改数据库

2007/03/11 PHP

php时间不正确的解决方法

2008/04/09 PHP

PHP开发负载均衡指南

2010/07/17 PHP

PHP删除非空目录的函数代码小结

2013/02/28 PHP

php文件上传的简单实例

2013/10/19 PHP

WordPress中注册菜单与调用菜单的方法详解

2015/12/18 PHP

如何使用PHP给图片加水印

2016/10/12 PHP

PHP使用递归算法无限遍历数组示例

2017/01/13 PHP

thinkphp分页集成实例

2017/07/24 PHP

PHP数据对象映射模式实例分析

2019/03/29 PHP

js或者jquery判断图片是否加载完成实现代码

2013/03/20 Javascript

javascript调试过程中找不到哪里出错的可能原因

2013/12/16 Javascript

js中call与apply的用法小结

2013/12/28 Javascript

js和jquery设置disabled属性为true使按钮失效

2014/08/07 Javascript

js操作数据库实现注册和登陆的简单实例

2016/05/26 Javascript

JS实现简单的tab切换选项卡效果

2016/09/21 Javascript

js中string和number类型互转换技巧(分享)

2016/11/28 Javascript

基于JS实现翻书效果的页面切换样式

2017/02/16 Javascript

JavaScript代码判断输入的字符串是否含有特殊字符和表情代码实例

2017/08/17 Javascript

JS实现获取当前所在周的周六、周日示例分析

2019/05/11 Javascript

JS数组中对象去重操作示例

2019/06/04 Javascript

Electron+vue从零开始打造一个本地播放器的方法示例

2020/10/27 Javascript

使用python分析git log日志示例

2014/02/27 Python

Python+Pyqt实现简单GUI电子时钟

2021/02/22 Python

快速解决docker-py api版本不兼容的问题

2019/08/30 Python

python 的 openpyxl模块读取 Excel文件的方法

2019/09/09 Python

Python的赋值、深拷贝与浅拷贝的区别详解

2020/02/12 Python

OpenCV+python实现实时目标检测功能

2020/06/24 Python

Agoda西班牙：全球特价酒店预订

2017/06/03 全球购物

Desigual德国官网：在线购买原创服装

2018/03/27 全球购物

法人代表任命书范本

2014/06/05 职场文书

2014年个人债务授权委托书范本

2014/09/22 职场文书

2016大学生暑期三下乡心得体会

2016/01/23 职场文书

MySQL中in和exists区别详解

2021/06/03 MySQL

mysql如何能有效防止删库跑路

2021/10/05 MySQL

css常用字体属性与背景属性介绍

2022/02/28 HTML / CSS