Last active
July 8, 2018 13:51
-
-
Save ugai/da60093f236915c093f2f5c49a773ee7 to your computer and use it in GitHub Desktop.
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| global_config { | |
| default_context { | |
| array_class: "CudaCachedArray" | |
| device_id: "0" | |
| backends: "cudnn:float" | |
| backends: "cuda:float" | |
| backends: "cpu:float" | |
| } | |
| } | |
| training_config { | |
| max_epoch: 1000 | |
| iter_per_epoch: 78 | |
| save_best: true | |
| monitor_interval: 10 | |
| } | |
| network { | |
| name: "Main" | |
| batch_size: 256 | |
| variable { | |
| name: "Input" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Input_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Input_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "DelayInput" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_4/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_4/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine_5/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_5/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine_2/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 784 dim: 3 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_2/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 3 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "CategoricalCrossEntropy_T" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 } | |
| } | |
| variable { | |
| name: "Concatenate" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "RSubScalar" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_7" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "RSubScalar_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_8" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_10" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_7" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_7" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "RSubScalar_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_8" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_9" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_9" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 3 } | |
| } | |
| variable { | |
| name: "Softmax" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 3 } | |
| } | |
| variable { | |
| name: "CategoricalCrossEntropy" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 } | |
| } | |
| function { | |
| name: "Concatenate" | |
| type: "Concatenate" | |
| input: "Input" | |
| input: "DelayInput" | |
| output: "Concatenate" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_4" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "Affine_4/affine/W" | |
| input: "Affine_4/affine/b" | |
| output: "Affine_4" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_5" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "Affine_5/affine/W" | |
| input: "Affine_5/affine/b" | |
| output: "Affine_5" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Sigmoid" | |
| type: "Sigmoid" | |
| input: "Affine_4" | |
| output: "Sigmoid" | |
| } | |
| function { | |
| name: "Sigmoid_2" | |
| type: "Sigmoid" | |
| input: "Affine_5" | |
| output: "Sigmoid_2" | |
| } | |
| function { | |
| name: "Mul2" | |
| type: "Mul2" | |
| input: "Sigmoid" | |
| input: "DelayInput" | |
| output: "Mul2" | |
| } | |
| function { | |
| name: "RSubScalar" | |
| type: "RSubScalar" | |
| input: "Sigmoid_2" | |
| output: "RSubScalar" | |
| r_sub_scalar_param { | |
| val: 1 | |
| } | |
| } | |
| function { | |
| name: "Concatenate_2" | |
| type: "Concatenate" | |
| input: "Mul2" | |
| input: "Input" | |
| output: "Concatenate_2" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Mul2_2" | |
| type: "Mul2" | |
| input: "RSubScalar" | |
| input: "DelayInput" | |
| output: "Mul2_2" | |
| } | |
| function { | |
| name: "Affine" | |
| type: "Affine" | |
| input: "Concatenate_2" | |
| input: "Affine/affine/W" | |
| input: "Affine/affine/b" | |
| output: "Affine" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh" | |
| type: "Tanh" | |
| input: "Affine" | |
| output: "Tanh" | |
| } | |
| function { | |
| name: "Mul2_3" | |
| type: "Mul2" | |
| input: "Tanh" | |
| input: "Sigmoid_2" | |
| output: "Mul2_3" | |
| } | |
| function { | |
| name: "Add2" | |
| type: "Add2" | |
| input: "Mul2_2" | |
| input: "Mul2_3" | |
| output: "Add2" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Concatenate_3" | |
| type: "Concatenate" | |
| input: "Input_2" | |
| input: "Add2" | |
| output: "Concatenate_3" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_3" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "Affine_4/affine/W" | |
| input: "Affine_4/affine/b" | |
| output: "Affine_3" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_7" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "Affine_5/affine/W" | |
| input: "Affine_5/affine/b" | |
| output: "Affine_7" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Sigmoid_4" | |
| type: "Sigmoid" | |
| input: "Affine_3" | |
| output: "Sigmoid_4" | |
| } | |
| function { | |
| name: "Sigmoid_5" | |
| type: "Sigmoid" | |
| input: "Affine_7" | |
| output: "Sigmoid_5" | |
| } | |
| function { | |
| name: "Mul2_4" | |
| type: "Mul2" | |
| input: "Sigmoid_4" | |
| input: "Add2" | |
| output: "Mul2_4" | |
| } | |
| function { | |
| name: "RSubScalar_2" | |
| type: "RSubScalar" | |
| input: "Sigmoid_5" | |
| output: "RSubScalar_2" | |
| r_sub_scalar_param { | |
| val: 1 | |
| } | |
| } | |
| function { | |
| name: "Concatenate_4" | |
| type: "Concatenate" | |
| input: "Mul2_4" | |
| input: "Input_2" | |
| output: "Concatenate_4" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Mul2_5" | |
| type: "Mul2" | |
| input: "RSubScalar_2" | |
| input: "Add2" | |
| output: "Mul2_5" | |
| } | |
| function { | |
| name: "Affine_6" | |
| type: "Affine" | |
| input: "Concatenate_4" | |
| input: "Affine/affine/W" | |
| input: "Affine/affine/b" | |
| output: "Affine_6" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh_2" | |
| type: "Tanh" | |
| input: "Affine_6" | |
| output: "Tanh_2" | |
| } | |
| function { | |
| name: "Mul2_6" | |
| type: "Mul2" | |
| input: "Tanh_2" | |
| input: "Sigmoid_5" | |
| output: "Mul2_6" | |
| } | |
| function { | |
| name: "Add2_2" | |
| type: "Add2" | |
| input: "Mul2_5" | |
| input: "Mul2_6" | |
| output: "Add2_2" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Concatenate_5" | |
| type: "Concatenate" | |
| input: "Add2_2" | |
| input: "Input_3" | |
| output: "Concatenate_5" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_8" | |
| type: "Affine" | |
| input: "Concatenate_5" | |
| input: "Affine_4/affine/W" | |
| input: "Affine_4/affine/b" | |
| output: "Affine_8" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_10" | |
| type: "Affine" | |
| input: "Concatenate_5" | |
| input: "Affine_5/affine/W" | |
| input: "Affine_5/affine/b" | |
| output: "Affine_10" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Sigmoid_6" | |
| type: "Sigmoid" | |
| input: "Affine_8" | |
| output: "Sigmoid_6" | |
| } | |
| function { | |
| name: "Sigmoid_7" | |
| type: "Sigmoid" | |
| input: "Affine_10" | |
| output: "Sigmoid_7" | |
| } | |
| function { | |
| name: "Mul2_7" | |
| type: "Mul2" | |
| input: "Sigmoid_6" | |
| input: "Add2_2" | |
| output: "Mul2_7" | |
| } | |
| function { | |
| name: "RSubScalar_3" | |
| type: "RSubScalar" | |
| input: "Sigmoid_7" | |
| output: "RSubScalar_3" | |
| r_sub_scalar_param { | |
| val: 1 | |
| } | |
| } | |
| function { | |
| name: "Concatenate_6" | |
| type: "Concatenate" | |
| input: "Mul2_7" | |
| input: "Input_3" | |
| output: "Concatenate_6" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Mul2_8" | |
| type: "Mul2" | |
| input: "RSubScalar_3" | |
| input: "Add2_2" | |
| output: "Mul2_8" | |
| } | |
| function { | |
| name: "Affine_9" | |
| type: "Affine" | |
| input: "Concatenate_6" | |
| input: "Affine/affine/W" | |
| input: "Affine/affine/b" | |
| output: "Affine_9" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh_3" | |
| type: "Tanh" | |
| input: "Affine_9" | |
| output: "Tanh_3" | |
| } | |
| function { | |
| name: "Mul2_9" | |
| type: "Mul2" | |
| input: "Tanh_3" | |
| input: "Sigmoid_7" | |
| output: "Mul2_9" | |
| } | |
| function { | |
| name: "Add2_3" | |
| type: "Add2" | |
| input: "Mul2_8" | |
| input: "Mul2_9" | |
| output: "Add2_3" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Affine_2" | |
| type: "Affine" | |
| input: "Add2_3" | |
| input: "Affine_2/affine/W" | |
| input: "Affine_2/affine/b" | |
| output: "Affine_2" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Softmax" | |
| type: "Softmax" | |
| input: "Affine_2" | |
| output: "Softmax" | |
| softmax_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "CategoricalCrossEntropy" | |
| type: "CategoricalCrossEntropy" | |
| input: "Softmax" | |
| input: "CategoricalCrossEntropy_T" | |
| output: "CategoricalCrossEntropy" | |
| categorical_cross_entropy_param { | |
| axis: 1 | |
| } | |
| } | |
| } | |
| network { | |
| name: "MainValidation" | |
| batch_size: 256 | |
| variable { | |
| name: "Input" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Input_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Input_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "DelayInput" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_4/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_4/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine_5/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_5/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine_2/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 784 dim: 3 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_2/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 3 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "CategoricalCrossEntropy_T" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 } | |
| } | |
| variable { | |
| name: "Concatenate" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "RSubScalar" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_7" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "RSubScalar_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_8" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_10" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_7" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_7" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "RSubScalar_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_8" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_9" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_9" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 3 } | |
| } | |
| variable { | |
| name: "Softmax" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 3 } | |
| } | |
| variable { | |
| name: "CategoricalCrossEntropy" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 } | |
| } | |
| function { | |
| name: "Concatenate" | |
| type: "Concatenate" | |
| input: "Input" | |
| input: "DelayInput" | |
| output: "Concatenate" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_4" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "Affine_4/affine/W" | |
| input: "Affine_4/affine/b" | |
| output: "Affine_4" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_5" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "Affine_5/affine/W" | |
| input: "Affine_5/affine/b" | |
| output: "Affine_5" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Sigmoid" | |
| type: "Sigmoid" | |
| input: "Affine_4" | |
| output: "Sigmoid" | |
| } | |
| function { | |
| name: "Sigmoid_2" | |
| type: "Sigmoid" | |
| input: "Affine_5" | |
| output: "Sigmoid_2" | |
| } | |
| function { | |
| name: "Mul2" | |
| type: "Mul2" | |
| input: "Sigmoid" | |
| input: "DelayInput" | |
| output: "Mul2" | |
| } | |
| function { | |
| name: "RSubScalar" | |
| type: "RSubScalar" | |
| input: "Sigmoid_2" | |
| output: "RSubScalar" | |
| r_sub_scalar_param { | |
| val: 1 | |
| } | |
| } | |
| function { | |
| name: "Concatenate_2" | |
| type: "Concatenate" | |
| input: "Mul2" | |
| input: "Input" | |
| output: "Concatenate_2" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Mul2_2" | |
| type: "Mul2" | |
| input: "RSubScalar" | |
| input: "DelayInput" | |
| output: "Mul2_2" | |
| } | |
| function { | |
| name: "Affine" | |
| type: "Affine" | |
| input: "Concatenate_2" | |
| input: "Affine/affine/W" | |
| input: "Affine/affine/b" | |
| output: "Affine" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh" | |
| type: "Tanh" | |
| input: "Affine" | |
| output: "Tanh" | |
| } | |
| function { | |
| name: "Mul2_3" | |
| type: "Mul2" | |
| input: "Tanh" | |
| input: "Sigmoid_2" | |
| output: "Mul2_3" | |
| } | |
| function { | |
| name: "Add2" | |
| type: "Add2" | |
| input: "Mul2_2" | |
| input: "Mul2_3" | |
| output: "Add2" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Concatenate_3" | |
| type: "Concatenate" | |
| input: "Input_2" | |
| input: "Add2" | |
| output: "Concatenate_3" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_3" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "Affine_4/affine/W" | |
| input: "Affine_4/affine/b" | |
| output: "Affine_3" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_7" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "Affine_5/affine/W" | |
| input: "Affine_5/affine/b" | |
| output: "Affine_7" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Sigmoid_4" | |
| type: "Sigmoid" | |
| input: "Affine_3" | |
| output: "Sigmoid_4" | |
| } | |
| function { | |
| name: "Sigmoid_5" | |
| type: "Sigmoid" | |
| input: "Affine_7" | |
| output: "Sigmoid_5" | |
| } | |
| function { | |
| name: "Mul2_4" | |
| type: "Mul2" | |
| input: "Sigmoid_4" | |
| input: "Add2" | |
| output: "Mul2_4" | |
| } | |
| function { | |
| name: "RSubScalar_2" | |
| type: "RSubScalar" | |
| input: "Sigmoid_5" | |
| output: "RSubScalar_2" | |
| r_sub_scalar_param { | |
| val: 1 | |
| } | |
| } | |
| function { | |
| name: "Concatenate_4" | |
| type: "Concatenate" | |
| input: "Mul2_4" | |
| input: "Input_2" | |
| output: "Concatenate_4" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Mul2_5" | |
| type: "Mul2" | |
| input: "RSubScalar_2" | |
| input: "Add2" | |
| output: "Mul2_5" | |
| } | |
| function { | |
| name: "Affine_6" | |
| type: "Affine" | |
| input: "Concatenate_4" | |
| input: "Affine/affine/W" | |
| input: "Affine/affine/b" | |
| output: "Affine_6" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh_2" | |
| type: "Tanh" | |
| input: "Affine_6" | |
| output: "Tanh_2" | |
| } | |
| function { | |
| name: "Mul2_6" | |
| type: "Mul2" | |
| input: "Tanh_2" | |
| input: "Sigmoid_5" | |
| output: "Mul2_6" | |
| } | |
| function { | |
| name: "Add2_2" | |
| type: "Add2" | |
| input: "Mul2_5" | |
| input: "Mul2_6" | |
| output: "Add2_2" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Concatenate_5" | |
| type: "Concatenate" | |
| input: "Add2_2" | |
| input: "Input_3" | |
| output: "Concatenate_5" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_8" | |
| type: "Affine" | |
| input: "Concatenate_5" | |
| input: "Affine_4/affine/W" | |
| input: "Affine_4/affine/b" | |
| output: "Affine_8" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_10" | |
| type: "Affine" | |
| input: "Concatenate_5" | |
| input: "Affine_5/affine/W" | |
| input: "Affine_5/affine/b" | |
| output: "Affine_10" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Sigmoid_6" | |
| type: "Sigmoid" | |
| input: "Affine_8" | |
| output: "Sigmoid_6" | |
| } | |
| function { | |
| name: "Sigmoid_7" | |
| type: "Sigmoid" | |
| input: "Affine_10" | |
| output: "Sigmoid_7" | |
| } | |
| function { | |
| name: "Mul2_7" | |
| type: "Mul2" | |
| input: "Sigmoid_6" | |
| input: "Add2_2" | |
| output: "Mul2_7" | |
| } | |
| function { | |
| name: "RSubScalar_3" | |
| type: "RSubScalar" | |
| input: "Sigmoid_7" | |
| output: "RSubScalar_3" | |
| r_sub_scalar_param { | |
| val: 1 | |
| } | |
| } | |
| function { | |
| name: "Concatenate_6" | |
| type: "Concatenate" | |
| input: "Mul2_7" | |
| input: "Input_3" | |
| output: "Concatenate_6" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Mul2_8" | |
| type: "Mul2" | |
| input: "RSubScalar_3" | |
| input: "Add2_2" | |
| output: "Mul2_8" | |
| } | |
| function { | |
| name: "Affine_9" | |
| type: "Affine" | |
| input: "Concatenate_6" | |
| input: "Affine/affine/W" | |
| input: "Affine/affine/b" | |
| output: "Affine_9" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh_3" | |
| type: "Tanh" | |
| input: "Affine_9" | |
| output: "Tanh_3" | |
| } | |
| function { | |
| name: "Mul2_9" | |
| type: "Mul2" | |
| input: "Tanh_3" | |
| input: "Sigmoid_7" | |
| output: "Mul2_9" | |
| } | |
| function { | |
| name: "Add2_3" | |
| type: "Add2" | |
| input: "Mul2_8" | |
| input: "Mul2_9" | |
| output: "Add2_3" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Affine_2" | |
| type: "Affine" | |
| input: "Add2_3" | |
| input: "Affine_2/affine/W" | |
| input: "Affine_2/affine/b" | |
| output: "Affine_2" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Softmax" | |
| type: "Softmax" | |
| input: "Affine_2" | |
| output: "Softmax" | |
| softmax_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "CategoricalCrossEntropy" | |
| type: "CategoricalCrossEntropy" | |
| input: "Softmax" | |
| input: "CategoricalCrossEntropy_T" | |
| output: "CategoricalCrossEntropy" | |
| categorical_cross_entropy_param { | |
| axis: 1 | |
| } | |
| } | |
| } | |
| network { | |
| name: "MainRuntime" | |
| batch_size: 256 | |
| variable { | |
| name: "Input" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Input_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Input_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "DelayInput" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_4/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_4/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine_5/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_5/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine_2/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 784 dim: 3 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_2/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 3 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Concatenate" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "RSubScalar" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_7" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "RSubScalar_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_8" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_10" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_7" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_7" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "RSubScalar_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_8" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_9" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_9" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 3 } | |
| } | |
| variable { | |
| name: "Softmax" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 3 } | |
| } | |
| function { | |
| name: "Concatenate" | |
| type: "Concatenate" | |
| input: "Input" | |
| input: "DelayInput" | |
| output: "Concatenate" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_4" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "Affine_4/affine/W" | |
| input: "Affine_4/affine/b" | |
| output: "Affine_4" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_5" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "Affine_5/affine/W" | |
| input: "Affine_5/affine/b" | |
| output: "Affine_5" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Sigmoid" | |
| type: "Sigmoid" | |
| input: "Affine_4" | |
| output: "Sigmoid" | |
| } | |
| function { | |
| name: "Sigmoid_2" | |
| type: "Sigmoid" | |
| input: "Affine_5" | |
| output: "Sigmoid_2" | |
| } | |
| function { | |
| name: "Mul2" | |
| type: "Mul2" | |
| input: "Sigmoid" | |
| input: "DelayInput" | |
| output: "Mul2" | |
| } | |
| function { | |
| name: "RSubScalar" | |
| type: "RSubScalar" | |
| input: "Sigmoid_2" | |
| output: "RSubScalar" | |
| r_sub_scalar_param { | |
| val: 1 | |
| } | |
| } | |
| function { | |
| name: "Concatenate_2" | |
| type: "Concatenate" | |
| input: "Mul2" | |
| input: "Input" | |
| output: "Concatenate_2" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Mul2_2" | |
| type: "Mul2" | |
| input: "RSubScalar" | |
| input: "DelayInput" | |
| output: "Mul2_2" | |
| } | |
| function { | |
| name: "Affine" | |
| type: "Affine" | |
| input: "Concatenate_2" | |
| input: "Affine/affine/W" | |
| input: "Affine/affine/b" | |
| output: "Affine" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh" | |
| type: "Tanh" | |
| input: "Affine" | |
| output: "Tanh" | |
| } | |
| function { | |
| name: "Mul2_3" | |
| type: "Mul2" | |
| input: "Tanh" | |
| input: "Sigmoid_2" | |
| output: "Mul2_3" | |
| } | |
| function { | |
| name: "Add2" | |
| type: "Add2" | |
| input: "Mul2_2" | |
| input: "Mul2_3" | |
| output: "Add2" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Concatenate_3" | |
| type: "Concatenate" | |
| input: "Input_2" | |
| input: "Add2" | |
| output: "Concatenate_3" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_3" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "Affine_4/affine/W" | |
| input: "Affine_4/affine/b" | |
| output: "Affine_3" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_7" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "Affine_5/affine/W" | |
| input: "Affine_5/affine/b" | |
| output: "Affine_7" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Sigmoid_4" | |
| type: "Sigmoid" | |
| input: "Affine_3" | |
| output: "Sigmoid_4" | |
| } | |
| function { | |
| name: "Sigmoid_5" | |
| type: "Sigmoid" | |
| input: "Affine_7" | |
| output: "Sigmoid_5" | |
| } | |
| function { | |
| name: "Mul2_4" | |
| type: "Mul2" | |
| input: "Sigmoid_4" | |
| input: "Add2" | |
| output: "Mul2_4" | |
| } | |
| function { | |
| name: "RSubScalar_2" | |
| type: "RSubScalar" | |
| input: "Sigmoid_5" | |
| output: "RSubScalar_2" | |
| r_sub_scalar_param { | |
| val: 1 | |
| } | |
| } | |
| function { | |
| name: "Concatenate_4" | |
| type: "Concatenate" | |
| input: "Mul2_4" | |
| input: "Input_2" | |
| output: "Concatenate_4" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Mul2_5" | |
| type: "Mul2" | |
| input: "RSubScalar_2" | |
| input: "Add2" | |
| output: "Mul2_5" | |
| } | |
| function { | |
| name: "Affine_6" | |
| type: "Affine" | |
| input: "Concatenate_4" | |
| input: "Affine/affine/W" | |
| input: "Affine/affine/b" | |
| output: "Affine_6" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh_2" | |
| type: "Tanh" | |
| input: "Affine_6" | |
| output: "Tanh_2" | |
| } | |
| function { | |
| name: "Mul2_6" | |
| type: "Mul2" | |
| input: "Tanh_2" | |
| input: "Sigmoid_5" | |
| output: "Mul2_6" | |
| } | |
| function { | |
| name: "Add2_2" | |
| type: "Add2" | |
| input: "Mul2_5" | |
| input: "Mul2_6" | |
| output: "Add2_2" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Concatenate_5" | |
| type: "Concatenate" | |
| input: "Add2_2" | |
| input: "Input_3" | |
| output: "Concatenate_5" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_8" | |
| type: "Affine" | |
| input: "Concatenate_5" | |
| input: "Affine_4/affine/W" | |
| input: "Affine_4/affine/b" | |
| output: "Affine_8" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_10" | |
| type: "Affine" | |
| input: "Concatenate_5" | |
| input: "Affine_5/affine/W" | |
| input: "Affine_5/affine/b" | |
| output: "Affine_10" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Sigmoid_6" | |
| type: "Sigmoid" | |
| input: "Affine_8" | |
| output: "Sigmoid_6" | |
| } | |
| function { | |
| name: "Sigmoid_7" | |
| type: "Sigmoid" | |
| input: "Affine_10" | |
| output: "Sigmoid_7" | |
| } | |
| function { | |
| name: "Mul2_7" | |
| type: "Mul2" | |
| input: "Sigmoid_6" | |
| input: "Add2_2" | |
| output: "Mul2_7" | |
| } | |
| function { | |
| name: "RSubScalar_3" | |
| type: "RSubScalar" | |
| input: "Sigmoid_7" | |
| output: "RSubScalar_3" | |
| r_sub_scalar_param { | |
| val: 1 | |
| } | |
| } | |
| function { | |
| name: "Concatenate_6" | |
| type: "Concatenate" | |
| input: "Mul2_7" | |
| input: "Input_3" | |
| output: "Concatenate_6" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Mul2_8" | |
| type: "Mul2" | |
| input: "RSubScalar_3" | |
| input: "Add2_2" | |
| output: "Mul2_8" | |
| } | |
| function { | |
| name: "Affine_9" | |
| type: "Affine" | |
| input: "Concatenate_6" | |
| input: "Affine/affine/W" | |
| input: "Affine/affine/b" | |
| output: "Affine_9" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh_3" | |
| type: "Tanh" | |
| input: "Affine_9" | |
| output: "Tanh_3" | |
| } | |
| function { | |
| name: "Mul2_9" | |
| type: "Mul2" | |
| input: "Tanh_3" | |
| input: "Sigmoid_7" | |
| output: "Mul2_9" | |
| } | |
| function { | |
| name: "Add2_3" | |
| type: "Add2" | |
| input: "Mul2_8" | |
| input: "Mul2_9" | |
| output: "Add2_3" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Affine_2" | |
| type: "Affine" | |
| input: "Add2_3" | |
| input: "Affine_2/affine/W" | |
| input: "Affine_2/affine/b" | |
| output: "Affine_2" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Softmax" | |
| type: "Softmax" | |
| input: "Affine_2" | |
| output: "Softmax" | |
| softmax_param { | |
| axis: 1 | |
| } | |
| } | |
| } | |
| dataset { | |
| name: "Training" | |
| uri: "F:\\neural_network_console_120\\samples\\sample_dataset\\MNIST\\hoge1_training.csv" | |
| cache_dir: "F:\\neural_network_console_120\\samples\\sample_dataset\\MNIST\\hoge1_training.cache" | |
| overwrite_cache: False | |
| create_cache_explicitly: True | |
| shuffle: true | |
| no_image_normalization: False | |
| batch_size: 256 | |
| } | |
| dataset { | |
| name: "Validation" | |
| uri: "F:\\neural_network_console_120\\samples\\sample_dataset\\MNIST\\hoge1_validation.csv" | |
| cache_dir: "F:\\neural_network_console_120\\samples\\sample_dataset\\MNIST\\hoge1_validation.cache" | |
| overwrite_cache: False | |
| create_cache_explicitly: True | |
| shuffle: false | |
| no_image_normalization: False | |
| batch_size: 256 | |
| } | |
| optimizer { | |
| name: "Optimizer" | |
| update_interval: 1 | |
| network_name: "Main" | |
| dataset_name: "Training" | |
| solver { | |
| type: "Adam" | |
| weight_decay: 0 | |
| lr_decay: 1 | |
| lr_decay_interval: 78 | |
| adam_param { | |
| alpha: 0.001 | |
| beta1: 0.9 | |
| beta2: 0.999 | |
| eps: 1e-08 | |
| } | |
| } | |
| data_variable { | |
| variable_name: "Input" | |
| data_name: "x1" | |
| } | |
| data_variable { | |
| variable_name: "Input_2" | |
| data_name: "x2" | |
| } | |
| data_variable { | |
| variable_name: "Input_3" | |
| data_name: "x3" | |
| } | |
| generator_variable { | |
| variable_name: "DelayInput" | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| data_variable { | |
| variable_name: "CategoricalCrossEntropy_T" | |
| data_name: "y" | |
| } | |
| loss_variable { | |
| variable_name: "CategoricalCrossEntropy" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_4/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_4/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_5/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_5/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "Affine/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "Affine/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_2/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_2/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| } | |
| monitor { | |
| name: "train_error" | |
| network_name: "MainValidation" | |
| dataset_name: "Training" | |
| data_variable { | |
| variable_name: "Input" | |
| data_name: "x1" | |
| } | |
| data_variable { | |
| variable_name: "Input_2" | |
| data_name: "x2" | |
| } | |
| data_variable { | |
| variable_name: "Input_3" | |
| data_name: "x3" | |
| } | |
| generator_variable { | |
| variable_name: "DelayInput" | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| data_variable { | |
| variable_name: "CategoricalCrossEntropy_T" | |
| data_name: "y" | |
| } | |
| monitor_variable { | |
| type: "Error" | |
| variable_name: "CategoricalCrossEntropy" | |
| } | |
| } | |
| monitor { | |
| name: "valid_error" | |
| network_name: "MainValidation" | |
| dataset_name: "Validation" | |
| data_variable { | |
| variable_name: "Input" | |
| data_name: "x1" | |
| } | |
| data_variable { | |
| variable_name: "Input_2" | |
| data_name: "x2" | |
| } | |
| data_variable { | |
| variable_name: "Input_3" | |
| data_name: "x3" | |
| } | |
| generator_variable { | |
| variable_name: "DelayInput" | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| data_variable { | |
| variable_name: "CategoricalCrossEntropy_T" | |
| data_name: "y" | |
| } | |
| monitor_variable { | |
| type: "Error" | |
| variable_name: "CategoricalCrossEntropy" | |
| } | |
| } | |
| executor { | |
| name: "Executor" | |
| network_name: "MainRuntime" | |
| num_evaluations: 1 | |
| repeat_evaluation_type: "mean" | |
| need_back_propagation: false | |
| data_variable { | |
| variable_name: "Input" | |
| data_name: "x1" | |
| } | |
| data_variable { | |
| variable_name: "Input_2" | |
| data_name: "x2" | |
| } | |
| data_variable { | |
| variable_name: "Input_3" | |
| data_name: "x3" | |
| } | |
| generator_variable { | |
| variable_name: "DelayInput" | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| output_variable { | |
| variable_name: "Softmax" | |
| data_name: "y'" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_4/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_4/affine/b" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_5/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_5/affine/b" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine/affine/b" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_2/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_2/affine/b" | |
| } | |
| } |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| global_config { | |
| default_context { | |
| array_class: "CudaCachedArray" | |
| device_id: "0" | |
| backends: "cudnn:float" | |
| backends: "cuda:float" | |
| backends: "cpu:float" | |
| } | |
| } | |
| training_config { | |
| max_epoch: 1000 | |
| iter_per_epoch: 78 | |
| save_best: true | |
| monitor_interval: 10 | |
| } | |
| network { | |
| name: "Main" | |
| batch_size: 256 | |
| variable { | |
| name: "Input" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Input_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Input_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "DelayInput" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "InputGate/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "InputGate/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine_2/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_2/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "InputGate_2/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "InputGate_2/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate_2/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate_2/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate_2/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate_2/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine_3/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_3/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "InputGate_3/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "InputGate_3/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate_3/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate_3/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate_3/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate_3/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine_4/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 784 dim: 3 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_4/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 3 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "CategoricalCrossEntropy_T" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 } | |
| } | |
| variable { | |
| name: "Concatenate" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "InputGate" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "ForgetGate" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "OutputGate" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "InputGate_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "ForgetGate_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "OutputGate_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_7" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "InputGate_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "ForgetGate_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "OutputGate_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_8" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_9" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_10" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_7" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_8" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_9" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 3 } | |
| } | |
| variable { | |
| name: "Softmax" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 3 } | |
| } | |
| variable { | |
| name: "CategoricalCrossEntropy" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 } | |
| } | |
| function { | |
| name: "Concatenate" | |
| type: "Concatenate" | |
| input: "Input" | |
| input: "DelayInput" | |
| output: "Concatenate" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "Affine/affine/W" | |
| input: "Affine/affine/b" | |
| output: "Affine" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "InputGate" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "InputGate/affine/W" | |
| input: "InputGate/affine/b" | |
| output: "InputGate" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "ForgetGate" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "ForgetGate/affine/W" | |
| input: "ForgetGate/affine/b" | |
| output: "ForgetGate" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "OutputGate" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "OutputGate/affine/W" | |
| input: "OutputGate/affine/b" | |
| output: "OutputGate" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh" | |
| type: "Tanh" | |
| input: "Affine" | |
| output: "Tanh" | |
| } | |
| function { | |
| name: "Sigmoid_4" | |
| type: "Sigmoid" | |
| input: "InputGate" | |
| output: "Sigmoid_4" | |
| } | |
| function { | |
| name: "Sigmoid_2" | |
| type: "Sigmoid" | |
| input: "ForgetGate" | |
| output: "Sigmoid_2" | |
| } | |
| function { | |
| name: "Sigmoid_3" | |
| type: "Sigmoid" | |
| input: "OutputGate" | |
| output: "Sigmoid_3" | |
| } | |
| function { | |
| name: "Mul2" | |
| type: "Mul2" | |
| input: "Sigmoid_4" | |
| input: "Tanh" | |
| output: "Mul2" | |
| } | |
| function { | |
| name: "Mul2_2" | |
| type: "Mul2" | |
| input: "Sigmoid_2" | |
| input: "DelayInput" | |
| output: "Mul2_2" | |
| } | |
| function { | |
| name: "Add2" | |
| type: "Add2" | |
| input: "Mul2" | |
| input: "Mul2_2" | |
| output: "Add2" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Tanh_2" | |
| type: "Tanh" | |
| input: "Add2" | |
| output: "Tanh_2" | |
| } | |
| function { | |
| name: "Mul2_3" | |
| type: "Mul2" | |
| input: "Sigmoid_3" | |
| input: "Tanh_2" | |
| output: "Mul2_3" | |
| } | |
| function { | |
| name: "Concatenate_2" | |
| type: "Concatenate" | |
| input: "Input_2" | |
| input: "Mul2_3" | |
| output: "Concatenate_2" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_2" | |
| type: "Affine" | |
| input: "Concatenate_2" | |
| input: "Affine_2/affine/W" | |
| input: "Affine_2/affine/b" | |
| output: "Affine_2" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "InputGate_2" | |
| type: "Affine" | |
| input: "Concatenate_2" | |
| input: "InputGate_2/affine/W" | |
| input: "InputGate_2/affine/b" | |
| output: "InputGate_2" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "ForgetGate_2" | |
| type: "Affine" | |
| input: "Concatenate_2" | |
| input: "ForgetGate_2/affine/W" | |
| input: "ForgetGate_2/affine/b" | |
| output: "ForgetGate_2" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "OutputGate_2" | |
| type: "Affine" | |
| input: "Concatenate_2" | |
| input: "OutputGate_2/affine/W" | |
| input: "OutputGate_2/affine/b" | |
| output: "OutputGate_2" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh_3" | |
| type: "Tanh" | |
| input: "Affine_2" | |
| output: "Tanh_3" | |
| } | |
| function { | |
| name: "Sigmoid_5" | |
| type: "Sigmoid" | |
| input: "InputGate_2" | |
| output: "Sigmoid_5" | |
| } | |
| function { | |
| name: "Sigmoid_6" | |
| type: "Sigmoid" | |
| input: "ForgetGate_2" | |
| output: "Sigmoid_6" | |
| } | |
| function { | |
| name: "Sigmoid_7" | |
| type: "Sigmoid" | |
| input: "OutputGate_2" | |
| output: "Sigmoid_7" | |
| } | |
| function { | |
| name: "Mul2_4" | |
| type: "Mul2" | |
| input: "Sigmoid_5" | |
| input: "Tanh_3" | |
| output: "Mul2_4" | |
| } | |
| function { | |
| name: "Mul2_5" | |
| type: "Mul2" | |
| input: "Sigmoid_6" | |
| input: "Mul2_3" | |
| output: "Mul2_5" | |
| } | |
| function { | |
| name: "Add2_2" | |
| type: "Add2" | |
| input: "Mul2_4" | |
| input: "Mul2_5" | |
| output: "Add2_2" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Tanh_4" | |
| type: "Tanh" | |
| input: "Add2_2" | |
| output: "Tanh_4" | |
| } | |
| function { | |
| name: "Mul2_6" | |
| type: "Mul2" | |
| input: "Sigmoid_7" | |
| input: "Tanh_4" | |
| output: "Mul2_6" | |
| } | |
| function { | |
| name: "Concatenate_3" | |
| type: "Concatenate" | |
| input: "Input_3" | |
| input: "Mul2_6" | |
| output: "Concatenate_3" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_3" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "Affine_3/affine/W" | |
| input: "Affine_3/affine/b" | |
| output: "Affine_3" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "InputGate_3" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "InputGate_3/affine/W" | |
| input: "InputGate_3/affine/b" | |
| output: "InputGate_3" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "ForgetGate_3" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "ForgetGate_3/affine/W" | |
| input: "ForgetGate_3/affine/b" | |
| output: "ForgetGate_3" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "OutputGate_3" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "OutputGate_3/affine/W" | |
| input: "OutputGate_3/affine/b" | |
| output: "OutputGate_3" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh_5" | |
| type: "Tanh" | |
| input: "Affine_3" | |
| output: "Tanh_5" | |
| } | |
| function { | |
| name: "Sigmoid_8" | |
| type: "Sigmoid" | |
| input: "InputGate_3" | |
| output: "Sigmoid_8" | |
| } | |
| function { | |
| name: "Sigmoid_9" | |
| type: "Sigmoid" | |
| input: "ForgetGate_3" | |
| output: "Sigmoid_9" | |
| } | |
| function { | |
| name: "Sigmoid_10" | |
| type: "Sigmoid" | |
| input: "OutputGate_3" | |
| output: "Sigmoid_10" | |
| } | |
| function { | |
| name: "Mul2_7" | |
| type: "Mul2" | |
| input: "Sigmoid_8" | |
| input: "Tanh_5" | |
| output: "Mul2_7" | |
| } | |
| function { | |
| name: "Mul2_8" | |
| type: "Mul2" | |
| input: "Sigmoid_9" | |
| input: "Mul2_6" | |
| output: "Mul2_8" | |
| } | |
| function { | |
| name: "Add2_3" | |
| type: "Add2" | |
| input: "Mul2_7" | |
| input: "Mul2_8" | |
| output: "Add2_3" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Tanh_6" | |
| type: "Tanh" | |
| input: "Add2_3" | |
| output: "Tanh_6" | |
| } | |
| function { | |
| name: "Mul2_9" | |
| type: "Mul2" | |
| input: "Sigmoid_10" | |
| input: "Tanh_6" | |
| output: "Mul2_9" | |
| } | |
| function { | |
| name: "Affine_4" | |
| type: "Affine" | |
| input: "Mul2_9" | |
| input: "Affine_4/affine/W" | |
| input: "Affine_4/affine/b" | |
| output: "Affine_4" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Softmax" | |
| type: "Softmax" | |
| input: "Affine_4" | |
| output: "Softmax" | |
| softmax_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "CategoricalCrossEntropy" | |
| type: "CategoricalCrossEntropy" | |
| input: "Softmax" | |
| input: "CategoricalCrossEntropy_T" | |
| output: "CategoricalCrossEntropy" | |
| categorical_cross_entropy_param { | |
| axis: 1 | |
| } | |
| } | |
| } | |
| network { | |
| name: "MainValidation" | |
| batch_size: 256 | |
| variable { | |
| name: "Input" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Input_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Input_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "DelayInput" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "InputGate/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "InputGate/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine_2/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_2/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "InputGate_2/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "InputGate_2/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate_2/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate_2/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate_2/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate_2/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine_3/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_3/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "InputGate_3/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "InputGate_3/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate_3/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate_3/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate_3/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate_3/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine_4/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 784 dim: 3 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_4/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 3 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "CategoricalCrossEntropy_T" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 } | |
| } | |
| variable { | |
| name: "Concatenate" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "InputGate" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "ForgetGate" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "OutputGate" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "InputGate_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "ForgetGate_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "OutputGate_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_7" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "InputGate_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "ForgetGate_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "OutputGate_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_8" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_9" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_10" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_7" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_8" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_9" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 3 } | |
| } | |
| variable { | |
| name: "Softmax" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 3 } | |
| } | |
| variable { | |
| name: "CategoricalCrossEntropy" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 } | |
| } | |
| function { | |
| name: "Concatenate" | |
| type: "Concatenate" | |
| input: "Input" | |
| input: "DelayInput" | |
| output: "Concatenate" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "Affine/affine/W" | |
| input: "Affine/affine/b" | |
| output: "Affine" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "InputGate" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "InputGate/affine/W" | |
| input: "InputGate/affine/b" | |
| output: "InputGate" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "ForgetGate" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "ForgetGate/affine/W" | |
| input: "ForgetGate/affine/b" | |
| output: "ForgetGate" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "OutputGate" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "OutputGate/affine/W" | |
| input: "OutputGate/affine/b" | |
| output: "OutputGate" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh" | |
| type: "Tanh" | |
| input: "Affine" | |
| output: "Tanh" | |
| } | |
| function { | |
| name: "Sigmoid_4" | |
| type: "Sigmoid" | |
| input: "InputGate" | |
| output: "Sigmoid_4" | |
| } | |
| function { | |
| name: "Sigmoid_2" | |
| type: "Sigmoid" | |
| input: "ForgetGate" | |
| output: "Sigmoid_2" | |
| } | |
| function { | |
| name: "Sigmoid_3" | |
| type: "Sigmoid" | |
| input: "OutputGate" | |
| output: "Sigmoid_3" | |
| } | |
| function { | |
| name: "Mul2" | |
| type: "Mul2" | |
| input: "Sigmoid_4" | |
| input: "Tanh" | |
| output: "Mul2" | |
| } | |
| function { | |
| name: "Mul2_2" | |
| type: "Mul2" | |
| input: "Sigmoid_2" | |
| input: "DelayInput" | |
| output: "Mul2_2" | |
| } | |
| function { | |
| name: "Add2" | |
| type: "Add2" | |
| input: "Mul2" | |
| input: "Mul2_2" | |
| output: "Add2" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Tanh_2" | |
| type: "Tanh" | |
| input: "Add2" | |
| output: "Tanh_2" | |
| } | |
| function { | |
| name: "Mul2_3" | |
| type: "Mul2" | |
| input: "Sigmoid_3" | |
| input: "Tanh_2" | |
| output: "Mul2_3" | |
| } | |
| function { | |
| name: "Concatenate_2" | |
| type: "Concatenate" | |
| input: "Input_2" | |
| input: "Mul2_3" | |
| output: "Concatenate_2" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_2" | |
| type: "Affine" | |
| input: "Concatenate_2" | |
| input: "Affine_2/affine/W" | |
| input: "Affine_2/affine/b" | |
| output: "Affine_2" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "InputGate_2" | |
| type: "Affine" | |
| input: "Concatenate_2" | |
| input: "InputGate_2/affine/W" | |
| input: "InputGate_2/affine/b" | |
| output: "InputGate_2" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "ForgetGate_2" | |
| type: "Affine" | |
| input: "Concatenate_2" | |
| input: "ForgetGate_2/affine/W" | |
| input: "ForgetGate_2/affine/b" | |
| output: "ForgetGate_2" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "OutputGate_2" | |
| type: "Affine" | |
| input: "Concatenate_2" | |
| input: "OutputGate_2/affine/W" | |
| input: "OutputGate_2/affine/b" | |
| output: "OutputGate_2" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh_3" | |
| type: "Tanh" | |
| input: "Affine_2" | |
| output: "Tanh_3" | |
| } | |
| function { | |
| name: "Sigmoid_5" | |
| type: "Sigmoid" | |
| input: "InputGate_2" | |
| output: "Sigmoid_5" | |
| } | |
| function { | |
| name: "Sigmoid_6" | |
| type: "Sigmoid" | |
| input: "ForgetGate_2" | |
| output: "Sigmoid_6" | |
| } | |
| function { | |
| name: "Sigmoid_7" | |
| type: "Sigmoid" | |
| input: "OutputGate_2" | |
| output: "Sigmoid_7" | |
| } | |
| function { | |
| name: "Mul2_4" | |
| type: "Mul2" | |
| input: "Sigmoid_5" | |
| input: "Tanh_3" | |
| output: "Mul2_4" | |
| } | |
| function { | |
| name: "Mul2_5" | |
| type: "Mul2" | |
| input: "Sigmoid_6" | |
| input: "Mul2_3" | |
| output: "Mul2_5" | |
| } | |
| function { | |
| name: "Add2_2" | |
| type: "Add2" | |
| input: "Mul2_4" | |
| input: "Mul2_5" | |
| output: "Add2_2" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Tanh_4" | |
| type: "Tanh" | |
| input: "Add2_2" | |
| output: "Tanh_4" | |
| } | |
| function { | |
| name: "Mul2_6" | |
| type: "Mul2" | |
| input: "Sigmoid_7" | |
| input: "Tanh_4" | |
| output: "Mul2_6" | |
| } | |
| function { | |
| name: "Concatenate_3" | |
| type: "Concatenate" | |
| input: "Input_3" | |
| input: "Mul2_6" | |
| output: "Concatenate_3" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_3" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "Affine_3/affine/W" | |
| input: "Affine_3/affine/b" | |
| output: "Affine_3" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "InputGate_3" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "InputGate_3/affine/W" | |
| input: "InputGate_3/affine/b" | |
| output: "InputGate_3" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "ForgetGate_3" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "ForgetGate_3/affine/W" | |
| input: "ForgetGate_3/affine/b" | |
| output: "ForgetGate_3" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "OutputGate_3" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "OutputGate_3/affine/W" | |
| input: "OutputGate_3/affine/b" | |
| output: "OutputGate_3" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh_5" | |
| type: "Tanh" | |
| input: "Affine_3" | |
| output: "Tanh_5" | |
| } | |
| function { | |
| name: "Sigmoid_8" | |
| type: "Sigmoid" | |
| input: "InputGate_3" | |
| output: "Sigmoid_8" | |
| } | |
| function { | |
| name: "Sigmoid_9" | |
| type: "Sigmoid" | |
| input: "ForgetGate_3" | |
| output: "Sigmoid_9" | |
| } | |
| function { | |
| name: "Sigmoid_10" | |
| type: "Sigmoid" | |
| input: "OutputGate_3" | |
| output: "Sigmoid_10" | |
| } | |
| function { | |
| name: "Mul2_7" | |
| type: "Mul2" | |
| input: "Sigmoid_8" | |
| input: "Tanh_5" | |
| output: "Mul2_7" | |
| } | |
| function { | |
| name: "Mul2_8" | |
| type: "Mul2" | |
| input: "Sigmoid_9" | |
| input: "Mul2_6" | |
| output: "Mul2_8" | |
| } | |
| function { | |
| name: "Add2_3" | |
| type: "Add2" | |
| input: "Mul2_7" | |
| input: "Mul2_8" | |
| output: "Add2_3" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Tanh_6" | |
| type: "Tanh" | |
| input: "Add2_3" | |
| output: "Tanh_6" | |
| } | |
| function { | |
| name: "Mul2_9" | |
| type: "Mul2" | |
| input: "Sigmoid_10" | |
| input: "Tanh_6" | |
| output: "Mul2_9" | |
| } | |
| function { | |
| name: "Affine_4" | |
| type: "Affine" | |
| input: "Mul2_9" | |
| input: "Affine_4/affine/W" | |
| input: "Affine_4/affine/b" | |
| output: "Affine_4" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Softmax" | |
| type: "Softmax" | |
| input: "Affine_4" | |
| output: "Softmax" | |
| softmax_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "CategoricalCrossEntropy" | |
| type: "CategoricalCrossEntropy" | |
| input: "Softmax" | |
| input: "CategoricalCrossEntropy_T" | |
| output: "CategoricalCrossEntropy" | |
| categorical_cross_entropy_param { | |
| axis: 1 | |
| } | |
| } | |
| } | |
| network { | |
| name: "MainRuntime" | |
| batch_size: 256 | |
| variable { | |
| name: "Input" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Input_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Input_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "DelayInput" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "InputGate/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "InputGate/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine_2/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_2/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "InputGate_2/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "InputGate_2/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate_2/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate_2/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate_2/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate_2/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine_3/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_3/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "InputGate_3/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "InputGate_3/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate_3/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "ForgetGate_3/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate_3/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 1568 dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "OutputGate_3/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 1 dim: 28 dim: 28 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Affine_4/affine/W" | |
| type: "Parameter" | |
| shape: { dim: 784 dim: 3 } | |
| initializer { | |
| type: "NormalAffineGlorot" | |
| multiplier: 1 | |
| } | |
| } | |
| variable { | |
| name: "Affine_4/affine/b" | |
| type: "Parameter" | |
| shape: { dim: 3 } | |
| initializer { | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| } | |
| variable { | |
| name: "Concatenate" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "InputGate" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "ForgetGate" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "OutputGate" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "InputGate_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "ForgetGate_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "OutputGate_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_7" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2_2" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Concatenate_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 2 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "InputGate_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "ForgetGate_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "OutputGate_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_5" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_8" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_9" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Sigmoid_10" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_7" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_8" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Add2_3" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Tanh_6" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Mul2_9" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 1 dim: 28 dim: 28 } | |
| } | |
| variable { | |
| name: "Affine_4" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 3 } | |
| } | |
| variable { | |
| name: "Softmax" | |
| type: "Buffer" | |
| shape: { dim:-1 dim: 3 } | |
| } | |
| function { | |
| name: "Concatenate" | |
| type: "Concatenate" | |
| input: "Input" | |
| input: "DelayInput" | |
| output: "Concatenate" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "Affine/affine/W" | |
| input: "Affine/affine/b" | |
| output: "Affine" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "InputGate" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "InputGate/affine/W" | |
| input: "InputGate/affine/b" | |
| output: "InputGate" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "ForgetGate" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "ForgetGate/affine/W" | |
| input: "ForgetGate/affine/b" | |
| output: "ForgetGate" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "OutputGate" | |
| type: "Affine" | |
| input: "Concatenate" | |
| input: "OutputGate/affine/W" | |
| input: "OutputGate/affine/b" | |
| output: "OutputGate" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh" | |
| type: "Tanh" | |
| input: "Affine" | |
| output: "Tanh" | |
| } | |
| function { | |
| name: "Sigmoid_4" | |
| type: "Sigmoid" | |
| input: "InputGate" | |
| output: "Sigmoid_4" | |
| } | |
| function { | |
| name: "Sigmoid_2" | |
| type: "Sigmoid" | |
| input: "ForgetGate" | |
| output: "Sigmoid_2" | |
| } | |
| function { | |
| name: "Sigmoid_3" | |
| type: "Sigmoid" | |
| input: "OutputGate" | |
| output: "Sigmoid_3" | |
| } | |
| function { | |
| name: "Mul2" | |
| type: "Mul2" | |
| input: "Sigmoid_4" | |
| input: "Tanh" | |
| output: "Mul2" | |
| } | |
| function { | |
| name: "Mul2_2" | |
| type: "Mul2" | |
| input: "Sigmoid_2" | |
| input: "DelayInput" | |
| output: "Mul2_2" | |
| } | |
| function { | |
| name: "Add2" | |
| type: "Add2" | |
| input: "Mul2" | |
| input: "Mul2_2" | |
| output: "Add2" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Tanh_2" | |
| type: "Tanh" | |
| input: "Add2" | |
| output: "Tanh_2" | |
| } | |
| function { | |
| name: "Mul2_3" | |
| type: "Mul2" | |
| input: "Sigmoid_3" | |
| input: "Tanh_2" | |
| output: "Mul2_3" | |
| } | |
| function { | |
| name: "Concatenate_2" | |
| type: "Concatenate" | |
| input: "Input_2" | |
| input: "Mul2_3" | |
| output: "Concatenate_2" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_2" | |
| type: "Affine" | |
| input: "Concatenate_2" | |
| input: "Affine_2/affine/W" | |
| input: "Affine_2/affine/b" | |
| output: "Affine_2" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "InputGate_2" | |
| type: "Affine" | |
| input: "Concatenate_2" | |
| input: "InputGate_2/affine/W" | |
| input: "InputGate_2/affine/b" | |
| output: "InputGate_2" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "ForgetGate_2" | |
| type: "Affine" | |
| input: "Concatenate_2" | |
| input: "ForgetGate_2/affine/W" | |
| input: "ForgetGate_2/affine/b" | |
| output: "ForgetGate_2" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "OutputGate_2" | |
| type: "Affine" | |
| input: "Concatenate_2" | |
| input: "OutputGate_2/affine/W" | |
| input: "OutputGate_2/affine/b" | |
| output: "OutputGate_2" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh_3" | |
| type: "Tanh" | |
| input: "Affine_2" | |
| output: "Tanh_3" | |
| } | |
| function { | |
| name: "Sigmoid_5" | |
| type: "Sigmoid" | |
| input: "InputGate_2" | |
| output: "Sigmoid_5" | |
| } | |
| function { | |
| name: "Sigmoid_6" | |
| type: "Sigmoid" | |
| input: "ForgetGate_2" | |
| output: "Sigmoid_6" | |
| } | |
| function { | |
| name: "Sigmoid_7" | |
| type: "Sigmoid" | |
| input: "OutputGate_2" | |
| output: "Sigmoid_7" | |
| } | |
| function { | |
| name: "Mul2_4" | |
| type: "Mul2" | |
| input: "Sigmoid_5" | |
| input: "Tanh_3" | |
| output: "Mul2_4" | |
| } | |
| function { | |
| name: "Mul2_5" | |
| type: "Mul2" | |
| input: "Sigmoid_6" | |
| input: "Mul2_3" | |
| output: "Mul2_5" | |
| } | |
| function { | |
| name: "Add2_2" | |
| type: "Add2" | |
| input: "Mul2_4" | |
| input: "Mul2_5" | |
| output: "Add2_2" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Tanh_4" | |
| type: "Tanh" | |
| input: "Add2_2" | |
| output: "Tanh_4" | |
| } | |
| function { | |
| name: "Mul2_6" | |
| type: "Mul2" | |
| input: "Sigmoid_7" | |
| input: "Tanh_4" | |
| output: "Mul2_6" | |
| } | |
| function { | |
| name: "Concatenate_3" | |
| type: "Concatenate" | |
| input: "Input_3" | |
| input: "Mul2_6" | |
| output: "Concatenate_3" | |
| concatenate_param { | |
| axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Affine_3" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "Affine_3/affine/W" | |
| input: "Affine_3/affine/b" | |
| output: "Affine_3" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "InputGate_3" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "InputGate_3/affine/W" | |
| input: "InputGate_3/affine/b" | |
| output: "InputGate_3" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "ForgetGate_3" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "ForgetGate_3/affine/W" | |
| input: "ForgetGate_3/affine/b" | |
| output: "ForgetGate_3" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "OutputGate_3" | |
| type: "Affine" | |
| input: "Concatenate_3" | |
| input: "OutputGate_3/affine/W" | |
| input: "OutputGate_3/affine/b" | |
| output: "OutputGate_3" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Tanh_5" | |
| type: "Tanh" | |
| input: "Affine_3" | |
| output: "Tanh_5" | |
| } | |
| function { | |
| name: "Sigmoid_8" | |
| type: "Sigmoid" | |
| input: "InputGate_3" | |
| output: "Sigmoid_8" | |
| } | |
| function { | |
| name: "Sigmoid_9" | |
| type: "Sigmoid" | |
| input: "ForgetGate_3" | |
| output: "Sigmoid_9" | |
| } | |
| function { | |
| name: "Sigmoid_10" | |
| type: "Sigmoid" | |
| input: "OutputGate_3" | |
| output: "Sigmoid_10" | |
| } | |
| function { | |
| name: "Mul2_7" | |
| type: "Mul2" | |
| input: "Sigmoid_8" | |
| input: "Tanh_5" | |
| output: "Mul2_7" | |
| } | |
| function { | |
| name: "Mul2_8" | |
| type: "Mul2" | |
| input: "Sigmoid_9" | |
| input: "Mul2_6" | |
| output: "Mul2_8" | |
| } | |
| function { | |
| name: "Add2_3" | |
| type: "Add2" | |
| input: "Mul2_7" | |
| input: "Mul2_8" | |
| output: "Add2_3" | |
| add2_param { | |
| inplace: True | |
| } | |
| } | |
| function { | |
| name: "Tanh_6" | |
| type: "Tanh" | |
| input: "Add2_3" | |
| output: "Tanh_6" | |
| } | |
| function { | |
| name: "Mul2_9" | |
| type: "Mul2" | |
| input: "Sigmoid_10" | |
| input: "Tanh_6" | |
| output: "Mul2_9" | |
| } | |
| function { | |
| name: "Affine_4" | |
| type: "Affine" | |
| input: "Mul2_9" | |
| input: "Affine_4/affine/W" | |
| input: "Affine_4/affine/b" | |
| output: "Affine_4" | |
| affine_param { | |
| base_axis: 1 | |
| } | |
| } | |
| function { | |
| name: "Softmax" | |
| type: "Softmax" | |
| input: "Affine_4" | |
| output: "Softmax" | |
| softmax_param { | |
| axis: 1 | |
| } | |
| } | |
| } | |
| dataset { | |
| name: "Training" | |
| uri: "F:\\neural_network_console_120\\samples\\sample_dataset\\MNIST\\hoge1_training.csv" | |
| cache_dir: "F:\\neural_network_console_120\\samples\\sample_dataset\\MNIST\\hoge1_training.cache" | |
| overwrite_cache: False | |
| create_cache_explicitly: True | |
| shuffle: true | |
| no_image_normalization: False | |
| batch_size: 256 | |
| } | |
| dataset { | |
| name: "Validation" | |
| uri: "F:\\neural_network_console_120\\samples\\sample_dataset\\MNIST\\hoge1_validation.csv" | |
| cache_dir: "F:\\neural_network_console_120\\samples\\sample_dataset\\MNIST\\hoge1_validation.cache" | |
| overwrite_cache: False | |
| create_cache_explicitly: True | |
| shuffle: false | |
| no_image_normalization: False | |
| batch_size: 256 | |
| } | |
| optimizer { | |
| name: "Optimizer" | |
| update_interval: 1 | |
| network_name: "Main" | |
| dataset_name: "Training" | |
| solver { | |
| type: "Adam" | |
| weight_decay: 0 | |
| lr_decay: 1 | |
| lr_decay_interval: 78 | |
| adam_param { | |
| alpha: 0.001 | |
| beta1: 0.9 | |
| beta2: 0.999 | |
| eps: 1e-08 | |
| } | |
| } | |
| data_variable { | |
| variable_name: "Input" | |
| data_name: "x1" | |
| } | |
| data_variable { | |
| variable_name: "Input_2" | |
| data_name: "x2" | |
| } | |
| data_variable { | |
| variable_name: "Input_3" | |
| data_name: "x3" | |
| } | |
| generator_variable { | |
| variable_name: "DelayInput" | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| data_variable { | |
| variable_name: "CategoricalCrossEntropy_T" | |
| data_name: "y" | |
| } | |
| loss_variable { | |
| variable_name: "CategoricalCrossEntropy" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "Affine/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "InputGate/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "InputGate/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "ForgetGate/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "ForgetGate/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "OutputGate/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "OutputGate/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_2/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_2/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "InputGate_2/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "InputGate_2/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "ForgetGate_2/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "ForgetGate_2/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "OutputGate_2/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "OutputGate_2/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_3/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_3/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "InputGate_3/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "InputGate_3/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "ForgetGate_3/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "ForgetGate_3/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "OutputGate_3/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "OutputGate_3/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_4/affine/W" | |
| learning_rate_multiplier: 1 | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_4/affine/b" | |
| learning_rate_multiplier: 1 | |
| } | |
| } | |
| monitor { | |
| name: "train_error" | |
| network_name: "MainValidation" | |
| dataset_name: "Training" | |
| data_variable { | |
| variable_name: "Input" | |
| data_name: "x1" | |
| } | |
| data_variable { | |
| variable_name: "Input_2" | |
| data_name: "x2" | |
| } | |
| data_variable { | |
| variable_name: "Input_3" | |
| data_name: "x3" | |
| } | |
| generator_variable { | |
| variable_name: "DelayInput" | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| data_variable { | |
| variable_name: "CategoricalCrossEntropy_T" | |
| data_name: "y" | |
| } | |
| monitor_variable { | |
| type: "Error" | |
| variable_name: "CategoricalCrossEntropy" | |
| } | |
| } | |
| monitor { | |
| name: "valid_error" | |
| network_name: "MainValidation" | |
| dataset_name: "Validation" | |
| data_variable { | |
| variable_name: "Input" | |
| data_name: "x1" | |
| } | |
| data_variable { | |
| variable_name: "Input_2" | |
| data_name: "x2" | |
| } | |
| data_variable { | |
| variable_name: "Input_3" | |
| data_name: "x3" | |
| } | |
| generator_variable { | |
| variable_name: "DelayInput" | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| data_variable { | |
| variable_name: "CategoricalCrossEntropy_T" | |
| data_name: "y" | |
| } | |
| monitor_variable { | |
| type: "Error" | |
| variable_name: "CategoricalCrossEntropy" | |
| } | |
| } | |
| executor { | |
| name: "Executor" | |
| network_name: "MainRuntime" | |
| num_evaluations: 1 | |
| repeat_evaluation_type: "mean" | |
| need_back_propagation: false | |
| data_variable { | |
| variable_name: "Input" | |
| data_name: "x1" | |
| } | |
| data_variable { | |
| variable_name: "Input_2" | |
| data_name: "x2" | |
| } | |
| data_variable { | |
| variable_name: "Input_3" | |
| data_name: "x3" | |
| } | |
| generator_variable { | |
| variable_name: "DelayInput" | |
| type: "Constant" | |
| multiplier: 0 | |
| } | |
| output_variable { | |
| variable_name: "Softmax" | |
| data_name: "y'" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine/affine/b" | |
| } | |
| parameter_variable { | |
| variable_name: "InputGate/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "InputGate/affine/b" | |
| } | |
| parameter_variable { | |
| variable_name: "ForgetGate/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "ForgetGate/affine/b" | |
| } | |
| parameter_variable { | |
| variable_name: "OutputGate/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "OutputGate/affine/b" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_2/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_2/affine/b" | |
| } | |
| parameter_variable { | |
| variable_name: "InputGate_2/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "InputGate_2/affine/b" | |
| } | |
| parameter_variable { | |
| variable_name: "ForgetGate_2/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "ForgetGate_2/affine/b" | |
| } | |
| parameter_variable { | |
| variable_name: "OutputGate_2/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "OutputGate_2/affine/b" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_3/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_3/affine/b" | |
| } | |
| parameter_variable { | |
| variable_name: "InputGate_3/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "InputGate_3/affine/b" | |
| } | |
| parameter_variable { | |
| variable_name: "ForgetGate_3/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "ForgetGate_3/affine/b" | |
| } | |
| parameter_variable { | |
| variable_name: "OutputGate_3/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "OutputGate_3/affine/b" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_4/affine/W" | |
| } | |
| parameter_variable { | |
| variable_name: "Affine_4/affine/b" | |
| } | |
| } |
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| import math | |
| import os | |
| import random | |
| import pandas as pd | |
| base_dir = r"F:\neural_network_console_120\samples\sample_dataset\MNIST" | |
| name = "hoge1" | |
| variable_count = 3 | |
| def hoge(dataset_dirname, count): | |
| rows = [] | |
| files = [] | |
| dataset_dirpath = os.path.join(base_dir, dataset_dirname) | |
| for i in range(10): | |
| dirpath = os.path.join(dataset_dirpath, str(i)) | |
| files.append([fn for fn in os.listdir(dirpath) if os.path.isfile(os.path.join(dirpath, fn))]) | |
| for i in range(count): | |
| row = type('',(object,), { | |
| 'paths': [], | |
| 'digits': [], | |
| 'get_label': lambda self: math.ceil(sum(self.digits) / len(self.digits)), | |
| 'get_csv_header': lambda self: ([f"x{n+1}:image" for n in range(len(self.paths))] + ["y:label"]), | |
| 'get_csv_values': lambda self: self.paths + [self.get_label()], | |
| '__str__': lambda self: f"l: {self.get_label()}, d: {self.digits}, p: {self.paths}", | |
| })() | |
| for n in range(variable_count): | |
| digit = random.randint(0, 9) | |
| class_dirname = f"{digit}" | |
| fileindex = random.randint(0, len(files[digit]) - 1) | |
| path = os.path.join(r".", dataset_dirname, class_dirname, files[digit][fileindex]) | |
| row.paths.append(path) | |
| row.digits.append(digit) | |
| rows.append(row) | |
| values = [row.get_csv_values() for row in rows] | |
| output_path = os.path.join(base_dir, f"{name}_{dataset_dirname}.csv") | |
| df = pd.DataFrame(values, columns=rows[0].get_csv_header()) | |
| df.to_csv(output_path, index=False, encoding="utf-8") | |
| hoge("training", 20000) | |
| hoge("validation", 2000) |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment