Created
November 23, 2018 19:09
-
-
Save aleksas/8dd6f31f03b5b3e78aff1a57c30ed7ea to your computer and use it in GitHub Desktop.
This file has been truncated, but you can view the full file.
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
node { | |
name: "global_step/Initializer/zeros" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@global_step" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
} | |
int64_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "global_step" | |
op: "VariableV2" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@global_step" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "" | |
} | |
} | |
} | |
node { | |
name: "global_step/Assign" | |
op: "Assign" | |
input: "global_step" | |
input: "global_step/Initializer/zeros" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@global_step" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "use_locking" | |
value { | |
b: true | |
} | |
} | |
attr { | |
key: "validate_shape" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "global_step/read" | |
op: "Identity" | |
input: "global_step" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@global_step" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "global_step/IsVariableInitialized" | |
op: "IsVariableInitialized" | |
input: "global_step" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@global_step" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
} | |
node { | |
name: "global_step/cond/Switch" | |
op: "Switch" | |
input: "global_step/IsVariableInitialized" | |
input: "global_step/IsVariableInitialized" | |
attr { | |
key: "T" | |
value { | |
type: DT_BOOL | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "global_step/cond/switch_t" | |
op: "Identity" | |
input: "global_step/cond/Switch:1" | |
attr { | |
key: "T" | |
value { | |
type: DT_BOOL | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "global_step/cond/switch_f" | |
op: "Identity" | |
input: "global_step/cond/Switch" | |
attr { | |
key: "T" | |
value { | |
type: DT_BOOL | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "global_step/cond/pred_id" | |
op: "Identity" | |
input: "global_step/IsVariableInitialized" | |
attr { | |
key: "T" | |
value { | |
type: DT_BOOL | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "global_step/cond/read" | |
op: "Identity" | |
input: "global_step/cond/read/Switch:1" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "global_step/cond/read/Switch" | |
op: "RefSwitch" | |
input: "global_step" | |
input: "global_step/cond/pred_id" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@global_step" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "global_step/cond/Switch_1" | |
op: "Switch" | |
input: "global_step/Initializer/zeros" | |
input: "global_step/cond/pred_id" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@global_step" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "global_step/cond/Merge" | |
op: "Merge" | |
input: "global_step/cond/Switch_1" | |
input: "global_step/cond/read" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "global_step/add/y" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
} | |
int64_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "global_step/add" | |
op: "Add" | |
input: "global_step/cond/Merge" | |
input: "global_step/add/y" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "Const" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 100 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 100 | |
} | |
} | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00096-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00086-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00028-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00076-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00032-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00051-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00050-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00015-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00057-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00049-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00031-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00010-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00053-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00004-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00033-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00091-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00020-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00009-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00035-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00017-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00059-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00068-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00063-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00095-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00082-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00034-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00062-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00052-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00067-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00099-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00093-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00090-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00075-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00012-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00083-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00037-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00005-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00002-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00038-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00058-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00030-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00011-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00003-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00006-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00029-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00089-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00081-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00044-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00013-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00077-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00080-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00087-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00085-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00007-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00021-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00024-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00054-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00060-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00016-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00040-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00094-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00023-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00061-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00018-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00043-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00069-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00066-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00048-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00092-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00056-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00073-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00014-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00027-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00055-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00098-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00097-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00041-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00072-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00025-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00045-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00088-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00047-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00019-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00070-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00008-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00000-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00079-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00046-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00084-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00078-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00065-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00042-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00074-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00064-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00071-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00026-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00039-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00036-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00022-of-00100" | |
string_val: "/root/t2t_data/translate_ltltstr_wmt32k-train-00001-of-00100" | |
} | |
} | |
} | |
} | |
node { | |
name: "cycle_length" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
} | |
int64_val: 8 | |
} | |
} | |
} | |
} | |
node { | |
name: "block_length" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
} | |
int64_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "sloppy" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_BOOL | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_BOOL | |
tensor_shape { | |
} | |
bool_val: true | |
} | |
} | |
} | |
} | |
node { | |
name: "buffer_output_elements" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
} | |
int64_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "prefetch_input_elements" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
} | |
int64_val: 16 | |
} | |
} | |
} | |
} | |
node { | |
name: "num_parallel_calls" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 4 | |
} | |
} | |
} | |
} | |
node { | |
name: "count" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
} | |
int64_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "buffer_size" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
} | |
int64_val: 1024 | |
} | |
} | |
} | |
} | |
node { | |
name: "seed" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
} | |
int64_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "seed2" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
} | |
int64_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "count_1" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
} | |
int64_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "count_2" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
} | |
int64_val: 8 | |
} | |
} | |
} | |
} | |
node { | |
name: "num_parallel_calls_1" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 4 | |
} | |
} | |
} | |
} | |
node { | |
name: "bucket_by_seq_length/Const" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 42 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
dim { | |
size: 42 | |
} | |
} | |
tensor_content: "\244\001\000\000\000\000\000\000\244\001\000\000\000\000\000\000;\001\000\000\000\000\000\000;\001\000\000\000\000\000\000;\001\000\000\000\000\000\000;\001\000\000\000\000\000\000\374\000\000\000\000\000\000\000\374\000\000\000\000\000\000\000\374\000\000\000\000\000\000\000\322\000\000\000\000\000\000\000\322\000\000\000\000\000\000\000\322\000\000\000\000\000\000\000\264\000\000\000\000\000\000\000\264\000\000\000\000\000\000\000\214\000\000\000\000\000\000\000\214\000\000\000\000\000\000\000\214\000\000\000\000\000\000\000~\000\000\000\000\000\000\000i\000\000\000\000\000\000\000i\000\000\000\000\000\000\000i\000\000\000\000\000\000\000Z\000\000\000\000\000\000\000T\000\000\000\000\000\000\000F\000\000\000\000\000\000\000F\000\000\000\000\000\000\000?\000\000\000\000\000\000\000<\000\000\000\000\000\000\000-\000\000\000\000\000\000\000-\000\000\000\000\000\000\000-\000\000\000\000\000\000\000*\000\000\000\000\000\000\000$\000\000\000\000\000\000\000$\000\000\000\000\000\000\000\036\000\000\000\000\000\000\000\036\000\000\000\000\000\000\000\025\000\000\000\000\000\000\000\025\000\000\000\000\000\000\000\025\000\000\000\000\000\000\000\024\000\000\000\000\000\000\000\022\000\000\000\000\000\000\000\017\000\000\000\000\000\000\000\017\000\000\000\000\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "num_parallel_calls_2" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 4 | |
} | |
} | |
} | |
} | |
node { | |
name: "buffer_size_1" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
} | |
int64_val: 512 | |
} | |
} | |
} | |
} | |
node { | |
name: "seed_1" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
} | |
int64_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "seed2_1" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
} | |
int64_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "num_parallel_calls_3" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 4 | |
} | |
} | |
} | |
} | |
node { | |
name: "buffer_size_2" | |
op: "Const" | |
device: "/device:CPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT64 | |
tensor_shape { | |
} | |
int64_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "IteratorV2" | |
op: "IteratorV2" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_types" | |
value { | |
list { | |
type: DT_INT32 | |
type: DT_INT32 | |
type: DT_INT32 | |
type: DT_INT32 | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "" | |
} | |
} | |
} | |
node { | |
name: "TensorSliceDataset" | |
op: "TensorSliceDataset" | |
input: "Const" | |
attr { | |
key: "Toutput_types" | |
value { | |
list { | |
type: DT_STRING | |
} | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@IteratorV2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "ParallelInterleaveDataset" | |
op: "ParallelInterleaveDataset" | |
input: "TensorSliceDataset" | |
input: "cycle_length" | |
input: "block_length" | |
input: "sloppy" | |
input: "buffer_output_elements" | |
input: "prefetch_input_elements" | |
attr { | |
key: "Targuments" | |
value { | |
list { | |
} | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@IteratorV2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "f" | |
value { | |
func { | |
name: "tf_data_structured_function_wrapper_rl4HI7BWu1A" | |
} | |
} | |
} | |
attr { | |
key: "output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_types" | |
value { | |
list { | |
type: DT_INT64 | |
type: DT_INT64 | |
type: DT_INT64 | |
} | |
} | |
} | |
} | |
node { | |
name: "ParallelMapDataset" | |
op: "ParallelMapDataset" | |
input: "ParallelInterleaveDataset" | |
input: "num_parallel_calls" | |
attr { | |
key: "Targuments" | |
value { | |
list { | |
} | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@IteratorV2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "f" | |
value { | |
func { | |
name: "tf_data_structured_function_wrapper_8BcapRUaa8g" | |
} | |
} | |
} | |
attr { | |
key: "output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_types" | |
value { | |
list { | |
type: DT_INT64 | |
type: DT_INT64 | |
type: DT_INT64 | |
} | |
} | |
} | |
attr { | |
key: "use_inter_op_parallelism" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "TakeDataset" | |
op: "TakeDataset" | |
input: "ParallelMapDataset" | |
input: "count" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@IteratorV2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_types" | |
value { | |
list { | |
type: DT_INT64 | |
type: DT_INT64 | |
type: DT_INT64 | |
} | |
} | |
} | |
} | |
node { | |
name: "ShuffleDataset" | |
op: "ShuffleDataset" | |
input: "TakeDataset" | |
input: "buffer_size" | |
input: "seed" | |
input: "seed2" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@IteratorV2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_types" | |
value { | |
list { | |
type: DT_INT64 | |
type: DT_INT64 | |
type: DT_INT64 | |
} | |
} | |
} | |
attr { | |
key: "reshuffle_each_iteration" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "RepeatDataset" | |
op: "RepeatDataset" | |
input: "ShuffleDataset" | |
input: "count_1" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@IteratorV2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_types" | |
value { | |
list { | |
type: DT_INT64 | |
type: DT_INT64 | |
type: DT_INT64 | |
} | |
} | |
} | |
} | |
node { | |
name: "SkipDataset" | |
op: "SkipDataset" | |
input: "RepeatDataset" | |
input: "count_2" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@IteratorV2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_types" | |
value { | |
list { | |
type: DT_INT64 | |
type: DT_INT64 | |
type: DT_INT64 | |
} | |
} | |
} | |
} | |
node { | |
name: "ParallelMapDataset_1" | |
op: "ParallelMapDataset" | |
input: "SkipDataset" | |
input: "num_parallel_calls_1" | |
attr { | |
key: "Targuments" | |
value { | |
list { | |
} | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@IteratorV2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "f" | |
value { | |
func { | |
name: "tf_data_structured_function_wrapper_B1ltQpaA30c" | |
} | |
} | |
} | |
attr { | |
key: "output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_types" | |
value { | |
list { | |
type: DT_INT32 | |
type: DT_INT32 | |
type: DT_INT32 | |
} | |
} | |
} | |
attr { | |
key: "use_inter_op_parallelism" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "FilterDataset" | |
op: "FilterDataset" | |
input: "ParallelMapDataset_1" | |
attr { | |
key: "Targuments" | |
value { | |
list { | |
} | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@IteratorV2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_types" | |
value { | |
list { | |
type: DT_INT32 | |
type: DT_INT32 | |
type: DT_INT32 | |
} | |
} | |
} | |
attr { | |
key: "predicate" | |
value { | |
func { | |
name: "tf_data_structured_function_wrapper_md9cGBlsubY" | |
} | |
} | |
} | |
} | |
node { | |
name: "GroupByWindowDataset" | |
op: "GroupByWindowDataset" | |
input: "FilterDataset" | |
input: "bucket_by_seq_length/Const" | |
input: "bucket_by_seq_length/Const" | |
attr { | |
key: "Tkey_func_other_arguments" | |
value { | |
list { | |
} | |
} | |
} | |
attr { | |
key: "Treduce_func_other_arguments" | |
value { | |
list { | |
type: DT_INT64 | |
} | |
} | |
} | |
attr { | |
key: "Twindow_size_func_other_arguments" | |
value { | |
list { | |
type: DT_INT64 | |
} | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@IteratorV2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "key_func" | |
value { | |
func { | |
name: "tf_data_structured_function_wrapper_eJST0bGO0eU" | |
} | |
} | |
} | |
attr { | |
key: "output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_types" | |
value { | |
list { | |
type: DT_INT32 | |
type: DT_INT32 | |
type: DT_INT32 | |
} | |
} | |
} | |
attr { | |
key: "reduce_func" | |
value { | |
func { | |
name: "tf_data_structured_function_wrapper_uI0tbat6wJg" | |
} | |
} | |
} | |
attr { | |
key: "window_size_func" | |
value { | |
func { | |
name: "tf_data_structured_function_wrapper_AMulhXHnGP4" | |
} | |
} | |
} | |
} | |
node { | |
name: "ParallelMapDataset_2" | |
op: "ParallelMapDataset" | |
input: "GroupByWindowDataset" | |
input: "num_parallel_calls_2" | |
attr { | |
key: "Targuments" | |
value { | |
list { | |
} | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@IteratorV2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "f" | |
value { | |
func { | |
name: "tf_data_structured_function_wrapper_IEyC79VR4Yg" | |
} | |
} | |
} | |
attr { | |
key: "output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_types" | |
value { | |
list { | |
type: DT_INT32 | |
type: DT_INT32 | |
type: DT_INT32 | |
} | |
} | |
} | |
attr { | |
key: "use_inter_op_parallelism" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "ShuffleDataset_1" | |
op: "ShuffleDataset" | |
input: "ParallelMapDataset_2" | |
input: "buffer_size_1" | |
input: "seed_1" | |
input: "seed2_1" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@IteratorV2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_types" | |
value { | |
list { | |
type: DT_INT32 | |
type: DT_INT32 | |
type: DT_INT32 | |
} | |
} | |
} | |
attr { | |
key: "reshuffle_each_iteration" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "ParallelMapDataset_3" | |
op: "ParallelMapDataset" | |
input: "ShuffleDataset_1" | |
input: "num_parallel_calls_3" | |
attr { | |
key: "Targuments" | |
value { | |
list { | |
} | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@IteratorV2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "f" | |
value { | |
func { | |
name: "tf_data_structured_function_wrapper_PZOx4pJdhKc" | |
} | |
} | |
} | |
attr { | |
key: "output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_types" | |
value { | |
list { | |
type: DT_INT32 | |
type: DT_INT32 | |
type: DT_INT32 | |
type: DT_INT32 | |
} | |
} | |
} | |
attr { | |
key: "use_inter_op_parallelism" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "PrefetchDataset" | |
op: "PrefetchDataset" | |
input: "ParallelMapDataset_3" | |
input: "buffer_size_2" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@IteratorV2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_types" | |
value { | |
list { | |
type: DT_INT32 | |
type: DT_INT32 | |
type: DT_INT32 | |
type: DT_INT32 | |
} | |
} | |
} | |
} | |
node { | |
name: "MakeIterator" | |
op: "MakeIterator" | |
input: "PrefetchDataset" | |
input: "IteratorV2" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@IteratorV2" | |
} | |
} | |
} | |
} | |
node { | |
name: "IteratorToStringHandle" | |
op: "IteratorToStringHandle" | |
input: "IteratorV2" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "IteratorGetNext" | |
op: "IteratorGetNext" | |
input: "IteratorV2" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "output_types" | |
value { | |
list { | |
type: DT_INT32 | |
type: DT_INT32 | |
type: DT_INT32 | |
type: DT_INT32 | |
} | |
} | |
} | |
} | |
node { | |
name: "losses_avg/problem_0/total_loss/initial_value" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 100.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "losses_avg/problem_0/total_loss" | |
op: "VariableV2" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "" | |
} | |
} | |
} | |
node { | |
name: "losses_avg/problem_0/total_loss/Assign" | |
op: "Assign" | |
input: "losses_avg/problem_0/total_loss" | |
input: "losses_avg/problem_0/total_loss/initial_value" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@losses_avg/problem_0/total_loss" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "use_locking" | |
value { | |
b: true | |
} | |
} | |
attr { | |
key: "validate_shape" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "losses_avg/problem_0/total_loss/read" | |
op: "Identity" | |
input: "losses_avg/problem_0/total_loss" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@losses_avg/problem_0/total_loss" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "losses_avg/problem_0/extra_loss/initial_value" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 100.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "losses_avg/problem_0/extra_loss" | |
op: "VariableV2" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "" | |
} | |
} | |
} | |
node { | |
name: "losses_avg/problem_0/extra_loss/Assign" | |
op: "Assign" | |
input: "losses_avg/problem_0/extra_loss" | |
input: "losses_avg/problem_0/extra_loss/initial_value" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@losses_avg/problem_0/extra_loss" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "use_locking" | |
value { | |
b: true | |
} | |
} | |
attr { | |
key: "validate_shape" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "losses_avg/problem_0/extra_loss/read" | |
op: "Identity" | |
input: "losses_avg/problem_0/extra_loss" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@losses_avg/problem_0/extra_loss" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "losses_avg/problem_0/training_loss/initial_value" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 100.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "losses_avg/problem_0/training_loss" | |
op: "VariableV2" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "" | |
} | |
} | |
} | |
node { | |
name: "losses_avg/problem_0/training_loss/Assign" | |
op: "Assign" | |
input: "losses_avg/problem_0/training_loss" | |
input: "losses_avg/problem_0/training_loss/initial_value" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@losses_avg/problem_0/training_loss" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "use_locking" | |
value { | |
b: true | |
} | |
} | |
attr { | |
key: "validate_shape" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "losses_avg/problem_0/training_loss/read" | |
op: "Identity" | |
input: "losses_avg/problem_0/training_loss" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@losses_avg/problem_0/training_loss" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "train_stats/problem_0_steps/initial_value" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "train_stats/problem_0_steps" | |
op: "VariableV2" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "" | |
} | |
} | |
} | |
node { | |
name: "train_stats/problem_0_steps/Assign" | |
op: "Assign" | |
input: "train_stats/problem_0_steps" | |
input: "train_stats/problem_0_steps/initial_value" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@train_stats/problem_0_steps" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "use_locking" | |
value { | |
b: true | |
} | |
} | |
attr { | |
key: "validate_shape" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "train_stats/problem_0_steps/read" | |
op: "Identity" | |
input: "train_stats/problem_0_steps" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@train_stats/problem_0_steps" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_1" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "moe_loss_coef" | |
string_val: "0.001" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_2" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "clip_grad_norm" | |
string_val: "0.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_3" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "layer_prepostprocess_dropout" | |
string_val: "0.1" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_4" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "multiply_embedding_mode" | |
string_val: "sqrt_depth" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_5" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "optimizer_adafactor_multiply_by_parameter_scale" | |
string_val: "True" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_6" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "multiproblem_max_target_length" | |
string_val: "-1" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_7" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "train_steps" | |
string_val: "250000" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_8" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "attention_value_channels" | |
string_val: "0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_9" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "moe_overhead_train" | |
string_val: "1.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_10" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "factored_logits" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_11" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "compress_steps" | |
string_val: "0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_12" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "num_heads" | |
string_val: "8" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_13" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "multiproblem_schedule_threshold" | |
string_val: "0.5" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_14" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "num_encoder_layers" | |
string_val: "0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_15" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "conv_first_kernel" | |
string_val: "3" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_16" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "self_attention_type" | |
string_val: "dot_product" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_17" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "max_target_seq_length" | |
string_val: "0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_18" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "attention_dropout_broadcast_dims" | |
string_val: "" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_19" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "eval_timeout_mins" | |
string_val: "240" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_20" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "proximity_bias" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_21" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "shared_embedding_and_softmax_weights" | |
string_val: "True" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_22" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "learning_rate_schedule" | |
string_val: "constant*linear_warmup*rsqrt_decay*rsqrt_hidden_size" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_23" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "optimizer_adafactor_factored" | |
string_val: "True" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_24" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "moe_num_experts" | |
string_val: "16" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_25" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "mode" | |
string_val: "train" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_26" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "moe_k" | |
string_val: "2" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_27" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "multiproblem_mixing_schedule" | |
string_val: "constant" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_28" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "optimizer_adam_epsilon" | |
string_val: "1e-09" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_29" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "symbol_dropout" | |
string_val: "0.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_30" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "scheduled_sampling_prob" | |
string_val: "0.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_31" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "use_fixed_batch_size" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_32" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "initializer" | |
string_val: "uniform_unit_scaling" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_33" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "norm_type" | |
string_val: "layer" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_34" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "filter_size" | |
string_val: "2048" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_35" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "learning_rate_constant" | |
string_val: "2.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_36" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "weight_decay" | |
string_val: "0.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_37" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "vocab_divisor" | |
string_val: "1" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_38" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "activation_dtype" | |
string_val: "float32" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_39" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "parameter_attention_key_channels" | |
string_val: "0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_40" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "learning_rate_warmup_steps" | |
string_val: "8000" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_41" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "optimizer_adafactor_memory_exponent" | |
string_val: "0.8" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_42" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "hidden_size" | |
string_val: "512" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_43" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "kernel_height" | |
string_val: "3" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_44" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "ffn_layer" | |
string_val: "dense_relu_dense" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_45" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "std_server_protocol" | |
string_val: "grpc" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_46" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "num_hidden_layers" | |
string_val: "6" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_47" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "schedule" | |
string_val: "continuous_train_and_eval" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_48" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "label_smoothing" | |
string_val: "0.1" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_49" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "use_pad_remover" | |
string_val: "True" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_50" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "batch_size" | |
string_val: "4096" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_51" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "max_relative_position" | |
string_val: "0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_52" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "optimizer_multistep_accumulate_steps" | |
string_val: "None" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_53" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "learning_rate_decay_rate" | |
string_val: "1.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_54" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "symbol_modality_num_shards" | |
string_val: "16" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_55" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "attention_variables_3d" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_56" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "max_input_seq_length" | |
string_val: "0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_57" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "optimizer_adafactor_decay_type" | |
string_val: "pow" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_58" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "min_length" | |
string_val: "0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_59" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "kernel_width" | |
string_val: "1" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_60" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "daisy_chain_variables" | |
string_val: "True" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_61" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "split_to_length" | |
string_val: "0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_62" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "min_length_bucket" | |
string_val: "8" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_63" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "layer_prepostprocess_dropout_broadcast_dims" | |
string_val: "" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_64" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "optimizer_adam_beta2" | |
string_val: "0.997" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_65" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "optimizer_adam_beta1" | |
string_val: "0.9" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_66" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "multiproblem_target_eval_only" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_67" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "initializer_gain" | |
string_val: "1.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_68" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "layer_postprocess_sequence" | |
string_val: "da" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_69" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "heads_share_relative_embedding" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_70" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "multiproblem_schedule_max_examples" | |
string_val: "10000000.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_71" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "learning_rate_cosine_cycle_steps" | |
string_val: "250000" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_72" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "causal_decoder_self_attention" | |
string_val: "True" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_73" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "pos" | |
string_val: "timing" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_74" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "scheduled_sampling_gold_mixin_prob" | |
string_val: "0.5" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_75" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "multiproblem_reweight_label_loss" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_76" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "nbr_decoder_problems" | |
string_val: "1" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_77" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "attention_key_channels" | |
string_val: "0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_78" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "video_num_target_frames" | |
string_val: "1" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_79" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "prepend_mode" | |
string_val: "none" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_80" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "symbol_modality_skip_top" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_81" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "summarize_vars" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_82" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "attention_dropout" | |
string_val: "0.1" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_83" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "optimizer_momentum_nesterov" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_84" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "no_data_parallelism" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_85" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "layer_preprocess_sequence" | |
string_val: "n" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_86" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "video_num_input_frames" | |
string_val: "1" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_87" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "pretrained_model_dir" | |
string_val: "" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_88" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "max_length" | |
string_val: "256" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_89" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "summarize_grads" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_90" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "model_dir" | |
string_val: "/root/train/ltltstr" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_91" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "multiproblem_label_weight" | |
string_val: "0.5" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_92" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "learning_rate_decay_scheme" | |
string_val: "noam" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_93" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "dropout" | |
string_val: "0.2" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_94" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "length_bucket_step" | |
string_val: "1.1" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_95" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "multiproblem_vocab_size" | |
string_val: "-1" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_96" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "num_decoder_layers" | |
string_val: "0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_97" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "force_full_predict" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_98" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "use_target_space_embedding" | |
string_val: "True" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_99" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "eval_freq_in_steps" | |
string_val: "1000" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_100" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "scheduled_sampling_warmup_steps" | |
string_val: "50000" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_101" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "moe_hidden_sizes" | |
string_val: "2048" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_102" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "norm_epsilon" | |
string_val: "1e-06" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_103" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "relu_dropout_broadcast_dims" | |
string_val: "" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_104" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "eval_steps" | |
string_val: "100" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_105" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "multiproblem_class_loss_multiplier" | |
string_val: "0.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_106" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "tpu_enable_host_call" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_107" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "eval_run_autoregressive" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_108" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "grad_noise_scale" | |
string_val: "0.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_109" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "eval_drop_long_sequences" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_110" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "optimizer_momentum_momentum" | |
string_val: "0.9" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_111" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "modality" | |
string_val: "{}" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_112" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "weight_noise" | |
string_val: "0.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_113" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "data_dir" | |
string_val: "/root/t2t_data" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_114" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "parameter_attention_value_channels" | |
string_val: "0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_115" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "relu_dropout" | |
string_val: "0.1" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_116" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "moe_overhead_eval" | |
string_val: "2.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_117" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "warm_start_from" | |
string_val: "None" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_118" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "sampling_method" | |
string_val: "argmax" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_119" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "add_relative_to_values" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_120" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "multiproblem_max_input_length" | |
string_val: "-1" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_121" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "shared_embedding" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_122" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "optimizer" | |
string_val: "Adam" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_123" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "sampling_temp" | |
string_val: "1.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_124" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "learning_rate" | |
string_val: "0.2" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_125" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "learning_rate_decay_steps" | |
string_val: "5000" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_126" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "pad_batch" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_127" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "optimizer_adafactor_beta2" | |
string_val: "0.999" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_128" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "optimizer_adafactor_beta1" | |
string_val: "0.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_129" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "optimizer_adafactor_clipping_threshold" | |
string_val: "1.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_130" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "learning_rate_minimum" | |
string_val: "None" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_131" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "learning_rate_decay_staircase" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_132" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "weight_dtype" | |
string_val: "float32" | |
} | |
} | |
} | |
} | |
node { | |
name: "stack" | |
op: "Pack" | |
input: "Const_1" | |
input: "Const_2" | |
input: "Const_3" | |
input: "Const_4" | |
input: "Const_5" | |
input: "Const_6" | |
input: "Const_7" | |
input: "Const_8" | |
input: "Const_9" | |
input: "Const_10" | |
input: "Const_11" | |
input: "Const_12" | |
input: "Const_13" | |
input: "Const_14" | |
input: "Const_15" | |
input: "Const_16" | |
input: "Const_17" | |
input: "Const_18" | |
input: "Const_19" | |
input: "Const_20" | |
input: "Const_21" | |
input: "Const_22" | |
input: "Const_23" | |
input: "Const_24" | |
input: "Const_25" | |
input: "Const_26" | |
input: "Const_27" | |
input: "Const_28" | |
input: "Const_29" | |
input: "Const_30" | |
input: "Const_31" | |
input: "Const_32" | |
input: "Const_33" | |
input: "Const_34" | |
input: "Const_35" | |
input: "Const_36" | |
input: "Const_37" | |
input: "Const_38" | |
input: "Const_39" | |
input: "Const_40" | |
input: "Const_41" | |
input: "Const_42" | |
input: "Const_43" | |
input: "Const_44" | |
input: "Const_45" | |
input: "Const_46" | |
input: "Const_47" | |
input: "Const_48" | |
input: "Const_49" | |
input: "Const_50" | |
input: "Const_51" | |
input: "Const_52" | |
input: "Const_53" | |
input: "Const_54" | |
input: "Const_55" | |
input: "Const_56" | |
input: "Const_57" | |
input: "Const_58" | |
input: "Const_59" | |
input: "Const_60" | |
input: "Const_61" | |
input: "Const_62" | |
input: "Const_63" | |
input: "Const_64" | |
input: "Const_65" | |
input: "Const_66" | |
input: "Const_67" | |
input: "Const_68" | |
input: "Const_69" | |
input: "Const_70" | |
input: "Const_71" | |
input: "Const_72" | |
input: "Const_73" | |
input: "Const_74" | |
input: "Const_75" | |
input: "Const_76" | |
input: "Const_77" | |
input: "Const_78" | |
input: "Const_79" | |
input: "Const_80" | |
input: "Const_81" | |
input: "Const_82" | |
input: "Const_83" | |
input: "Const_84" | |
input: "Const_85" | |
input: "Const_86" | |
input: "Const_87" | |
input: "Const_88" | |
input: "Const_89" | |
input: "Const_90" | |
input: "Const_91" | |
input: "Const_92" | |
input: "Const_93" | |
input: "Const_94" | |
input: "Const_95" | |
input: "Const_96" | |
input: "Const_97" | |
input: "Const_98" | |
input: "Const_99" | |
input: "Const_100" | |
input: "Const_101" | |
input: "Const_102" | |
input: "Const_103" | |
input: "Const_104" | |
input: "Const_105" | |
input: "Const_106" | |
input: "Const_107" | |
input: "Const_108" | |
input: "Const_109" | |
input: "Const_110" | |
input: "Const_111" | |
input: "Const_112" | |
input: "Const_113" | |
input: "Const_114" | |
input: "Const_115" | |
input: "Const_116" | |
input: "Const_117" | |
input: "Const_118" | |
input: "Const_119" | |
input: "Const_120" | |
input: "Const_121" | |
input: "Const_122" | |
input: "Const_123" | |
input: "Const_124" | |
input: "Const_125" | |
input: "Const_126" | |
input: "Const_127" | |
input: "Const_128" | |
input: "Const_129" | |
input: "Const_130" | |
input: "Const_131" | |
input: "Const_132" | |
attr { | |
key: "N" | |
value { | |
i: 132 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 132 | |
} | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer_hparams/tag" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "transformer_hparams" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer_hparams/serialized_summary_metadata" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "\n\006\n\004text" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer_hparams" | |
op: "TensorSummaryV2" | |
input: "transformer_hparams/tag" | |
input: "stack" | |
input: "transformer_hparams/serialized_summary_metadata" | |
attr { | |
key: "T" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_133" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "was_reversed" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_134" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "was_copy" | |
string_val: "False" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_135" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "loss_multiplier" | |
string_val: "1.0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_136" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "target_space_id" | |
string_val: "0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_137" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "stop_at_eos" | |
string_val: "1" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_138" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "vocabulary" | |
string_val: "{\'inputs\': <tensor2tensor.data_generators.text_encoder.SubwordTextEncoder object at 0x7f6ee2dd5b50>, \'targets\': <tensor2tensor.data_generators.text_encoder.SubwordTextEncoder object at 0x7f6ee2dd5b50>}" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_139" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "batch_size_multiplier" | |
string_val: "1" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_140" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "input_space_id" | |
string_val: "0" | |
} | |
} | |
} | |
} | |
node { | |
name: "Const_141" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
string_val: "modality" | |
string_val: "{\'inputs\': <tensor2tensor.layers.modalities.SymbolModality object at 0x7f6ee3c6d110>, \'targets\': <tensor2tensor.layers.modalities.SymbolModality object at 0x7f6ee8937510>}" | |
} | |
} | |
} | |
} | |
node { | |
name: "stack_1" | |
op: "Pack" | |
input: "Const_133" | |
input: "Const_134" | |
input: "Const_135" | |
input: "Const_136" | |
input: "Const_137" | |
input: "Const_138" | |
input: "Const_139" | |
input: "Const_140" | |
input: "Const_141" | |
attr { | |
key: "N" | |
value { | |
i: 9 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 9 | |
} | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer_problem_hparams/tag" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "transformer_problem_hparams" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer_problem_hparams/serialized_summary_metadata" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "\n\006\n\004text" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer_problem_hparams" | |
op: "TensorSummaryV2" | |
input: "transformer_problem_hparams/tag" | |
input: "stack_1" | |
input: "transformer_problem_hparams/serialized_summary_metadata" | |
attr { | |
key: "T" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_space_id" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/target_space_id" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Shape" | |
op: "Shape" | |
input: "IteratorGetNext" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice/stack" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice/stack_1" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice/stack_2" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/input_stats/Shape" | |
input: "transformer/input_stats/strided_slice/stack" | |
input: "transformer/input_stats/strided_slice/stack_1" | |
input: "transformer/input_stats/strided_slice/stack_2" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/floordiv/y" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/floordiv" | |
op: "FloorDiv" | |
input: "transformer/input_stats/strided_slice" | |
input: "transformer/input_stats/floordiv/y" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/batch_prediction_key_batch/tags" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "transformer/input_stats/batch_prediction_key_batch" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/batch_prediction_key_batch" | |
op: "ScalarSummary" | |
input: "transformer/input_stats/batch_prediction_key_batch/tags" | |
input: "transformer/input_stats/floordiv" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Shape_1" | |
op: "Shape" | |
input: "IteratorGetNext" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_1/stack" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_1/stack_1" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_1/stack_2" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/input_stats/Shape_1" | |
input: "transformer/input_stats/strided_slice_1/stack" | |
input: "transformer/input_stats/strided_slice_1/stack_1" | |
input: "transformer/input_stats/strided_slice_1/stack_2" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/batch_prediction_key_length/tags" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "transformer/input_stats/batch_prediction_key_length" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/batch_prediction_key_length" | |
op: "ScalarSummary" | |
input: "transformer/input_stats/batch_prediction_key_length/tags" | |
input: "transformer/input_stats/strided_slice_1" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/NotEqual/y" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/NotEqual" | |
op: "NotEqual" | |
input: "IteratorGetNext" | |
input: "transformer/input_stats/NotEqual/y" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/ToFloat" | |
op: "Cast" | |
input: "transformer/input_stats/NotEqual" | |
attr { | |
key: "DstT" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "SrcT" | |
value { | |
type: DT_BOOL | |
} | |
} | |
attr { | |
key: "Truncate" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Const" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Sum" | |
op: "Sum" | |
input: "transformer/input_stats/ToFloat" | |
input: "transformer/input_stats/Const" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/batch_prediction_key_nonpadding_tokens/tags" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "transformer/input_stats/batch_prediction_key_nonpadding_tokens" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/batch_prediction_key_nonpadding_tokens" | |
op: "ScalarSummary" | |
input: "transformer/input_stats/batch_prediction_key_nonpadding_tokens/tags" | |
input: "transformer/input_stats/Sum" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Const_1" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Mean" | |
op: "Mean" | |
input: "transformer/input_stats/ToFloat" | |
input: "transformer/input_stats/Const_1" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/batch_prediction_key_nonpadding_fraction/tags" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "transformer/input_stats/batch_prediction_key_nonpadding_fraction" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/batch_prediction_key_nonpadding_fraction" | |
op: "ScalarSummary" | |
input: "transformer/input_stats/batch_prediction_key_nonpadding_fraction/tags" | |
input: "transformer/input_stats/Mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Shape_2" | |
op: "Shape" | |
input: "IteratorGetNext:1" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_2/stack" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_2/stack_1" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_2/stack_2" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_2" | |
op: "StridedSlice" | |
input: "transformer/input_stats/Shape_2" | |
input: "transformer/input_stats/strided_slice_2/stack" | |
input: "transformer/input_stats/strided_slice_2/stack_1" | |
input: "transformer/input_stats/strided_slice_2/stack_2" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/floordiv_1/y" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/floordiv_1" | |
op: "FloorDiv" | |
input: "transformer/input_stats/strided_slice_2" | |
input: "transformer/input_stats/floordiv_1/y" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/inputs_batch/tags" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "transformer/input_stats/inputs_batch" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/inputs_batch" | |
op: "ScalarSummary" | |
input: "transformer/input_stats/inputs_batch/tags" | |
input: "transformer/input_stats/floordiv_1" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Shape_3" | |
op: "Shape" | |
input: "IteratorGetNext:1" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_3/stack" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_3/stack_1" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_3/stack_2" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_3" | |
op: "StridedSlice" | |
input: "transformer/input_stats/Shape_3" | |
input: "transformer/input_stats/strided_slice_3/stack" | |
input: "transformer/input_stats/strided_slice_3/stack_1" | |
input: "transformer/input_stats/strided_slice_3/stack_2" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/inputs_length/tags" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "transformer/input_stats/inputs_length" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/inputs_length" | |
op: "ScalarSummary" | |
input: "transformer/input_stats/inputs_length/tags" | |
input: "transformer/input_stats/strided_slice_3" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/NotEqual_1/y" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/NotEqual_1" | |
op: "NotEqual" | |
input: "IteratorGetNext:1" | |
input: "transformer/input_stats/NotEqual_1/y" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/ToFloat_1" | |
op: "Cast" | |
input: "transformer/input_stats/NotEqual_1" | |
attr { | |
key: "DstT" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "SrcT" | |
value { | |
type: DT_BOOL | |
} | |
} | |
attr { | |
key: "Truncate" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Const_2" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 4 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000\002\000\000\000\003\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Sum_1" | |
op: "Sum" | |
input: "transformer/input_stats/ToFloat_1" | |
input: "transformer/input_stats/Const_2" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/inputs_nonpadding_tokens/tags" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "transformer/input_stats/inputs_nonpadding_tokens" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/inputs_nonpadding_tokens" | |
op: "ScalarSummary" | |
input: "transformer/input_stats/inputs_nonpadding_tokens/tags" | |
input: "transformer/input_stats/Sum_1" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Const_3" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 4 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000\002\000\000\000\003\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Mean_1" | |
op: "Mean" | |
input: "transformer/input_stats/ToFloat_1" | |
input: "transformer/input_stats/Const_3" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/inputs_nonpadding_fraction/tags" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "transformer/input_stats/inputs_nonpadding_fraction" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/inputs_nonpadding_fraction" | |
op: "ScalarSummary" | |
input: "transformer/input_stats/inputs_nonpadding_fraction/tags" | |
input: "transformer/input_stats/Mean_1" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Shape_4" | |
op: "Shape" | |
input: "IteratorGetNext:2" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_4/stack" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_4/stack_1" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_4/stack_2" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_4" | |
op: "StridedSlice" | |
input: "transformer/input_stats/Shape_4" | |
input: "transformer/input_stats/strided_slice_4/stack" | |
input: "transformer/input_stats/strided_slice_4/stack_1" | |
input: "transformer/input_stats/strided_slice_4/stack_2" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/floordiv_2/y" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/floordiv_2" | |
op: "FloorDiv" | |
input: "transformer/input_stats/strided_slice_4" | |
input: "transformer/input_stats/floordiv_2/y" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/targets_batch/tags" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "transformer/input_stats/targets_batch" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/targets_batch" | |
op: "ScalarSummary" | |
input: "transformer/input_stats/targets_batch/tags" | |
input: "transformer/input_stats/floordiv_2" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Shape_5" | |
op: "Shape" | |
input: "IteratorGetNext:2" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_5/stack" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_5/stack_1" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_5/stack_2" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/strided_slice_5" | |
op: "StridedSlice" | |
input: "transformer/input_stats/Shape_5" | |
input: "transformer/input_stats/strided_slice_5/stack" | |
input: "transformer/input_stats/strided_slice_5/stack_1" | |
input: "transformer/input_stats/strided_slice_5/stack_2" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/targets_length/tags" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "transformer/input_stats/targets_length" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/targets_length" | |
op: "ScalarSummary" | |
input: "transformer/input_stats/targets_length/tags" | |
input: "transformer/input_stats/strided_slice_5" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/NotEqual_2/y" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/NotEqual_2" | |
op: "NotEqual" | |
input: "IteratorGetNext:2" | |
input: "transformer/input_stats/NotEqual_2/y" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/ToFloat_2" | |
op: "Cast" | |
input: "transformer/input_stats/NotEqual_2" | |
attr { | |
key: "DstT" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "SrcT" | |
value { | |
type: DT_BOOL | |
} | |
} | |
attr { | |
key: "Truncate" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Const_4" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 4 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000\002\000\000\000\003\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Sum_2" | |
op: "Sum" | |
input: "transformer/input_stats/ToFloat_2" | |
input: "transformer/input_stats/Const_4" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/targets_nonpadding_tokens/tags" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "transformer/input_stats/targets_nonpadding_tokens" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/targets_nonpadding_tokens" | |
op: "ScalarSummary" | |
input: "transformer/input_stats/targets_nonpadding_tokens/tags" | |
input: "transformer/input_stats/Sum_2" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Const_5" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 4 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000\002\000\000\000\003\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/Mean_2" | |
op: "Mean" | |
input: "transformer/input_stats/ToFloat_2" | |
input: "transformer/input_stats/Const_5" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/targets_nonpadding_fraction/tags" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "transformer/input_stats/targets_nonpadding_fraction" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/input_stats/targets_nonpadding_fraction" | |
op: "ScalarSummary" | |
input: "transformer/input_stats/targets_nonpadding_fraction/tags" | |
input: "transformer/input_stats/Mean_2" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/Shape" | |
op: "Shape" | |
input: "IteratorGetNext" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice/stack" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice/stack_1" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice/stack_2" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/Shape" | |
input: "transformer/strided_slice/stack" | |
input: "transformer/strided_slice/stack_1" | |
input: "transformer/strided_slice/stack_2" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/Const" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/split/split_dim" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/split" | |
op: "Split" | |
input: "transformer/split/split_dim" | |
input: "IteratorGetNext" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "num_split" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0/transformer/Identity" | |
op: "Identity" | |
input: "transformer/split" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/Shape_1" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/ExpandDims/dim" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/ExpandDims" | |
op: "ExpandDims" | |
input: "transformer/input_space_id" | |
input: "transformer/ExpandDims/dim" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tdim" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/ToInt32/x" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/Tile" | |
op: "Tile" | |
input: "transformer/ExpandDims" | |
input: "transformer/ToInt32/x" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tmultiples" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/Const_1" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/split_1/split_dim" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/split_1" | |
op: "Split" | |
input: "transformer/split_1/split_dim" | |
input: "transformer/Tile" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "num_split" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_1/transformer/Identity" | |
op: "Identity" | |
input: "transformer/split_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/Shape_2" | |
op: "Shape" | |
input: "IteratorGetNext:1" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice_1/stack" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice_1/stack_1" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice_1/stack_2" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/Shape_2" | |
input: "transformer/strided_slice_1/stack" | |
input: "transformer/strided_slice_1/stack_1" | |
input: "transformer/strided_slice_1/stack_2" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice_2/stack" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice_2/stack_1" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice_2/stack_2" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice_2" | |
op: "StridedSlice" | |
input: "transformer/Shape_2" | |
input: "transformer/strided_slice_2/stack" | |
input: "transformer/strided_slice_2/stack_1" | |
input: "transformer/strided_slice_2/stack_2" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/Const_2" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/split_2/split_dim" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/split_2" | |
op: "Split" | |
input: "transformer/split_2/split_dim" | |
input: "IteratorGetNext:1" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "num_split" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_2/transformer/Identity" | |
op: "Identity" | |
input: "transformer/split_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/Shape_3" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/ExpandDims_1/dim" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/ExpandDims_1" | |
op: "ExpandDims" | |
input: "transformer/target_space_id" | |
input: "transformer/ExpandDims_1/dim" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tdim" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/ToInt32_1/x" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/Tile_1" | |
op: "Tile" | |
input: "transformer/ExpandDims_1" | |
input: "transformer/ToInt32_1/x" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tmultiples" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/Const_3" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/split_3/split_dim" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/split_3" | |
op: "Split" | |
input: "transformer/split_3/split_dim" | |
input: "transformer/Tile_1" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "num_split" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_3/transformer/Identity" | |
op: "Identity" | |
input: "transformer/split_3" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/Shape_4" | |
op: "Shape" | |
input: "IteratorGetNext:2" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice_3/stack" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice_3/stack_1" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice_3/stack_2" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice_3" | |
op: "StridedSlice" | |
input: "transformer/Shape_4" | |
input: "transformer/strided_slice_3/stack" | |
input: "transformer/strided_slice_3/stack_1" | |
input: "transformer/strided_slice_3/stack_2" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice_4/stack" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice_4/stack_1" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice_4/stack_2" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/strided_slice_4" | |
op: "StridedSlice" | |
input: "transformer/Shape_4" | |
input: "transformer/strided_slice_4/stack" | |
input: "transformer/strided_slice_4/stack_1" | |
input: "transformer/strided_slice_4/stack_2" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/Const_4" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/split_4/split_dim" | |
op: "Const" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/split_4" | |
op: "Split" | |
input: "transformer/split_4/split_dim" | |
input: "IteratorGetNext:2" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "num_split" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_4/transformer/Identity" | |
op: "Identity" | |
input: "transformer/split_4" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/Squeeze" | |
op: "Squeeze" | |
input: "transformer/parallel_0_2/transformer/Identity" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "squeeze_dims" | |
value { | |
list { | |
i: 3 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_0/Initializer/random_normal/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_0" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\361\006\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_0/Initializer/random_normal/mean" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_0" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_0/Initializer/random_normal/stddev" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_0" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0441941730678 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_0/Initializer/random_normal/RandomStandardNormal" | |
op: "RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_0/Initializer/random_normal/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_0" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_0/Initializer/random_normal/mul" | |
op: "Mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_0/Initializer/random_normal/RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_0/Initializer/random_normal/stddev" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_0" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_0/Initializer/random_normal" | |
op: "Add" | |
input: "transformer/symbol_modality_28422_512/shared/weights_0/Initializer/random_normal/mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_0/Initializer/random_normal/mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_0" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_0" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_0" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/symbol_modality_28422_512/shared/weights_0" | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_0/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_0" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_0/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_0" | |
input: "transformer/symbol_modality_28422_512/shared/weights_0/Initializer/random_normal" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_0" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_0/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_0" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_0" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_0" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity" | |
op: "Identity" | |
input: "Read/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_1/Initializer/random_normal/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_1" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\361\006\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_1/Initializer/random_normal/mean" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_1" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_1/Initializer/random_normal/stddev" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_1" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0441941730678 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_1/Initializer/random_normal/RandomStandardNormal" | |
op: "RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_1/Initializer/random_normal/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_1" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_1/Initializer/random_normal/mul" | |
op: "Mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_1/Initializer/random_normal/RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_1/Initializer/random_normal/stddev" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_1" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_1/Initializer/random_normal" | |
op: "Add" | |
input: "transformer/symbol_modality_28422_512/shared/weights_1/Initializer/random_normal/mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_1/Initializer/random_normal/mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_1" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_1" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_1" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/symbol_modality_28422_512/shared/weights_1" | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_1/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_1/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_1" | |
input: "transformer/symbol_modality_28422_512/shared/weights_1/Initializer/random_normal" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_1" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_1/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_1" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_1/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_1" | |
op: "Identity" | |
input: "Read_1/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_2/Initializer/random_normal/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\361\006\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_2/Initializer/random_normal/mean" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_2/Initializer/random_normal/stddev" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0441941730678 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_2/Initializer/random_normal/RandomStandardNormal" | |
op: "RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_2/Initializer/random_normal/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_2/Initializer/random_normal/mul" | |
op: "Mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_2/Initializer/random_normal/RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_2/Initializer/random_normal/stddev" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_2/Initializer/random_normal" | |
op: "Add" | |
input: "transformer/symbol_modality_28422_512/shared/weights_2/Initializer/random_normal/mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_2/Initializer/random_normal/mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_2" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/symbol_modality_28422_512/shared/weights_2" | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_2/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_2/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_2" | |
input: "transformer/symbol_modality_28422_512/shared/weights_2/Initializer/random_normal" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_2" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_2/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_2" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_2/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_2" | |
op: "Identity" | |
input: "Read_2/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_3/Initializer/random_normal/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_3" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\361\006\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_3/Initializer/random_normal/mean" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_3" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_3/Initializer/random_normal/stddev" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_3" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0441941730678 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_3/Initializer/random_normal/RandomStandardNormal" | |
op: "RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_3/Initializer/random_normal/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_3" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_3/Initializer/random_normal/mul" | |
op: "Mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_3/Initializer/random_normal/RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_3/Initializer/random_normal/stddev" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_3" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_3/Initializer/random_normal" | |
op: "Add" | |
input: "transformer/symbol_modality_28422_512/shared/weights_3/Initializer/random_normal/mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_3/Initializer/random_normal/mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_3" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_3" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_3" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/symbol_modality_28422_512/shared/weights_3" | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_3/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_3" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_3/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_3" | |
input: "transformer/symbol_modality_28422_512/shared/weights_3/Initializer/random_normal" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_3" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_3/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_3" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_3" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_3/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_3" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_3" | |
op: "Identity" | |
input: "Read_3/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_4/Initializer/random_normal/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_4" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\361\006\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_4/Initializer/random_normal/mean" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_4" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_4/Initializer/random_normal/stddev" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_4" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0441941730678 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_4/Initializer/random_normal/RandomStandardNormal" | |
op: "RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_4/Initializer/random_normal/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_4" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_4/Initializer/random_normal/mul" | |
op: "Mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_4/Initializer/random_normal/RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_4/Initializer/random_normal/stddev" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_4" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_4/Initializer/random_normal" | |
op: "Add" | |
input: "transformer/symbol_modality_28422_512/shared/weights_4/Initializer/random_normal/mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_4/Initializer/random_normal/mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_4" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_4" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_4" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/symbol_modality_28422_512/shared/weights_4" | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_4/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_4" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_4/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_4" | |
input: "transformer/symbol_modality_28422_512/shared/weights_4/Initializer/random_normal" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_4" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_4/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_4" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_4" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_4/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_4" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_4" | |
op: "Identity" | |
input: "Read_4/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_5/Initializer/random_normal/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_5" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\361\006\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_5/Initializer/random_normal/mean" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_5" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_5/Initializer/random_normal/stddev" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_5" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0441941730678 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_5/Initializer/random_normal/RandomStandardNormal" | |
op: "RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_5/Initializer/random_normal/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_5" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_5/Initializer/random_normal/mul" | |
op: "Mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_5/Initializer/random_normal/RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_5/Initializer/random_normal/stddev" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_5" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_5/Initializer/random_normal" | |
op: "Add" | |
input: "transformer/symbol_modality_28422_512/shared/weights_5/Initializer/random_normal/mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_5/Initializer/random_normal/mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_5" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_5" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_5" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/symbol_modality_28422_512/shared/weights_5" | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_5/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_5" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_5/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_5" | |
input: "transformer/symbol_modality_28422_512/shared/weights_5/Initializer/random_normal" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_5" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_5/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_5" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_5" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_5/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_5" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_5" | |
op: "Identity" | |
input: "Read_5/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1777 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_6/Initializer/random_normal/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_6" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\360\006\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_6/Initializer/random_normal/mean" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_6" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_6/Initializer/random_normal/stddev" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_6" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0441941730678 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_6/Initializer/random_normal/RandomStandardNormal" | |
op: "RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_6/Initializer/random_normal/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_6" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_6/Initializer/random_normal/mul" | |
op: "Mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_6/Initializer/random_normal/RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_6/Initializer/random_normal/stddev" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_6" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_6/Initializer/random_normal" | |
op: "Add" | |
input: "transformer/symbol_modality_28422_512/shared/weights_6/Initializer/random_normal/mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_6/Initializer/random_normal/mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_6" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_6" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_6" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/symbol_modality_28422_512/shared/weights_6" | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_6/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_6" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_6/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_6" | |
input: "transformer/symbol_modality_28422_512/shared/weights_6/Initializer/random_normal" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_6" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_6/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_6" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_6" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_6/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_6" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_6" | |
op: "Identity" | |
input: "Read_6/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_7/Initializer/random_normal/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_7" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\360\006\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_7/Initializer/random_normal/mean" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_7" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_7/Initializer/random_normal/stddev" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_7" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0441941730678 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_7/Initializer/random_normal/RandomStandardNormal" | |
op: "RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_7/Initializer/random_normal/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_7" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_7/Initializer/random_normal/mul" | |
op: "Mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_7/Initializer/random_normal/RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_7/Initializer/random_normal/stddev" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_7" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_7/Initializer/random_normal" | |
op: "Add" | |
input: "transformer/symbol_modality_28422_512/shared/weights_7/Initializer/random_normal/mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_7/Initializer/random_normal/mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_7" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_7" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_7" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/symbol_modality_28422_512/shared/weights_7" | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_7/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_7" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_7/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_7" | |
input: "transformer/symbol_modality_28422_512/shared/weights_7/Initializer/random_normal" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_7" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_7/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_7" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_7" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_7/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_7" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_7" | |
op: "Identity" | |
input: "Read_7/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_8/Initializer/random_normal/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_8" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\360\006\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_8/Initializer/random_normal/mean" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_8" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_8/Initializer/random_normal/stddev" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_8" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0441941730678 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_8/Initializer/random_normal/RandomStandardNormal" | |
op: "RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_8/Initializer/random_normal/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_8" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_8/Initializer/random_normal/mul" | |
op: "Mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_8/Initializer/random_normal/RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_8/Initializer/random_normal/stddev" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_8" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_8/Initializer/random_normal" | |
op: "Add" | |
input: "transformer/symbol_modality_28422_512/shared/weights_8/Initializer/random_normal/mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_8/Initializer/random_normal/mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_8" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_8" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_8" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/symbol_modality_28422_512/shared/weights_8" | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_8/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_8" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_8/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_8" | |
input: "transformer/symbol_modality_28422_512/shared/weights_8/Initializer/random_normal" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_8" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_8/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_8" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_8" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_8/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_8" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_8" | |
op: "Identity" | |
input: "Read_8/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_9/Initializer/random_normal/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_9" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\360\006\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_9/Initializer/random_normal/mean" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_9" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_9/Initializer/random_normal/stddev" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_9" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0441941730678 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_9/Initializer/random_normal/RandomStandardNormal" | |
op: "RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_9/Initializer/random_normal/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_9" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_9/Initializer/random_normal/mul" | |
op: "Mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_9/Initializer/random_normal/RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_9/Initializer/random_normal/stddev" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_9" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_9/Initializer/random_normal" | |
op: "Add" | |
input: "transformer/symbol_modality_28422_512/shared/weights_9/Initializer/random_normal/mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_9/Initializer/random_normal/mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_9" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_9" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_9" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/symbol_modality_28422_512/shared/weights_9" | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_9/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_9" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_9/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_9" | |
input: "transformer/symbol_modality_28422_512/shared/weights_9/Initializer/random_normal" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_9" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_9/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_9" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_9" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_9/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_9" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_9" | |
op: "Identity" | |
input: "Read_9/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_10/Initializer/random_normal/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_10" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\360\006\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_10/Initializer/random_normal/mean" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_10" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_10/Initializer/random_normal/stddev" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_10" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0441941730678 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_10/Initializer/random_normal/RandomStandardNormal" | |
op: "RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_10/Initializer/random_normal/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_10" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_10/Initializer/random_normal/mul" | |
op: "Mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_10/Initializer/random_normal/RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_10/Initializer/random_normal/stddev" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_10" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_10/Initializer/random_normal" | |
op: "Add" | |
input: "transformer/symbol_modality_28422_512/shared/weights_10/Initializer/random_normal/mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_10/Initializer/random_normal/mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_10" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_10" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_10" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/symbol_modality_28422_512/shared/weights_10" | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_10/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_10" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_10/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_10" | |
input: "transformer/symbol_modality_28422_512/shared/weights_10/Initializer/random_normal" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_10" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_10/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_10" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_10" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_10/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_10" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_10" | |
op: "Identity" | |
input: "Read_10/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_11/Initializer/random_normal/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_11" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\360\006\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_11/Initializer/random_normal/mean" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_11" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_11/Initializer/random_normal/stddev" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_11" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0441941730678 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_11/Initializer/random_normal/RandomStandardNormal" | |
op: "RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_11/Initializer/random_normal/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_11" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_11/Initializer/random_normal/mul" | |
op: "Mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_11/Initializer/random_normal/RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_11/Initializer/random_normal/stddev" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_11" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_11/Initializer/random_normal" | |
op: "Add" | |
input: "transformer/symbol_modality_28422_512/shared/weights_11/Initializer/random_normal/mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_11/Initializer/random_normal/mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_11" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_11" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_11" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/symbol_modality_28422_512/shared/weights_11" | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_11/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_11" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_11/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_11" | |
input: "transformer/symbol_modality_28422_512/shared/weights_11/Initializer/random_normal" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_11" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_11/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_11" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_11" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_11/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_11" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_11" | |
op: "Identity" | |
input: "Read_11/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_12/Initializer/random_normal/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_12" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\360\006\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_12/Initializer/random_normal/mean" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_12" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_12/Initializer/random_normal/stddev" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_12" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0441941730678 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_12/Initializer/random_normal/RandomStandardNormal" | |
op: "RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_12/Initializer/random_normal/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_12" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_12/Initializer/random_normal/mul" | |
op: "Mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_12/Initializer/random_normal/RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_12/Initializer/random_normal/stddev" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_12" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_12/Initializer/random_normal" | |
op: "Add" | |
input: "transformer/symbol_modality_28422_512/shared/weights_12/Initializer/random_normal/mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_12/Initializer/random_normal/mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_12" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_12" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_12" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/symbol_modality_28422_512/shared/weights_12" | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_12/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_12" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_12/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_12" | |
input: "transformer/symbol_modality_28422_512/shared/weights_12/Initializer/random_normal" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_12" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_12/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_12" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_12" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_12/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_12" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_12" | |
op: "Identity" | |
input: "Read_12/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_13/Initializer/random_normal/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_13" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\360\006\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_13/Initializer/random_normal/mean" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_13" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_13/Initializer/random_normal/stddev" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_13" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0441941730678 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_13/Initializer/random_normal/RandomStandardNormal" | |
op: "RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_13/Initializer/random_normal/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_13" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_13/Initializer/random_normal/mul" | |
op: "Mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_13/Initializer/random_normal/RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_13/Initializer/random_normal/stddev" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_13" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_13/Initializer/random_normal" | |
op: "Add" | |
input: "transformer/symbol_modality_28422_512/shared/weights_13/Initializer/random_normal/mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_13/Initializer/random_normal/mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_13" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_13" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_13" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/symbol_modality_28422_512/shared/weights_13" | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_13/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_13" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_13/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_13" | |
input: "transformer/symbol_modality_28422_512/shared/weights_13/Initializer/random_normal" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_13" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_13/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_13" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_13" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_13/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_13" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_13" | |
op: "Identity" | |
input: "Read_13/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_14/Initializer/random_normal/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_14" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\360\006\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_14/Initializer/random_normal/mean" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_14" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_14/Initializer/random_normal/stddev" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_14" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0441941730678 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_14/Initializer/random_normal/RandomStandardNormal" | |
op: "RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_14/Initializer/random_normal/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_14" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_14/Initializer/random_normal/mul" | |
op: "Mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_14/Initializer/random_normal/RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_14/Initializer/random_normal/stddev" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_14" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_14/Initializer/random_normal" | |
op: "Add" | |
input: "transformer/symbol_modality_28422_512/shared/weights_14/Initializer/random_normal/mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_14/Initializer/random_normal/mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_14" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_14" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_14" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/symbol_modality_28422_512/shared/weights_14" | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_14/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_14" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_14/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_14" | |
input: "transformer/symbol_modality_28422_512/shared/weights_14/Initializer/random_normal" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_14" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_14/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_14" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_14" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_14/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_14" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_14" | |
op: "Identity" | |
input: "Read_14/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_15/Initializer/random_normal/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_15" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\360\006\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_15/Initializer/random_normal/mean" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_15" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_15/Initializer/random_normal/stddev" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_15" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0441941730678 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_15/Initializer/random_normal/RandomStandardNormal" | |
op: "RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_15/Initializer/random_normal/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_15" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_15/Initializer/random_normal/mul" | |
op: "Mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_15/Initializer/random_normal/RandomStandardNormal" | |
input: "transformer/symbol_modality_28422_512/shared/weights_15/Initializer/random_normal/stddev" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_15" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_15/Initializer/random_normal" | |
op: "Add" | |
input: "transformer/symbol_modality_28422_512/shared/weights_15/Initializer/random_normal/mul" | |
input: "transformer/symbol_modality_28422_512/shared/weights_15/Initializer/random_normal/mean" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_15" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_15" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_15" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/symbol_modality_28422_512/shared/weights_15" | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_15/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_15" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_15/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_15" | |
input: "transformer/symbol_modality_28422_512/shared/weights_15/Initializer/random_normal" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_15" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/symbol_modality_28422_512/shared/weights_15/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_15" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/symbol_modality_28422_512/shared/weights_15" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_15/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/symbol_modality_28422_512/shared/weights_15" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_15" | |
op: "Identity" | |
input: "Read_15/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1776 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/concat/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/concat" | |
op: "ConcatV2" | |
input: "Identity" | |
input: "Identity_1" | |
input: "Identity_2" | |
input: "Identity_3" | |
input: "Identity_4" | |
input: "Identity_5" | |
input: "Identity_6" | |
input: "Identity_7" | |
input: "Identity_8" | |
input: "Identity_9" | |
input: "Identity_10" | |
input: "Identity_11" | |
input: "Identity_12" | |
input: "Identity_13" | |
input: "Identity_14" | |
input: "Identity_15" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/concat/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 16 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 28422 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/convert_gradient_to_tensor_HBc3xYw22Mw" | |
op: "convert_gradient_to_tensor_HBc3xYw22Mw" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/concat" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 28422 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/Reshape/shape" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/Squeeze" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/Reshape/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/GatherV2/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/GatherV2" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/convert_gradient_to_tensor_HBc3xYw22Mw" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/GatherV2/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/ExpandDims/dim" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/ExpandDims" | |
op: "ExpandDims" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/Squeeze" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/ExpandDims/dim" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tdim" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/ExpandDims" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 1 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/Shape_1" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/GatherV2" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/strided_slice_1/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/strided_slice_1/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/strided_slice_1/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/Shape_1" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/strided_slice_1/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/strided_slice_1/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/strided_slice_1/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 1 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/concat_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/concat_1" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/strided_slice" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/strided_slice_1" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/concat_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/Reshape_1" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/concat_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/mul/y" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 22.6274166107 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/Reshape_1" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/mul/y" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/NotEqual/y" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/NotEqual" | |
op: "NotEqual" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/Squeeze" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/NotEqual/y" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/ToFloat" | |
op: "Cast" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/NotEqual" | |
device: "/device:GPU:0" | |
attr { | |
key: "DstT" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "SrcT" | |
value { | |
type: DT_BOOL | |
} | |
} | |
attr { | |
key: "Truncate" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/ExpandDims_1/dim" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/ExpandDims_1" | |
op: "ExpandDims" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/ToFloat" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/ExpandDims_1/dim" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tdim" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/mul_1" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/ExpandDims_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/Squeeze" | |
op: "Squeeze" | |
input: "transformer/parallel_0_4/transformer/Identity" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "squeeze_dims" | |
value { | |
list { | |
i: 3 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/concat/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/concat" | |
op: "ConcatV2" | |
input: "Identity" | |
input: "Identity_1" | |
input: "Identity_2" | |
input: "Identity_3" | |
input: "Identity_4" | |
input: "Identity_5" | |
input: "Identity_6" | |
input: "Identity_7" | |
input: "Identity_8" | |
input: "Identity_9" | |
input: "Identity_10" | |
input: "Identity_11" | |
input: "Identity_12" | |
input: "Identity_13" | |
input: "Identity_14" | |
input: "Identity_15" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/concat/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 16 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 28422 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/convert_gradient_to_tensor_HBc3xYw22Mw" | |
op: "convert_gradient_to_tensor_HBc3xYw22Mw" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/concat" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 28422 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/Reshape/shape" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/Squeeze" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/Reshape/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/GatherV2/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/GatherV2" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/convert_gradient_to_tensor_HBc3xYw22Mw" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/GatherV2/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/ExpandDims/dim" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/ExpandDims" | |
op: "ExpandDims" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/Squeeze" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/ExpandDims/dim" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tdim" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/ExpandDims" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 1 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/Shape_1" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/GatherV2" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/strided_slice_1/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/strided_slice_1/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/strided_slice_1/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/Shape_1" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/strided_slice_1/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/strided_slice_1/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/strided_slice_1/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 1 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/concat_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/concat_1" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/strided_slice" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/strided_slice_1" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/concat_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/Reshape_1" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/concat_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/mul/y" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 22.6274166107 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/Reshape_1" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/mul/y" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/NotEqual/y" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/NotEqual" | |
op: "NotEqual" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/Squeeze" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/NotEqual/y" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/ToFloat" | |
op: "Cast" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/NotEqual" | |
device: "/device:GPU:0" | |
attr { | |
key: "DstT" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "SrcT" | |
value { | |
type: DT_BOOL | |
} | |
} | |
attr { | |
key: "Truncate" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/ExpandDims_1/dim" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/ExpandDims_1" | |
op: "ExpandDims" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/ToFloat" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/ExpandDims_1/dim" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tdim" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/mul_1" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512_1/shared/ExpandDims_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/mul_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/strided_slice_1/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/strided_slice_1/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/strided_slice_1/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/strided_slice_1/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/strided_slice_1/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/strided_slice_1/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/mul/y" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/strided_slice_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/mul/y" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/Reshape/shape/2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 512 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/Reshape/shape" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/strided_slice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/Reshape/shape/2" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 3 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/symbol_modality_28422_512/shared/mul_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/Reshape/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/embedding_to_padding/Abs" | |
op: "Abs" | |
input: "transformer/parallel_0_5/transformer/transformer/body/Reshape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/embedding_to_padding/Sum/reduction_indices" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/embedding_to_padding/Sum" | |
op: "Sum" | |
input: "transformer/parallel_0_5/transformer/transformer/body/embedding_to_padding/Abs" | |
input: "transformer/parallel_0_5/transformer/transformer/body/embedding_to_padding/Sum/reduction_indices" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/embedding_to_padding/Equal/y" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/embedding_to_padding/Equal" | |
op: "Equal" | |
input: "transformer/parallel_0_5/transformer/transformer/body/embedding_to_padding/Sum" | |
input: "transformer/parallel_0_5/transformer/transformer/body/embedding_to_padding/Equal/y" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/embedding_to_padding/ToFloat" | |
op: "Cast" | |
input: "transformer/parallel_0_5/transformer/transformer/body/embedding_to_padding/Equal" | |
device: "/device:GPU:0" | |
attr { | |
key: "DstT" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "SrcT" | |
value { | |
type: DT_BOOL | |
} | |
} | |
attr { | |
key: "Truncate" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/attention_bias_ignore_padding/mul/y" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: -1000000000.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/attention_bias_ignore_padding/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/embedding_to_padding/ToFloat" | |
input: "transformer/parallel_0_5/transformer/transformer/body/attention_bias_ignore_padding/mul/y" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/attention_bias_ignore_padding/ExpandDims/dim" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/attention_bias_ignore_padding/ExpandDims" | |
op: "ExpandDims" | |
input: "transformer/parallel_0_5/transformer/transformer/body/attention_bias_ignore_padding/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/attention_bias_ignore_padding/ExpandDims/dim" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tdim" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/attention_bias_ignore_padding/ExpandDims_1/dim" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/attention_bias_ignore_padding/ExpandDims_1" | |
op: "ExpandDims" | |
input: "transformer/parallel_0_5/transformer/transformer/body/attention_bias_ignore_padding/ExpandDims" | |
input: "transformer/parallel_0_5/transformer/transformer/body/attention_bias_ignore_padding/ExpandDims_1/dim" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tdim" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/target_space_embedding/kernel/Initializer/random_uniform/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/target_space_embedding/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: " \000\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/target_space_embedding/kernel/Initializer/random_uniform/min" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/target_space_embedding/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: -0.105021007359 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/target_space_embedding/kernel/Initializer/random_uniform/max" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/target_space_embedding/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.105021007359 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/target_space_embedding/kernel/Initializer/random_uniform/RandomUniform" | |
op: "RandomUniform" | |
input: "transformer/body/target_space_embedding/kernel/Initializer/random_uniform/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/target_space_embedding/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 32 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/body/target_space_embedding/kernel/Initializer/random_uniform/sub" | |
op: "Sub" | |
input: "transformer/body/target_space_embedding/kernel/Initializer/random_uniform/max" | |
input: "transformer/body/target_space_embedding/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/target_space_embedding/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/target_space_embedding/kernel/Initializer/random_uniform/mul" | |
op: "Mul" | |
input: "transformer/body/target_space_embedding/kernel/Initializer/random_uniform/RandomUniform" | |
input: "transformer/body/target_space_embedding/kernel/Initializer/random_uniform/sub" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/target_space_embedding/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 32 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/target_space_embedding/kernel/Initializer/random_uniform" | |
op: "Add" | |
input: "transformer/body/target_space_embedding/kernel/Initializer/random_uniform/mul" | |
input: "transformer/body/target_space_embedding/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/target_space_embedding/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 32 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/target_space_embedding/kernel" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/target_space_embedding/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 32 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/target_space_embedding/kernel" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/target_space_embedding/kernel/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/target_space_embedding/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/target_space_embedding/kernel/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/target_space_embedding/kernel" | |
input: "transformer/body/target_space_embedding/kernel/Initializer/random_uniform" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/target_space_embedding/kernel" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/target_space_embedding/kernel/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/target_space_embedding/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/target_space_embedding/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 32 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_16/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/target_space_embedding/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 32 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_16" | |
op: "Identity" | |
input: "Read_16/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 32 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/convert_gradient_to_tensor_HBc3xYw22Mw" | |
op: "convert_gradient_to_tensor_HBc3xYw22Mw" | |
input: "Identity_16" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 32 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/Reshape/shape" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_3/transformer/Identity" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/Reshape/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/GatherV2/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/GatherV2" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/convert_gradient_to_tensor_HBc3xYw22Mw" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/GatherV2/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/ExpandDims/dim" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/ExpandDims" | |
op: "ExpandDims" | |
input: "transformer/parallel_0_3/transformer/Identity" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/ExpandDims/dim" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tdim" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/Shape" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\001\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 1 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/Shape_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\001\000\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/strided_slice_1/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/strided_slice_1/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/strided_slice_1/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/Shape_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/strided_slice_1/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/strided_slice_1/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/strided_slice_1/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 1 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/concat/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/concat" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/strided_slice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/strided_slice_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/concat/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/Reshape_1" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/concat" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/Reshape_1/shape" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 3 | |
} | |
} | |
tensor_content: "\001\000\000\000\001\000\000\000\377\377\377\377" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/Reshape_1" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/target_space_embedding/Reshape_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/Reshape_1/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/Reshape_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_1/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_1/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_1/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_1/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_1/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_1/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/Shape_1" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_2/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_2/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_2/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_2" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/Shape_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_2/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_2/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_2/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_3/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_3/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_3/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_3" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/Shape_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_3/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_3/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_3/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/range/start" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/range/delta" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/range" | |
op: "Range" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/range/start" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/range/delta" | |
device: "/device:GPU:0" | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/add/y" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/add" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/range" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/add/y" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/ToFloat" | |
op: "Cast" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/add" | |
device: "/device:GPU:0" | |
attr { | |
key: "DstT" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "SrcT" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Truncate" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/ToFloat_1/x" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 256 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/ToFloat_1" | |
op: "Cast" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/ToFloat_1/x" | |
device: "/device:GPU:0" | |
attr { | |
key: "DstT" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "SrcT" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Truncate" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/sub/y" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 1.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/sub" | |
op: "Sub" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/ToFloat_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/sub/y" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Maximum/y" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 1.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Maximum" | |
op: "Maximum" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/sub" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Maximum/y" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/truediv/x" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 9.21034049988 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/truediv" | |
op: "RealDiv" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/truediv/x" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Maximum" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/range_1/start" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/range_1/limit" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 256 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/range_1/delta" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/range_1" | |
op: "Range" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/range_1/start" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/range_1/limit" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/range_1/delta" | |
device: "/device:GPU:0" | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 256 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/ToFloat_2" | |
op: "Cast" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/range_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "DstT" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "SrcT" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Truncate" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 256 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Neg" | |
op: "Neg" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/truediv" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/ToFloat_2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Neg" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 256 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Exp" | |
op: "Exp" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/mul" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 256 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/mul_1/x" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 1.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/mul_1" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/mul_1/x" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Exp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 256 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/ExpandDims/dim" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/ExpandDims" | |
op: "ExpandDims" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/ToFloat" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/ExpandDims/dim" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tdim" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/ExpandDims_1/dim" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/ExpandDims_1" | |
op: "ExpandDims" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/mul_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/ExpandDims_1/dim" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tdim" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 256 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/mul_2" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/ExpandDims" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/ExpandDims_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 256 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Sin" | |
op: "Sin" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/mul_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 256 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Cos" | |
op: "Cos" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/mul_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 256 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/concat/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/concat" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Sin" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Cos" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/concat/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/FloorMod/x" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 512 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/FloorMod/y" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/FloorMod" | |
op: "FloorMod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/FloorMod/x" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/FloorMod/y" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Pad/paddings/1/0" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Pad/paddings/1" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Pad/paddings/1/0" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/FloorMod" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Pad/paddings/0_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\000\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Pad/paddings" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Pad/paddings/0_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Pad/paddings/1" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Pad" | |
op: "Pad" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/concat" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Pad/paddings" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tpaddings" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Reshape/shape/0" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Reshape/shape/2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 512 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Reshape/shape" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Reshape/shape/0" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/strided_slice_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Reshape/shape/2" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 3 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Pad" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Reshape/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/add" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/get_timing_signal_1d/Reshape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/dropout/keep_prob" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.899999976158 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/dropout/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/add" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/dropout/random_uniform/min" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/dropout/random_uniform/max" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 1.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/dropout/random_uniform/RandomUniform" | |
op: "RandomUniform" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/Shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/dropout/random_uniform/sub" | |
op: "Sub" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/random_uniform/max" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/random_uniform/min" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/dropout/random_uniform/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/random_uniform/RandomUniform" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/random_uniform/sub" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/dropout/random_uniform" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/random_uniform/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/random_uniform/min" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/dropout/add" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/keep_prob" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/random_uniform" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/dropout/Floor" | |
op: "Floor" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/add" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/dropout/div" | |
op: "RealDiv" | |
input: "transformer/parallel_0_5/transformer/transformer/body/add_timing_signal_1d/add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/keep_prob" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/dropout/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/div" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/Floor" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/attention_bias_to_padding/Less/y" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: -1.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/attention_bias_to_padding/Less" | |
op: "Less" | |
input: "transformer/parallel_0_5/transformer/transformer/body/attention_bias_ignore_padding/ExpandDims_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/attention_bias_to_padding/Less/y" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/attention_bias_to_padding/ToFloat" | |
op: "Cast" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/attention_bias_to_padding/Less" | |
device: "/device:GPU:0" | |
attr { | |
key: "DstT" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "SrcT" | |
value { | |
type: DT_BOOL | |
} | |
} | |
attr { | |
key: "Truncate" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/attention_bias_to_padding/Squeeze" | |
op: "Squeeze" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/attention_bias_to_padding/ToFloat" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "squeeze_dims" | |
value { | |
list { | |
i: 1 | |
i: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/sub/x" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 1.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/sub" | |
op: "Sub" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/sub/x" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/attention_bias_to_padding/Squeeze" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/Reshape/shape" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/attention_bias_to_padding/Squeeze" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/Reshape/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/Less/y" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 9.99999971718e-10 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/Less" | |
op: "Less" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/Less/y" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/Where" | |
op: "Where" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/Less" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_BOOL | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/ToInt32" | |
op: "Cast" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/Where" | |
device: "/device:GPU:0" | |
attr { | |
key: "DstT" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "SrcT" | |
value { | |
type: DT_INT64 | |
} | |
} | |
attr { | |
key: "Truncate" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/Reshape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 1 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/mul" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/strided_slice_1/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/strided_slice_1/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/strided_slice_1/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/strided_slice_1/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/strided_slice_1/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/strided_slice_1/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale/Initializer/ones" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
dim { | |
size: 512 | |
} | |
} | |
float_val: 1.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
input: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale/Initializer/ones" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_17/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_17" | |
op: "Identity" | |
input: "Read_17/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias/Initializer/zeros" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
dim { | |
size: 512 | |
} | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
input: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias/Initializer/zeros" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_18/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_18" | |
op: "Identity" | |
input: "Read_18/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/Const" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 9.99999997475e-07 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/Mean/reduction_indices" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/Mean" | |
op: "Mean" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/Mean/reduction_indices" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/sub" | |
op: "Sub" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/Mean" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/Square" | |
op: "Square" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/sub" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/Mean_1/reduction_indices" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/Mean_1" | |
op: "Mean" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/Square" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/Mean_1/reduction_indices" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/sub_1" | |
op: "Sub" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/Mean" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/add" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/Mean_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/Rsqrt" | |
op: "Rsqrt" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/add" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/sub_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/Rsqrt" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/mul_1" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/mul" | |
input: "Identity_17" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/add_1" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/mul_1" | |
input: "Identity_18" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\002\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/min" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: -0.0765465572476 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/max" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0765465572476 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/RandomUniform" | |
op: "RandomUniform" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/sub" | |
op: "Sub" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/max" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/mul" | |
op: "Mul" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/RandomUniform" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/sub" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Initializer/random_uniform" | |
op: "Add" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/mul" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Initializer/random_uniform" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_19/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/q/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_19" | |
op: "Identity" | |
input: "Read_19/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/axes" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/free" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/add_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/GatherV2/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/GatherV2" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/GatherV2/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/GatherV2_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/GatherV2_1" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/GatherV2_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Const" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Prod" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Const_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Prod_1" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/GatherV2_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Const_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/concat/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/concat" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/concat/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/stack" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Prod_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/transpose" | |
op: "Transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/add_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/concat" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/stack" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/transpose_1/perm" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/transpose_1" | |
op: "Transpose" | |
input: "Identity_19" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/transpose_1/perm" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Reshape_1/shape" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\002\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Reshape_1" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/transpose_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Reshape_1/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/MatMul" | |
op: "MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Reshape_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "transpose_a" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "transpose_b" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Const_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 512 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/concat_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/concat_1" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/Const_2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/concat_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot/concat_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\002\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/min" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: -0.0765465572476 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/max" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0765465572476 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/RandomUniform" | |
op: "RandomUniform" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/sub" | |
op: "Sub" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/max" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/mul" | |
op: "Mul" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/RandomUniform" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/sub" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Initializer/random_uniform" | |
op: "Add" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/mul" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Initializer/random_uniform" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_20/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/k/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_20" | |
op: "Identity" | |
input: "Read_20/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/axes" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/free" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/add_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/GatherV2/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/GatherV2" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/GatherV2/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/GatherV2_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/GatherV2_1" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/GatherV2_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Const" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Prod" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Const_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Prod_1" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/GatherV2_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Const_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/concat/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/concat" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/concat/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/stack" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Prod_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/transpose" | |
op: "Transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/add_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/concat" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/stack" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/transpose_1/perm" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/transpose_1" | |
op: "Transpose" | |
input: "Identity_20" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/transpose_1/perm" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Reshape_1/shape" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\002\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Reshape_1" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/transpose_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Reshape_1/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/MatMul" | |
op: "MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Reshape_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "transpose_a" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "transpose_b" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Const_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 512 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/concat_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/concat_1" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/Const_2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/concat_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot/concat_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\002\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/min" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: -0.0765465572476 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/max" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0765465572476 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/RandomUniform" | |
op: "RandomUniform" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/sub" | |
op: "Sub" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/max" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/mul" | |
op: "Mul" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/RandomUniform" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/sub" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Initializer/random_uniform" | |
op: "Add" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/mul" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Initializer/random_uniform" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_21/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/v/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_21" | |
op: "Identity" | |
input: "Read_21/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/axes" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/free" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/add_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/GatherV2/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/GatherV2" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/GatherV2/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/GatherV2_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/GatherV2_1" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/GatherV2_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Const" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Prod" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Const_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Prod_1" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/GatherV2_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Const_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/concat/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/concat" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/concat/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/stack" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Prod_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/transpose" | |
op: "Transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_prepostprocess/layer_norm/add_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/concat" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/stack" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/transpose_1/perm" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/transpose_1" | |
op: "Transpose" | |
input: "Identity_21" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/transpose_1/perm" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Reshape_1/shape" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\002\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Reshape_1" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/transpose_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Reshape_1/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/MatMul" | |
op: "MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Reshape_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "transpose_a" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "transpose_b" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Const_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 512 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/concat_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/concat_1" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/Const_2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/concat_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot/concat_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice_1/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice_1/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice_1/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice_1/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice_1/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice_1/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/Reshape/shape/2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 8 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/Reshape/shape/3" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 64 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/Reshape/shape" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/Reshape/shape/2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/Reshape/shape/3" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 4 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/q/Tensordot" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/Reshape/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: 64 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/transpose/perm" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 4 | |
} | |
} | |
tensor_content: "\000\000\000\000\002\000\000\000\001\000\000\000\003\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/transpose" | |
op: "Transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/split_last_dimension/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/transpose/perm" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 64 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice_1/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice_1/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice_1/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice_1/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice_1/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice_1/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/Reshape/shape/2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 8 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/Reshape/shape/3" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 64 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/Reshape/shape" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/Reshape/shape/2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/Reshape/shape/3" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 4 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/k/Tensordot" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/Reshape/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: 64 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/transpose/perm" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 4 | |
} | |
} | |
tensor_content: "\000\000\000\000\002\000\000\000\001\000\000\000\003\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/transpose" | |
op: "Transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/split_last_dimension/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/transpose/perm" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 64 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/strided_slice_1/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/strided_slice_1/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/strided_slice_1/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/strided_slice_1/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/strided_slice_1/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/strided_slice_1/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/Reshape/shape/2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 8 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/Reshape/shape/3" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 64 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/Reshape/shape" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/strided_slice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/strided_slice_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/Reshape/shape/2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/Reshape/shape/3" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 4 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/v/Tensordot" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/Reshape/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: 64 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/transpose/perm" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 4 | |
} | |
} | |
tensor_content: "\000\000\000\000\002\000\000\000\001\000\000\000\003\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/transpose" | |
op: "Transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/split_last_dimension/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/transpose/perm" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 64 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/mul/y" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.125 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads/transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/mul/y" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 64 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/MatMul" | |
op: "BatchMatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_1/transpose" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "adj_x" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "adj_y" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/add" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/attention_bias_ignore_padding/ExpandDims_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/attention_weights" | |
op: "Softmax" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/add" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/keep_prob" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.899999976158 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/attention_weights" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/random_uniform/min" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/random_uniform/max" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 1.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/random_uniform/RandomUniform" | |
op: "RandomUniform" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/Shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/random_uniform/sub" | |
op: "Sub" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/random_uniform/max" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/random_uniform/min" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/random_uniform/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/random_uniform/RandomUniform" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/random_uniform/sub" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/random_uniform" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/random_uniform/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/random_uniform/min" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/add" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/keep_prob" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/random_uniform" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/Floor" | |
op: "Floor" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/add" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/div" | |
op: "RealDiv" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/attention_weights" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/keep_prob" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/div" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/Floor" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/mul" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice_1/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice_1/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 3 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice_1/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice_1/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice_1/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice_1/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice_2/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 3 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice_2/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 4 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice_2/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice_2" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice_2/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice_2/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/strided_slice_2/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/transpose/perm" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 4 | |
} | |
} | |
tensor_content: "\000\000\000\000\002\000\000\000\003\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/transpose" | |
op: "Transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/transpose/perm" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pow/y" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.20000000298 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pow" | |
op: "Pow" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pow/y" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/FloorMod/x" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: -8 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/FloorMod/y" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 3 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/FloorMod" | |
op: "FloorMod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/FloorMod/x" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/FloorMod/y" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pad/paddings/3/0" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pad/paddings/3" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pad/paddings/3/0" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/FloorMod" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pad/paddings/0_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\000\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pad/paddings/1_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\000\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pad/paddings/2_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\000\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pad/paddings" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pad/paddings/0_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pad/paddings/1_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pad/paddings/2_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pad/paddings/3" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 4 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pad" | |
op: "Pad" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pow" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pad/paddings" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tpaddings" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 9 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pad" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice_1/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice_1/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice_1/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice_1/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice_1/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice_1/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice_2/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice_2/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 3 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice_2/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice_2" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice_2/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice_2/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice_2/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/Reshape/shape/3" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 3 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/Reshape/shape/4" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 3 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/Reshape/shape" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/strided_slice_2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/Reshape/shape/3" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/Reshape/shape/4" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 5 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 5 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Pad" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/Reshape/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 3 | |
} | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Max/reduction_indices" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 4 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Max" | |
op: "Max" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/split_last_dimension/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Max/reduction_indices" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/attention/tag" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_STRING | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_STRING | |
tensor_shape { | |
} | |
string_val: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/attention" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/attention" | |
op: "ImageSummary" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/attention/tag" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/Max" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "bad_color" | |
value { | |
tensor { | |
dtype: DT_UINT8 | |
tensor_shape { | |
dim { | |
size: 4 | |
} | |
} | |
int_val: 255 | |
int_val: 0 | |
int_val: 0 | |
int_val: 255 | |
} | |
} | |
} | |
attr { | |
key: "max_images" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/MatMul_1" | |
op: "BatchMatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/dropout/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/split_heads_2/transpose" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 64 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "adj_x" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "adj_y" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/transpose/perm" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 4 | |
} | |
} | |
tensor_content: "\000\000\000\000\002\000\000\000\001\000\000\000\003\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/transpose" | |
op: "Transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/dot_product_attention/MatMul_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/transpose/perm" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: 64 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/transpose" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/strided_slice_1/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/strided_slice_1/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/strided_slice_1/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/strided_slice_1/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/strided_slice_1/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/strided_slice_1/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/Reshape/shape/2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 512 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/Reshape/shape" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/strided_slice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/strided_slice_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/Reshape/shape/2" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 3 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/Reshape/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Initializer/random_uniform/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\002\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Initializer/random_uniform/min" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: -0.0765465572476 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Initializer/random_uniform/max" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0765465572476 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Initializer/random_uniform/RandomUniform" | |
op: "RandomUniform" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Initializer/random_uniform/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Initializer/random_uniform/sub" | |
op: "Sub" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Initializer/random_uniform/max" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Initializer/random_uniform/mul" | |
op: "Mul" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Initializer/random_uniform/RandomUniform" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Initializer/random_uniform/sub" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Initializer/random_uniform" | |
op: "Add" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Initializer/random_uniform/mul" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Initializer/random_uniform" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_22/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_22" | |
op: "Identity" | |
input: "Read_22/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/axes" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/free" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/Reshape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/GatherV2/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/GatherV2" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/GatherV2/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/GatherV2_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/GatherV2_1" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/GatherV2_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Const" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Prod" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Const_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Prod_1" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/GatherV2_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Const_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/concat/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/concat" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/concat/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/stack" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Prod_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/transpose" | |
op: "Transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/combine_heads/combine_last_two_dimensions/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/concat" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/stack" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/transpose_1/perm" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/transpose_1" | |
op: "Transpose" | |
input: "Identity_22" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/transpose_1/perm" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Reshape_1/shape" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\002\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Reshape_1" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/transpose_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Reshape_1/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/MatMul" | |
op: "MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Reshape_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "transpose_a" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "transpose_b" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Const_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 512 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/concat_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/concat_1" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/Const_2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/concat_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot/concat_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/keep_prob" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.899999976158 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/random_uniform/min" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/random_uniform/max" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 1.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/random_uniform/RandomUniform" | |
op: "RandomUniform" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/Shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/random_uniform/sub" | |
op: "Sub" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/random_uniform/max" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/random_uniform/min" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/random_uniform/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/random_uniform/RandomUniform" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/random_uniform/sub" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/random_uniform" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/random_uniform/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/random_uniform/min" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/add" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/keep_prob" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/random_uniform" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/Floor" | |
op: "Floor" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/add" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/div" | |
op: "RealDiv" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/multihead_attention/output_transform/Tensordot" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/keep_prob" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/div" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/Floor" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/add" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/dropout/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/dropout/mul" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/add" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/strided_slice_1/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/strided_slice_1/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/strided_slice_1/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/strided_slice_1/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/strided_slice_1/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/strided_slice_1/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_scale/Initializer/ones" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_scale" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
dim { | |
size: 512 | |
} | |
} | |
float_val: 1.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_scale" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_scale" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_scale" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_scale/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_scale" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_scale/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_scale" | |
input: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_scale/Initializer/ones" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_scale" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_scale/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_scale" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_scale" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_23/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_scale" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_23" | |
op: "Identity" | |
input: "Read_23/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_bias/Initializer/zeros" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
dim { | |
size: 512 | |
} | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_bias" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_bias" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_bias/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_bias" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_bias/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_bias" | |
input: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_bias/Initializer/zeros" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_bias" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_bias/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_bias" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_24/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/layer_norm_bias" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_24" | |
op: "Identity" | |
input: "Read_24/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/Const" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 9.99999997475e-07 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/Mean/reduction_indices" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/Mean" | |
op: "Mean" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/Mean/reduction_indices" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/sub" | |
op: "Sub" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/Mean" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/Square" | |
op: "Square" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/sub" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/Mean_1/reduction_indices" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/Mean_1" | |
op: "Mean" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/Square" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/Mean_1/reduction_indices" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/sub_1" | |
op: "Sub" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/Mean" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/add" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/Mean_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/Rsqrt" | |
op: "Rsqrt" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/add" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/sub_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/Rsqrt" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/mul_1" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/mul" | |
input: "Identity_23" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/add_1" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/mul_1" | |
input: "Identity_24" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/add_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/strided_slice_1/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/strided_slice_1/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/strided_slice_1/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/strided_slice_1/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/strided_slice_1/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/strided_slice_1/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/concat/values_0" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/concat/values_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 512 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/concat/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/concat" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/concat/values_0" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/concat/values_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/concat/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_prepostprocess/layer_norm/add_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/concat" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/remove/GatherNd" | |
op: "GatherNd" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/ToInt32" | |
device: "/device:GPU:0" | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/ExpandDims/dim" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/ExpandDims" | |
op: "ExpandDims" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/remove/GatherNd" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/ExpandDims/dim" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tdim" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Initializer/random_uniform/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv1/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\002\000\000\000\010\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Initializer/random_uniform/min" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv1/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: -0.0484122931957 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Initializer/random_uniform/max" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv1/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0484122931957 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Initializer/random_uniform/RandomUniform" | |
op: "RandomUniform" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Initializer/random_uniform/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv1/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Initializer/random_uniform/sub" | |
op: "Sub" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Initializer/random_uniform/max" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv1/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Initializer/random_uniform/mul" | |
op: "Mul" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Initializer/random_uniform/RandomUniform" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Initializer/random_uniform/sub" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv1/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Initializer/random_uniform" | |
op: "Add" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Initializer/random_uniform/mul" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv1/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/kernel" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv1/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_0/ffn/conv1/kernel" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/kernel/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/kernel" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Initializer/random_uniform" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv1/kernel" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/kernel/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv1/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_25/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_25" | |
op: "Identity" | |
input: "Read_25/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/bias/Initializer/zeros/shape_as_tensor" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv1/bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2048 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/bias/Initializer/zeros/Const" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv1/bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/bias/Initializer/zeros" | |
op: "Fill" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/bias/Initializer/zeros/shape_as_tensor" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/bias/Initializer/zeros/Const" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv1/bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "index_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/bias" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv1/bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_0/ffn/conv1/bias" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/bias/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/bias" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/bias/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/bias" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/bias/Initializer/zeros" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv1/bias" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv1/bias/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/bias" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv1/bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_26/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/conv1/bias" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_26" | |
op: "Identity" | |
input: "Read_26/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/axes" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/free" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/ExpandDims" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/GatherV2/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/GatherV2" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/GatherV2/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/GatherV2_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/GatherV2_1" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/GatherV2_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Const" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Prod" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Const_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Prod_1" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/GatherV2_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Const_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/concat/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/concat" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/concat/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/stack" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Prod_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/transpose" | |
op: "Transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/ExpandDims" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/concat" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/stack" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/transpose_1/perm" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/transpose_1" | |
op: "Transpose" | |
input: "Identity_25" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/transpose_1/perm" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Reshape_1/shape" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\002\000\000\000\010\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Reshape_1" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/transpose_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Reshape_1/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/MatMul" | |
op: "MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Reshape_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "transpose_a" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "transpose_b" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Const_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2048 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/concat_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/concat_1" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/Const_2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/concat_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot/concat_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/BiasAdd" | |
op: "BiasAdd" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Tensordot" | |
input: "Identity_26" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "data_format" | |
value { | |
s: "NHWC" | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Relu" | |
op: "Relu" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/BiasAdd" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/keep_prob" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.899999976158 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Relu" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/random_uniform/min" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/random_uniform/max" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 1.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/random_uniform/RandomUniform" | |
op: "RandomUniform" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/Shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/random_uniform/sub" | |
op: "Sub" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/random_uniform/max" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/random_uniform/min" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/random_uniform/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/random_uniform/RandomUniform" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/random_uniform/sub" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/random_uniform" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/random_uniform/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/random_uniform/min" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/add" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/keep_prob" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/random_uniform" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/Floor" | |
op: "Floor" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/add" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/div" | |
op: "RealDiv" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv1/Relu" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/keep_prob" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/div" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/Floor" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Initializer/random_uniform/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv2/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\010\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Initializer/random_uniform/min" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv2/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: -0.0484122931957 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Initializer/random_uniform/max" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv2/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0484122931957 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Initializer/random_uniform/RandomUniform" | |
op: "RandomUniform" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Initializer/random_uniform/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv2/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2048 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Initializer/random_uniform/sub" | |
op: "Sub" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Initializer/random_uniform/max" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv2/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Initializer/random_uniform/mul" | |
op: "Mul" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Initializer/random_uniform/RandomUniform" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Initializer/random_uniform/sub" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv2/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2048 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Initializer/random_uniform" | |
op: "Add" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Initializer/random_uniform/mul" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv2/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2048 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv2/kernel" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv2/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 2048 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_0/ffn/conv2/kernel" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv2/kernel/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/kernel" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Initializer/random_uniform" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv2/kernel" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv2/kernel/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv2/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2048 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_27/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2048 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_27" | |
op: "Identity" | |
input: "Read_27/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2048 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv2/bias/Initializer/zeros" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv2/bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
dim { | |
size: 512 | |
} | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv2/bias" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv2/bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_0/ffn/conv2/bias" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv2/bias/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/bias" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv2/bias/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/bias" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/bias/Initializer/zeros" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv2/bias" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_0/ffn/conv2/bias/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/bias" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_0/ffn/conv2/bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_28/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_0/ffn/conv2/bias" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_28" | |
op: "Identity" | |
input: "Read_28/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/axes" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/free" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/mul" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/GatherV2/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/GatherV2" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/GatherV2/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/GatherV2_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/GatherV2_1" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/GatherV2_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Const" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Prod" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Const_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Prod_1" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/GatherV2_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Const_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/concat/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/concat" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/concat/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/stack" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Prod_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/transpose" | |
op: "Transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/dropout/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/concat" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 2048 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/stack" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/transpose_1/perm" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/transpose_1" | |
op: "Transpose" | |
input: "Identity_27" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/transpose_1/perm" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2048 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Reshape_1/shape" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\010\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Reshape_1" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/transpose_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Reshape_1/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2048 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/MatMul" | |
op: "MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Reshape_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "transpose_a" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "transpose_b" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Const_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 512 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/concat_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/concat_1" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/Const_2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/concat_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot/concat_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/BiasAdd" | |
op: "BiasAdd" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/Tensordot" | |
input: "Identity_28" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "data_format" | |
value { | |
s: "NHWC" | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/Squeeze" | |
op: "Squeeze" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/conv2/BiasAdd" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "squeeze_dims" | |
value { | |
list { | |
i: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/restore/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/Squeeze" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/restore/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/restore/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/restore/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/restore/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/restore/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/restore/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/restore/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/restore/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 1 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/restore/concat/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/restore/concat" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/strided_slice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/restore/strided_slice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/restore/concat/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/restore/ScatterNd" | |
op: "ScatterNd" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/pad_reduce/get_ids/ToInt32" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/Squeeze" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/restore/concat" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/Reshape_1/shape/2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 512 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/Reshape_1/shape" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/strided_slice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/strided_slice_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/Reshape_1/shape/2" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 3 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/Reshape_1" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/pad_reduce/restore/ScatterNd" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/Reshape_1/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/keep_prob" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.899999976158 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/Reshape_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/random_uniform/min" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/random_uniform/max" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 1.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/random_uniform/RandomUniform" | |
op: "RandomUniform" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/Shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/random_uniform/sub" | |
op: "Sub" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/random_uniform/max" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/random_uniform/min" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/random_uniform/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/random_uniform/RandomUniform" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/random_uniform/sub" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/random_uniform" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/random_uniform/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/random_uniform/min" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/add" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/keep_prob" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/random_uniform" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/Floor" | |
op: "Floor" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/add" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/div" | |
op: "RealDiv" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/Reshape_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/keep_prob" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/div" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/Floor" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/add" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/dropout/mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/self_attention/layer_postprocess/add" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/add" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/strided_slice_1/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/strided_slice_1/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/strided_slice_1/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/strided_slice_1/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/strided_slice_1/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/strided_slice_1/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale/Initializer/ones" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
dim { | |
size: 512 | |
} | |
} | |
float_val: 1.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
input: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale/Initializer/ones" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_29/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_scale" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_29" | |
op: "Identity" | |
input: "Read_29/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias/Initializer/zeros" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
dim { | |
size: 512 | |
} | |
} | |
float_val: 0.0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
input: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias/Initializer/zeros" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_30/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/layer_norm_bias" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_30" | |
op: "Identity" | |
input: "Read_30/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/Const" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 9.99999997475e-07 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/Mean/reduction_indices" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/Mean" | |
op: "Mean" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/Mean/reduction_indices" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/sub" | |
op: "Sub" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/Mean" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/Square" | |
op: "Square" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/sub" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/Mean_1/reduction_indices" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: -1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/Mean_1" | |
op: "Mean" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/Square" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/Mean_1/reduction_indices" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: true | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/sub_1" | |
op: "Sub" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_0/ffn/layer_postprocess/add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/Mean" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/add" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/Mean_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/Rsqrt" | |
op: "Rsqrt" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/add" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/mul" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/sub_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/Rsqrt" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/mul_1" | |
op: "Mul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/mul" | |
input: "Identity_29" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/add_1" | |
op: "Add" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/mul_1" | |
input: "Identity_30" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\002\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/min" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: -0.0765465572476 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/max" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0765465572476 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/RandomUniform" | |
op: "RandomUniform" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/sub" | |
op: "Sub" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/max" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/mul" | |
op: "Mul" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/RandomUniform" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/sub" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Initializer/random_uniform" | |
op: "Add" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/mul" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Initializer/random_uniform" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_31/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/q/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_31" | |
op: "Identity" | |
input: "Read_31/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/axes" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/free" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/add_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/GatherV2/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/GatherV2" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/GatherV2/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/GatherV2_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/GatherV2_1" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/GatherV2_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Const" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Prod" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Const_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Prod_1" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/GatherV2_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Const_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/concat/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/concat" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/concat/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/stack" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Prod_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/transpose" | |
op: "Transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/add_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/concat" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/stack" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/transpose_1/perm" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/transpose_1" | |
op: "Transpose" | |
input: "Identity_31" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/transpose_1/perm" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Reshape_1/shape" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\002\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Reshape_1" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/transpose_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Reshape_1/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/MatMul" | |
op: "MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Reshape_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "transpose_a" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "transpose_b" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Const_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 512 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/concat_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/concat_1" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/Const_2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/concat_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot/concat_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\002\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/min" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: -0.0765465572476 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/max" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0765465572476 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/RandomUniform" | |
op: "RandomUniform" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/sub" | |
op: "Sub" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/max" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/mul" | |
op: "Mul" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/RandomUniform" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/sub" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Initializer/random_uniform" | |
op: "Add" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/mul" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Initializer/random_uniform" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_32/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/k/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_32" | |
op: "Identity" | |
input: "Read_32/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/axes" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/free" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/add_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/GatherV2/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/GatherV2" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/GatherV2/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/GatherV2_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/GatherV2_1" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/GatherV2_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Const" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Prod" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Const_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Prod_1" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/GatherV2_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Const_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/concat/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/concat" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/concat/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/stack" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Prod_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/transpose" | |
op: "Transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/add_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/concat" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/stack" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/transpose_1/perm" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/transpose_1" | |
op: "Transpose" | |
input: "Identity_32" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/transpose_1/perm" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Reshape_1/shape" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\002\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Reshape_1" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/transpose_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Reshape_1/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/MatMul" | |
op: "MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Reshape_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "transpose_a" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "transpose_b" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Const_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 512 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/concat_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/concat_1" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/Const_2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/concat_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot/concat_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/shape" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\002\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/min" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: -0.0765465572476 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/max" | |
op: "Const" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_FLOAT | |
tensor_shape { | |
} | |
float_val: 0.0765465572476 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/RandomUniform" | |
op: "RandomUniform" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/shape" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "seed" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "seed2" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/sub" | |
op: "Sub" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/max" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/mul" | |
op: "Mul" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/RandomUniform" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/sub" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Initializer/random_uniform" | |
op: "Add" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/mul" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Initializer/random_uniform/min" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel" | |
op: "VarHandleOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "container" | |
value { | |
s: "" | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "shape" | |
value { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
attr { | |
key: "shared_name" | |
value { | |
s: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/IsInitialized/VarIsInitializedOp" | |
op: "VarIsInitializedOp" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Assign" | |
op: "AssignVariableOp" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Initializer/random_uniform" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel/Read/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_class" | |
value { | |
list { | |
s: "loc:@transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel" | |
} | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Read_33/ReadVariableOp" | |
op: "ReadVariableOp" | |
input: "transformer/body/encoder/layer_1/self_attention/multihead_attention/v/kernel" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
} | |
node { | |
name: "Identity_33" | |
op: "Identity" | |
input: "Read_33/ReadVariableOp" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/axes" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/free" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/add_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/GatherV2/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/GatherV2" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/GatherV2/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/GatherV2_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/GatherV2_1" | |
op: "GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/GatherV2_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "Taxis" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tindices" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tparams" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Const" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Prod" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Const_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Prod_1" | |
op: "Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/GatherV2_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Const_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "keep_dims" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/concat/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/concat" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/free" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/axes" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/concat/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/stack" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Prod" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Prod_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/transpose" | |
op: "Transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/layer_prepostprocess/layer_norm/add_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/concat" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/stack" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/transpose_1/perm" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\000\000\000\001\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/transpose_1" | |
op: "Transpose" | |
input: "Identity_33" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/transpose_1/perm" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Reshape_1/shape" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 2 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 2 | |
} | |
} | |
tensor_content: "\000\002\000\000\000\002\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Reshape_1" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/transpose_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Reshape_1/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 512 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/MatMul" | |
op: "MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Reshape_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "transpose_a" | |
value { | |
b: false | |
} | |
} | |
attr { | |
key: "transpose_b" | |
value { | |
b: false | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Const_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 512 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/concat_1/axis" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/concat_1" | |
op: "ConcatV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/GatherV2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/Const_2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/concat_1/axis" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 2 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "Tidx" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/MatMul" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/v/Tensordot/concat_1" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 512 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice_1/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice_1/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 2 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice_1/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice_1" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice_1/stack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice_1/stack_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice_1/stack_2" | |
device: "/device:GPU:0" | |
attr { | |
key: "Index" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "begin_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "ellipsis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "end_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "new_axis_mask" | |
value { | |
i: 0 | |
} | |
} | |
attr { | |
key: "shrink_axis_mask" | |
value { | |
i: 1 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/Reshape/shape/2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 8 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/Reshape/shape/3" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
} | |
int_val: 64 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/Reshape/shape" | |
op: "Pack" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/strided_slice_1" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/Reshape/shape/2" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/Reshape/shape/3" | |
device: "/device:GPU:0" | |
attr { | |
key: "N" | |
value { | |
i: 4 | |
} | |
} | |
attr { | |
key: "T" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "axis" | |
value { | |
i: 0 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/Reshape" | |
op: "Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/q/Tensordot" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/Reshape/shape" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tshape" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: 64 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/transpose/perm" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 4 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 4 | |
} | |
} | |
tensor_content: "\000\000\000\000\002\000\000\000\001\000\000\000\003\000\000\000" | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/transpose" | |
op: "Transpose" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/split_last_dimension/Reshape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads/transpose/perm" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "Tperm" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 8 | |
} | |
dim { | |
size: -1 | |
} | |
dim { | |
size: 64 | |
} | |
} | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads_1/split_last_dimension/Shape" | |
op: "Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/k/Tensordot" | |
device: "/device:GPU:0" | |
attr { | |
key: "T" | |
value { | |
type: DT_FLOAT | |
} | |
} | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 3 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "out_type" | |
value { | |
type: DT_INT32 | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice/stack" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 0 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice/stack_1" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice/stack_2" | |
op: "Const" | |
device: "/device:GPU:0" | |
attr { | |
key: "_output_shapes" | |
value { | |
list { | |
shape { | |
dim { | |
size: 1 | |
} | |
} | |
} | |
} | |
} | |
attr { | |
key: "dtype" | |
value { | |
type: DT_INT32 | |
} | |
} | |
attr { | |
key: "value" | |
value { | |
tensor { | |
dtype: DT_INT32 | |
tensor_shape { | |
dim { | |
size: 1 | |
} | |
} | |
int_val: 1 | |
} | |
} | |
} | |
} | |
node { | |
name: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice" | |
op: "StridedSlice" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads_1/split_last_dimension/Shape" | |
input: "transformer/parallel_0_5/transformer/transformer/body/encoder/layer_1/self_attention/multihead_attention/split_heads_1/split_last_dimension/strided_slice/stack" | |
input: "transformer/parallel_0_5/transformer/transforme |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment