fix internal_convert_to_tensor shape exception for scalar value.

Oceania2018 · Oceania2018 · commit 0c6f8cd9e4ec · 2019-02-06T05:02:49.000-06:00
diff --git a/docs/source/Variable.md b/docs/source/Variable.md
@@ -1,2 +1,19 @@
 # Chapter. Variable
 
+The variables in TensorFlow are mainly used to represent variable parameter values in the machine learning model. Variables can be initialized by the `tf.Variable` function. During the graph computation the variables are modified by other operations. Variables exist in the session, as long as they are in the same session, other computing nodes on the network can access the same variable value. Variables use lazy loading and will only request memory space when they are used.
+
+TensorFlow中变量主要用来表示机器学习模型中的可变参数值，变量通过可以通过`tf.Variable` 类进行初始化。在图运行过程中，通过各种操作对变量进行修改。变量存在于会话当中，只要是在同一个会话里，网络上的其它计算结节都可以访问到相同的变量值。变量采用延迟加载的方式，只有使用的时候才会申请内存空间。
+
+```csharp
+var x = tf.Variable(10, name: "x");
+using (var session = tf.Session())
+{
+    session.run(x.initializer);
+    var result = session.run(x);
+    Console.Write(result); // should be 10
+}
+```
+
+The above code first creates a variable operation, initializes the variable, then runs the session, and finally gets the result. This code is very simple, but it shows the complete process how TensorFlow operates on variables. When creating a variable, you pass a `tensor` as the initial value to the function `Variable()`. TensorFlow provides a series of operators to initialize the tensor, the initial value is a constant or a random value.
+
+以上代码先创建变量操作，初始化变量，再运行会话，最后得到结果。这段代码非常简单，但是它体现了整个TensorFlow对变量操作的完整流程。当创建一个变量时，你将一个`张量`作为初始值传入函数`Variable()`。TensorFlow提供了一系列操作符来初始化张量，初始值是常量或是随机值。
diff --git a/src/TensorFlowNET.Core/Operations/OpDefLibrary.cs b/src/TensorFlowNET.Core/Operations/OpDefLibrary.cs
@@ -44,14 +44,13 @@ public Operation _apply_op_helper(string op_type_name, string name = "", dynamic
             var input_types = new List<TF_DataType>();
             var base_types = new List<TF_DataType>();
 
-            Operation op = null;
-            Python.with<ops.name_scope>(new ops.name_scope(name), scope =>
+            return Python.with<ops.name_scope, Operation>(new ops.name_scope(name), scope =>
             {
                 // Perform input type inference
                 foreach (var input_arg in op_def.InputArg)
                 {
-                    var input_name = input_arg.Name;
-                    var values = keywords[input_name];
+                    var input_arg_name = input_arg.Name;
+                    var values = keywords[input_arg_name];
                     // Goals:
                     // * Convert values to Tensors if it contains constants.
                     // * Verify that values is a list if that matches the input_arg's
@@ -64,13 +63,13 @@ public Operation _apply_op_helper(string op_type_name, string name = "", dynamic
                     // * If the input_arg has an explicit type, make sure the input
                     // conforms.
 
+                    DataType dtype = DataType.DtInvalid;
+                    DataType default_dtype = DataType.DtInvalid;
+
                     if (_IsListParameter(input_arg))
                     {
-                        DataType dtype = DataType.DtInvalid;
-                        DataType default_dtype = DataType.DtInvalid;
-
                         if (!_IsListValue(values))
-                            throw new TypeError($"Expected list for '{input_name}' argument to '{op_type_name}' Op, not {values}.");
+                            throw new TypeError($"Expected list for '{input_arg_name}' argument to '{op_type_name}' Op, not {values}.");
                         if(input_arg.Type != DataType.DtInvalid)
                         {
                             dtype = input_arg.Type;
@@ -87,19 +86,22 @@ public Operation _apply_op_helper(string op_type_name, string name = "", dynamic
                     }
                     else
                     {
-                        if (keywords[input_name] is Tensor)
+                        if (default_type_attr_map.ContainsKey(input_arg.TypeAttr))
+                            default_dtype = (DataType)default_type_attr_map[input_arg.TypeAttr];
+
+                        if (keywords[input_arg_name] is Tensor)
                         {
                         }
                         else
                         {
-                            keywords[input_name] = ops.internal_convert_to_tensor(values, name: input_name);
+                            keywords[input_arg_name] = ops.internal_convert_to_tensor(values, name: input_arg_name);
                         }
 
                         if (!String.IsNullOrEmpty(input_arg.TypeAttr))
                         {
-                            attrs[input_arg.TypeAttr] = (keywords[input_name] as Tensor).dtype;
+                            attrs[input_arg.TypeAttr] = (keywords[input_arg_name] as Tensor).dtype;
                         }
-                        values = new Tensor[] { keywords[input_name] as Tensor };
+                        values = new Tensor[] { keywords[input_arg_name] as Tensor };
                     }
 
                     inputs.AddRange(values as Tensor[]);
@@ -122,7 +124,7 @@ public Operation _apply_op_helper(string op_type_name, string name = "", dynamic
                 {
                     var key = attr_def.Name;
                     if (!attrs.ContainsKey(key))
-                        Console.WriteLine($"{key} not found in attr_def.");
+                        Console.WriteLine($"_apply_op_helper: key '{key}' is not found in '{op_def.Name}' operation's attr_def.");
                     var value = attrs[key];
                     var attr_value = new AttrValue();
 
@@ -165,14 +167,14 @@ public Operation _apply_op_helper(string op_type_name, string name = "", dynamic
                 }
 
                 // Add Op to graph
-                op = g.create_op(op_type_name, inputs, output_types.ToArray(),
+                var op = g.create_op(op_type_name, inputs, output_types.ToArray(),
                     name: scope,
                     input_types: input_types.ToArray(),
                     attrs: attr_protos,
                     op_def: op_def);
-            });
 
-            return op;
+                return op;
+            });
         }
 
         public DataType _MakeType(TF_DataType v, AttrDef attr_def)
diff --git a/src/TensorFlowNET.Core/Operations/math_ops.py.cs b/src/TensorFlowNET.Core/Operations/math_ops.py.cs
@@ -20,8 +20,10 @@ public static Tensor reduced_shape(Tensor input_shape, Tensor axes)
             var input_rank = array_ops.size(input_shape);
             axes = (axes + input_rank) % input_rank;
             var axes_shape = array_ops.shape(axes);
-            var a1 = new Tensor[] { input_rank, axes };
-            var a2 = new Tensor[] { input_shape, gen_array_ops.fill(axes_shape, 1) };
+            var rng = math_ops.range(input_rank);
+            var a1 = new Tensor[] { rng, axes };
+            var fill = gen_array_ops.fill(axes_shape, 1);
+            var a2 = new Tensor[] { input_shape, fill };
 
             return gen_data_flow_ops.dynamic_stitch(a1, a2);
         }
@@ -80,8 +82,17 @@ private static Tensor _ReductionDims(Tensor x, Tensor axis)
             }
         }
 
-        public static Tensor range(object start, Tensor limit = null, object delta = null, TF_DataType dtype = TF_DataType.DtInvalid, string name = "range" )
+        public static Tensor range(object start, object limit = null, object delta = null, TF_DataType dtype = TF_DataType.DtInvalid, string name = "range" )
         {
+            if(limit == null)
+            {
+                limit = start;
+                start = 0;
+            }
+
+            if (delta == null)
+                delta = 1;
+
             return Python.with<ops.name_scope, Tensor>(new ops.name_scope(name, "Range", new object[] { start, limit, delta }), scope =>
             {
                 name = scope;
diff --git a/src/TensorFlowNET.Core/ops.py.cs b/src/TensorFlowNET.Core/ops.py.cs
@@ -333,8 +333,12 @@ public static Tensor internal_convert_to_tensor<T>(T value, DataType dtype = Dat
             {
                 case "Tensor":
                     return value as Tensor;
+                case "Int32":
+                    return constant_op.constant(Convert.ToInt32(value), name);
+                case "Double":
+                    return constant_op.constant(Convert.ToDouble(value), name);
                 default:
-                    return constant_op.constant(np.array(value), name);
+                    throw new NotImplementedException($"internal_convert_to_tensor: Can't convert {typeof(T).Name} to Tensor");
             }
         }
     }

Original file line number	Diff line number	Diff line change
`@@ -44,14 +44,13 @@ public Operation _apply_op_helper(string op_type_name, string name = "", dynamic`
`44`	`44`	`var input_types = new List<TF_DataType>();`
`45`	`45`	`var base_types = new List<TF_DataType>();`
`46`	`46`
`47`		`- Operation op = null;`
`48`		`- Python.with<ops.name_scope>(new ops.name_scope(name), scope =>`
	`47`	`+ return Python.with<ops.name_scope, Operation>(new ops.name_scope(name), scope =>`
`49`	`48`	`{`
`50`	`49`	`// Perform input type inference`
`51`	`50`	`foreach (var input_arg in op_def.InputArg)`
`52`	`51`	`{`
`53`		`- var input_name = input_arg.Name;`
`54`		`- var values = keywords[input_name];`
	`52`	`+ var input_arg_name = input_arg.Name;`
	`53`	`+ var values = keywords[input_arg_name];`
`55`	`54`	`// Goals:`
`56`	`55`	`// * Convert values to Tensors if it contains constants.`
`57`	`56`	`// * Verify that values is a list if that matches the input_arg's`
`@@ -64,13 +63,13 @@ public Operation _apply_op_helper(string op_type_name, string name = "", dynamic`
`64`	`63`	`// * If the input_arg has an explicit type, make sure the input`
`65`	`64`	`// conforms.`
`66`	`65`
	`66`	`+ DataType dtype = DataType.DtInvalid;`
	`67`	`+ DataType default_dtype = DataType.DtInvalid;`
	`68`	`+`
`67`	`69`	`if (_IsListParameter(input_arg))`
`68`	`70`	`{`
`69`		`- DataType dtype = DataType.DtInvalid;`
`70`		`- DataType default_dtype = DataType.DtInvalid;`
`71`		`-`
`72`	`71`	`if (!_IsListValue(values))`
`73`		`- throw new TypeError($"Expected list for '{input_name}' argument to '{op_type_name}' Op, not {values}.");`
	`72`	`+ throw new TypeError($"Expected list for '{input_arg_name}' argument to '{op_type_name}' Op, not {values}.");`
`74`	`73`	`if(input_arg.Type != DataType.DtInvalid)`
`75`	`74`	`{`
`76`	`75`	`dtype = input_arg.Type;`
`@@ -87,19 +86,22 @@ public Operation _apply_op_helper(string op_type_name, string name = "", dynamic`
`87`	`86`	`}`
`88`	`87`	`else`
`89`	`88`	`{`
`90`		`- if (keywords[input_name] is Tensor)`
	`89`	`+ if (default_type_attr_map.ContainsKey(input_arg.TypeAttr))`
	`90`	`+ default_dtype = (DataType)default_type_attr_map[input_arg.TypeAttr];`
	`91`	`+`
	`92`	`+ if (keywords[input_arg_name] is Tensor)`
`91`	`93`	`{`
`92`	`94`	`}`
`93`	`95`	`else`
`94`	`96`	`{`
`95`		`- keywords[input_name] = ops.internal_convert_to_tensor(values, name: input_name);`
	`97`	`+ keywords[input_arg_name] = ops.internal_convert_to_tensor(values, name: input_arg_name);`
`96`	`98`	`}`
`97`	`99`
`98`	`100`	`if (!String.IsNullOrEmpty(input_arg.TypeAttr))`
`99`	`101`	`{`
`100`		`- attrs[input_arg.TypeAttr] = (keywords[input_name] as Tensor).dtype;`
	`102`	`+ attrs[input_arg.TypeAttr] = (keywords[input_arg_name] as Tensor).dtype;`
`101`	`103`	`}`
`102`		`- values = new Tensor[] { keywords[input_name] as Tensor };`
	`104`	`+ values = new Tensor[] { keywords[input_arg_name] as Tensor };`
`103`	`105`	`}`
`104`	`106`
`105`	`107`	`inputs.AddRange(values as Tensor[]);`
`@@ -122,7 +124,7 @@ public Operation _apply_op_helper(string op_type_name, string name = "", dynamic`
`122`	`124`	`{`
`123`	`125`	`var key = attr_def.Name;`
`124`	`126`	`if (!attrs.ContainsKey(key))`
`125`		`- Console.WriteLine($"{key} not found in attr_def.");`
	`127`	`+ Console.WriteLine($"_apply_op_helper: key '{key}' is not found in '{op_def.Name}' operation's attr_def.");`
`126`	`128`	`var value = attrs[key];`
`127`	`129`	`var attr_value = new AttrValue();`
`128`	`130`
`@@ -165,14 +167,14 @@ public Operation _apply_op_helper(string op_type_name, string name = "", dynamic`
`165`	`167`	`}`
`166`	`168`
`167`	`169`	`// Add Op to graph`
`168`		`- op = g.create_op(op_type_name, inputs, output_types.ToArray(),`
	`170`	`+ var op = g.create_op(op_type_name, inputs, output_types.ToArray(),`
`169`	`171`	`name: scope,`
`170`	`172`	`input_types: input_types.ToArray(),`
`171`	`173`	`attrs: attr_protos,`
`172`	`174`	`op_def: op_def);`
`173`		`- });`
`174`	`175`
`175`		`- return op;`
	`176`	`+ return op;`
	`177`	`+ });`
`176`	`178`	`}`
`177`	`179`
`178`	`180`	`public DataType _MakeType(TF_DataType v, AttrDef attr_def)`
Original file line number	Diff line number	Diff line change
`@@ -20,8 +20,10 @@ public static Tensor reduced_shape(Tensor input_shape, Tensor axes)`
`20`	`20`	`var input_rank = array_ops.size(input_shape);`
`21`	`21`	`axes = (axes + input_rank) % input_rank;`
`22`	`22`	`var axes_shape = array_ops.shape(axes);`
`23`		`- var a1 = new Tensor[] { input_rank, axes };`
`24`		`- var a2 = new Tensor[] { input_shape, gen_array_ops.fill(axes_shape, 1) };`
	`23`	`+ var rng = math_ops.range(input_rank);`
	`24`	`+ var a1 = new Tensor[] { rng, axes };`
	`25`	`+ var fill = gen_array_ops.fill(axes_shape, 1);`
	`26`	`+ var a2 = new Tensor[] { input_shape, fill };`
`25`	`27`
`26`	`28`	`return gen_data_flow_ops.dynamic_stitch(a1, a2);`
`27`	`29`	`}`
`@@ -80,8 +82,17 @@ private static Tensor _ReductionDims(Tensor x, Tensor axis)`
`80`	`82`	`}`
`81`	`83`	`}`
`82`	`84`
`83`		`- public static Tensor range(object start, Tensor limit = null, object delta = null, TF_DataType dtype = TF_DataType.DtInvalid, string name = "range" )`
	`85`	`+ public static Tensor range(object start, object limit = null, object delta = null, TF_DataType dtype = TF_DataType.DtInvalid, string name = "range" )`
`84`	`86`	`{`
	`87`	`+ if(limit == null)`
	`88`	`+ {`
	`89`	`+ limit = start;`
	`90`	`+ start = 0;`
	`91`	`+ }`
	`92`	`+`
	`93`	`+ if (delta == null)`
	`94`	`+ delta = 1;`
	`95`	`+`
`85`	`96`	`return Python.with<ops.name_scope, Tensor>(new ops.name_scope(name, "Range", new object[] { start, limit, delta }), scope =>`
`86`	`97`	`{`
`87`	`98`	`name = scope;`
Original file line number	Diff line number	Diff line change
`@@ -333,8 +333,12 @@ public static Tensor internal_convert_to_tensor<T>(T value, DataType dtype = Dat`
`333`	`333`	`{`
`334`	`334`	`case "Tensor":`
`335`	`335`	`return value as Tensor;`
	`336`	`+ case "Int32":`
	`337`	`+ return constant_op.constant(Convert.ToInt32(value), name);`
	`338`	`+ case "Double":`
	`339`	`+ return constant_op.constant(Convert.ToDouble(value), name);`
`336`	`340`	`default:`
`337`		`- return constant_op.constant(np.array(value), name);`
	`341`	`+ throw new NotImplementedException($"internal_convert_to_tensor: Can't convert {typeof(T).Name} to Tensor");`
`338`	`342`	`}`
`339`	`343`	`}`
`340`	`344`	`}`