提交 e17a9d1f 编写于 作者: R Ruilong Liu 提交者: GitHub

Merge pull request #993 from codeWorm2015/metal

correct genet
...@@ -31,8 +31,8 @@ kernel void fetch(texture2d_array<float, access::read> inTexture [[texture(0)]], ...@@ -31,8 +31,8 @@ kernel void fetch(texture2d_array<float, access::read> inTexture [[texture(0)]],
int output_to = 4 * input_width * input_height; int output_to = 4 * input_width * input_height;
output[gid.z * output_to + 0 * input_width * input_height + gid.y * input_width + gid.x] = input.x; output[gid.z * output_to + 0 * input_width * input_height + gid.y * input_width + gid.x] = input.x;
output[gid.z * output_to + 1 * input_width * input_height + gid.y * input_width + gid.x] = input.y; output[gid.z * output_to + 1 * input_width * input_height + gid.y * input_width + gid.x] = input.y;
output[gid.z * output_to + 2 * input_width * input_height + gid.y * input_width + gid.x] = input.z; // output[gid.z * output_to + 2 * input_width * input_height + gid.y * input_width + gid.x] = input.z;
output[gid.z * output_to + 3 * input_width * input_height + gid.y * input_width + gid.x] = input.w; // output[gid.z * output_to + 3 * input_width * input_height + gid.y * input_width + gid.x] = input.w;
} }
...@@ -52,8 +52,8 @@ kernel void fetch_half(texture2d_array<half, access::read> inTexture [[texture(0 ...@@ -52,8 +52,8 @@ kernel void fetch_half(texture2d_array<half, access::read> inTexture [[texture(0
int output_to = 4 * input_width * input_height; int output_to = 4 * input_width * input_height;
output[gid.z * output_to + 0 * input_width * input_height + gid.y * input_width + gid.x] = input.x; output[gid.z * output_to + 0 * input_width * input_height + gid.y * input_width + gid.x] = input.x;
output[gid.z * output_to + 1 * input_width * input_height + gid.y * input_width + gid.x] = input.y; output[gid.z * output_to + 1 * input_width * input_height + gid.y * input_width + gid.x] = input.y;
output[gid.z * output_to + 2 * input_width * input_height + gid.y * input_width + gid.x] = input.z; // output[gid.z * output_to + 2 * input_width * input_height + gid.y * input_width + gid.x] = input.z;
output[gid.z * output_to + 3 * input_width * input_height + gid.y * input_width + gid.x] = input.w; // output[gid.z * output_to + 3 * input_width * input_height + gid.y * input_width + gid.x] = input.w;
} }
......
...@@ -164,7 +164,7 @@ public class Executor<P: PrecisionType> { ...@@ -164,7 +164,7 @@ public class Executor<P: PrecisionType> {
// return; // return;
// self!.ops[testTo - 2].delogOutput() // self!.ops[testTo - 2].delogOutput()
// self!.ops[testTo - 1].delogOutput() // self!.ops[testTo - 1].delogOutput()
// self!.ops[60].delogOutput() // self!.ops[5].delogOutput()
// return // return
...@@ -199,5 +199,3 @@ public class Executor<P: PrecisionType> { ...@@ -199,5 +199,3 @@ public class Executor<P: PrecisionType> {
} }
} }
//public let paddle_executor: Executor = Executor.init()
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册