diff options
Diffstat (limited to 'xvmc/shader/mc/read_field_x1y1_uv.g4i')
-rw-r--r-- | xvmc/shader/mc/read_field_x1y1_uv.g4i | 172 |
1 files changed, 172 insertions, 0 deletions
diff --git a/xvmc/shader/mc/read_field_x1y1_uv.g4i b/xvmc/shader/mc/read_field_x1y1_uv.g4i new file mode 100644 index 00000000..162de9a2 --- /dev/null +++ b/xvmc/shader/mc/read_field_x1y1_uv.g4i @@ -0,0 +1,172 @@ +/* + * Copyright © 2008 Intel Corporation + * + * Permission is hereby granted, free of charge, to any person obtaining a + * copy of this software and associated documentation files (the "Software"), + * to deal in the Software without restriction, including without limitation + * the rights to use, copy, modify, merge, publish, distribute, sublicense, + * and/or sell copies of the Software, and to permit persons to whom the + * Software is furnished to do so, subject to the following conditions: + * + * The above copyright notice and this permission notice (including the next + * paragraph) shall be included in all copies or substantial portions of the + * Software. + * + * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR + * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, + * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL + * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER + * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, + * OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE + * SOFTWARE. + * + * Author: + * Zou Nan hai <nanhai.zou@intel.com> + * Zhang Hua jun <huajun.zhang@intel.com> + * Xing Dong sheng <dongsheng.xing@intel.com> + * + */ +mov (1) g115.8<1>UD 0x07000FUD {align1}; +send (16) 0 g86.0<1>UW g115<16,8,1>UW read(surface_u, 2, 0, 2) mlen 1 rlen 4 {align1};//U +send (16) 0 g91.0<1>UW g115<16,8,1>UW read(surface_v, 2, 0, 2) mlen 1 rlen 4 {align1};//V +and (1) g2.24<1>UD g115.0<1,1,1>UD 3UD {align1}; +mul (1) g2.24<1>UD g2.24<1,1,1>UD 25UD {align1}; +mov (1) g115.8<1>UD 0x01000FUD {align1}; +add (1) g115.4<1>UD g115.4<1,1,1>UD 8UD {align1}; +send (16) 0 g90.0<1>UW g115<16,8,1>UW read(surface_u, 2, 0, 2) mlen 1 rlen 1 {align1}; +send (16) 0 g95.0<1>UW g115<16,8,1>UW read(surface_v, 2, 0, 2) mlen 1 rlen 1 {align1}; +jmpi g2.24<1,1,1>D; +//U +add (16) g78.0<1>UW g86.0<16,8,1>UB g87.0<16,8,1>UB {align1}; +add (16) g79.0<1>UW g87.0<16,8,1>UB g88.0<16,8,1>UB {align1}; +add (16) g80.0<1>UW g88.0<16,8,1>UB g89.0<16,8,1>UB {align1}; +add (16) g81.0<1>UW g89.0<16,8,1>UB g90.0<16,8,1>UB {align1}; + +add (16) g78.0<1>UW g78.0<16,8,1>UW g86.1<16,8,1>UB {align1}; +add (16) g79.0<1>UW g79.0<16,8,1>UW g87.1<16,8,1>UB {align1}; +add (16) g80.0<1>UW g80.0<16,8,1>UW g88.1<16,8,1>UB {align1}; +add (16) g81.0<1>UW g81.0<16,8,1>UW g89.1<16,8,1>UB {align1}; + +add (16) g78.0<1>UW g78.0<16,8,1>UW g87.1<16,8,1>UB {align1}; +add (16) g79.0<1>UW g79.0<16,8,1>UW g88.1<16,8,1>UB {align1}; +add (16) g80.0<1>UW g80.0<16,8,1>UW g89.1<16,8,1>UB {align1}; +add (16) g81.0<1>UW g81.0<16,8,1>UW g90.1<16,8,1>UB {align1}; +//V +add (16) g82.0<1>UW g91.0<16,8,1>UB g92.0<16,8,1>UB {align1}; +add (16) g83.0<1>UW g92.0<16,8,1>UB g93.0<16,8,1>UB {align1}; +add (16) g84.0<1>UW g93.0<16,8,1>UB g94.0<16,8,1>UB {align1}; +add (16) g85.0<1>UW g94.0<16,8,1>UB g95.0<16,8,1>UB {align1}; + +add (16) g82.0<1>UW g82.0<16,8,1>UW g91.1<16,8,1>UB {align1}; +add (16) g83.0<1>UW g83.0<16,8,1>UW g92.1<16,8,1>UB {align1}; +add (16) g84.0<1>UW g84.0<16,8,1>UW g93.1<16,8,1>UB {align1}; +add (16) g85.0<1>UW g85.0<16,8,1>UW g94.1<16,8,1>UB {align1}; + +add (16) g82.0<1>UW g82.0<16,8,1>UW g92.1<16,8,1>UB {align1}; +add (16) g83.0<1>UW g83.0<16,8,1>UW g93.1<16,8,1>UB {align1}; +add (16) g84.0<1>UW g84.0<16,8,1>UW g94.1<16,8,1>UB {align1}; +add (16) g85.0<1>UW g85.0<16,8,1>UW g95.1<16,8,1>UB {align1}; +jmpi out; +//U +add (16) g78.0<1>UW g86.1<16,8,1>UB g87.1<16,8,1>UB {align1}; +add (16) g79.0<1>UW g87.1<16,8,1>UB g88.1<16,8,1>UB {align1}; +add (16) g80.0<1>UW g88.1<16,8,1>UB g89.1<16,8,1>UB {align1}; +add (16) g81.0<1>UW g89.1<16,8,1>UB g90.1<16,8,1>UB {align1}; + +add (16) g78.0<1>UW g78.0<16,8,1>UW g86.2<16,8,1>UB {align1}; +add (16) g79.0<1>UW g79.0<16,8,1>UW g87.2<16,8,1>UB {align1}; +add (16) g80.0<1>UW g80.0<16,8,1>UW g88.2<16,8,1>UB {align1}; +add (16) g81.0<1>UW g81.0<16,8,1>UW g89.2<16,8,1>UB {align1}; + +add (16) g78.0<1>UW g78.0<16,8,1>UW g87.2<16,8,1>UB {align1}; +add (16) g79.0<1>UW g79.0<16,8,1>UW g88.2<16,8,1>UB {align1}; +add (16) g80.0<1>UW g80.0<16,8,1>UW g89.2<16,8,1>UB {align1}; +add (16) g81.0<1>UW g81.0<16,8,1>UW g90.2<16,8,1>UB {align1}; +//V +add (16) g82.0<1>UW g91.1<16,8,1>UB g92.1<16,8,1>UB {align1}; +add (16) g83.0<1>UW g92.1<16,8,1>UB g93.1<16,8,1>UB {align1}; +add (16) g84.0<1>UW g93.1<16,8,1>UB g94.1<16,8,1>UB {align1}; +add (16) g85.0<1>UW g94.1<16,8,1>UB g95.1<16,8,1>UB {align1}; + +add (16) g82.0<1>UW g82.0<16,8,1>UW g91.2<16,8,1>UB {align1}; +add (16) g83.0<1>UW g83.0<16,8,1>UW g92.2<16,8,1>UB {align1}; +add (16) g84.0<1>UW g84.0<16,8,1>UW g93.2<16,8,1>UB {align1}; +add (16) g85.0<1>UW g85.0<16,8,1>UW g94.2<16,8,1>UB {align1}; + +add (16) g82.0<1>UW g82.0<16,8,1>UW g92.2<16,8,1>UB {align1}; +add (16) g83.0<1>UW g83.0<16,8,1>UW g93.2<16,8,1>UB {align1}; +add (16) g84.0<1>UW g84.0<16,8,1>UW g94.2<16,8,1>UB {align1}; +add (16) g85.0<1>UW g85.0<16,8,1>UW g95.2<16,8,1>UB {align1}; +jmpi out; +//U +add (16) g78.0<1>UW g86.2<16,8,1>UB g87.2<16,8,1>UB {align1}; +add (16) g79.0<1>UW g87.2<16,8,1>UB g88.2<16,8,1>UB {align1}; +add (16) g80.0<1>UW g88.2<16,8,1>UB g89.2<16,8,1>UB {align1}; +add (16) g81.0<1>UW g89.2<16,8,1>UB g90.2<16,8,1>UB {align1}; + +add (16) g78.0<1>UW g78.0<16,8,1>UW g86.3<16,8,1>UB {align1}; +add (16) g79.0<1>UW g79.0<16,8,1>UW g87.3<16,8,1>UB {align1}; +add (16) g80.0<1>UW g80.0<16,8,1>UW g88.3<16,8,1>UB {align1}; +add (16) g81.0<1>UW g81.0<16,8,1>UW g89.3<16,8,1>UB {align1}; + +add (16) g78.0<1>UW g78.0<16,8,1>UW g87.3<16,8,1>UB {align1}; +add (16) g79.0<1>UW g79.0<16,8,1>UW g88.3<16,8,1>UB {align1}; +add (16) g80.0<1>UW g80.0<16,8,1>UW g89.3<16,8,1>UB {align1}; +add (16) g81.0<1>UW g81.0<16,8,1>UW g90.3<16,8,1>UB {align1}; +//V +add (16) g82.0<1>UW g91.2<16,8,1>UB g92.2<16,8,1>UB {align1}; +add (16) g83.0<1>UW g92.2<16,8,1>UB g93.2<16,8,1>UB {align1}; +add (16) g84.0<1>UW g93.2<16,8,1>UB g94.2<16,8,1>UB {align1}; +add (16) g85.0<1>UW g94.2<16,8,1>UB g95.2<16,8,1>UB {align1}; + +add (16) g82.0<1>UW g82.0<16,8,1>UW g91.3<16,8,1>UB {align1}; +add (16) g83.0<1>UW g83.0<16,8,1>UW g92.3<16,8,1>UB {align1}; +add (16) g84.0<1>UW g84.0<16,8,1>UW g93.3<16,8,1>UB {align1}; +add (16) g85.0<1>UW g85.0<16,8,1>UW g94.3<16,8,1>UB {align1}; + +add (16) g82.0<1>UW g82.0<16,8,1>UW g92.3<16,8,1>UB {align1}; +add (16) g83.0<1>UW g83.0<16,8,1>UW g93.3<16,8,1>UB {align1}; +add (16) g84.0<1>UW g84.0<16,8,1>UW g94.3<16,8,1>UB {align1}; +add (16) g85.0<1>UW g85.0<16,8,1>UW g95.3<16,8,1>UB {align1}; +jmpi out; +//U +add (16) g78.0<1>UW g86.3<16,8,1>UB g87.3<16,8,1>UB {align1}; +add (16) g79.0<1>UW g87.3<16,8,1>UB g88.3<16,8,1>UB {align1}; +add (16) g80.0<1>UW g88.3<16,8,1>UB g89.3<16,8,1>UB {align1}; +add (16) g81.0<1>UW g89.3<16,8,1>UB g90.3<16,8,1>UB {align1}; + +add (16) g78.0<1>UW g78.0<16,8,1>UW g86.4<16,8,1>UB {align1}; +add (16) g79.0<1>UW g79.0<16,8,1>UW g87.4<16,8,1>UB {align1}; +add (16) g80.0<1>UW g80.0<16,8,1>UW g88.4<16,8,1>UB {align1}; +add (16) g81.0<1>UW g81.0<16,8,1>UW g89.4<16,8,1>UB {align1}; + +add (16) g78.0<1>UW g78.0<16,8,1>UW g87.4<16,8,1>UB {align1}; +add (16) g79.0<1>UW g79.0<16,8,1>UW g88.4<16,8,1>UB {align1}; +add (16) g80.0<1>UW g80.0<16,8,1>UW g89.4<16,8,1>UB {align1}; +add (16) g81.0<1>UW g81.0<16,8,1>UW g90.4<16,8,1>UB {align1}; +//V +add (16) g82.0<1>UW g91.3<16,8,1>UB g92.3<16,8,1>UB {align1}; +add (16) g83.0<1>UW g92.3<16,8,1>UB g93.3<16,8,1>UB {align1}; +add (16) g84.0<1>UW g93.3<16,8,1>UB g94.3<16,8,1>UB {align1}; +add (16) g85.0<1>UW g94.3<16,8,1>UB g95.3<16,8,1>UB {align1}; + +add (16) g82.0<1>UW g82.0<16,8,1>UW g91.4<16,8,1>UB {align1}; +add (16) g83.0<1>UW g83.0<16,8,1>UW g92.4<16,8,1>UB {align1}; +add (16) g84.0<1>UW g84.0<16,8,1>UW g93.4<16,8,1>UB {align1}; +add (16) g85.0<1>UW g85.0<16,8,1>UW g94.4<16,8,1>UB {align1}; + +add (16) g82.0<1>UW g82.0<16,8,1>UW g92.4<16,8,1>UB {align1}; +add (16) g83.0<1>UW g83.0<16,8,1>UW g93.4<16,8,1>UB {align1}; +add (16) g84.0<1>UW g84.0<16,8,1>UW g94.4<16,8,1>UB {align1}; +add (16) g85.0<1>UW g85.0<16,8,1>UW g95.4<16,8,1>UB {align1}; + +out: +shr.sat (16) g78.0<1>UW g78.0<16,16,1>UW 2UW {align1}; +shr.sat (16) g79.0<1>UW g79.0<16,16,1>UW 2UW {align1}; +shr.sat (16) g80.0<1>UW g80.0<16,16,1>UW 2UW {align1}; +shr.sat (16) g81.0<1>UW g81.0<16,16,1>UW 2UW {align1}; +shr.sat (16) g82.0<1>UW g82.0<16,16,1>UW 2UW {align1}; +shr.sat (16) g83.0<1>UW g83.0<16,16,1>UW 2UW {align1}; +shr.sat (16) g84.0<1>UW g84.0<16,16,1>UW 2UW {align1}; +shr.sat (16) g85.0<1>UW g85.0<16,16,1>UW 2UW {align1}; + |