亚洲欧美第一页_禁久久精品乱码_粉嫩av一区二区三区免费野_久草精品视频

? 歡迎來到蟲蟲下載站! | ?? 資源下載 ?? 資源專輯 ?? 關于我們
? 蟲蟲下載站

?? dct_sse2.asm

?? H264EncPlayer,H264協議解碼與播放代碼
?? ASM
字號:
  ;/*****************************************************************************
; *
; *  T264 AVC CODEC
; *
; *  Copyright(C) 2004-2005 llcc <lcgate1@yahoo.com.cn>
; *               2004-2005 visionany <visionany@yahoo.com.cn>
; *
; *  This program is free software ; you can redistribute it and/or modify
; *  it under the terms of the GNU General Public License as published by
; *  the Free Software Foundation ; either version 2 of the License, or
; *  (at your option) any later version.
; *
; *  This program is distributed in the hope that it will be useful,
; *  but WITHOUT ANY WARRANTY ; without even the implied warranty of
; *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
; *  GNU General Public License for more details.
; *
; *  You should have received a copy of the GNU General Public License
; *  along with this program ; if not, write to the Free Software
; *  Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307 USA
; *
; ****************************************************************************/

bits 32

; ideal from xvid
; modify by Thomascatlee@163.com
; for GCC
%macro cglobal 1
	%ifdef NOPREFIX
		global %1
	%else
		global _%1
		%define %1 _%1
	%endif
%endmacro

%macro cextern 1
	%ifdef NOPREFIX
		extern %1
	%else
		extern _%1
		%define %1 _%1
	%endif
%endmacro

; input 0 1 2 3, output 3 4 1 0
%macro transpose 5
    movq       %5, %1
    punpckhwd  %5, %2  ; mm4 = 8 4 7 3
    punpcklwd  %1, %2  ; mm0 = 6 2 5 1

    movq       %2, %3
    punpckhwd  %2, %4  ; mm1 = 16 12 15 11
    punpcklwd  %3, %4  ; mm2 = 14 10 13 9

    movq       %4, %5
    punpckhdq  %4, %2  ; mm3 = 16 12 8 4
    punpckldq  %5, %2  ; mm4 = 15 11 7 3

    movq       %2, %1
    punpckhdq  %2, %3  ; mm1 = 14 10 6 2
    punpckldq  %1, %3  ; mm0 = 13 9 5 1
%endmacro

%macro addsub 5
    movq  %5, %1
    paddw %1, %4    ; %0 = s[0]
    psubw %5, %4    ; %4 = s[3]
    movq  %4, %2
    paddw %2, %3    ; %1 = s[1]
    psubw %4, %3    ; %3 = s[2]
%endmacro

%macro addsub2 5    
    movq  %5, %1   ; %5   = s[0]
    paddw %1, %2   ; d[0] = s[0] + s[1]
    psubw %5, %2   ; d[2] = tmp  - s[1]
    
    movq  %2, %4   ; %2   = s[3]
    paddw %2, %2   ; %2   = %2 + %2
    paddw %2, %3   ; d[1] = %2 + s[2]
    paddw %3, %3   ; s[2] = s[2]+ s[2]
    psubw %4, %3   ; d[3] = s[3]- s[2]
%endmacro

; output 0 4 1 2
%macro idct_addsub2 5    
    movq  %5, %1   ; %5   = d[0]
    paddw %1, %3   ; s[0] = d[0] + d[2]
    psubw %5, %3   ; s[1] = d[0] - d[2]
    
    movq  %3, %2   ; %3   = d[1]
    psraw %2, 1    ; %2   = %2 / 2
    psubw %2, %4   ; s[2] = %2 - d[3]
    psraw %4, 1    ; d[3] = d[3] / 2
    paddw %3, %4   ; s[3] = d[1] + d[3]
%endmacro

; %1 = mmx content, %2 = tmp mmx, %3 = zero mmx, %4 = xmm content, %5 = xmm tmp
%macro word2dw 5
    movq   %2, %1
    punpcklwd %2, %3  ;   dcba->0b0a
    punpckhwd %1, %3  ;   dcba->0d0c
    movq2dq %4, %1   ;   00 00 0d 0c
    pslldq %4, 8      ;   0d 0c 00 00
    movq2dq %5, %2   ;   00 00 0b 0a
    por %4, %5      ;   0d 0c 0b 0a
%endmacro

section .rodata data align=16

align 16
    sse2_neg1 dw -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1, -1
    sse2_1 dw 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1
align 16
    mmx1 dw 1, 1, 1, 1
align 16
    mmx32 dw 32, 32, 32, 32
    
cextern quant
cextern dequant

align 16

section .text

;======================================================
;
; void 
; dct4x4_mmx(int16_t* data)
;
;======================================================

align 16

cglobal dct4x4_mmx
dct4x4_mmx
    
    mov  eax, [esp + 4]  ; data
    movq mm0, [eax + 0] 
    movq mm1, [eax + 8] 
    movq mm2, [eax + 16]
    movq mm3, [eax + 24]
    
    transpose mm0, mm1, mm2, mm3, mm4 ; input 0 1 2 3, output 0 1 4 3
    
    addsub mm0, mm1, mm4, mm3, mm2  ; input 0 1 2 3, output 0 1 3 4
    ; s[0] = mm0, s[1] = mm1, s[2] = mm3, s[3] = mm2

    addsub2 mm0, mm1, mm3, mm2, mm4  ; input 0 1 2 3, output 0 1 4 3

    transpose mm0, mm1, mm4, mm2, mm3 ; input 0 1 2 3, output 0 1 4 3
    
    addsub mm0, mm1, mm3, mm2, mm4  ; input 0 1 2 3, output 0 1 3 4
    ; s[0] = mm0, s[1] = mm1, s[2] = mm2, s[3] = mm4
    
    addsub2 mm0, mm1, mm2, mm4, mm3  ; input 0 1 2 3, output 0 1 4 3

    movq [eax + 0], mm0
    movq [eax + 8], mm1
    movq [eax +16], mm3
    movq [eax +24], mm4
 
    ret

;======================================================
;
; void 
; dct4x4dc_mmx(int16_t* data)
;
;======================================================

align 16

cglobal dct4x4dc_mmx
dct4x4dc_mmx

    mov  eax, [esp + 4]  ; data
    movq mm0, [eax + 0] 
    movq mm1, [eax + 8] 
    movq mm2, [eax + 16]
    movq mm3, [eax + 24]
    
    transpose mm0, mm1, mm2, mm3, mm4 ; input 0 1 2 3, output 0 1 4 3
    
    addsub mm0, mm1, mm4, mm3, mm2  ; input 0 1 2 3, output 0 1 3 4
    ; s[0] = mm0, s[1] = mm1, s[2] = mm3, s[3] = mm2

    addsub mm0, mm2, mm3, mm1, mm4  ; input 0 1 2 3, output 0 1 4 3

    transpose mm0, mm2, mm4, mm1, mm3 ; input 0 1 2 3, output 0 1 4 3
    
    addsub mm0, mm2, mm3, mm1, mm4  ; input 0 1 2 3, output 0 1 3 4
    ; s[0] = mm0, s[1] = mm2, s[2] = mm1, s[3] = mm4
    
    addsub mm0, mm4, mm1, mm2, mm3  ; input 0 1 2 3, output 0 1 4 3

    movq mm1, [mmx1]
    
    paddw mm0, mm1
    paddw mm4, mm1
    paddw mm3, mm1
    paddw mm2, mm1
    
    psraw mm0, 1
    psraw mm4, 1
    psraw mm3, 1
    psraw mm2, 1
    
    movq [eax + 0], mm0
    movq [eax + 8], mm4
    movq [eax +16], mm3
    movq [eax +24], mm2

    ret

;======================================================
;
; void 
; idct4x4_mmx(int16_t* data)
;
;======================================================

align 16

cglobal idct4x4_mmx
idct4x4_mmx

    mov  eax, [esp + 4]  ; data
    movq mm0, [eax + 0] 
    movq mm1, [eax + 8] 
    movq mm2, [eax + 16]
    movq mm3, [eax + 24]
    
    transpose mm0, mm1, mm2, mm3, mm4 ; input 0 1 2 3, output 0 1 4 3
    
    idct_addsub2 mm0, mm1, mm4, mm3, mm2  ; input 0 1 2 3, output 0 4 1 2
    ; s[0] = mm0, s[1] = mm2, s[2] = mm1, s[3] = mm4

    addsub mm0, mm2, mm1, mm4, mm3  ; input 0 1 2 3, output 0 1 3 4

    transpose mm0, mm2, mm4, mm3, mm1 ; input 0 1 2 3, output 0 1 4 3
    
    idct_addsub2 mm0, mm2, mm1, mm3, mm4  ; input 0 1 2 3, output 0 4 1 2
    ; s[0] = mm0, s[1] = mm4, s[2] = mm2, s[3] = mm1

    addsub mm0, mm4, mm2, mm1, mm3  ; input 0 1 2 3, output 0 1 3 4

    movq mm2, [mmx32]
    
    paddw mm0, mm2
    paddw mm4, mm2
    paddw mm1, mm2
    paddw mm3, mm2
    
    psraw mm0, 6
    psraw mm4, 6
    psraw mm1, 6
    psraw mm3, 6
    
    movq [eax + 0], mm0
    movq [eax + 8], mm4
    movq [eax +16], mm1
    movq [eax +24], mm3
 
    ret

;======================================================
;
; void 
; idct4x4dc_mmx(int16_t* data)
;
;======================================================

align 16

cglobal idct4x4dc_mmx
idct4x4dc_mmx

    mov  eax, [esp + 4]  ; data
    movq mm0, [eax + 0] 
    movq mm1, [eax + 8] 
    movq mm2, [eax + 16]
    movq mm3, [eax + 24]
    
    transpose mm0, mm1, mm2, mm3, mm4 ; input 0 1 2 3, output 0 1 4 3
    
    addsub mm0, mm1, mm3, mm4, mm2  ; input 0 1 2 3, output 0 4 3 1
    ; s[0] = mm0, s[1] = mm2, s[2] = mm4, s[3] = mm1

    addsub mm0, mm2, mm4, mm1, mm3  ; input 0 1 2 3, output 0 1 3 4

    transpose mm0, mm2, mm1, mm3, mm4 ; input 0 1 2 3, output 0 1 4 3
    
    addsub mm0, mm2, mm3, mm4, mm1  ; input 0 1 2 3, output 0 4 3 1
    ; s[0] = mm0, s[1] = mm1, s[2] = mm4, s[3] = mm2
    
    addsub mm0, mm1, mm4, mm2, mm3  ; input 0 1 2 3, output 0 1 3 4

    movq [eax + 0], mm0
    movq [eax + 8], mm1
    movq [eax +16], mm2
    movq [eax +24], mm3

    ret

;======================================================
;
; void
; quant4x4_sse2(int16_t* data, const int32_t Qp, int32_t is_intra)
;
;======================================================

align 16

cglobal quant4x4_sse2
quant4x4_sse2

    push ebx
    push esi
    push edi
    push ebp
    
    mov  edi, [esp + 4 + 16]  ; data
    mov  eax, [esp + 8 + 16]  ; qp
    cdq
    mov  ebp, [esp + 12 + 16] ; is_intra
    mov  ebx, 6

    idiv ebx
    add  eax, 15         ; qbits(eax) = 15 + qp / 6, mf_index(edx) = qp % 6    
    mov  esi, edx
    shl  esi, 5
    add  esi, quant     ; esi = quant[mf_index]
    mov  ecx, eax        ; ecx = qbits
    
    neg  ebp
    sbb  ebp, ebp
    and  ebp, 0xfffffffd
    add  ebp, 6          ; is_intra(ecx) ? 3 : 6
    
    mov  eax, 1
    shl  eax, cl         ; 1 << qbits
    cdq
    idiv ebp             ; 1 << qbits / is_intra(ecx) ? 3 : 6
    
    ; eax = f, ecx = qbits, esi = quant[mf_index], edi = data
    
    movd      mm0, eax
    movd      mm1, ecx
    pshufw    mm0, mm0, 0x44
    movq2dq   xmm6, mm0
    movq2dq   xmm7, mm1
    pshufd    xmm6, xmm6, 0x44        ; f
    pxor      mm3, mm3
    
    movdqa    xmm0, [edi + 0]         ; data
    movdqa    xmm1, [esi + 0]         ; quant
    
    ; > 0
    pxor      xmm4, xmm4
    movdqa    xmm2, xmm0
    pcmpgtw   xmm0, xmm4
    movdqa    xmm4, xmm0
    pand      xmm0, xmm2
    movdqa    xmm3, xmm0
    pmullw    xmm0, xmm1              ; low part
    pmulhw    xmm3, xmm1              ; high part
    movdqa    xmm5, xmm0
    punpcklwd xmm0, xmm3              ; low 4 - 32 bits
    punpckhwd xmm5, xmm3              ; high 4 - 32 bits
    movdqa    xmm3, xmm4
    punpcklwd xmm4, xmm4
    pand      xmm4, xmm6
    paddd     xmm0, xmm4              ; data * quant + f
    psrad     xmm0, xmm7              ; data * quant + f >> qbits
    punpckhwd xmm3, xmm3
    pand      xmm3, xmm6
    paddd     xmm5, xmm3              ; data * quant + f
    psrad     xmm5, xmm7              ; data * quant + f >> qbits
    packssdw  xmm0, xmm5
    
    ; < 0
    pxor      xmm4, xmm4
    movdqa    xmm5, xmm2
    pcmpgtw   xmm4, xmm2
    pand      xmm5, xmm4
    pmullw    xmm5, [sse2_neg1]
    movdqa    xmm3, xmm5
    pmullw    xmm5, xmm1
    pmulhw    xmm3, xmm1
    movdqa    xmm1, xmm5
    punpcklwd xmm5, xmm3
    punpckhwd xmm1, xmm3
    movdqa    xmm3, xmm4
    punpcklwd xmm4, xmm4
    pand      xmm4, xmm6
    paddd     xmm5, xmm4            ; data * quant - f
    psrad     xmm5, xmm7
    punpckhwd xmm3, xmm3
    pand      xmm3, xmm6
    paddd     xmm1, xmm3
    psrad     xmm1, xmm7
    packssdw  xmm5, xmm1
    pmullw    xmm5, [sse2_neg1]
    
    por       xmm5, xmm0
    movdqa    [edi + 0], xmm5

    movdqa    xmm0, [edi + 16]         ; data
    movdqa    xmm1, [esi + 16]         ; quant
    
    ; > 0
    pxor      xmm4, xmm4
    movdqa    xmm2, xmm0
    pcmpgtw   xmm0, xmm4
    movdqa    xmm4, xmm0
    pand      xmm0, xmm2
    movdqa    xmm3, xmm0
    pmullw    xmm0, xmm1              ; low part
    pmulhw    xmm3, xmm1              ; high part
    movdqa    xmm5, xmm0
    punpcklwd xmm0, xmm3              ; low 4 - 32 bits
    punpckhwd xmm5, xmm3              ; high 4 - 32 bits
    movdqa    xmm3, xmm4
    punpcklwd xmm4, xmm4
    pand      xmm4, xmm6
    paddd     xmm0, xmm4              ; data * quant + f
    psrad     xmm0, xmm7              ; data * quant + f >> qbits
    punpckhwd xmm3, xmm3
    pand      xmm3, xmm6
    paddd     xmm5, xmm3              ; data * quant + f
    psrad     xmm5, xmm7              ; data * quant + f >> qbits
    packssdw  xmm0, xmm5
    
    ; < 0
    pxor      xmm4, xmm4
    movdqa    xmm5, xmm2
    pcmpgtw   xmm4, xmm2
    pand      xmm5, xmm4
    pmullw    xmm5, [sse2_neg1]
    movdqa    xmm3, xmm5
    pmullw    xmm5, xmm1
    pmulhw    xmm3, xmm1
    movdqa    xmm1, xmm5
    punpcklwd xmm5, xmm3
    punpckhwd xmm1, xmm3
    movdqa    xmm3, xmm4
    punpcklwd xmm4, xmm4
    pand      xmm4, xmm6
    paddd     xmm5, xmm4            ; data * quant - f
    psrad     xmm5, xmm7
    punpckhwd xmm3, xmm3
    pand      xmm3, xmm6
    paddd     xmm1, xmm3
    psrad     xmm1, xmm7
    packssdw  xmm5, xmm1
    pmullw    xmm5, [sse2_neg1]
    
    por       xmm5, xmm0
    movdqa    [edi + 16], xmm5

    pop ebp
    pop edi
    pop esi
    pop ebx
    ret

;======================================================
;
; void
; iquant4x4_sse2(int16_t* data, const int32_t Qp)
;
;======================================================

align 16

cglobal iquant4x4_sse2
iquant4x4_sse2

    mov  eax, [esp + 8]  ; qp
    cdq
    mov  ecx, 6

    idiv ecx             ; qbits(eax) = qp / 6, mf_index(edx) = qp % 6    
    mov  ecx, edx
    shl  ecx, 5
    add  ecx, dequant   ; ecx = quant[mf_index]
    mov  edx, [esp + 4]  ; data
    
    ; eax = qbits, ecx = quant[mf_index], edx = data
    
    movdqa xmm6, [sse2_1]
    movdqa xmm0, [edx + 0]
    movdqa xmm2, [edx + 16]
    movdqa xmm1, [ecx + 0]
    movdqa xmm3, [ecx + 16]

    pmullw  xmm0, xmm1
    pmullw  xmm2, xmm3

    movd    xmm7, eax
    psllw   xmm6, xmm7      ; << qbits

    pmullw xmm0, xmm6
    pmullw xmm2, xmm6

    movdqa [edx + 0], xmm0
    movdqa [edx + 16], xmm2

    ret    

?? 快捷鍵說明

復制代碼 Ctrl + C
搜索代碼 Ctrl + F
全屏模式 F11
切換主題 Ctrl + Shift + D
顯示快捷鍵 ?
增大字號 Ctrl + =
減小字號 Ctrl + -
亚洲欧美第一页_禁久久精品乱码_粉嫩av一区二区三区免费野_久草精品视频
日韩欧美国产不卡| 日韩欧美中文一区二区| 青草国产精品久久久久久| 欧美国产欧美亚州国产日韩mv天天看完整| 色婷婷综合在线| 国产在线看一区| 午夜精品久久久久影视| 中文字幕中文乱码欧美一区二区 | 欧美综合在线视频| 国产成人一区在线| 激情六月婷婷久久| 日产精品久久久久久久性色| 亚洲精品久久久久久国产精华液| 久久婷婷色综合| 日韩午夜在线影院| 欧美精品 国产精品| 91亚洲精品乱码久久久久久蜜桃| 国产精华液一区二区三区| 青青草伊人久久| 天天操天天干天天综合网| 国产精品久久久久久久久动漫| 久久久亚洲综合| 欧美xxxxxxxx| 精品日本一线二线三线不卡| 欧美二区三区91| 欧美电影一区二区三区| 欧美日韩一区久久| 欧美性猛片aaaaaaa做受| 一本色道久久综合狠狠躁的推荐| 成人免费不卡视频| 成人深夜视频在线观看| 大胆欧美人体老妇| 国产成人av网站| 国产成人综合在线播放| 国产乱子伦视频一区二区三区| 久久99精品国产| 国产乱一区二区| 丁香婷婷综合五月| 不卡视频在线看| 色婷婷综合久久久久中文一区二区 | 日韩欧美电影在线| 日韩小视频在线观看专区| 欧美一级精品大片| 26uuu亚洲综合色欧美 | 国产精品久久久久aaaa| 国产精品国产三级国产aⅴ中文| 国产欧美日产一区| 中文字幕中文乱码欧美一区二区 | 久久综合色综合88| 久久综合九色综合欧美亚洲| 国产亚洲欧美色| 国产精品久久久久久一区二区三区| 亚洲天天做日日做天天谢日日欢| 亚洲欧美国产高清| 日韩精品一二三四| 激情另类小说区图片区视频区| 国产精品18久久久久| av综合在线播放| 欧美日韩在线综合| 日韩精品综合一本久道在线视频| 久久久精品综合| 中文字幕一区av| 亚洲国产精品一区二区www | 91黄色免费版| 在线成人小视频| 久久久91精品国产一区二区精品| 中文一区二区完整视频在线观看 | 亚洲男人天堂av| 亚洲专区一二三| 蜜桃精品在线观看| 豆国产96在线|亚洲| 色综合天天综合狠狠| 91精品国产麻豆| 国产欧美在线观看一区| 亚洲综合丁香婷婷六月香| 精品一区二区影视| 99r精品视频| 欧美一级精品在线| 国产精品视频一二| 免费在线一区观看| 97久久精品人人做人人爽| 日韩午夜在线观看视频| 日韩一区在线看| 蜜臀av一区二区在线观看| 不卡av电影在线播放| 这里是久久伊人| 亚洲少妇中出一区| 黄页视频在线91| 欧美日韩一本到| 中文字幕精品三区| 蜜臀99久久精品久久久久久软件| 99久久精品免费看国产| 日韩欧美一区二区三区在线| 亚洲视频综合在线| 国产在线视频精品一区| 欧美日韩国产综合一区二区三区| 国产日韩欧美精品一区| 日本va欧美va精品| 日本精品一区二区三区高清| 国产午夜精品久久| 久久国内精品自在自线400部| 91麻豆国产福利在线观看| 久久久噜噜噜久噜久久综合| 午夜精品久久久久久久久| gogogo免费视频观看亚洲一| 亚洲精品在线观看网站| 亚洲不卡一区二区三区| www.色精品| 久久精品欧美日韩精品| 日韩电影免费在线观看网站| 色成年激情久久综合| 国产精品美女久久福利网站| 国产在线精品视频| 日韩视频永久免费| 日韩福利电影在线| 欧美群妇大交群中文字幕| 一区二区三区在线播| 91无套直看片红桃| 成人免费在线视频| 成人免费看黄yyy456| 久久九九久久九九| 国产一区欧美日韩| 欧美精品粉嫩高潮一区二区| 亚洲与欧洲av电影| 在线观看不卡一区| 亚洲综合免费观看高清完整版在线 | 91在线看国产| 国产精品三级av| 成人激情av网| 中文字幕在线一区免费| 粉嫩绯色av一区二区在线观看 | 欧美三级一区二区| 亚洲最大成人网4388xx| 91久久一区二区| 亚洲愉拍自拍另类高清精品| 欧美性受xxxx黑人xyx性爽| 一区二区三区在线视频观看58 | 在线中文字幕一区二区| 亚洲精品少妇30p| 欧美在线观看视频在线| 亚洲国产一区视频| 91精品国产乱| 国产一区二区按摩在线观看| 国产精品水嫩水嫩| 色天使久久综合网天天| 国产精品国产三级国产专播品爱网 | 欧美探花视频资源| 日韩福利电影在线| 欧美一区二区精品在线| 狠狠色丁香久久婷婷综合_中| 欧美xxxxxxxxx| av中文字幕在线不卡| 成人在线视频一区二区| 国产精品丝袜一区| 91在线视频网址| 亚洲18影院在线观看| 日韩美女一区二区三区| 国产精品99久久久久久似苏梦涵| 国产精品日韩成人| 91福利社在线观看| 蜜臀99久久精品久久久久久软件| 久久精品欧美日韩| 在线观看免费亚洲| 国内精品久久久久影院一蜜桃| 中文字幕一区免费在线观看| 欧美日韩一区高清| 国产精品一级黄| 一区二区在线观看av| 5月丁香婷婷综合| 国产91丝袜在线18| 亚洲视频一区在线| 欧美va在线播放| 色哟哟一区二区在线观看| 蜜臀av性久久久久av蜜臀妖精| 国产精品三级视频| 欧美一区二区三区思思人| 国产经典欧美精品| 亚洲一二三四区不卡| 久久影音资源网| 91精品福利在线| 国产精选一区二区三区| 亚洲www啪成人一区二区麻豆| 国产欧美日韩在线| 欧美日韩成人在线一区| 高清在线成人网| 日韩精品福利网| 中文字幕一区二区不卡| 欧美成人在线直播| 欧美午夜一区二区| 成人福利在线看| 极品美女销魂一区二区三区免费 | 日本美女一区二区三区| 欧美国产日韩一二三区| 在线91免费看| 91蜜桃视频在线| 国产成人三级在线观看| 日韩不卡一二三区| 一区二区三区在线观看国产| 亚洲国产精品精华液2区45| 欧美一级黄色大片|