mirror of
https://codeberg.org/forgejo/forgejo.git
synced 2024-11-24 08:57:03 -05:00
154 lines
2.3 KiB
ArmAsm
154 lines
2.3 KiB
ArmAsm
|
// Copyright 2012 The Go Authors. All rights reserved.
|
||
|
// Use of this source code is governed by a BSD-style
|
||
|
// license that can be found in the LICENSE file.
|
||
|
|
||
|
// This code was translated into a form compatible with 6a from the public
|
||
|
// domain sources in SUPERCOP: http://bench.cr.yp.to/supercop.html
|
||
|
|
||
|
// +build amd64,!gccgo,!appengine
|
||
|
|
||
|
// func square(out, in *[5]uint64)
|
||
|
TEXT ·square(SB),7,$96-16
|
||
|
MOVQ out+0(FP), DI
|
||
|
MOVQ in+8(FP), SI
|
||
|
|
||
|
MOVQ SP,R11
|
||
|
MOVQ $31,CX
|
||
|
NOTQ CX
|
||
|
ANDQ CX,SP
|
||
|
ADDQ $32, SP
|
||
|
|
||
|
MOVQ R11,0(SP)
|
||
|
MOVQ R12,8(SP)
|
||
|
MOVQ R13,16(SP)
|
||
|
MOVQ R14,24(SP)
|
||
|
MOVQ R15,32(SP)
|
||
|
MOVQ BX,40(SP)
|
||
|
MOVQ BP,48(SP)
|
||
|
MOVQ 0(SI),AX
|
||
|
MULQ 0(SI)
|
||
|
MOVQ AX,CX
|
||
|
MOVQ DX,R8
|
||
|
MOVQ 0(SI),AX
|
||
|
SHLQ $1,AX
|
||
|
MULQ 8(SI)
|
||
|
MOVQ AX,R9
|
||
|
MOVQ DX,R10
|
||
|
MOVQ 0(SI),AX
|
||
|
SHLQ $1,AX
|
||
|
MULQ 16(SI)
|
||
|
MOVQ AX,R11
|
||
|
MOVQ DX,R12
|
||
|
MOVQ 0(SI),AX
|
||
|
SHLQ $1,AX
|
||
|
MULQ 24(SI)
|
||
|
MOVQ AX,R13
|
||
|
MOVQ DX,R14
|
||
|
MOVQ 0(SI),AX
|
||
|
SHLQ $1,AX
|
||
|
MULQ 32(SI)
|
||
|
MOVQ AX,R15
|
||
|
MOVQ DX,BX
|
||
|
MOVQ 8(SI),AX
|
||
|
MULQ 8(SI)
|
||
|
ADDQ AX,R11
|
||
|
ADCQ DX,R12
|
||
|
MOVQ 8(SI),AX
|
||
|
SHLQ $1,AX
|
||
|
MULQ 16(SI)
|
||
|
ADDQ AX,R13
|
||
|
ADCQ DX,R14
|
||
|
MOVQ 8(SI),AX
|
||
|
SHLQ $1,AX
|
||
|
MULQ 24(SI)
|
||
|
ADDQ AX,R15
|
||
|
ADCQ DX,BX
|
||
|
MOVQ 8(SI),DX
|
||
|
IMUL3Q $38,DX,AX
|
||
|
MULQ 32(SI)
|
||
|
ADDQ AX,CX
|
||
|
ADCQ DX,R8
|
||
|
MOVQ 16(SI),AX
|
||
|
MULQ 16(SI)
|
||
|
ADDQ AX,R15
|
||
|
ADCQ DX,BX
|
||
|
MOVQ 16(SI),DX
|
||
|
IMUL3Q $38,DX,AX
|
||
|
MULQ 24(SI)
|
||
|
ADDQ AX,CX
|
||
|
ADCQ DX,R8
|
||
|
MOVQ 16(SI),DX
|
||
|
IMUL3Q $38,DX,AX
|
||
|
MULQ 32(SI)
|
||
|
ADDQ AX,R9
|
||
|
ADCQ DX,R10
|
||
|
MOVQ 24(SI),DX
|
||
|
IMUL3Q $19,DX,AX
|
||
|
MULQ 24(SI)
|
||
|
ADDQ AX,R9
|
||
|
ADCQ DX,R10
|
||
|
MOVQ 24(SI),DX
|
||
|
IMUL3Q $38,DX,AX
|
||
|
MULQ 32(SI)
|
||
|
ADDQ AX,R11
|
||
|
ADCQ DX,R12
|
||
|
MOVQ 32(SI),DX
|
||
|
IMUL3Q $19,DX,AX
|
||
|
MULQ 32(SI)
|
||
|
ADDQ AX,R13
|
||
|
ADCQ DX,R14
|
||
|
MOVQ ·REDMASK51(SB),SI
|
||
|
SHLQ $13,R8:CX
|
||
|
ANDQ SI,CX
|
||
|
SHLQ $13,R10:R9
|
||
|
ANDQ SI,R9
|
||
|
ADDQ R8,R9
|
||
|
SHLQ $13,R12:R11
|
||
|
ANDQ SI,R11
|
||
|
ADDQ R10,R11
|
||
|
SHLQ $13,R14:R13
|
||
|
ANDQ SI,R13
|
||
|
ADDQ R12,R13
|
||
|
SHLQ $13,BX:R15
|
||
|
ANDQ SI,R15
|
||
|
ADDQ R14,R15
|
||
|
IMUL3Q $19,BX,DX
|
||
|
ADDQ DX,CX
|
||
|
MOVQ CX,DX
|
||
|
SHRQ $51,DX
|
||
|
ADDQ R9,DX
|
||
|
ANDQ SI,CX
|
||
|
MOVQ DX,R8
|
||
|
SHRQ $51,DX
|
||
|
ADDQ R11,DX
|
||
|
ANDQ SI,R8
|
||
|
MOVQ DX,R9
|
||
|
SHRQ $51,DX
|
||
|
ADDQ R13,DX
|
||
|
ANDQ SI,R9
|
||
|
MOVQ DX,AX
|
||
|
SHRQ $51,DX
|
||
|
ADDQ R15,DX
|
||
|
ANDQ SI,AX
|
||
|
MOVQ DX,R10
|
||
|
SHRQ $51,DX
|
||
|
IMUL3Q $19,DX,DX
|
||
|
ADDQ DX,CX
|
||
|
ANDQ SI,R10
|
||
|
MOVQ CX,0(DI)
|
||
|
MOVQ R8,8(DI)
|
||
|
MOVQ R9,16(DI)
|
||
|
MOVQ AX,24(DI)
|
||
|
MOVQ R10,32(DI)
|
||
|
MOVQ 0(SP),R11
|
||
|
MOVQ 8(SP),R12
|
||
|
MOVQ 16(SP),R13
|
||
|
MOVQ 24(SP),R14
|
||
|
MOVQ 32(SP),R15
|
||
|
MOVQ 40(SP),BX
|
||
|
MOVQ 48(SP),BP
|
||
|
MOVQ R11,SP
|
||
|
MOVQ DI,AX
|
||
|
MOVQ SI,DX
|
||
|
RET
|