133 lines
		
	
	
		
			2.0 KiB
		
	
	
	
		
			ArmAsm
		
	
	
	
	
	
		
		
			
		
	
	
			133 lines
		
	
	
		
			2.0 KiB
		
	
	
	
		
			ArmAsm
		
	
	
	
	
	
| 
								 | 
							
								// Copyright 2012 The Go Authors. All rights reserved.
							 | 
						||
| 
								 | 
							
								// Use of this source code is governed by a BSD-style
							 | 
						||
| 
								 | 
							
								// license that can be found in the LICENSE file.
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								// This code was translated into a form compatible with 6a from the public
							 | 
						||
| 
								 | 
							
								// domain sources in SUPERCOP: http://bench.cr.yp.to/supercop.html
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								// +build amd64,!gccgo,!appengine
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								#include "const_amd64.h"
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
								// func square(out, in *[5]uint64)
							 | 
						||
| 
								 | 
							
								TEXT ·square(SB),7,$0-16
							 | 
						||
| 
								 | 
							
									MOVQ out+0(FP), DI
							 | 
						||
| 
								 | 
							
									MOVQ in+8(FP), SI
							 | 
						||
| 
								 | 
							
								
							 | 
						||
| 
								 | 
							
									MOVQ 0(SI),AX
							 | 
						||
| 
								 | 
							
									MULQ 0(SI)
							 | 
						||
| 
								 | 
							
									MOVQ AX,CX
							 | 
						||
| 
								 | 
							
									MOVQ DX,R8
							 | 
						||
| 
								 | 
							
									MOVQ 0(SI),AX
							 | 
						||
| 
								 | 
							
									SHLQ $1,AX
							 | 
						||
| 
								 | 
							
									MULQ 8(SI)
							 | 
						||
| 
								 | 
							
									MOVQ AX,R9
							 | 
						||
| 
								 | 
							
									MOVQ DX,R10
							 | 
						||
| 
								 | 
							
									MOVQ 0(SI),AX
							 | 
						||
| 
								 | 
							
									SHLQ $1,AX
							 | 
						||
| 
								 | 
							
									MULQ 16(SI)
							 | 
						||
| 
								 | 
							
									MOVQ AX,R11
							 | 
						||
| 
								 | 
							
									MOVQ DX,R12
							 | 
						||
| 
								 | 
							
									MOVQ 0(SI),AX
							 | 
						||
| 
								 | 
							
									SHLQ $1,AX
							 | 
						||
| 
								 | 
							
									MULQ 24(SI)
							 | 
						||
| 
								 | 
							
									MOVQ AX,R13
							 | 
						||
| 
								 | 
							
									MOVQ DX,R14
							 | 
						||
| 
								 | 
							
									MOVQ 0(SI),AX
							 | 
						||
| 
								 | 
							
									SHLQ $1,AX
							 | 
						||
| 
								 | 
							
									MULQ 32(SI)
							 | 
						||
| 
								 | 
							
									MOVQ AX,R15
							 | 
						||
| 
								 | 
							
									MOVQ DX,BX
							 | 
						||
| 
								 | 
							
									MOVQ 8(SI),AX
							 | 
						||
| 
								 | 
							
									MULQ 8(SI)
							 | 
						||
| 
								 | 
							
									ADDQ AX,R11
							 | 
						||
| 
								 | 
							
									ADCQ DX,R12
							 | 
						||
| 
								 | 
							
									MOVQ 8(SI),AX
							 | 
						||
| 
								 | 
							
									SHLQ $1,AX
							 | 
						||
| 
								 | 
							
									MULQ 16(SI)
							 | 
						||
| 
								 | 
							
									ADDQ AX,R13
							 | 
						||
| 
								 | 
							
									ADCQ DX,R14
							 | 
						||
| 
								 | 
							
									MOVQ 8(SI),AX
							 | 
						||
| 
								 | 
							
									SHLQ $1,AX
							 | 
						||
| 
								 | 
							
									MULQ 24(SI)
							 | 
						||
| 
								 | 
							
									ADDQ AX,R15
							 | 
						||
| 
								 | 
							
									ADCQ DX,BX
							 | 
						||
| 
								 | 
							
									MOVQ 8(SI),DX
							 | 
						||
| 
								 | 
							
									IMUL3Q $38,DX,AX
							 | 
						||
| 
								 | 
							
									MULQ 32(SI)
							 | 
						||
| 
								 | 
							
									ADDQ AX,CX
							 | 
						||
| 
								 | 
							
									ADCQ DX,R8
							 | 
						||
| 
								 | 
							
									MOVQ 16(SI),AX
							 | 
						||
| 
								 | 
							
									MULQ 16(SI)
							 | 
						||
| 
								 | 
							
									ADDQ AX,R15
							 | 
						||
| 
								 | 
							
									ADCQ DX,BX
							 | 
						||
| 
								 | 
							
									MOVQ 16(SI),DX
							 | 
						||
| 
								 | 
							
									IMUL3Q $38,DX,AX
							 | 
						||
| 
								 | 
							
									MULQ 24(SI)
							 | 
						||
| 
								 | 
							
									ADDQ AX,CX
							 | 
						||
| 
								 | 
							
									ADCQ DX,R8
							 | 
						||
| 
								 | 
							
									MOVQ 16(SI),DX
							 | 
						||
| 
								 | 
							
									IMUL3Q $38,DX,AX
							 | 
						||
| 
								 | 
							
									MULQ 32(SI)
							 | 
						||
| 
								 | 
							
									ADDQ AX,R9
							 | 
						||
| 
								 | 
							
									ADCQ DX,R10
							 | 
						||
| 
								 | 
							
									MOVQ 24(SI),DX
							 | 
						||
| 
								 | 
							
									IMUL3Q $19,DX,AX
							 | 
						||
| 
								 | 
							
									MULQ 24(SI)
							 | 
						||
| 
								 | 
							
									ADDQ AX,R9
							 | 
						||
| 
								 | 
							
									ADCQ DX,R10
							 | 
						||
| 
								 | 
							
									MOVQ 24(SI),DX
							 | 
						||
| 
								 | 
							
									IMUL3Q $38,DX,AX
							 | 
						||
| 
								 | 
							
									MULQ 32(SI)
							 | 
						||
| 
								 | 
							
									ADDQ AX,R11
							 | 
						||
| 
								 | 
							
									ADCQ DX,R12
							 | 
						||
| 
								 | 
							
									MOVQ 32(SI),DX
							 | 
						||
| 
								 | 
							
									IMUL3Q $19,DX,AX
							 | 
						||
| 
								 | 
							
									MULQ 32(SI)
							 | 
						||
| 
								 | 
							
									ADDQ AX,R13
							 | 
						||
| 
								 | 
							
									ADCQ DX,R14
							 | 
						||
| 
								 | 
							
									MOVQ $REDMASK51,SI
							 | 
						||
| 
								 | 
							
									SHLQ $13,R8:CX
							 | 
						||
| 
								 | 
							
									ANDQ SI,CX
							 | 
						||
| 
								 | 
							
									SHLQ $13,R10:R9
							 | 
						||
| 
								 | 
							
									ANDQ SI,R9
							 | 
						||
| 
								 | 
							
									ADDQ R8,R9
							 | 
						||
| 
								 | 
							
									SHLQ $13,R12:R11
							 | 
						||
| 
								 | 
							
									ANDQ SI,R11
							 | 
						||
| 
								 | 
							
									ADDQ R10,R11
							 | 
						||
| 
								 | 
							
									SHLQ $13,R14:R13
							 | 
						||
| 
								 | 
							
									ANDQ SI,R13
							 | 
						||
| 
								 | 
							
									ADDQ R12,R13
							 | 
						||
| 
								 | 
							
									SHLQ $13,BX:R15
							 | 
						||
| 
								 | 
							
									ANDQ SI,R15
							 | 
						||
| 
								 | 
							
									ADDQ R14,R15
							 | 
						||
| 
								 | 
							
									IMUL3Q $19,BX,DX
							 | 
						||
| 
								 | 
							
									ADDQ DX,CX
							 | 
						||
| 
								 | 
							
									MOVQ CX,DX
							 | 
						||
| 
								 | 
							
									SHRQ $51,DX
							 | 
						||
| 
								 | 
							
									ADDQ R9,DX
							 | 
						||
| 
								 | 
							
									ANDQ SI,CX
							 | 
						||
| 
								 | 
							
									MOVQ DX,R8
							 | 
						||
| 
								 | 
							
									SHRQ $51,DX
							 | 
						||
| 
								 | 
							
									ADDQ R11,DX
							 | 
						||
| 
								 | 
							
									ANDQ SI,R8
							 | 
						||
| 
								 | 
							
									MOVQ DX,R9
							 | 
						||
| 
								 | 
							
									SHRQ $51,DX
							 | 
						||
| 
								 | 
							
									ADDQ R13,DX
							 | 
						||
| 
								 | 
							
									ANDQ SI,R9
							 | 
						||
| 
								 | 
							
									MOVQ DX,AX
							 | 
						||
| 
								 | 
							
									SHRQ $51,DX
							 | 
						||
| 
								 | 
							
									ADDQ R15,DX
							 | 
						||
| 
								 | 
							
									ANDQ SI,AX
							 | 
						||
| 
								 | 
							
									MOVQ DX,R10
							 | 
						||
| 
								 | 
							
									SHRQ $51,DX
							 | 
						||
| 
								 | 
							
									IMUL3Q $19,DX,DX
							 | 
						||
| 
								 | 
							
									ADDQ DX,CX
							 | 
						||
| 
								 | 
							
									ANDQ SI,R10
							 | 
						||
| 
								 | 
							
									MOVQ CX,0(DI)
							 | 
						||
| 
								 | 
							
									MOVQ R8,8(DI)
							 | 
						||
| 
								 | 
							
									MOVQ R9,16(DI)
							 | 
						||
| 
								 | 
							
									MOVQ AX,24(DI)
							 | 
						||
| 
								 | 
							
									MOVQ R10,32(DI)
							 | 
						||
| 
								 | 
							
									RET
							 |