diff options
| author | marha <marha@users.sourceforge.net> | 2010-03-30 12:36:28 +0000 | 
|---|---|---|
| committer | marha <marha@users.sourceforge.net> | 2010-03-30 12:36:28 +0000 | 
| commit | ff48c0d9098080b51ea12710029135916d117806 (patch) | |
| tree | 96e6af9caf170ba21a1027b24e306a07e27d7b75 /openssl/crypto/md5 | |
| parent | bb731f5ac92655c4860a41fa818a7a63005f8369 (diff) | |
| download | vcxsrv-ff48c0d9098080b51ea12710029135916d117806.tar.gz vcxsrv-ff48c0d9098080b51ea12710029135916d117806.tar.bz2 vcxsrv-ff48c0d9098080b51ea12710029135916d117806.zip | |
svn merge -r514:HEAD ^/branches/released .
Diffstat (limited to 'openssl/crypto/md5')
| -rw-r--r-- | openssl/crypto/md5/Makefile | 30 | ||||
| -rw-r--r-- | openssl/crypto/md5/asm/md5-586.pl | 3 | ||||
| -rw-r--r-- | openssl/crypto/md5/asm/md5-ia64.S | 992 | ||||
| -rw-r--r-- | openssl/crypto/md5/asm/md5-x86_64.pl | 156 | ||||
| -rw-r--r-- | openssl/crypto/md5/md5.h | 5 | ||||
| -rw-r--r-- | openssl/crypto/md5/md5_dgst.c | 11 | ||||
| -rw-r--r-- | openssl/crypto/md5/md5_locl.h | 2 | 
7 files changed, 1151 insertions, 48 deletions
| diff --git a/openssl/crypto/md5/Makefile b/openssl/crypto/md5/Makefile index 3c450fcfc..9858d53d3 100644 --- a/openssl/crypto/md5/Makefile +++ b/openssl/crypto/md5/Makefile @@ -38,21 +38,19 @@ top:  all:    lib  lib:    $(LIBOBJ) -	$(ARX) $(LIB) $(LIBOBJ) +	$(AR) $(LIB) $(LIBOBJ)  	$(RANLIB) $(LIB) || echo Never mind.  	@touch lib -# ELF -mx86-elf.s: asm/md5-586.pl ../perlasm/x86asm.pl -	(cd asm; $(PERL) md5-586.pl elf $(CFLAGS) > ../$@) -# COFF -mx86-cof.s: asm/md5-586.pl ../perlasm/x86asm.pl -	(cd asm; $(PERL) md5-586.pl coff $(CFLAGS) > ../$@) -# a.out -mx86-out.s: asm/md5-586.pl ../perlasm/x86asm.pl -	(cd asm; $(PERL) md5-586.pl a.out $(CFLAGS) > ../$@) +md5-586.s:	asm/md5-586.pl ../perlasm/x86asm.pl +	$(PERL) asm/md5-586.pl $(PERLASM_SCHEME) $(CFLAGS) > $@ -md5-x86_64.s:	asm/md5-x86_64.pl;	$(PERL) asm/md5-x86_64.pl $@ +md5-x86_64.s:	asm/md5-x86_64.pl +	$(PERL) asm/md5-x86_64.pl $(PERLASM_SCHEME) > $@ + +md5-ia64.s: asm/md5-ia64.S +	$(CC) $(CFLAGS) -E asm/md5-ia64.S | \ +	$(PERL) -ne 's/;\s+/;\n/g; print;' > $@  files:  	$(PERL) $(TOP)/util/files.pl Makefile >> $(TOP)/MINFO @@ -91,13 +89,9 @@ clean:  # DO NOT DELETE THIS LINE -- make depend depends on it. -md5_dgst.o: ../../include/openssl/bio.h ../../include/openssl/crypto.h -md5_dgst.o: ../../include/openssl/e_os2.h ../../include/openssl/err.h -md5_dgst.o: ../../include/openssl/fips.h ../../include/openssl/lhash.h -md5_dgst.o: ../../include/openssl/md5.h ../../include/openssl/opensslconf.h -md5_dgst.o: ../../include/openssl/opensslv.h ../../include/openssl/ossl_typ.h -md5_dgst.o: ../../include/openssl/safestack.h ../../include/openssl/stack.h -md5_dgst.o: ../../include/openssl/symhacks.h ../md32_common.h md5_dgst.c +md5_dgst.o: ../../include/openssl/e_os2.h ../../include/openssl/md5.h +md5_dgst.o: ../../include/openssl/opensslconf.h +md5_dgst.o: ../../include/openssl/opensslv.h ../md32_common.h md5_dgst.c  md5_dgst.o: md5_locl.h  md5_one.o: ../../include/openssl/crypto.h ../../include/openssl/e_os2.h  md5_one.o: ../../include/openssl/md5.h ../../include/openssl/opensslconf.h diff --git a/openssl/crypto/md5/asm/md5-586.pl b/openssl/crypto/md5/asm/md5-586.pl index 76ac235f7..6cb66bb49 100644 --- a/openssl/crypto/md5/asm/md5-586.pl +++ b/openssl/crypto/md5/asm/md5-586.pl @@ -7,7 +7,8 @@  $normal=0; -push(@INC,"perlasm","../../perlasm"); +$0 =~ m/(.*[\/\\])[^\/\\]+$/; $dir=$1; +push(@INC,"${dir}","${dir}../../perlasm");  require "x86asm.pl";  &asm_init($ARGV[0],$0); diff --git a/openssl/crypto/md5/asm/md5-ia64.S b/openssl/crypto/md5/asm/md5-ia64.S new file mode 100644 index 000000000..2f9818aec --- /dev/null +++ b/openssl/crypto/md5/asm/md5-ia64.S @@ -0,0 +1,992 @@ +/* Copyright (c) 2005 Hewlett-Packard Development Company, L.P. + +Permission is hereby granted, free of charge, to any person obtaining +a copy of this software and associated documentation files (the +"Software"), to deal in the Software without restriction, including +without limitation the rights to use, copy, modify, merge, publish, +distribute, sublicense, and/or sell copies of the Software, and to +permit persons to whom the Software is furnished to do so, subject to +the following conditions: + +The above copyright notice and this permission notice shall be +included in all copies or substantial portions of the Software. + +THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, +EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF +MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND +NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE +LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION +OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION +WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.  */ + +//	Common registers are assigned as follows: +// +//	COMMON +// +//	t0		Const Tbl Ptr	TPtr +//	t1		Round Constant	TRound +//	t4		Block residual	LenResid +//	t5		Residual Data	DTmp +// +//	{in,out}0	Block 0 Cycle	RotateM0 +//	{in,out}1	Block Value 12	M12 +//	{in,out}2	Block Value 8	M8 +//	{in,out}3	Block Value 4	M4 +//	{in,out}4	Block Value 0	M0 +//	{in,out}5	Block 1 Cycle	RotateM1 +//	{in,out}6	Block Value 13	M13 +//	{in,out}7	Block Value 9	M9 +//	{in,out}8	Block Value 5	M5 +//	{in,out}9	Block Value 1	M1 +//	{in,out}10	Block 2 Cycle	RotateM2 +//	{in,out}11	Block Value 14	M14 +//	{in,out}12	Block Value 10	M10 +//	{in,out}13	Block Value 6	M6 +//	{in,out}14	Block Value 2	M2 +//	{in,out}15	Block 3 Cycle	RotateM3 +//	{in,out}16	Block Value 15	M15 +//	{in,out}17	Block Value 11	M11 +//	{in,out}18	Block Value 7	M7 +//	{in,out}19	Block Value 3	M3 +//	{in,out}20	Scratch			Z +//	{in,out}21	Scratch			Y +//	{in,out}22	Scratch			X +//	{in,out}23	Scratch			W +//	{in,out}24	Digest A		A +//	{in,out}25	Digest B		B +//	{in,out}26	Digest C		C +//	{in,out}27	Digest D		D +//	{in,out}28	Active Data Ptr	DPtr +//	in28		Dummy Value		- +//	out28		Dummy Value		- +//	bt0			Coroutine Link	QUICK_RTN +// +///	These predicates are used for computing the padding block(s) and +///	are shared between the driver and digest co-routines +// +//	pt0			Extra Pad Block	pExtra +//	pt1			Load next word	pLoad +//	pt2			Skip next word	pSkip +//	pt3			Search for Pad	pNoPad +//	pt4			Pad Word 0		pPad0 +//	pt5			Pad Word 1		pPad1 +//	pt6			Pad Word 2		pPad2 +//	pt7			Pad Word 3		pPad3 + +#define	DTmp		r19 +#define	LenResid	r18 +#define	QUICK_RTN	b6 +#define	TPtr		r14 +#define	TRound		r15 +#define	pExtra		p6 +#define	pLoad		p7 +#define	pNoPad		p9 +#define	pPad0		p10 +#define	pPad1		p11 +#define	pPad2		p12 +#define	pPad3		p13 +#define	pSkip		p8 + +#define	A_		out24 +#define	B_		out25 +#define	C_		out26 +#define	D_		out27 +#define	DPtr_		out28 +#define	M0_		out4 +#define	M1_		out9 +#define	M10_		out12 +#define	M11_		out17 +#define	M12_		out1 +#define	M13_		out6 +#define	M14_		out11 +#define	M15_		out16 +#define	M2_		out14 +#define	M3_		out19 +#define	M4_		out3 +#define	M5_		out8 +#define	M6_		out13 +#define	M7_		out18 +#define	M8_		out2 +#define	M9_		out7 +#define	RotateM0_	out0 +#define	RotateM1_	out5 +#define	RotateM2_	out10 +#define	RotateM3_	out15 +#define	W_		out23 +#define	X_		out22 +#define	Y_		out21 +#define	Z_		out20 + +#define	A		in24 +#define	B		in25 +#define	C		in26 +#define	D		in27 +#define	DPtr		in28 +#define	M0		in4 +#define	M1		in9 +#define	M10		in12 +#define	M11		in17 +#define	M12		in1 +#define	M13		in6 +#define	M14		in11 +#define	M15		in16 +#define	M2		in14 +#define	M3		in19 +#define	M4		in3 +#define	M5		in8 +#define	M6		in13 +#define	M7		in18 +#define	M8		in2 +#define	M9		in7 +#define	RotateM0	in0 +#define	RotateM1	in5 +#define	RotateM2	in10 +#define	RotateM3	in15 +#define	W		in23 +#define	X		in22 +#define	Y		in21 +#define	Z		in20 + +/* register stack configuration for md5_block_asm_data_order(): */ +#define	MD5_NINP	3 +#define	MD5_NLOC	0 +#define MD5_NOUT	29 +#define MD5_NROT	0 + +/* register stack configuration for helpers: */ +#define	_NINPUTS	MD5_NOUT +#define	_NLOCALS	0 +#define _NOUTPUT	0 +#define	_NROTATE	24	/* this must be <= _NINPUTS */ + +#if defined(_HPUX_SOURCE) && !defined(_LP64) +#define	ADDP	addp4 +#else +#define	ADDP	add +#endif + +#if defined(_HPUX_SOURCE) || defined(B_ENDIAN) +#define HOST_IS_BIG_ENDIAN +#endif + +//	Macros for getting the left and right portions of little-endian words + +#define	GETLW(dst, src, align)	dep.z dst = src, 32 - 8 * align, 8 * align +#define	GETRW(dst, src, align)	extr.u dst = src, 8 * align, 32 - 8 * align + +//	MD5 driver +// +//		Reads an input block, then calls the digest block +//		subroutine and adds the results to the accumulated +//		digest.  It allocates 32 outs which the subroutine +//		uses as it's inputs and rotating +//		registers. Initializes the round constant pointer and +//		takes care of saving/restoring ar.lc +// +///	INPUT +// +//	in0		Context Ptr		CtxPtr0 +//	in1		Input Data Ptr		DPtrIn +//	in2		Integral Blocks		BlockCount +//	rp		Return Address		- +// +///	CODE +// +//	v2		Input Align		InAlign +//	t0		Shared w/digest		- +//	t1		Shared w/digest		- +//	t2		Shared w/digest		- +//	t3		Shared w/digest		- +//	t4		Shared w/digest		- +//	t5		Shared w/digest		- +//	t6		PFS Save		PFSSave +//	t7		ar.lc Save		LCSave +//	t8		Saved PR		PRSave +//	t9		2nd CtxPtr		CtxPtr1 +//	t10		Table Base		CTable +//	t11		Table[0]		CTable0 +//	t13		Accumulator A		AccumA +//	t14		Accumulator B		AccumB +//	t15		Accumulator C		AccumC +//	t16		Accumulator D		AccumD +//	pt0		Shared w/digest		- +//	pt1		Shared w/digest		- +//	pt2		Shared w/digest		- +//	pt3		Shared w/digest		- +//	pt4		Shared w/digest		- +//	pt5		Shared w/digest		- +//	pt6		Shared w/digest		- +//	pt7		Shared w/digest		- +//	pt8		Not Aligned		pOff +//	pt8		Blocks Left		pAgain + +#define	AccumA		r27 +#define	AccumB		r28 +#define	AccumC		r29 +#define	AccumD		r30 +#define	CTable		r24 +#define	CTable0		r25 +#define	CtxPtr0		in0 +#define	CtxPtr1		r23 +#define	DPtrIn		in1 +#define	BlockCount	in2 +#define	InAlign		r10 +#define	LCSave		r21 +#define	PFSSave		r20 +#define	PRSave		r22 +#define	pAgain		p63 +#define	pOff		p63 + +	.text + +/* md5_block_asm_data_order(MD5_CTX *c, const void *data, size_t num) + +     where: +      c: a pointer to a structure of this type: + +	   typedef struct MD5state_st +	     { +	       MD5_LONG A,B,C,D; +	       MD5_LONG Nl,Nh; +	       MD5_LONG data[MD5_LBLOCK]; +	       unsigned int num; +	     } +	   MD5_CTX; + +      data: a pointer to the input data (may be misaligned) +      num:  the number of 16-byte blocks to hash (i.e., the length +            of DATA is 16*NUM. + +   */ + +	.type	md5_block_asm_data_order, @function +	.global	md5_block_asm_data_order +	.align	32 +	.proc	md5_block_asm_data_order +md5_block_asm_data_order: +.md5_block: +	.prologue +{	.mmi +	.save	ar.pfs, PFSSave +	alloc	PFSSave = ar.pfs, MD5_NINP, MD5_NLOC, MD5_NOUT, MD5_NROT +	ADDP	CtxPtr1 = 8, CtxPtr0 +	mov	CTable = ip +} +{	.mmi +	ADDP	DPtrIn = 0, DPtrIn +	ADDP	CtxPtr0 = 0, CtxPtr0 +	.save	ar.lc, LCSave +	mov	LCSave = ar.lc +} +;; +{	.mmi +	add	CTable = .md5_tbl_data_order#-.md5_block#, CTable +	and	InAlign = 0x3, DPtrIn +} + +{	.mmi +	ld4	AccumA = [CtxPtr0], 4 +	ld4	AccumC = [CtxPtr1], 4 +	.save pr, PRSave +	mov	PRSave = pr +	.body +} +;; +{	.mmi +	ld4	AccumB = [CtxPtr0] +	ld4	AccumD = [CtxPtr1] +	dep	DPtr_ = 0, DPtrIn, 0, 2 +} ;; +#ifdef HOST_IS_BIG_ENDIAN +	rum	psr.be;;	// switch to little-endian +#endif +{	.mmb +	ld4	CTable0 = [CTable], 4 +	cmp.ne	pOff, p0 = 0, InAlign +(pOff)	br.cond.spnt.many .md5_unaligned +} ;; + +//	The FF load/compute loop rotates values three times, so that +//	loading into M12 here produces the M0 value, M13 -> M1, etc. + +.md5_block_loop0: +{	.mmi +	ld4	M12_ = [DPtr_], 4 +	mov	TPtr = CTable +	mov	TRound = CTable0 +} ;; +{	.mmi +	ld4	M13_ = [DPtr_], 4 +	mov	A_ = AccumA +	mov	B_ = AccumB +} ;; +{	.mmi +	ld4	M14_ = [DPtr_], 4 +	mov	C_ = AccumC +	mov	D_ = AccumD +} ;; +{	.mmb +	ld4	M15_ = [DPtr_], 4 +	add	BlockCount = -1, BlockCount +	br.call.sptk.many QUICK_RTN = md5_digest_block0 +} ;; + +//	Now, we add the new digest values and do some clean-up +//	before checking if there's another full block to process + +{	.mmi +	add	AccumA = AccumA, A_ +	add	AccumB = AccumB, B_ +	cmp.ne	pAgain, p0 = 0, BlockCount +} +{	.mib +	add	AccumC = AccumC, C_ +	add	AccumD = AccumD, D_ +(pAgain) br.cond.dptk.many .md5_block_loop0 +} ;; + +.md5_exit: +#ifdef HOST_IS_BIG_ENDIAN +	sum	psr.be;;	// switch back to big-endian mode +#endif +{	.mmi +	st4	[CtxPtr0] = AccumB, -4 +	st4	[CtxPtr1] = AccumD, -4 +	mov	pr = PRSave, 0x1ffff ;; +} +{	.mmi +	st4	[CtxPtr0] = AccumA +	st4	[CtxPtr1] = AccumC +	mov	ar.lc = LCSave +} ;; +{	.mib +	mov	ar.pfs = PFSSave +	br.ret.sptk.few	rp +} ;; + +#define	MD5UNALIGNED(offset)						\ +.md5_process##offset:							\ +{	.mib ;								\ +	nop	0x0	;						\ +	GETRW(DTmp, DTmp, offset) ;					\ +} ;;									\ +.md5_block_loop##offset:						\ +{	.mmi ;								\ +	ld4	Y_ = [DPtr_], 4 ;					\ +	mov	TPtr = CTable ;						\ +	mov	TRound = CTable0 ;					\ +} ;;									\ +{	.mmi ;								\ +	ld4	M13_ = [DPtr_], 4 ;					\ +	mov	A_ = AccumA ;						\ +	mov	B_ = AccumB ;						\ +} ;;									\ +{	.mii ;								\ +	ld4	M14_ = [DPtr_], 4 ;					\ +	GETLW(W_, Y_, offset) ;						\ +	mov	C_ = AccumC ;						\ +}									\ +{	.mmi ;								\ +	mov	D_ = AccumD ;;						\ +	or	M12_ = W_, DTmp ;					\ +	GETRW(DTmp, Y_, offset) ;					\ +}									\ +{	.mib ;								\ +	ld4	M15_ = [DPtr_], 4 ;					\ +	add	BlockCount = -1, BlockCount ;				\ +	br.call.sptk.many QUICK_RTN = md5_digest_block##offset;		\ +} ;;									\ +{	.mmi ;								\ +	add	AccumA = AccumA, A_ ;					\ +	add	AccumB = AccumB, B_ ;					\ +	cmp.ne	pAgain, p0 = 0, BlockCount ;				\ +}									\ +{	.mib ;								\ +	add	AccumC = AccumC, C_ ;					\ +	add	AccumD = AccumD, D_ ;					\ +(pAgain) br.cond.dptk.many .md5_block_loop##offset ;			\ +} ;;									\ +{	.mib ;								\ +	nop	0x0 ;							\ +	nop	0x0 ;							\ +	br.cond.sptk.many .md5_exit ;					\ +} ;; + +	.align	32 +.md5_unaligned: +// +//	Because variable shifts are expensive, we special case each of +//	the four alignements. In practice, this won't hurt too much +//	since only one working set of code will be loaded. +// +{	.mib +	ld4	DTmp = [DPtr_], 4 +	cmp.eq	pOff, p0 = 1, InAlign +(pOff)	br.cond.dpnt.many .md5_process1 +} ;; +{	.mib +	cmp.eq	pOff, p0 = 2, InAlign +	nop	0x0 +(pOff)	br.cond.dpnt.many .md5_process2 +} ;; +	MD5UNALIGNED(3) +	MD5UNALIGNED(1) +	MD5UNALIGNED(2) + +	.endp md5_block_asm_data_order + + +// MD5 Perform the F function and load +// +// Passed the first 4 words (M0 - M3) and initial (A, B, C, D) values, +// computes the FF() round of functions, then branches to the common +// digest code to finish up with GG(), HH, and II(). +// +// INPUT +// +// rp Return Address - +// +// CODE +// +// v0 PFS bit bucket PFS +// v1 Loop Trip Count LTrip +// pt0 Load next word pMore + +/* For F round: */ +#define LTrip	r9 +#define PFS	r8 +#define pMore	p6 + +/* For GHI rounds: */ +#define T	r9 +#define U	r10 +#define V	r11 + +#define COMPUTE(a, b, s, M, R)			\ +{						\ +	.mii ;					\ +	ld4 TRound = [TPtr], 4 ;		\ +	dep.z Y = Z, 32, 32 ;;			\ +	shrp Z = Z, Y, 64 - s ;			\ +} ;;						\ +{						\ +	.mmi ;					\ +	add a = Z, b ;				\ +	mov R = M ;				\ +	nop 0x0 ;				\ +} ;; + +#define LOOP(a, b, s, M, R, label)		\ +{	.mii ;					\ +	ld4 TRound = [TPtr], 4 ;		\ +	dep.z Y = Z, 32, 32 ;;			\ +	shrp Z = Z, Y, 64 - s ;			\ +} ;;						\ +{	.mib ;					\ +	add a = Z, b ;				\ +	mov R = M ;				\ +	br.ctop.sptk.many label ;		\ +} ;; + +// G(B, C, D) = (B & D) | (C & ~D) + +#define G(a, b, c, d, M)			\ +{	.mmi ;					\ +	add Z = M, TRound ;			\ +	and Y = b, d ;				\ +	andcm X = c, d ;			\ +} ;;						\ +{	.mii ;					\ +	add Z = Z, a ;				\ +	or Y = Y, X ;;				\ +	add Z = Z, Y ;				\ +} ;; + +// H(B, C, D) = B ^ C ^ D + +#define H(a, b, c, d, M)			\ +{	.mmi ;					\ +	add Z = M, TRound ;			\ +	xor Y = b, c ;				\ +	nop 0x0 ;				\ +} ;;						\ +{	.mii ;					\ +	add Z = Z, a ;				\ +	xor Y = Y, d ;;				\ +	add Z = Z, Y ;				\ +} ;; + +// I(B, C, D) = C ^ (B | ~D) +// +// However, since we have an andcm operator, we use the fact that +// +// Y ^ Z == ~Y ^ ~Z +// +// to rewrite the expression as +// +// I(B, C, D) = ~C ^ (~B & D) + +#define I(a, b, c, d, M)			\ +{	.mmi ;					\ +	add Z = M, TRound ;			\ +	andcm Y = d, b ;			\ +	andcm X = -1, c ;			\ +} ;;						\ +{	.mii ;					\ +	add Z = Z, a ;				\ +	xor Y = Y, X ;;				\ +	add Z = Z, Y ;				\ +} ;; + +#define GG4(label)				\ +	G(A, B, C, D, M0)			\ +	COMPUTE(A, B, 5, M0, RotateM0)		\ +	G(D, A, B, C, M1)			\ +	COMPUTE(D, A, 9, M1, RotateM1)		\ +	G(C, D, A, B, M2)			\ +	COMPUTE(C, D, 14, M2, RotateM2)		\ +	G(B, C, D, A, M3)			\ +	LOOP(B, C, 20, M3, RotateM3, label) + +#define HH4(label)				\ +	H(A, B, C, D, M0)			\ +	COMPUTE(A, B, 4, M0, RotateM0)		\ +	H(D, A, B, C, M1)			\ +	COMPUTE(D, A, 11, M1, RotateM1)		\ +	H(C, D, A, B, M2)			\ +	COMPUTE(C, D, 16, M2, RotateM2)		\ +	H(B, C, D, A, M3)			\ +	LOOP(B, C, 23, M3, RotateM3, label) + +#define II4(label)				\ +	I(A, B, C, D, M0)			\ +	COMPUTE(A, B, 6, M0, RotateM0)		\ +	I(D, A, B, C, M1)			\ +	COMPUTE(D, A, 10, M1, RotateM1)		\ +	I(C, D, A, B, M2)			\ +	COMPUTE(C, D, 15, M2, RotateM2)		\ +	I(B, C, D, A, M3)			\ +	LOOP(B, C, 21, M3, RotateM3, label) + +#define FFLOAD(a, b, c, d, M, N, s)		\ +{	.mii ;					\ +(pMore) ld4 N = [DPtr], 4 ;			\ +	add Z = M, TRound ;			\ +	and Y = c, b ;				\ +}						\ +{	.mmi ;					\ +	andcm X = d, b ;;			\ +	add Z = Z, a ;				\ +	or Y = Y, X ;				\ +} ;;						\ +{	.mii ;					\ +	ld4 TRound = [TPtr], 4 ;		\ +	add Z = Z, Y ;;				\ +	dep.z Y = Z, 32, 32 ;			\ +} ;;						\ +{	.mii ;					\ +	nop 0x0 ;				\ +	shrp Z = Z, Y, 64 - s ;;		\ +	add a = Z, b ;				\ +} ;; + +#define FFLOOP(a, b, c, d, M, N, s, dest)	\ +{	.mii ;					\ +(pMore)	ld4 N = [DPtr], 4 ;			\ +	add Z = M, TRound ;			\ +	and Y = c, b ;				\ +}						\ +{	.mmi ;					\ +	andcm X = d, b ;;			\ +	add Z = Z, a ;				\ +	or Y = Y, X ;				\ +} ;;						\ +{	.mii ;					\ +	ld4 TRound = [TPtr], 4 ;		\ +	add Z = Z, Y ;;				\ +	dep.z Y = Z, 32, 32 ;			\ +} ;;						\ +{	.mii ;					\ +	nop 0x0 ;				\ +	shrp Z = Z, Y, 64 - s ;;		\ +	add a = Z, b ;				\ +}						\ +{	.mib ;					\ +	cmp.ne pMore, p0 = 0, LTrip ;		\ +	add LTrip = -1, LTrip ;			\ +	br.ctop.dptk.many dest ;		\ +} ;; + +	.type md5_digest_block0, @function +	.align 32 + +	.proc md5_digest_block0 +	.prologue +md5_digest_block0: +	.altrp QUICK_RTN +	.body +{	.mmi +	alloc PFS = ar.pfs, _NINPUTS, _NLOCALS, _NOUTPUT, _NROTATE +	mov LTrip = 2 +	mov ar.lc = 3 +} ;; +{	.mii +	cmp.eq pMore, p0 = r0, r0 +	mov ar.ec = 0 +	nop 0x0 +} ;; + +.md5_FF_round0: +	FFLOAD(A, B, C, D, M12, RotateM0, 7) +	FFLOAD(D, A, B, C, M13, RotateM1, 12) +	FFLOAD(C, D, A, B, M14, RotateM2, 17) +	FFLOOP(B, C, D, A, M15, RotateM3, 22, .md5_FF_round0) +	// +	// !!! Fall through to md5_digest_GHI +	// +	.endp md5_digest_block0 + +	.type md5_digest_GHI, @function +	.align 32 + +	.proc md5_digest_GHI +	.prologue +	.regstk _NINPUTS, _NLOCALS, _NOUTPUT, _NROTATE +md5_digest_GHI: +	.altrp QUICK_RTN +	.body +// +// The following sequence shuffles the block counstants round for the +// next round: +// +// 0 1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 +// 1 6 11 0 5 10 14 4 9 14 3 8 13 2 7 12 +// +{	.mmi +	mov Z = M0 +	mov Y = M15 +	mov ar.lc = 3 +} +{	.mmi +	mov X = M2 +	mov W = M9 +	mov V = M4 +} ;; + +{	.mmi +	mov M0 = M1 +	mov M15 = M12 +	mov ar.ec = 1 +} +{	.mmi +	mov M2 = M11 +	mov M9 = M14 +	mov M4 = M5 +} ;; + +{	.mmi +	mov M1 = M6 +	mov M12 = M13 +	mov U = M3 +} +{	.mmi +	mov M11 = M8 +	mov M14 = M7 +	mov M5 = M10 +} ;; + +{	.mmi +	mov M6 = Y +	mov M13 = X +	mov M3 = Z +} +{	.mmi +	mov M8 = W +	mov M7 = V +	mov M10 = U +} ;; + +.md5_GG_round: +	GG4(.md5_GG_round) + +// The following sequence shuffles the block constants round for the +// next round: +// +// 1 6 11 0 5 10 14 4 9 14 3 8 13 2 7 12 +// 5 8 11 14 1 4 7 10 13 0 3 6 9 12 15 2 + +{	.mmi +	mov Z = M0 +	mov Y = M1 +	mov ar.lc = 3 +} +{	.mmi +	mov X = M3 +	mov W = M5 +	mov V = M6 +} ;; + +{	.mmi +	mov M0 = M4 +	mov M1 = M11 +	mov ar.ec = 1 +} +{	.mmi +	mov M3 = M9 +	mov U = M8 +	mov T = M13 +} ;; + +{	.mmi +	mov M4 = Z +	mov M11 = Y +	mov M5 = M7 +} +{	.mmi +	mov M6 = M14 +	mov M8 = M12 +	mov M13 = M15 +} ;; + +{	.mmi +	mov M7 = W +	mov M14 = V +	nop 0x0 +} +{	.mmi +	mov M9 = X +	mov M12 = U +	mov M15 = T +} ;; + +.md5_HH_round: +	HH4(.md5_HH_round) + +// The following sequence shuffles the block constants round for the +// next round: +// +// 5 8 11 14 1 4 7 10 13 0 3 6 9 12 15 2 +// 0 7 14 5 12 3 10 1 8 15 6 13 4 11 2 9 + +{	.mmi +	mov Z = M0 +	mov Y = M15 +	mov ar.lc = 3 +} +{	.mmi +	mov X = M10 +	mov W = M1 +	mov V = M4 +} ;; + +{	.mmi +	mov M0 = M9 +	mov M15 = M12 +	mov ar.ec = 1 +} +{	.mmi +	mov M10 = M11 +	mov M1 = M6 +	mov M4 = M13 +} ;; + +{	.mmi +	mov M9 = M14 +	mov M12 = M5 +	mov U = M3 +} +{	.mmi +	mov M11 = M8 +	mov M6 = M7 +	mov M13 = M2 +} ;; + +{	.mmi +	mov M14 = Y +	mov M5 = X +	mov M3 = Z +} +{	.mmi +	mov M8 = W +	mov M7 = V +	mov M2 = U +} ;; + +.md5_II_round: +	II4(.md5_II_round) + +{	.mib +	nop 0x0 +	nop 0x0 +	br.ret.sptk.many QUICK_RTN +} ;; + +	.endp md5_digest_GHI + +#define FFLOADU(a, b, c, d, M, P, N, s, offset)	\ +{	.mii ;					\ +(pMore) ld4 N = [DPtr], 4 ;			\ +	add Z = M, TRound ;			\ +	and Y = c, b ;				\ +}						\ +{	.mmi ;					\ +	andcm X = d, b ;;			\ +	add Z = Z, a ;				\ +	or Y = Y, X ;				\ +} ;;						\ +{	.mii ;					\ +	ld4 TRound = [TPtr], 4 ;		\ +	GETLW(W, P, offset) ;			\ +	add Z = Z, Y ;				\ +} ;;						\ +{	.mii ;					\ +	or W = W, DTmp ;			\ +	dep.z Y = Z, 32, 32 ;;			\ +	shrp Z = Z, Y, 64 - s ;			\ +} ;;						\ +{	.mii ;					\ +	add a = Z, b ;				\ +	GETRW(DTmp, P, offset) ;		\ +	mov P = W ;				\ +} ;; + +#define FFLOOPU(a, b, c, d, M, P, N, s, offset)		\ +{	.mii ;						\ +(pMore) ld4 N = [DPtr], 4 ;				\ +	add Z = M, TRound ;				\ +	and Y = c, b ;					\ +}							\ +{	.mmi ;						\ +	andcm X = d, b ;;				\ +	add Z = Z, a ;					\ +	or Y = Y, X ;					\ +} ;;							\ +{	.mii ;						\ +	ld4 TRound = [TPtr], 4 ;			\ +(pMore) GETLW(W, P, offset) 	;			\ +	add Z = Z, Y ;					\ +} ;;							\ +{	.mii ;						\ +(pMore) or W = W, DTmp ;				\ +	dep.z Y = Z, 32, 32 ;;				\ +	shrp Z = Z, Y, 64 - s ;				\ +} ;;							\ +{	.mii ;						\ +	add a = Z, b ;					\ +(pMore) GETRW(DTmp, P, offset) 	;			\ +(pMore) mov P = W ;					\ +}							\ +{	.mib ;						\ +	cmp.ne pMore, p0 = 0, LTrip ;			\ +	add LTrip = -1, LTrip ;				\ +	br.ctop.sptk.many .md5_FF_round##offset ;	\ +} ;; + +#define MD5FBLOCK(offset)						\ +	.type md5_digest_block##offset, @function ;			\ +									\ +	.align 32 ;							\ +	.proc md5_digest_block##offset ;				\ +	.prologue ;							\ +	.altrp QUICK_RTN ;						\ +	.body ;								\ +md5_digest_block##offset:						\ +{	.mmi ;								\ +	alloc PFS = ar.pfs, _NINPUTS, _NLOCALS, _NOUTPUT, _NROTATE ;	\ +	mov LTrip = 2 ;							\ +	mov ar.lc = 3 ;							\ +} ;;									\ +{	.mii ;								\ +	cmp.eq pMore, p0 = r0, r0 ;					\ +	mov ar.ec = 0 ;							\ +	nop 0x0 ;							\ +} ;;									\ +									\ +	.pred.rel "mutex", pLoad, pSkip ;				\ +.md5_FF_round##offset:							\ +	FFLOADU(A, B, C, D, M12, M13, RotateM0, 7, offset)		\ +	FFLOADU(D, A, B, C, M13, M14, RotateM1, 12, offset)		\ +	FFLOADU(C, D, A, B, M14, M15, RotateM2, 17, offset)		\ +	FFLOOPU(B, C, D, A, M15, RotateM0, RotateM3, 22, offset)	\ +									\ +{	.mib ;								\ +	nop 0x0 ;							\ +	nop 0x0 ;							\ +	br.cond.sptk.many md5_digest_GHI ;				\ +} ;;									\ +	.endp md5digestBlock ## offset + +MD5FBLOCK(1) +MD5FBLOCK(2) +MD5FBLOCK(3) + +	.align 64 +	.type md5_constants, @object +md5_constants: +.md5_tbl_data_order:			// To ensure little-endian data +					// order, code as bytes. +	data1 0x78, 0xa4, 0x6a, 0xd7	//     0 +	data1 0x56, 0xb7, 0xc7, 0xe8	//     1 +	data1 0xdb, 0x70, 0x20, 0x24	//     2 +	data1 0xee, 0xce, 0xbd, 0xc1	//     3 +	data1 0xaf, 0x0f, 0x7c, 0xf5	//     4 +	data1 0x2a, 0xc6, 0x87, 0x47	//     5 +	data1 0x13, 0x46, 0x30, 0xa8	//     6 +	data1 0x01, 0x95, 0x46, 0xfd	//     7 +	data1 0xd8, 0x98, 0x80, 0x69	//     8 +	data1 0xaf, 0xf7, 0x44, 0x8b	//     9 +	data1 0xb1, 0x5b, 0xff, 0xff	//    10 +	data1 0xbe, 0xd7, 0x5c, 0x89	//    11 +	data1 0x22, 0x11, 0x90, 0x6b	//    12 +	data1 0x93, 0x71, 0x98, 0xfd	//    13 +	data1 0x8e, 0x43, 0x79, 0xa6	//    14 +	data1 0x21, 0x08, 0xb4, 0x49	//    15 +	data1 0x62, 0x25, 0x1e, 0xf6	//    16 +	data1 0x40, 0xb3, 0x40, 0xc0	//    17 +	data1 0x51, 0x5a, 0x5e, 0x26	//    18 +	data1 0xaa, 0xc7, 0xb6, 0xe9	//    19 +	data1 0x5d, 0x10, 0x2f, 0xd6	//    20 +	data1 0x53, 0x14, 0x44, 0x02	//    21 +	data1 0x81, 0xe6, 0xa1, 0xd8	//    22 +	data1 0xc8, 0xfb, 0xd3, 0xe7	//    23 +	data1 0xe6, 0xcd, 0xe1, 0x21	//    24 +	data1 0xd6, 0x07, 0x37, 0xc3	//    25 +	data1 0x87, 0x0d, 0xd5, 0xf4	//    26 +	data1 0xed, 0x14, 0x5a, 0x45	//    27 +	data1 0x05, 0xe9, 0xe3, 0xa9	//    28 +	data1 0xf8, 0xa3, 0xef, 0xfc	//    29 +	data1 0xd9, 0x02, 0x6f, 0x67	//    30 +	data1 0x8a, 0x4c, 0x2a, 0x8d	//    31 +	data1 0x42, 0x39, 0xfa, 0xff	//    32 +	data1 0x81, 0xf6, 0x71, 0x87	//    33 +	data1 0x22, 0x61, 0x9d, 0x6d	//    34 +	data1 0x0c, 0x38, 0xe5, 0xfd	//    35 +	data1 0x44, 0xea, 0xbe, 0xa4	//    36 +	data1 0xa9, 0xcf, 0xde, 0x4b	//    37 +	data1 0x60, 0x4b, 0xbb, 0xf6	//    38 +	data1 0x70, 0xbc, 0xbf, 0xbe	//    39 +	data1 0xc6, 0x7e, 0x9b, 0x28	//    40 +	data1 0xfa, 0x27, 0xa1, 0xea	//    41 +	data1 0x85, 0x30, 0xef, 0xd4	//    42 +	data1 0x05, 0x1d, 0x88, 0x04	//    43 +	data1 0x39, 0xd0, 0xd4, 0xd9	//    44 +	data1 0xe5, 0x99, 0xdb, 0xe6	//    45 +	data1 0xf8, 0x7c, 0xa2, 0x1f	//    46 +	data1 0x65, 0x56, 0xac, 0xc4	//    47 +	data1 0x44, 0x22, 0x29, 0xf4	//    48 +	data1 0x97, 0xff, 0x2a, 0x43	//    49 +	data1 0xa7, 0x23, 0x94, 0xab	//    50 +	data1 0x39, 0xa0, 0x93, 0xfc	//    51 +	data1 0xc3, 0x59, 0x5b, 0x65	//    52 +	data1 0x92, 0xcc, 0x0c, 0x8f	//    53 +	data1 0x7d, 0xf4, 0xef, 0xff	//    54 +	data1 0xd1, 0x5d, 0x84, 0x85	//    55 +	data1 0x4f, 0x7e, 0xa8, 0x6f	//    56 +	data1 0xe0, 0xe6, 0x2c, 0xfe	//    57 +	data1 0x14, 0x43, 0x01, 0xa3	//    58 +	data1 0xa1, 0x11, 0x08, 0x4e	//    59 +	data1 0x82, 0x7e, 0x53, 0xf7	//    60 +	data1 0x35, 0xf2, 0x3a, 0xbd	//    61 +	data1 0xbb, 0xd2, 0xd7, 0x2a	//    62 +	data1 0x91, 0xd3, 0x86, 0xeb	//    63 +.size	md5_constants#,64*4 diff --git a/openssl/crypto/md5/asm/md5-x86_64.pl b/openssl/crypto/md5/asm/md5-x86_64.pl index 9a6fa6722..867885435 100644 --- a/openssl/crypto/md5/asm/md5-x86_64.pl +++ b/openssl/crypto/md5/asm/md5-x86_64.pl @@ -15,7 +15,7 @@ my $code;  #   dst = x + ((dst + F(x,y,z) + X[k] + T_i) <<< s)  #   %r10d = X[k_next]  #   %r11d = z' (copy of z for the next step) -# Each round1_step() takes about 5.71 clocks (9 instructions, 1.58 IPC) +# Each round1_step() takes about 5.3 clocks (9 instructions, 1.7 IPC)  sub round1_step  {      my ($pos, $dst, $x, $y, $z, $k_next, $T_i, $s) = @_; @@ -37,22 +37,26 @@ EOF  # round2_step() does:  #   dst = x + ((dst + G(x,y,z) + X[k] + T_i) <<< s)  #   %r10d = X[k_next] -#   %r11d = y' (copy of y for the next step) -# Each round2_step() takes about 6.22 clocks (9 instructions, 1.45 IPC) +#   %r11d = z' (copy of z for the next step) +#   %r12d = z' (copy of z for the next step) +# Each round2_step() takes about 5.4 clocks (11 instructions, 2.0 IPC)  sub round2_step  {      my ($pos, $dst, $x, $y, $z, $k_next, $T_i, $s) = @_;      $code .= " mov	1*4(%rsi),	%r10d		/* (NEXT STEP) X[1] */\n" if ($pos == -1); -    $code .= " mov	%ecx,		%r11d		/* (NEXT STEP) y' = %ecx */\n" if ($pos == -1); +    $code .= " mov	%edx,		%r11d		/* (NEXT STEP) z' = %edx */\n" if ($pos == -1); +    $code .= " mov	%edx,		%r12d		/* (NEXT STEP) z' = %edx */\n" if ($pos == -1);      $code .= <<EOF; -	xor	$x,		%r11d		/* x ^ ... */ +	not	%r11d				/* not z */  	lea	$T_i($dst,%r10d),$dst		/* Const + dst + ... */ -	and	$z,		%r11d		/* z & ... */ -	xor	$y,		%r11d		/* y ^ ... */ +	and	$x,		%r12d		/* x & z */ +	and	$y,		%r11d		/* y & (not z) */  	mov	$k_next*4(%rsi),%r10d		/* (NEXT STEP) X[$k_next] */ -	add	%r11d,		$dst		/* dst += ... */ +	or	%r11d,		%r12d		/* (y & (not z)) | (x & z) */ +	mov	$y,		%r11d		/* (NEXT STEP) z' = $y */ +	add	%r12d,		$dst		/* dst += ... */ +	mov	$y,		%r12d		/* (NEXT STEP) z' = $y */  	rol	\$$s,		$dst		/* dst <<< s */ -	mov	$x,		%r11d		/* (NEXT STEP) y' = $x */  	add	$x,		$dst		/* dst += x */  EOF  } @@ -61,7 +65,7 @@ EOF  #   dst = x + ((dst + H(x,y,z) + X[k] + T_i) <<< s)  #   %r10d = X[k_next]  #   %r11d = y' (copy of y for the next step) -# Each round3_step() takes about 4.26 clocks (8 instructions, 1.88 IPC) +# Each round3_step() takes about 4.2 clocks (8 instructions, 1.9 IPC)  sub round3_step  {      my ($pos, $dst, $x, $y, $z, $k_next, $T_i, $s) = @_; @@ -83,7 +87,7 @@ EOF  #   dst = x + ((dst + I(x,y,z) + X[k] + T_i) <<< s)  #   %r10d = X[k_next]  #   %r11d = not z' (copy of not z for the next step) -# Each round4_step() takes about 5.27 clocks (9 instructions, 1.71 IPC) +# Each round4_step() takes about 5.2 clocks (9 instructions, 1.7 IPC)  sub round4_step  {      my ($pos, $dst, $x, $y, $z, $k_next, $T_i, $s) = @_; @@ -104,8 +108,19 @@ sub round4_step  EOF  } -my $output = shift; -open STDOUT,"| $^X ../perlasm/x86_64-xlate.pl $output"; +my $flavour = shift; +my $output  = shift; +if ($flavour =~ /\./) { $output = $flavour; undef $flavour; } + +my $win64=0; $win64=1 if ($flavour =~ /[nm]asm|mingw64/ || $output =~ /\.asm$/); + +$0 =~ m/(.*[\/\\])[^\/\\]+$/; my $dir=$1; my $xlate; +( $xlate="${dir}x86_64-xlate.pl" and -f $xlate ) or +( $xlate="${dir}../../perlasm/x86_64-xlate.pl" and -f $xlate) or +die "can't locate x86_64-xlate.pl"; + +no warnings qw(uninitialized); +open STDOUT,"| $^X $xlate $flavour $output";  $code .= <<EOF;  .text @@ -116,8 +131,10 @@ $code .= <<EOF;  md5_block_asm_data_order:  	push	%rbp  	push	%rbx +	push	%r12  	push	%r14  	push	%r15 +.Lprologue:  	# rdi = arg #1 (ctx, MD5_CTX pointer)  	# rsi = arg #2 (ptr, data pointer) @@ -232,13 +249,120 @@ $code .= <<EOF;  	mov	%ecx,		2*4(%rbp)	# ctx->C = C  	mov	%edx,		3*4(%rbp)	# ctx->D = D +	mov	(%rsp),%r15 +	mov	8(%rsp),%r14 +	mov	16(%rsp),%r12 +	mov	24(%rsp),%rbx +	mov	32(%rsp),%rbp +	add	\$40,%rsp +.Lepilogue: +	ret +.size md5_block_asm_data_order,.-md5_block_asm_data_order +EOF + +# EXCEPTION_DISPOSITION handler (EXCEPTION_RECORD *rec,ULONG64 frame, +#		CONTEXT *context,DISPATCHER_CONTEXT *disp) +if ($win64) { +my $rec="%rcx"; +my $frame="%rdx"; +my $context="%r8"; +my $disp="%r9"; + +$code.=<<___; +.extern	__imp_RtlVirtualUnwind +.type	se_handler,\@abi-omnipotent +.align	16 +se_handler: +	push	%rsi +	push	%rdi +	push	%rbx +	push	%rbp +	push	%r12 +	push	%r13 +	push	%r14 +	push	%r15 +	pushfq +	sub	\$64,%rsp + +	mov	120($context),%rax	# pull context->Rax +	mov	248($context),%rbx	# pull context->Rip + +	lea	.Lprologue(%rip),%r10 +	cmp	%r10,%rbx		# context->Rip<.Lprologue +	jb	.Lin_prologue + +	mov	152($context),%rax	# pull context->Rsp + +	lea	.Lepilogue(%rip),%r10 +	cmp	%r10,%rbx		# context->Rip>=.Lepilogue +	jae	.Lin_prologue + +	lea	40(%rax),%rax + +	mov	-8(%rax),%rbp +	mov	-16(%rax),%rbx +	mov	-24(%rax),%r12 +	mov	-32(%rax),%r14 +	mov	-40(%rax),%r15 +	mov	%rbx,144($context)	# restore context->Rbx +	mov	%rbp,160($context)	# restore context->Rbp +	mov	%r12,216($context)	# restore context->R12 +	mov	%r14,232($context)	# restore context->R14 +	mov	%r15,240($context)	# restore context->R15 + +.Lin_prologue: +	mov	8(%rax),%rdi +	mov	16(%rax),%rsi +	mov	%rax,152($context)	# restore context->Rsp +	mov	%rsi,168($context)	# restore context->Rsi +	mov	%rdi,176($context)	# restore context->Rdi + +	mov	40($disp),%rdi		# disp->ContextRecord +	mov	$context,%rsi		# context +	mov	\$154,%ecx		# sizeof(CONTEXT) +	.long	0xa548f3fc		# cld; rep movsq + +	mov	$disp,%rsi +	xor	%rcx,%rcx		# arg1, UNW_FLAG_NHANDLER +	mov	8(%rsi),%rdx		# arg2, disp->ImageBase +	mov	0(%rsi),%r8		# arg3, disp->ControlPc +	mov	16(%rsi),%r9		# arg4, disp->FunctionEntry +	mov	40(%rsi),%r10		# disp->ContextRecord +	lea	56(%rsi),%r11		# &disp->HandlerData +	lea	24(%rsi),%r12		# &disp->EstablisherFrame +	mov	%r10,32(%rsp)		# arg5 +	mov	%r11,40(%rsp)		# arg6 +	mov	%r12,48(%rsp)		# arg7 +	mov	%rcx,56(%rsp)		# arg8, (NULL) +	call	*__imp_RtlVirtualUnwind(%rip) + +	mov	\$1,%eax		# ExceptionContinueSearch +	add	\$64,%rsp +	popfq  	pop	%r15  	pop	%r14 -	pop	%rbx +	pop	%r13 +	pop	%r12  	pop	%rbp +	pop	%rbx +	pop	%rdi +	pop	%rsi  	ret -.size md5_block_asm_data_order,.-md5_block_asm_data_order -EOF +.size	se_handler,.-se_handler + +.section	.pdata +.align	4 +	.rva	.LSEH_begin_md5_block_asm_data_order +	.rva	.LSEH_end_md5_block_asm_data_order +	.rva	.LSEH_info_md5_block_asm_data_order + +.section	.xdata +.align	8 +.LSEH_info_md5_block_asm_data_order: +	.byte	9,0,0,0 +	.rva	se_handler +___ +}  print $code; diff --git a/openssl/crypto/md5/md5.h b/openssl/crypto/md5/md5.h index 0761f84a2..4cbf84386 100644 --- a/openssl/crypto/md5/md5.h +++ b/openssl/crypto/md5/md5.h @@ -77,7 +77,7 @@ extern "C" {   * !!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!!   */ -#if defined(OPENSSL_SYS_WIN16) || defined(__LP32__) +#if defined(__LP32__)  #define MD5_LONG unsigned long  #elif defined(OPENSSL_SYS_CRAY) || defined(__ILP64__)  #define MD5_LONG unsigned long @@ -105,9 +105,6 @@ typedef struct MD5state_st  	unsigned int num;  	} MD5_CTX; -#ifdef OPENSSL_FIPS -int private_MD5_Init(MD5_CTX *c); -#endif  int MD5_Init(MD5_CTX *c);  int MD5_Update(MD5_CTX *c, const void *data, size_t len);  int MD5_Final(unsigned char *md, MD5_CTX *c); diff --git a/openssl/crypto/md5/md5_dgst.c b/openssl/crypto/md5/md5_dgst.c index 47bb9020e..beace632e 100644 --- a/openssl/crypto/md5/md5_dgst.c +++ b/openssl/crypto/md5/md5_dgst.c @@ -59,11 +59,6 @@  #include <stdio.h>  #include "md5_locl.h"  #include <openssl/opensslv.h> -#include <openssl/err.h> -#ifdef OPENSSL_FIPS -#include <openssl/fips.h> -#endif -  const char MD5_version[]="MD5" OPENSSL_VERSION_PTEXT; @@ -75,15 +70,13 @@ const char MD5_version[]="MD5" OPENSSL_VERSION_PTEXT;  #define INIT_DATA_C (unsigned long)0x98badcfeL  #define INIT_DATA_D (unsigned long)0x10325476L -FIPS_NON_FIPS_MD_Init(MD5) +int MD5_Init(MD5_CTX *c)  	{ +	memset (c,0,sizeof(*c));  	c->A=INIT_DATA_A;  	c->B=INIT_DATA_B;  	c->C=INIT_DATA_C;  	c->D=INIT_DATA_D; -	c->Nl=0; -	c->Nh=0; -	c->num=0;  	return 1;  	} diff --git a/openssl/crypto/md5/md5_locl.h b/openssl/crypto/md5/md5_locl.h index 84e81b960..968d57799 100644 --- a/openssl/crypto/md5/md5_locl.h +++ b/openssl/crypto/md5/md5_locl.h @@ -69,6 +69,8 @@  # if defined(__i386) || defined(__i386__) || defined(_M_IX86) || defined(__INTEL__) || \       defined(__x86_64) || defined(__x86_64__) || defined(_M_AMD64) || defined(_M_X64)  #  define md5_block_data_order md5_block_asm_data_order +# elif defined(__ia64) || defined(__ia64__) || defined(_M_IA64) +#  define md5_block_data_order md5_block_asm_data_order  # endif  #endif | 
