]> git.ipfire.org Git - thirdparty/openssl.git/blame - crypto/cast/asm/cast-586.pl
Also check for errors in x86_64-xlate.pl.
[thirdparty/openssl.git] / crypto / cast / asm / cast-586.pl
CommitLineData
e0a65194
RS
1#! /usr/bin/env perl
2# Copyright 1995-2016 The OpenSSL Project Authors. All Rights Reserved.
3#
a5024e06 4# Licensed under the Apache License 2.0 (the "License"). You may not use
e0a65194
RS
5# this file except in compliance with the License. You can obtain a copy
6# in the file LICENSE in the source distribution or at
7# https://www.openssl.org/source/license.html
8
58964a49 9
609b0852 10# This flag makes the inner loop one cycle longer, but generates
ae4af7a0
AP
11# code that runs %30 faster on the pentium pro/II, 44% faster
12# of PIII, while only %7 slower on the pentium.
13# By default, this flag is on.
58964a49
RE
14$ppro=1;
15
4d1f3f7a
DSH
16$0 =~ m/(.*[\/\\])[^\/\\]+$/; $dir=$1;
17push(@INC,"${dir}","${dir}../../perlasm");
58964a49
RE
18require "x86asm.pl";
19require "cbc.pl";
20
1aa89a7a 21$output=pop and open STDOUT,">$output";
db198398 22
e195c8a2 23&asm_init($ARGV[0],$ARGV[$#ARGV] eq "386");
58964a49
RE
24
25$CAST_ROUNDS=16;
26$L="edi";
27$R="esi";
28$K="ebp";
29$tmp1="ecx";
30$tmp2="ebx";
31$tmp3="eax";
32$tmp4="edx";
33$S1="CAST_S_table0";
34$S2="CAST_S_table1";
35$S3="CAST_S_table2";
36$S4="CAST_S_table3";
37
38@F1=("add","xor","sub");
39@F2=("xor","sub","add");
40@F3=("sub","add","xor");
41
42&CAST_encrypt("CAST_encrypt",1);
43&CAST_encrypt("CAST_decrypt",0);
44&cbc("CAST_cbc_encrypt","CAST_encrypt","CAST_decrypt",1,4,5,3,-1,-1);
45
46&asm_finish();
47
a21314db 48close STDOUT or die "error closing STDOUT: $!";
db198398 49
649cdb7b
BL
50sub CAST_encrypt {
51 local($name,$enc)=@_;
58964a49 52
649cdb7b 53 local($win_ex)=<<"EOF";
58964a49
RE
54EXTERN _CAST_S_table0:DWORD
55EXTERN _CAST_S_table1:DWORD
56EXTERN _CAST_S_table2:DWORD
57EXTERN _CAST_S_table3:DWORD
58EOF
649cdb7b
BL
59 &main::external_label(
60 "CAST_S_table0",
61 "CAST_S_table1",
62 "CAST_S_table2",
63 "CAST_S_table3",
64 );
65
66 &function_begin_B($name,$win_ex);
67
68 &comment("");
69
70 &push("ebp");
71 &push("ebx");
72 &mov($tmp2,&wparam(0));
73 &mov($K,&wparam(1));
74 &push("esi");
75 &push("edi");
76
77 &comment("Load the 2 words");
78 &mov($L,&DWP(0,$tmp2,"",0));
79 &mov($R,&DWP(4,$tmp2,"",0));
80
81 &comment('Get short key flag');
82 &mov($tmp3,&DWP(128,$K,"",0));
83 if($enc) {
84 &push($tmp3);
85 } else {
86 &or($tmp3,$tmp3);
87 &jnz(&label('cast_dec_skip'));
88 }
89
90 &xor($tmp3, $tmp3);
91
92 # encrypting part
93
94 if ($enc) {
95 &E_CAST( 0,$S,$L,$R,$K,@F1,$tmp1,$tmp2,$tmp3,$tmp4);
96 &E_CAST( 1,$S,$R,$L,$K,@F2,$tmp1,$tmp2,$tmp3,$tmp4);
97 &E_CAST( 2,$S,$L,$R,$K,@F3,$tmp1,$tmp2,$tmp3,$tmp4);
98 &E_CAST( 3,$S,$R,$L,$K,@F1,$tmp1,$tmp2,$tmp3,$tmp4);
99 &E_CAST( 4,$S,$L,$R,$K,@F2,$tmp1,$tmp2,$tmp3,$tmp4);
100 &E_CAST( 5,$S,$R,$L,$K,@F3,$tmp1,$tmp2,$tmp3,$tmp4);
101 &E_CAST( 6,$S,$L,$R,$K,@F1,$tmp1,$tmp2,$tmp3,$tmp4);
102 &E_CAST( 7,$S,$R,$L,$K,@F2,$tmp1,$tmp2,$tmp3,$tmp4);
103 &E_CAST( 8,$S,$L,$R,$K,@F3,$tmp1,$tmp2,$tmp3,$tmp4);
104 &E_CAST( 9,$S,$R,$L,$K,@F1,$tmp1,$tmp2,$tmp3,$tmp4);
105 &E_CAST(10,$S,$L,$R,$K,@F2,$tmp1,$tmp2,$tmp3,$tmp4);
106 &E_CAST(11,$S,$R,$L,$K,@F3,$tmp1,$tmp2,$tmp3,$tmp4);
107 &comment('test short key flag');
108 &pop($tmp4);
109 &or($tmp4,$tmp4);
110 &jnz(&label('cast_enc_done'));
111 &E_CAST(12,$S,$L,$R,$K,@F1,$tmp1,$tmp2,$tmp3,$tmp4);
112 &E_CAST(13,$S,$R,$L,$K,@F2,$tmp1,$tmp2,$tmp3,$tmp4);
113 &E_CAST(14,$S,$L,$R,$K,@F3,$tmp1,$tmp2,$tmp3,$tmp4);
114 &E_CAST(15,$S,$R,$L,$K,@F1,$tmp1,$tmp2,$tmp3,$tmp4);
115 } else {
116 &E_CAST(15,$S,$L,$R,$K,@F1,$tmp1,$tmp2,$tmp3,$tmp4);
117 &E_CAST(14,$S,$R,$L,$K,@F3,$tmp1,$tmp2,$tmp3,$tmp4);
118 &E_CAST(13,$S,$L,$R,$K,@F2,$tmp1,$tmp2,$tmp3,$tmp4);
119 &E_CAST(12,$S,$R,$L,$K,@F1,$tmp1,$tmp2,$tmp3,$tmp4);
120 &set_label('cast_dec_skip');
121 &E_CAST(11,$S,$L,$R,$K,@F3,$tmp1,$tmp2,$tmp3,$tmp4);
122 &E_CAST(10,$S,$R,$L,$K,@F2,$tmp1,$tmp2,$tmp3,$tmp4);
123 &E_CAST( 9,$S,$L,$R,$K,@F1,$tmp1,$tmp2,$tmp3,$tmp4);
124 &E_CAST( 8,$S,$R,$L,$K,@F3,$tmp1,$tmp2,$tmp3,$tmp4);
125 &E_CAST( 7,$S,$L,$R,$K,@F2,$tmp1,$tmp2,$tmp3,$tmp4);
126 &E_CAST( 6,$S,$R,$L,$K,@F1,$tmp1,$tmp2,$tmp3,$tmp4);
127 &E_CAST( 5,$S,$L,$R,$K,@F3,$tmp1,$tmp2,$tmp3,$tmp4);
128 &E_CAST( 4,$S,$R,$L,$K,@F2,$tmp1,$tmp2,$tmp3,$tmp4);
129 &E_CAST( 3,$S,$L,$R,$K,@F1,$tmp1,$tmp2,$tmp3,$tmp4);
130 &E_CAST( 2,$S,$R,$L,$K,@F3,$tmp1,$tmp2,$tmp3,$tmp4);
131 &E_CAST( 1,$S,$L,$R,$K,@F2,$tmp1,$tmp2,$tmp3,$tmp4);
132 &E_CAST( 0,$S,$R,$L,$K,@F1,$tmp1,$tmp2,$tmp3,$tmp4);
133 }
134
135 &set_label('cast_enc_done') if $enc;
136# Why the nop? - Ben 17/1/99
137 &nop();
138 &mov($tmp3,&wparam(0));
139 &mov(&DWP(4,$tmp3,"",0),$L);
140 &mov(&DWP(0,$tmp3,"",0),$R);
141 &function_end($name);
142}
143
144sub E_CAST {
145 local($i,$S,$L,$R,$K,$OP1,$OP2,$OP3,$tmp1,$tmp2,$tmp3,$tmp4)=@_;
146 # Ri needs to have 16 pre added.
147
148 &comment("round $i");
149 &mov( $tmp4, &DWP($i*8,$K,"",1));
150
151 &mov( $tmp1, &DWP($i*8+4,$K,"",1));
152 &$OP1( $tmp4, $R);
153
154 &rotl( $tmp4, &LB($tmp1));
155
156 if ($ppro) {
649cdb7b 157 &xor( $tmp1, $tmp1);
ae4af7a0 158 &mov( $tmp2, 0xff);
609b0852 159
649cdb7b 160 &movb( &LB($tmp1), &HB($tmp4)); # A
ae4af7a0 161 &and( $tmp2, $tmp4);
649cdb7b
BL
162
163 &shr( $tmp4, 16); #
164 &xor( $tmp3, $tmp3);
165 } else {
166 &mov( $tmp2, $tmp4); # B
167 &movb( &LB($tmp1), &HB($tmp4)); # A # BAD BAD BAD
609b0852 168
649cdb7b
BL
169 &shr( $tmp4, 16); #
170 &and( $tmp2, 0xff);
171 }
172
173 &movb( &LB($tmp3), &HB($tmp4)); # C # BAD BAD BAD
174 &and( $tmp4, 0xff); # D
175
176 &mov( $tmp1, &DWP($S1,"",$tmp1,4));
177 &mov( $tmp2, &DWP($S2,"",$tmp2,4));
178
179 &$OP2( $tmp1, $tmp2);
180 &mov( $tmp2, &DWP($S3,"",$tmp3,4));
181
182 &$OP3( $tmp1, $tmp2);
183 &mov( $tmp2, &DWP($S4,"",$tmp4,4));
184
185 &$OP1( $tmp1, $tmp2);
186 # XXX
187
188 &xor( $L, $tmp1);
189 # XXX
190}
2613c1fa 191