123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270 |
- #! /usr/bin/env perl
- # Copyright 2015-2022 The OpenSSL Project Authors. All Rights Reserved.
- #
- # Licensed under the Apache License 2.0 (the "License"). You may not use
- # this file except in compliance with the License. You can obtain a copy
- # in the file LICENSE in the source distribution or at
- # https://www.openssl.org/source/license.html
- # $output is the last argument if it looks like a file (it has an extension)
- # $flavour is the first argument if it doesn't look like a file
- $output = $#ARGV >= 0 && $ARGV[$#ARGV] =~ m|\.\w+$| ? pop : undef;
- $flavour = $#ARGV >= 0 && $ARGV[0] !~ m|\.| ? shift : undef;
- $0 =~ m/(.*[\/\\])[^\/\\]+$/; $dir=$1;
- ( $xlate="${dir}arm-xlate.pl" and -f $xlate ) or
- ( $xlate="${dir}perlasm/arm-xlate.pl" and -f $xlate) or
- die "can't locate arm-xlate.pl";
- open OUT,"| \"$^X\" $xlate $flavour \"$output\""
- or die "can't call $xlate: $!";
- *STDOUT=*OUT;
- $code.=<<___;
- #include "arm_arch.h"
- .text
- .arch armv8-a+crypto
- .align 5
- .globl _armv7_neon_probe
- .type _armv7_neon_probe,%function
- _armv7_neon_probe:
- AARCH64_VALID_CALL_TARGET
- orr v15.16b, v15.16b, v15.16b
- ret
- .size _armv7_neon_probe,.-_armv7_neon_probe
- .globl _armv7_tick
- .type _armv7_tick,%function
- _armv7_tick:
- AARCH64_VALID_CALL_TARGET
- #ifdef __APPLE__
- mrs x0, CNTPCT_EL0
- #else
- mrs x0, CNTVCT_EL0
- #endif
- ret
- .size _armv7_tick,.-_armv7_tick
- .globl _armv8_aes_probe
- .type _armv8_aes_probe,%function
- _armv8_aes_probe:
- AARCH64_VALID_CALL_TARGET
- aese v0.16b, v0.16b
- ret
- .size _armv8_aes_probe,.-_armv8_aes_probe
- .globl _armv8_sha1_probe
- .type _armv8_sha1_probe,%function
- _armv8_sha1_probe:
- AARCH64_VALID_CALL_TARGET
- sha1h s0, s0
- ret
- .size _armv8_sha1_probe,.-_armv8_sha1_probe
- .globl _armv8_sha256_probe
- .type _armv8_sha256_probe,%function
- _armv8_sha256_probe:
- AARCH64_VALID_CALL_TARGET
- sha256su0 v0.4s, v0.4s
- ret
- .size _armv8_sha256_probe,.-_armv8_sha256_probe
- .globl _armv8_pmull_probe
- .type _armv8_pmull_probe,%function
- _armv8_pmull_probe:
- AARCH64_VALID_CALL_TARGET
- pmull v0.1q, v0.1d, v0.1d
- ret
- .size _armv8_pmull_probe,.-_armv8_pmull_probe
- .globl _armv8_sm4_probe
- .type _armv8_sm4_probe,%function
- _armv8_sm4_probe:
- AARCH64_VALID_CALL_TARGET
- .inst 0xcec08400 // sm4e v0.4s, v0.4s
- ret
- .size _armv8_sm4_probe,.-_armv8_sm4_probe
- .globl _armv8_sha512_probe
- .type _armv8_sha512_probe,%function
- _armv8_sha512_probe:
- AARCH64_VALID_CALL_TARGET
- .inst 0xcec08000 // sha512su0 v0.2d,v0.2d
- ret
- .size _armv8_sha512_probe,.-_armv8_sha512_probe
- .globl _armv8_eor3_probe
- .type _armv8_eor3_probe,%function
- _armv8_eor3_probe:
- AARCH64_VALID_CALL_TARGET
- .inst 0xce010800 // eor3 v0.16b, v0.16b, v1.16b, v2.16b
- ret
- .size _armv8_eor3_probe,.-_armv8_eor3_probe
- .globl _armv8_sve_probe
- .type _armv8_sve_probe,%function
- _armv8_sve_probe:
- AARCH64_VALID_CALL_TARGET
- .inst 0x04a03000 // eor z0.d,z0.d,z0.d
- ret
- .size _armv8_sve_probe,.-_armv8_sve_probe
- .globl _armv8_sve2_probe
- .type _armv8_sve2_probe,%function
- _armv8_sve2_probe:
- AARCH64_VALID_CALL_TARGET
- .inst 0x04e03400 // xar z0.d,z0.d,z0.d
- ret
- .size _armv8_sve2_probe,.-_armv8_sve2_probe
- .globl _armv8_cpuid_probe
- .type _armv8_cpuid_probe,%function
- _armv8_cpuid_probe:
- AARCH64_VALID_CALL_TARGET
- mrs x0, midr_el1
- ret
- .size _armv8_cpuid_probe,.-_armv8_cpuid_probe
- .globl _armv8_sm3_probe
- .type _armv8_sm3_probe,%function
- _armv8_sm3_probe:
- AARCH64_VALID_CALL_TARGET
- .inst 0xce63c004 // sm3partw1 v4.4s, v0.4s, v3.4s
- ret
- .size _armv8_sm3_probe,.-_armv8_sm3_probe
- .globl OPENSSL_cleanse
- .type OPENSSL_cleanse,%function
- .align 5
- OPENSSL_cleanse:
- AARCH64_VALID_CALL_TARGET
- cbz x1,.Lret // len==0?
- cmp x1,#15
- b.hi .Lot // len>15
- nop
- .Little:
- strb wzr,[x0],#1 // store byte-by-byte
- subs x1,x1,#1
- b.ne .Little
- .Lret: ret
- .align 4
- .Lot: tst x0,#7
- b.eq .Laligned // inp is aligned
- strb wzr,[x0],#1 // store byte-by-byte
- sub x1,x1,#1
- b .Lot
- .align 4
- .Laligned:
- str xzr,[x0],#8 // store word-by-word
- sub x1,x1,#8
- tst x1,#-8
- b.ne .Laligned // len>=8
- cbnz x1,.Little // len!=0?
- ret
- .size OPENSSL_cleanse,.-OPENSSL_cleanse
- .globl CRYPTO_memcmp
- .type CRYPTO_memcmp,%function
- .align 4
- CRYPTO_memcmp:
- AARCH64_VALID_CALL_TARGET
- eor w3,w3,w3
- cbz x2,.Lno_data // len==0?
- cmp x2,#16
- b.ne .Loop_cmp
- ldp x8,x9,[x0]
- ldp x10,x11,[x1]
- eor x8,x8,x10
- eor x9,x9,x11
- orr x8,x8,x9
- mov x0,#1
- cmp x8,#0
- csel x0,xzr,x0,eq
- ret
- .align 4
- .Loop_cmp:
- ldrb w4,[x0],#1
- ldrb w5,[x1],#1
- eor w4,w4,w5
- orr w3,w3,w4
- subs x2,x2,#1
- b.ne .Loop_cmp
- .Lno_data:
- neg w0,w3
- lsr w0,w0,#31
- ret
- .size CRYPTO_memcmp,.-CRYPTO_memcmp
- .globl _armv8_rng_probe
- .type _armv8_rng_probe,%function
- _armv8_rng_probe:
- AARCH64_VALID_CALL_TARGET
- mrs x0, s3_3_c2_c4_0 // rndr
- mrs x0, s3_3_c2_c4_1 // rndrrs
- ret
- .size _armv8_rng_probe,.-_armv8_rng_probe
- ___
- sub gen_random {
- my $rdop = shift;
- my $rand_reg = $rdop eq "rndr" ? "s3_3_c2_c4_0" : "s3_3_c2_c4_1";
- return <<___;
- // Fill buffer with Randomly Generated Bytes
- // inputs: char * in x0 - Pointer to buffer
- // size_t in x1 - Number of bytes to write to buffer
- // outputs: size_t in x0 - Number of bytes successfully written to buffer
- .globl OPENSSL_${rdop}_asm
- .type OPENSSL_${rdop}_asm,%function
- .align 4
- OPENSSL_${rdop}_asm:
- AARCH64_VALID_CALL_TARGET
- mov x2,xzr
- mov x3,xzr
- .align 4
- .Loop_${rdop}:
- cmp x1,#0
- b.eq .${rdop}_done
- mov x3,xzr
- mrs x3,$rand_reg
- b.eq .${rdop}_done
- cmp x1,#8
- b.lt .Loop_single_byte_${rdop}
- str x3,[x0]
- add x0,x0,#8
- add x2,x2,#8
- subs x1,x1,#8
- b.ge .Loop_${rdop}
- .align 4
- .Loop_single_byte_${rdop}:
- strb w3,[x0]
- lsr x3,x3,#8
- add x2,x2,#1
- add x0,x0,#1
- subs x1,x1,#1
- b.gt .Loop_single_byte_${rdop}
- .align 4
- .${rdop}_done:
- mov x0,x2
- ret
- .size OPENSSL_${rdop}_asm,.-OPENSSL_${rdop}_asm
- ___
- }
- $code .= gen_random("rndr");
- $code .= gen_random("rndrrs");
- print $code;
- close STDOUT or die "error closing STDOUT: $!";
|