123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209 |
- #! /usr/bin/env perl
- # Copyright 2018-2021 The OpenSSL Project Authors. All Rights Reserved.
- #
- # Licensed under the Apache License 2.0 (the "License"). You may not use
- # this file except in compliance with the License. You can obtain a copy
- # in the file LICENSE in the source distribution or at
- # https://www.openssl.org/source/license.html
- package OpenSSL::ParseC;
- use strict;
- use warnings;
- use Exporter;
- use vars qw($VERSION @ISA @EXPORT @EXPORT_OK %EXPORT_TAGS);
- $VERSION = "0.9";
- @ISA = qw(Exporter);
- @EXPORT = qw(parse);
- # Global handler data
- my @preprocessor_conds; # A list of simple preprocessor conditions,
- # each item being a list of macros defined
- # or not defined.
- # Handler helpers
- sub all_conds {
- return map { ( @$_ ) } @preprocessor_conds;
- }
- # A list of handlers that will look at a "complete" string and try to
- # figure out what to make of it.
- # Each handler is a hash with the following keys:
- #
- # regexp a regexp to compare the "complete" string with.
- # checker a function that does a more complex comparison.
- # Use this instead of regexp if that isn't enough.
- # massager massages the "complete" string into an array with
- # the following elements:
- #
- # [0] String that needs further processing (this
- # applies to typedefs of structs), or empty.
- # [1] The name of what was found.
- # [2] A character that denotes what type of thing
- # this is: 'F' for function, 'S' for struct,
- # 'T' for typedef, 'M' for macro, 'V' for
- # variable.
- # [3] Return type (only for type 'F' and 'V')
- # [4] Value (for type 'M') or signature (for type 'F',
- # 'V', 'T' or 'S')
- # [5...] The list of preprocessor conditions this is
- # found in, as in checks for macro definitions
- # (stored as the macro's name) or the absence
- # of definition (stored as the macro's name
- # prefixed with a '!'
- #
- # If the massager returns an empty list, it means the
- # "complete" string has side effects but should otherwise
- # be ignored.
- # If the massager is undefined, the "complete" string
- # should be ignored.
- my @opensslcpphandlers = (
- ##################################################################
- # OpenSSL CPP specials
- #
- # These are used to convert certain pre-precessor expressions into
- # others that @cpphandlers have a better chance to understand.
- # This changes any OPENSSL_NO_DEPRECATED_x_y[_z] check to a check of
- # OPENSSL_NO_DEPRECATEDIN_x_y[_z]. That's due to <openssl/macros.h>
- # creating OPENSSL_NO_DEPRECATED_x_y[_z], but the ordinals files using
- # DEPRECATEDIN_x_y[_z].
- { regexp => qr/#if(def|ndef) OPENSSL_NO_DEPRECATED_(\d+_\d+(?:_\d+)?)$/,
- massager => sub {
- return (<<"EOF");
- #if$1 OPENSSL_NO_DEPRECATEDIN_$2
- EOF
- }
- }
- );
- my @cpphandlers = (
- ##################################################################
- # CPP stuff
- { regexp => qr/#ifdef ?(.*)/,
- massager => sub {
- my %opts;
- if (ref($_[$#_]) eq "HASH") {
- %opts = %{$_[$#_]};
- pop @_;
- }
- push @preprocessor_conds, [ $1 ];
- print STDERR "DEBUG[",$opts{debug_type},"]: preprocessor level: ", scalar(@preprocessor_conds), "\n"
- if $opts{debug};
- return ();
- },
- },
- { regexp => qr/#ifndef ?(.*)/,
- massager => sub {
- my %opts;
- if (ref($_[$#_]) eq "HASH") {
- %opts = %{$_[$#_]};
- pop @_;
- }
- push @preprocessor_conds, [ '!'.$1 ];
- print STDERR "DEBUG[",$opts{debug_type},"]: preprocessor level: ", scalar(@preprocessor_conds), "\n"
- if $opts{debug};
- return ();
- },
- },
- { regexp => qr/#if (0|1)/,
- massager => sub {
- my %opts;
- if (ref($_[$#_]) eq "HASH") {
- %opts = %{$_[$#_]};
- pop @_;
- }
- if ($1 eq "1") {
- push @preprocessor_conds, [ "TRUE" ];
- } else {
- push @preprocessor_conds, [ "!TRUE" ];
- }
- print STDERR "DEBUG[",$opts{debug_type},"]: preprocessor level: ", scalar(@preprocessor_conds), "\n"
- if $opts{debug};
- return ();
- },
- },
- { regexp => qr/#if ?(.*)/,
- massager => sub {
- my %opts;
- if (ref($_[$#_]) eq "HASH") {
- %opts = %{$_[$#_]};
- pop @_;
- }
- my @results = ();
- my $conds = $1;
- if ($conds =~ m|^defined<<<\(([^\)]*)\)>>>(.*)$|) {
- push @results, $1; # Handle the simple case
- my $rest = $2;
- my $re = qr/^(?:\|\|defined<<<\([^\)]*\)>>>)*$/;
- print STDERR "DEBUG[",$opts{debug_type},"]: Matching '$rest' with '$re'\n"
- if $opts{debug};
- if ($rest =~ m/$re/) {
- my @rest = split /\|\|/, $rest;
- shift @rest;
- foreach (@rest) {
- m|^defined<<<\(([^\)]*)\)>>>$|;
- die "Something wrong...$opts{PLACE}" if $1 eq "";
- push @results, $1;
- }
- } else {
- $conds =~ s/<<<|>>>//g;
- warn "Warning: complicated #if expression(1): $conds$opts{PLACE}"
- if $opts{warnings};
- }
- } elsif ($conds =~ m|^!defined<<<\(([^\)]*)\)>>>(.*)$|) {
- push @results, '!'.$1; # Handle the simple case
- my $rest = $2;
- my $re = qr/^(?:\&\&!defined<<<\([^\)]*\)>>>)*$/;
- print STDERR "DEBUG[",$opts{debug_type},"]: Matching '$rest' with '$re'\n"
- if $opts{debug};
- if ($rest =~ m/$re/) {
- my @rest = split /\&\&/, $rest;
- shift @rest;
- foreach (@rest) {
- m|^!defined<<<\(([^\)]*)\)>>>$|;
- die "Something wrong...$opts{PLACE}" if $1 eq "";
- push @results, '!'.$1;
- }
- } else {
- $conds =~ s/<<<|>>>//g;
- warn "Warning: complicated #if expression(2): $conds$opts{PLACE}"
- if $opts{warnings};
- }
- } else {
- $conds =~ s/<<<|>>>//g;
- warn "Warning: complicated #if expression(3): $conds$opts{PLACE}"
- if $opts{warnings};
- }
- print STDERR "DEBUG[",$opts{debug_type},"]: Added preprocessor conds: '", join("', '", @results), "'\n"
- if $opts{debug};
- push @preprocessor_conds, [ @results ];
- print STDERR "DEBUG[",$opts{debug_type},"]: preprocessor level: ", scalar(@preprocessor_conds), "\n"
- if $opts{debug};
- return ();
- },
- },
- { regexp => qr/#elif (.*)/,
- massager => sub {
- my %opts;
- if (ref($_[$#_]) eq "HASH") {
- %opts = %{$_[$#_]};
- pop @_;
- }
- die "An #elif without corresponding condition$opts{PLACE}"
- if !@preprocessor_conds;
- pop @preprocessor_conds;
- print STDERR "DEBUG[",$opts{debug_type},"]: preprocessor level: ", scalar(@preprocessor_conds), "\n"
- if $opts{debug};
- return (<<"EOF");
- #if $1
- EOF
- },
- },
- { regexp => qr/#else/,
- massager => sub {
- my %opts;
- if (ref($_[$#_]) eq "HASH") {
- %opts = %{$_[$#_]};
- pop @_;
- }
- die "An #else without corresponding condition$opts{PLACE}"
- if !@preprocessor_conds;
- # Invert all conditions on the last level
- my $stuff = pop @preprocessor_conds;
- push @preprocessor_conds, [
- map { m|^!(.*)$| ? $1 : '!'.$_ } @$stuff
- ];
- print STDERR "DEBUG[",$opts{debug_type},"]: preprocessor level: ", scalar(@preprocessor_conds), "\n"
- if $opts{debug};
- return ();
- },
- },
- { regexp => qr/#endif ?/,
- massager => sub {
- my %opts;
- if (ref($_[$#_]) eq "HASH") {
- %opts = %{$_[$#_]};
- pop @_;
- }
- die "An #endif without corresponding condition$opts{PLACE}"
- if !@preprocessor_conds;
- pop @preprocessor_conds;
- print STDERR "DEBUG[",$opts{debug_type},"]: preprocessor level: ", scalar(@preprocessor_conds), "\n"
- if $opts{debug};
- return ();
- },
- },
- { regexp => qr/#define ([[:alpha:]_]\w*)(<<<\(.*?\)>>>)?( (.*))?/,
- massager => sub {
- my $name = $1;
- my $params = $2;
- my $spaceval = $3||"";
- my $val = $4||"";
- return ("",
- $1, 'M', "", $params ? "$name$params$spaceval" : $val,
- all_conds()); }
- },
- { regexp => qr/#.*/,
- massager => sub { return (); }
- },
- );
- my @opensslchandlers = (
- ##################################################################
- # OpenSSL C specials
- #
- # They are really preprocessor stuff, but they look like C stuff
- # to this parser. All of these do replacements, anything else is
- # an error.
- #####
- # Deprecated stuff, by OpenSSL release.
- # OSSL_DEPRECATEDIN_x_y[_z] is simply ignored. Such declarations are
- # supposed to be guarded with an '#ifdef OPENSSL_NO_DEPRECATED_x_y[_z]'
- { regexp => qr/OSSL_DEPRECATEDIN_\d+_\d+(?:_\d+)?\s+(.*)/,
- massager => sub { return $1; },
- },
- { regexp => qr/(.*?)\s+OSSL_DEPRECATEDIN_\d+_\d+(?:_\d+)?\s+(.*)/,
- massager => sub { return "$1 $2"; },
- },
- #####
- # Core stuff
- # OSSL_CORE_MAKE_FUNC is a macro to create the necessary data and inline
- # function the libcrypto<->provider interface
- { regexp => qr/OSSL_CORE_MAKE_FUNC<<<\((.*?),(.*?),(.*?)\)>>>/,
- massager => sub {
- return (<<"EOF");
- typedef $1 OSSL_FUNC_$2_fn$3;
- static ossl_inline OSSL_FUNC_$2_fn *OSSL_FUNC_$2(const OSSL_DISPATCH *opf);
- EOF
- },
- },
- #####
- # LHASH stuff
- # LHASH_OF(foo) is used as a type, but the chandlers won't take it
- # gracefully, so we expand it here.
- { regexp => qr/(.*)\bLHASH_OF<<<\((.*?)\)>>>(.*)/,
- massager => sub { return ("$1struct lhash_st_$2$3"); }
- },
- { regexp => qr/DEFINE_LHASH_OF(?:_INTERNAL|_EX)?<<<\((.*)\)>>>/,
- massager => sub {
- return (<<"EOF");
- static ossl_inline LHASH_OF($1) * lh_$1_new(unsigned long (*hfn)(const $1 *),
- int (*cfn)(const $1 *, const $1 *));
- static ossl_inline void lh_$1_free(LHASH_OF($1) *lh);
- static ossl_inline $1 *lh_$1_insert(LHASH_OF($1) *lh, $1 *d);
- static ossl_inline $1 *lh_$1_delete(LHASH_OF($1) *lh, const $1 *d);
- static ossl_inline $1 *lh_$1_retrieve(LHASH_OF($1) *lh, const $1 *d);
- static ossl_inline int lh_$1_error(LHASH_OF($1) *lh);
- static ossl_inline unsigned long lh_$1_num_items(LHASH_OF($1) *lh);
- static ossl_inline void lh_$1_node_stats_bio(const LHASH_OF($1) *lh, BIO *out);
- static ossl_inline void lh_$1_node_usage_stats_bio(const LHASH_OF($1) *lh,
- BIO *out);
- static ossl_inline void lh_$1_stats_bio(const LHASH_OF($1) *lh, BIO *out);
- static ossl_inline unsigned long lh_$1_get_down_load(LHASH_OF($1) *lh);
- static ossl_inline void lh_$1_set_down_load(LHASH_OF($1) *lh, unsigned long dl);
- static ossl_inline void lh_$1_doall(LHASH_OF($1) *lh, void (*doall)($1 *));
- LHASH_OF($1)
- EOF
- }
- },
- #####
- # STACK stuff
- # STACK_OF(foo) is used as a type, but the chandlers won't take it
- # gracefully, so we expand it here.
- { regexp => qr/(.*)\bSTACK_OF<<<\((.*?)\)>>>(.*)/,
- massager => sub { return ("$1struct stack_st_$2$3"); }
- },
- # { regexp => qr/(.*)\bSTACK_OF\((.*?)\)(.*)/,
- # massager => sub {
- # my $before = $1;
- # my $stack_of = "struct stack_st_$2";
- # my $after = $3;
- # if ($after =~ m|^\w|) { $after = " ".$after; }
- # return ("$before$stack_of$after");
- # }
- # },
- { regexp => qr/SKM_DEFINE_STACK_OF<<<\((.*),\s*(.*),\s*(.*)\)>>>/,
- massager => sub {
- return (<<"EOF");
- STACK_OF($1);
- typedef int (*sk_$1_compfunc)(const $3 * const *a, const $3 *const *b);
- typedef void (*sk_$1_freefunc)($3 *a);
- typedef $3 * (*sk_$1_copyfunc)(const $3 *a);
- static ossl_inline int sk_$1_num(const STACK_OF($1) *sk);
- static ossl_inline $2 *sk_$1_value(const STACK_OF($1) *sk, int idx);
- static ossl_inline STACK_OF($1) *sk_$1_new(sk_$1_compfunc compare);
- static ossl_inline STACK_OF($1) *sk_$1_new_null(void);
- static ossl_inline STACK_OF($1) *sk_$1_new_reserve(sk_$1_compfunc compare,
- int n);
- static ossl_inline int sk_$1_reserve(STACK_OF($1) *sk, int n);
- static ossl_inline void sk_$1_free(STACK_OF($1) *sk);
- static ossl_inline void sk_$1_zero(STACK_OF($1) *sk);
- static ossl_inline $2 *sk_$1_delete(STACK_OF($1) *sk, int i);
- static ossl_inline $2 *sk_$1_delete_ptr(STACK_OF($1) *sk, $2 *ptr);
- static ossl_inline int sk_$1_push(STACK_OF($1) *sk, $2 *ptr);
- static ossl_inline int sk_$1_unshift(STACK_OF($1) *sk, $2 *ptr);
- static ossl_inline $2 *sk_$1_pop(STACK_OF($1) *sk);
- static ossl_inline $2 *sk_$1_shift(STACK_OF($1) *sk);
- static ossl_inline void sk_$1_pop_free(STACK_OF($1) *sk,
- sk_$1_freefunc freefunc);
- static ossl_inline int sk_$1_insert(STACK_OF($1) *sk, $2 *ptr, int idx);
- static ossl_inline $2 *sk_$1_set(STACK_OF($1) *sk, int idx, $2 *ptr);
- static ossl_inline int sk_$1_find(STACK_OF($1) *sk, $2 *ptr);
- static ossl_inline int sk_$1_find_ex(STACK_OF($1) *sk, $2 *ptr);
- static ossl_inline void sk_$1_sort(STACK_OF($1) *sk);
- static ossl_inline int sk_$1_is_sorted(const STACK_OF($1) *sk);
- static ossl_inline STACK_OF($1) * sk_$1_dup(const STACK_OF($1) *sk);
- static ossl_inline STACK_OF($1) *sk_$1_deep_copy(const STACK_OF($1) *sk,
- sk_$1_copyfunc copyfunc,
- sk_$1_freefunc freefunc);
- static ossl_inline sk_$1_compfunc sk_$1_set_cmp_func(STACK_OF($1) *sk,
- sk_$1_compfunc compare);
- EOF
- }
- },
- { regexp => qr/SKM_DEFINE_STACK_OF_INTERNAL<<<\((.*),\s*(.*),\s*(.*)\)>>>/,
- massager => sub {
- return (<<"EOF");
- STACK_OF($1);
- typedef int (*sk_$1_compfunc)(const $3 * const *a, const $3 *const *b);
- typedef void (*sk_$1_freefunc)($3 *a);
- typedef $3 * (*sk_$1_copyfunc)(const $3 *a);
- static ossl_unused ossl_inline $2 *ossl_check_$1_type($2 *ptr);
- static ossl_unused ossl_inline const OPENSSL_STACK *ossl_check_const_$1_sk_type(const STACK_OF($1) *sk);
- static ossl_unused ossl_inline OPENSSL_sk_compfunc ossl_check_$1_compfunc_type(sk_$1_compfunc cmp);
- static ossl_unused ossl_inline OPENSSL_sk_copyfunc ossl_check_$1_copyfunc_type(sk_$1_copyfunc cpy);
- static ossl_unused ossl_inline OPENSSL_sk_freefunc ossl_check_$1_freefunc_type(sk_$1_freefunc fr);
- EOF
- }
- },
- { regexp => qr/DEFINE_SPECIAL_STACK_OF<<<\((.*),\s*(.*)\)>>>/,
- massager => sub { return ("SKM_DEFINE_STACK_OF($1,$2,$2)"); },
- },
- { regexp => qr/DEFINE_STACK_OF<<<\((.*)\)>>>/,
- massager => sub { return ("SKM_DEFINE_STACK_OF($1,$1,$1)"); },
- },
- { regexp => qr/DEFINE_SPECIAL_STACK_OF_CONST<<<\((.*),\s*(.*)\)>>>/,
- massager => sub { return ("SKM_DEFINE_STACK_OF($1,const $2,$2)"); },
- },
- { regexp => qr/DEFINE_STACK_OF_CONST<<<\((.*)\)>>>/,
- massager => sub { return ("SKM_DEFINE_STACK_OF($1,const $1,$1)"); },
- },
- #####
- # ASN1 stuff
- { regexp => qr/DECLARE_ASN1_ITEM<<<\((.*)\)>>>/,
- massager => sub {
- return (<<"EOF");
- const ASN1_ITEM *$1_it(void);
- EOF
- },
- },
- { regexp => qr/DECLARE_ASN1_ENCODE_FUNCTIONS_only<<<\((.*),\s*(.*)\)>>>/,
- massager => sub {
- return (<<"EOF");
- int d2i_$2(void);
- int i2d_$2(void);
- EOF
- },
- },
- { regexp => qr/DECLARE_ASN1_ENCODE_FUNCTIONS<<<\((.*),\s*(.*),\s*(.*)\)>>>/,
- massager => sub {
- return (<<"EOF");
- int d2i_$3(void);
- int i2d_$3(void);
- DECLARE_ASN1_ITEM($2)
- EOF
- },
- },
- { regexp => qr/DECLARE_ASN1_ENCODE_FUNCTIONS_name<<<\((.*),\s*(.*)\)>>>/,
- massager => sub {
- return (<<"EOF");
- int d2i_$2(void);
- int i2d_$2(void);
- DECLARE_ASN1_ITEM($2)
- EOF
- },
- },
- { regexp => qr/DECLARE_ASN1_ALLOC_FUNCTIONS_name<<<\((.*),\s*(.*)\)>>>/,
- massager => sub {
- return (<<"EOF");
- int $2_free(void);
- int $2_new(void);
- EOF
- },
- },
- { regexp => qr/DECLARE_ASN1_ALLOC_FUNCTIONS<<<\((.*)\)>>>/,
- massager => sub {
- return (<<"EOF");
- int $1_free(void);
- int $1_new(void);
- EOF
- },
- },
- { regexp => qr/DECLARE_ASN1_FUNCTIONS_name<<<\((.*),\s*(.*)\)>>>/,
- massager => sub {
- return (<<"EOF");
- int d2i_$2(void);
- int i2d_$2(void);
- int $2_free(void);
- int $2_new(void);
- DECLARE_ASN1_ITEM($2)
- EOF
- },
- },
- { regexp => qr/DECLARE_ASN1_FUNCTIONS<<<\((.*)\)>>>/,
- massager => sub { return (<<"EOF");
- int d2i_$1(void);
- int i2d_$1(void);
- int $1_free(void);
- int $1_new(void);
- DECLARE_ASN1_ITEM($1)
- EOF
- }
- },
- { regexp => qr/DECLARE_ASN1_NDEF_FUNCTION<<<\((.*)\)>>>/,
- massager => sub {
- return (<<"EOF");
- int i2d_$1_NDEF(void);
- EOF
- }
- },
- { regexp => qr/DECLARE_ASN1_PRINT_FUNCTION<<<\((.*)\)>>>/,
- massager => sub {
- return (<<"EOF");
- int $1_print_ctx(void);
- EOF
- }
- },
- { regexp => qr/DECLARE_ASN1_PRINT_FUNCTION_name<<<\((.*),\s*(.*)\)>>>/,
- massager => sub {
- return (<<"EOF");
- int $2_print_ctx(void);
- EOF
- }
- },
- { regexp => qr/DECLARE_ASN1_SET_OF<<<\((.*)\)>>>/,
- massager => sub { return (); }
- },
- { regexp => qr/DECLARE_ASN1_DUP_FUNCTION<<<\((.*)\)>>>/,
- massager => sub {
- return (<<"EOF");
- int $1_dup(void);
- EOF
- }
- },
- { regexp => qr/DECLARE_ASN1_DUP_FUNCTION_name<<<\((.*),\s*(.*)\)>>>/,
- massager => sub {
- return (<<"EOF");
- int $2_dup(void);
- EOF
- }
- },
- # Universal translator of attributed PEM declarators
- { regexp => qr/
- DECLARE_ASN1
- (_ENCODE_FUNCTIONS_only|_ENCODE_FUNCTIONS|_ENCODE_FUNCTIONS_name
- |_ALLOC_FUNCTIONS_name|_ALLOC_FUNCTIONS|_FUNCTIONS_name|_FUNCTIONS
- |_NDEF_FUNCTION|_PRINT_FUNCTION|_PRINT_FUNCTION_name
- |_DUP_FUNCTION|_DUP_FUNCTION_name)
- _attr
- <<<\(\s*OSSL_DEPRECATEDIN_(.*?)\s*,(.*?)\)>>>
- /x,
- massager => sub { return (<<"EOF");
- DECLARE_ASN1$1($3)
- EOF
- },
- },
- { regexp => qr/DECLARE_PKCS12_SET_OF<<<\((.*)\)>>>/,
- massager => sub { return (); }
- },
- #####
- # PEM stuff
- { regexp => qr/DECLARE_PEM(?|_rw|_rw_cb|_rw_const)<<<\((.*?),.*\)>>>/,
- massager => sub { return (<<"EOF");
- #ifndef OPENSSL_NO_STDIO
- int PEM_read_$1(void);
- int PEM_write_$1(void);
- #endif
- int PEM_read_bio_$1(void);
- int PEM_write_bio_$1(void);
- EOF
- },
- },
- { regexp => qr/DECLARE_PEM(?|_rw|_rw_cb|_rw_const)_ex<<<\((.*?),.*\)>>>/,
- massager => sub { return (<<"EOF");
- #ifndef OPENSSL_NO_STDIO
- int PEM_read_$1(void);
- int PEM_write_$1(void);
- int PEM_read_$1_ex(void);
- int PEM_write_$1_ex(void);
- #endif
- int PEM_read_bio_$1(void);
- int PEM_write_bio_$1(void);
- int PEM_read_bio_$1_ex(void);
- int PEM_write_bio_$1_ex(void);
- EOF
- },
- },
- { regexp => qr/DECLARE_PEM(?|_write|_write_cb|_write_const)<<<\((.*?),.*\)>>>/,
- massager => sub { return (<<"EOF");
- #ifndef OPENSSL_NO_STDIO
- int PEM_write_$1(void);
- #endif
- int PEM_write_bio_$1(void);
- EOF
- },
- },
- { regexp => qr/DECLARE_PEM(?|_write|_write_cb|_write_const)_ex<<<\((.*?),.*\)>>>/,
- massager => sub { return (<<"EOF");
- #ifndef OPENSSL_NO_STDIO
- int PEM_write_$1(void);
- int PEM_write_$1_ex(void);
- #endif
- int PEM_write_bio_$1(void);
- int PEM_write_bio_$1_ex(void);
- EOF
- },
- },
- { regexp => qr/DECLARE_PEM(?|_read|_read_cb)<<<\((.*?),.*\)>>>/,
- massager => sub { return (<<"EOF");
- #ifndef OPENSSL_NO_STDIO
- int PEM_read_$1(void);
- #endif
- int PEM_read_bio_$1(void);
- EOF
- },
- },
- { regexp => qr/DECLARE_PEM(?|_read|_read_cb)_ex<<<\((.*?),.*\)>>>/,
- massager => sub { return (<<"EOF");
- #ifndef OPENSSL_NO_STDIO
- int PEM_read_$1(void);
- int PEM_read_$1_ex(void);
- #endif
- int PEM_read_bio_$1(void);
- int PEM_read_bio_$1_ex(void);
- EOF
- },
- },
- # Universal translator of attributed PEM declarators
- { regexp => qr/
- DECLARE_PEM
- ((?:_rw|_rw_cb|_rw_const|_write|_write_cb|_write_const|_read|_read_cb)
- (?:_ex)?)
- _attr
- <<<\(\s*OSSL_DEPRECATEDIN_(.*?)\s*,(.*?)\)>>>
- /x,
- massager => sub { return (<<"EOF");
- DECLARE_PEM$1($3)
- EOF
- },
- },
- # OpenSSL's declaration of externs with possible export linkage
- # (really only relevant on Windows)
- { regexp => qr/OPENSSL_(?:EXPORT|EXTERN)/,
- massager => sub { return ("extern"); }
- },
- # Spurious stuff found in the OpenSSL headers
- # Usually, these are just macros that expand to, well, something
- { regexp => qr/__NDK_FPABI__/,
- massager => sub { return (); }
- },
- );
- my $anoncnt = 0;
- my @chandlers = (
- ##################################################################
- # C stuff
- # extern "C" of individual items
- # Note that the main parse function has a special hack for 'extern "C" {'
- # which can't be done in handlers
- # We simply ignore it.
- { regexp => qr/^extern "C" (.*(?:;|>>>))/,
- massager => sub { return ($1); },
- },
- # any other extern is just ignored
- { regexp => qr/^\s* # Any spaces before
- extern # The keyword we look for
- \b # word to non-word boundary
- .* # Anything after
- ;
- /x,
- massager => sub { return (); },
- },
- # union, struct and enum definitions
- # Because this one might appear a little everywhere within type
- # definitions, we take it out and replace it with just
- # 'union|struct|enum name' while registering it.
- # This makes use of the parser trick to surround the outer braces
- # with <<< and >>>
- { regexp => qr/(.*) # Anything before ($1)
- \b # word to non-word boundary
- (union|struct|enum) # The word used ($2)
- (?:\s([[:alpha:]_]\w*))? # Struct or enum name ($3)
- <<<(\{.*?\})>>> # Struct or enum definition ($4)
- (.*) # Anything after ($5)
- ;
- /x,
- massager => sub {
- my $before = $1;
- my $word = $2;
- my $name = $3
- || sprintf("__anon%03d", ++$anoncnt); # Anonymous struct
- my $definition = $4;
- my $after = $5;
- my $type = $word eq "struct" ? 'S' : 'E';
- if ($before ne "" || $after ne ";") {
- if ($after =~ m|^\w|) { $after = " ".$after; }
- return ("$before$word $name$after;",
- "$word $name", $type, "", "$word$definition", all_conds());
- }
- # If there was no before nor after, make the return much simple
- return ("", "$word $name", $type, "", "$word$definition", all_conds());
- }
- },
- # Named struct and enum forward declarations
- # We really just ignore them, but we need to parse them or the variable
- # declaration handler further down will think it's a variable declaration.
- { regexp => qr/^(union|struct|enum) ([[:alpha:]_]\w*);/,
- massager => sub { return (); }
- },
- # Function returning function pointer declaration
- # This sort of declaration may have a body (inline functions, for example)
- { regexp => qr/(?:(typedef)\s?)? # Possible typedef ($1)
- ((?:\w|\*|\s)*?) # Return type ($2)
- \s? # Possible space
- <<<\(\*
- ([[:alpha:]_]\w*) # Function name ($3)
- (\(.*\)) # Parameters ($4)
- \)>>>
- <<<(\(.*\))>>> # F.p. parameters ($5)
- (?:<<<\{.*\}>>>|;) # Body or semicolon
- /x,
- massager => sub {
- return ("", $3, 'T', "", "$2(*$4)$5", all_conds())
- if defined $1;
- return ("", $3, 'F', "$2(*)$5", "$2(*$4)$5", all_conds()); }
- },
- # Function pointer declaration, or typedef thereof
- # This sort of declaration never has a function body
- { regexp => qr/(?:(typedef)\s?)? # Possible typedef ($1)
- ((?:\w|\*|\s)*?) # Return type ($2)
- <<<\(\*([[:alpha:]_]\w*)\)>>> # T.d. or var name ($3)
- <<<(\(.*\))>>> # F.p. parameters ($4)
- ;
- /x,
- massager => sub {
- return ("", $3, 'T', "", "$2(*)$4", all_conds())
- if defined $1;
- return ("", $3, 'V', "$2(*)$4", "$2(*)$4", all_conds());
- },
- },
- # Function declaration, or typedef thereof
- # This sort of declaration may have a body (inline functions, for example)
- { regexp => qr/(?:(typedef)\s?)? # Possible typedef ($1)
- ((?:\w|\*|\s)*?) # Return type ($2)
- \s? # Possible space
- ([[:alpha:]_]\w*) # Function name ($3)
- <<<(\(.*\))>>> # Parameters ($4)
- (?:<<<\{.*\}>>>|;) # Body or semicolon
- /x,
- massager => sub {
- return ("", $3, 'T', "", "$2$4", all_conds())
- if defined $1;
- return ("", $3, 'F', $2, "$2$4", all_conds());
- },
- },
- # Variable declaration, including arrays, or typedef thereof
- { regexp => qr/(?:(typedef)\s?)? # Possible typedef ($1)
- ((?:\w|\*|\s)*?) # Type ($2)
- \s? # Possible space
- ([[:alpha:]_]\w*) # Variable name ($3)
- ((?:<<<\[[^\]]*\]>>>)*) # Possible array declaration ($4)
- ;
- /x,
- massager => sub {
- return ("", $3, 'T', "", $2.($4||""), all_conds())
- if defined $1;
- return ("", $3, 'V', $2.($4||""), $2.($4||""), all_conds());
- },
- },
- );
- # End handlers are almost the same as handlers, except they are run through
- # ONCE when the input has been parsed through. These are used to check for
- # remaining stuff, such as an unfinished #ifdef and stuff like that that the
- # main parser can't check on its own.
- my @endhandlers = (
- { massager => sub {
- my %opts = %{$_[0]};
- die "Unfinished preprocessor conditions levels: ",scalar(@preprocessor_conds),($opts{filename} ? " in file ".$opts{filename}: ""),$opts{PLACE}
- if @preprocessor_conds;
- }
- }
- );
- # takes a list of strings that can each contain one or several lines of code
- # also takes a hash of options as last argument.
- #
- # returns a list of hashes with information:
- #
- # name name of the thing
- # type type, see the massage handler function
- # returntype return type of functions and variables
- # value value for macros, signature for functions, variables
- # and structs
- # conds preprocessor conditions (array ref)
- sub parse {
- my %opts;
- if (ref($_[$#_]) eq "HASH") {
- %opts = %{$_[$#_]};
- pop @_;
- }
- my %state = (
- in_extern_C => 0, # An exception to parenthesis processing.
- cpp_parens => [], # A list of ending parens and braces found in
- # preprocessor directives
- c_parens => [], # A list of ending parens and braces found in
- # C statements
- in_string => "", # empty string when outside a string, otherwise
- # "'" or '"' depending on the starting quote.
- in_comment => "", # empty string when outside a comment, otherwise
- # "/*" or "//" depending on the type of comment
- # found. The latter will never be multiline
- # NOTE: in_string and in_comment will never be
- # true (in perl semantics) at the same time.
- current_line => 0,
- );
- my @result = ();
- my $normalized_line = ""; # $input_line, but normalized. In essence, this
- # means that ALL whitespace is removed unless
- # it absolutely has to be present, and in that
- # case, there's only one space.
- # The cases where a space needs to stay present
- # are:
- # 1. between words
- # 2. between words and number
- # 3. after the first word of a preprocessor
- # directive.
- # 4. for the #define directive, between the macro
- # name/args and its value, so we end up with:
- # #define FOO val
- # #define BAR(x) something(x)
- my $collected_stmt = ""; # Where we're building up a C line until it's a
- # complete definition/declaration, as determined
- # by any handler being capable of matching it.
- # We use $_ shamelessly when looking through @lines.
- # In case we find a \ at the end, we keep filling it up with more lines.
- $_ = undef;
- foreach my $line (@_) {
- # split tries to be smart when a string ends with the thing we split on
- $line .= "\n" unless $line =~ m|\R$|;
- $line .= "#";
- # We use ¦undef¦ as a marker for a new line from the file.
- # Since we convert one line to several and unshift that into @lines,
- # that's the only safe way we have to track the original lines
- my @lines = map { ( undef, $_ ) } split m|\R|, $line;
- # Remember that extra # we added above? Now we remove it
- pop @lines;
- pop @lines; # Don't forget the undef
- while (@lines) {
- if (!defined($lines[0])) {
- shift @lines;
- $state{current_line}++;
- if (!defined($_)) {
- $opts{PLACE} = " at ".$opts{filename}." line ".$state{current_line}."\n";
- $opts{PLACE2} = $opts{filename}.":".$state{current_line};
- }
- next;
- }
- $_ = "" unless defined $_;
- $_ .= shift @lines;
- if (m|\\$|) {
- $_ = $`;
- next;
- }
- if ($opts{debug}) {
- print STDERR "DEBUG:----------------------------\n";
- print STDERR "DEBUG: \$_ = '$_'\n";
- }
- ##########################################################
- # Now that we have a full line, let's process through it
- while(1) {
- unless ($state{in_comment}) {
- # Begin with checking if the current $normalized_line
- # contains a preprocessor directive
- # This is only done if we're not inside a comment and
- # if it's a preprocessor directive and it's finished.
- if ($normalized_line =~ m|^#| && $_ eq "") {
- print STDERR "DEBUG[OPENSSL CPP]: \$normalized_line = '$normalized_line'\n"
- if $opts{debug};
- $opts{debug_type} = "OPENSSL CPP";
- my @r = ( _run_handlers($normalized_line,
- @opensslcpphandlers,
- \%opts) );
- if (shift @r) {
- # Checking if there are lines to inject.
- if (@r) {
- @r = split $/, (pop @r).$_;
- print STDERR "DEBUG[OPENSSL CPP]: injecting '", join("', '", @r),"'\n"
- if $opts{debug} && @r;
- @lines = ( @r, @lines );
- $_ = "";
- }
- } else {
- print STDERR "DEBUG[CPP]: \$normalized_line = '$normalized_line'\n"
- if $opts{debug};
- $opts{debug_type} = "CPP";
- my @r = ( _run_handlers($normalized_line,
- @cpphandlers,
- \%opts) );
- if (shift @r) {
- if (ref($r[0]) eq "HASH") {
- push @result, shift @r;
- }
- # Now, check if there are lines to inject.
- # Really, this should never happen, it IS a
- # preprocessor directive after all...
- if (@r) {
- @r = split $/, pop @r;
- print STDERR "DEBUG[CPP]: injecting '", join("', '", @r),"'\n"
- if $opts{debug} && @r;
- @lines = ( @r, @lines );
- $_ = "";
- }
- }
- }
- # Note: we simply ignore all directives that no
- # handler matches
- $normalized_line = "";
- }
- # If the two strings end and start with a character that
- # shouldn't get concatenated, add a space
- my $space =
- ($collected_stmt =~ m/(?:"|')$/
- || ($collected_stmt =~ m/(?:\w|\d)$/
- && $normalized_line =~ m/^(?:\w|\d)/)) ? " " : "";
- # Now, unless we're building up a preprocessor directive or
- # are in the middle of a string, or the parens et al aren't
- # balanced up yet, let's try and see if there's a OpenSSL
- # or C handler that can make sense of what we have so far.
- if ( $normalized_line !~ m|^#|
- && ($collected_stmt ne "" || $normalized_line ne "")
- && ! @{$state{c_parens}}
- && ! $state{in_string} ) {
- if ($opts{debug}) {
- print STDERR "DEBUG[OPENSSL C]: \$collected_stmt = '$collected_stmt'\n";
- print STDERR "DEBUG[OPENSSL C]: \$normalized_line = '$normalized_line'\n";
- }
- $opts{debug_type} = "OPENSSL C";
- my @r = ( _run_handlers($collected_stmt
- .$space
- .$normalized_line,
- @opensslchandlers,
- \%opts) );
- if (shift @r) {
- # Checking if there are lines to inject.
- if (@r) {
- @r = split $/, (pop @r).$_;
- print STDERR "DEBUG[OPENSSL]: injecting '", join("', '", @r),"'\n"
- if $opts{debug} && @r;
- @lines = ( @r, @lines );
- $_ = "";
- }
- $normalized_line = "";
- $collected_stmt = "";
- } else {
- if ($opts{debug}) {
- print STDERR "DEBUG[C]: \$collected_stmt = '$collected_stmt'\n";
- print STDERR "DEBUG[C]: \$normalized_line = '$normalized_line'\n";
- }
- $opts{debug_type} = "C";
- my @r = ( _run_handlers($collected_stmt
- .$space
- .$normalized_line,
- @chandlers,
- \%opts) );
- if (shift @r) {
- if (ref($r[0]) eq "HASH") {
- push @result, shift @r;
- }
- # Checking if there are lines to inject.
- if (@r) {
- @r = split $/, (pop @r).$_;
- print STDERR "DEBUG[C]: injecting '", join("', '", @r),"'\n"
- if $opts{debug} && @r;
- @lines = ( @r, @lines );
- $_ = "";
- }
- $normalized_line = "";
- $collected_stmt = "";
- }
- }
- }
- if ($_ eq "") {
- $collected_stmt .= $space.$normalized_line;
- $normalized_line = "";
- }
- }
- if ($_ eq "") {
- $_ = undef;
- last;
- }
- # Take care of inside string first.
- if ($state{in_string}) {
- if (m/ (?:^|(?<!\\)) # Make sure it's not escaped
- $state{in_string} # Look for matching quote
- /x) {
- $normalized_line .= $`.$&;
- $state{in_string} = "";
- $_ = $';
- next;
- } else {
- die "Unfinished string without continuation found$opts{PLACE}\n";
- }
- }
- # ... or inside comments, whichever happens to apply
- elsif ($state{in_comment}) {
- # This should never happen
- die "Something went seriously wrong, multiline //???$opts{PLACE}\n"
- if ($state{in_comment} eq "//");
- # A note: comments are simply discarded.
- if (m/ (?:^|(?<!\\)) # Make sure it's not escaped
- \*\/ # Look for C comment end
- /x) {
- $state{in_comment} = "";
- $_ = $';
- print STDERR "DEBUG: Found end of comment, followed by '$_'\n"
- if $opts{debug};
- next;
- } else {
- $_ = "";
- next;
- }
- }
- # At this point, it's safe to remove leading whites, but
- # we need to be careful with some preprocessor lines
- if (m|^\s+|) {
- my $rest = $';
- my $space = "";
- $space = " "
- if ($normalized_line =~ m/^
- \#define\s\w(?:\w|\d)*(?:<<<\([^\)]*\)>>>)?
- | \#[a-z]+
- $/x);
- print STDERR "DEBUG: Processing leading spaces: \$normalized_line = '$normalized_line', \$space = '$space', \$rest = '$rest'\n"
- if $opts{debug};
- $_ = $space.$rest;
- }
- my $parens =
- $normalized_line =~ m|^#| ? 'cpp_parens' : 'c_parens';
- (my $paren_singular = $parens) =~ s|s$||;
- # Now check for specific tokens, and if they are parens,
- # check them against $state{$parens}. Note that we surround
- # the outermost parens with extra "<<<" and ">>>". Those
- # are for the benefit of handlers who to need to detect
- # them, and they will be removed from the final output.
- if (m|^[\{\[\(]|) {
- my $body = $&;
- $_ = $';
- if (!@{$state{$parens}}) {
- if ("$normalized_line$body" =~ m|^extern "C"\{$|) {
- $state{in_extern_C} = 1;
- print STDERR "DEBUG: found start of 'extern \"C\"' ($normalized_line$body)\n"
- if $opts{debug};
- $normalized_line = "";
- } else {
- $normalized_line .= "<<<".$body;
- }
- } else {
- $normalized_line .= $body;
- }
- if ($normalized_line ne "") {
- print STDERR "DEBUG: found $paren_singular start '$body'\n"
- if $opts{debug};
- $body =~ tr|\{\[\(|\}\]\)|;
- print STDERR "DEBUG: pushing $paren_singular end '$body'\n"
- if $opts{debug};
- push @{$state{$parens}}, $body;
- }
- } elsif (m|^[\}\]\)]|) {
- $_ = $';
- if (!@{$state{$parens}}
- && $& eq '}' && $state{in_extern_C}) {
- print STDERR "DEBUG: found end of 'extern \"C\"'\n"
- if $opts{debug};
- $state{in_extern_C} = 0;
- } else {
- print STDERR "DEBUG: Trying to match '$&' against '"
- ,join("', '", @{$state{$parens}})
- ,"'\n"
- if $opts{debug};
- die "Unmatched parentheses$opts{PLACE}\n"
- unless (@{$state{$parens}}
- && pop @{$state{$parens}} eq $&);
- if (!@{$state{$parens}}) {
- $normalized_line .= $&.">>>";
- } else {
- $normalized_line .= $&;
- }
- }
- } elsif (m|^["']|) { # string start
- my $body = $&;
- $_ = $';
- # We want to separate strings from \w and \d with one space.
- $normalized_line .= " " if $normalized_line =~ m/(\w|\d)$/;
- $normalized_line .= $body;
- $state{in_string} = $body;
- } elsif (m|^\/\*|) { # C style comment
- print STDERR "DEBUG: found start of C style comment\n"
- if $opts{debug};
- $state{in_comment} = $&;
- $_ = $';
- } elsif (m|^\/\/|) { # C++ style comment
- print STDERR "DEBUG: found C++ style comment\n"
- if $opts{debug};
- $_ = ""; # (just discard it entirely)
- } elsif (m/^ (?| (?: 0[xX][[:xdigit:]]+ | 0[bB][01]+ | [0-9]+ )
- (?i: U | L | UL | LL | ULL )?
- | [0-9]+\.[0-9]+(?:[eE][\-\+]\d+)? (?i: F | L)?
- ) /x) {
- print STDERR "DEBUG: Processing numbers: \$normalized_line = '$normalized_line', \$& = '$&', \$' = '$''\n"
- if $opts{debug};
- $normalized_line .= $&;
- $_ = $';
- } elsif (m/^[[:alpha:]_]\w*/) {
- my $body = $&;
- my $rest = $';
- my $space = "";
- # Now, only add a space if it's needed to separate
- # two \w characters, and we also surround strings with
- # a space. In this case, that's if $normalized_line ends
- # with a \w, \d, " or '.
- $space = " "
- if ($normalized_line =~ m/("|')$/
- || ($normalized_line =~ m/(\w|\d)$/
- && $body =~ m/^(\w|\d)/));
- print STDERR "DEBUG: Processing words: \$normalized_line = '$normalized_line', \$space = '$space', \$body = '$body', \$rest = '$rest'\n"
- if $opts{debug};
- $normalized_line .= $space.$body;
- $_ = $rest;
- } elsif (m|^(?:\\)?.|) { # Catch-all
- $normalized_line .= $&;
- $_ = $';
- }
- }
- }
- }
- foreach my $handler (@endhandlers) {
- if ($handler->{massager}) {
- $handler->{massager}->(\%opts);
- }
- }
- return @result;
- }
- # arg1: line to check
- # arg2...: handlers to check
- # return undef when no handler matched
- sub _run_handlers {
- my %opts;
- if (ref($_[$#_]) eq "HASH") {
- %opts = %{$_[$#_]};
- pop @_;
- }
- my $line = shift;
- my @handlers = @_;
- foreach my $handler (@handlers) {
- if ($handler->{regexp}
- && $line =~ m|^$handler->{regexp}$|) {
- if ($handler->{massager}) {
- if ($opts{debug}) {
- print STDERR "DEBUG[",$opts{debug_type},"]: Trying to handle '$line'\n";
- print STDERR "DEBUG[",$opts{debug_type},"]: (matches /\^",$handler->{regexp},"\$/)\n";
- }
- my $saved_line = $line;
- my @massaged =
- map { s/(<<<|>>>)//g; $_ }
- $handler->{massager}->($saved_line, \%opts);
- print STDERR "DEBUG[",$opts{debug_type},"]: Got back '"
- , join("', '", @massaged), "'\n"
- if $opts{debug};
- # Because we may get back new lines to be
- # injected before whatever else that follows,
- # and the injected stuff might include
- # preprocessor lines, we need to inject them
- # in @lines and set $_ to the empty string to
- # break out from the inner loops
- my $injected_lines = shift @massaged || "";
- if (@massaged) {
- return (1,
- {
- name => shift @massaged,
- type => shift @massaged,
- returntype => shift @massaged,
- value => shift @massaged,
- conds => [ @massaged ]
- },
- $injected_lines
- );
- } else {
- print STDERR "DEBUG[",$opts{debug_type},"]: (ignore, possible side effects)\n"
- if $opts{debug} && $injected_lines eq "";
- return (1, $injected_lines);
- }
- }
- return (1);
- }
- }
- return (0);
- }
|