grpc 0.12.0 → 0.13.0.pre1.1
Sign up to get free protection for your applications and to get access to all the features.
Potentially problematic release.
This version of grpc might be problematic. Click here for more details.
- checksums.yaml +4 -4
- data/Makefile +5707 -22222
- data/include/grpc/byte_buffer.h +2 -83
- data/include/grpc/census.h +191 -121
- data/include/grpc/compression.h +14 -38
- data/include/grpc/grpc.h +88 -434
- data/include/grpc/grpc_security.h +76 -46
- data/include/grpc/grpc_zookeeper.h +1 -1
- data/include/grpc/impl/codegen/alloc.h +74 -0
- data/include/grpc/impl/codegen/atm.h +92 -0
- data/include/grpc/impl/codegen/atm_gcc_atomic.h +72 -0
- data/include/grpc/impl/codegen/atm_gcc_sync.h +87 -0
- data/include/grpc/impl/codegen/atm_win32.h +125 -0
- data/include/grpc/impl/codegen/byte_buffer.h +121 -0
- data/include/grpc/impl/codegen/compression_types.h +73 -0
- data/include/grpc/impl/codegen/connectivity_state.h +59 -0
- data/include/grpc/impl/codegen/grpc_types.h +373 -0
- data/include/grpc/impl/codegen/log.h +110 -0
- data/include/grpc/impl/codegen/port_platform.h +362 -0
- data/include/grpc/impl/codegen/propagation_bits.h +67 -0
- data/include/grpc/impl/codegen/slice.h +182 -0
- data/include/grpc/impl/codegen/slice_buffer.h +105 -0
- data/include/grpc/impl/codegen/status.h +163 -0
- data/include/grpc/impl/codegen/sync.h +316 -0
- data/include/grpc/impl/codegen/sync_generic.h +55 -0
- data/{src/core/census/context.h → include/grpc/impl/codegen/sync_posix.h} +11 -11
- data/include/grpc/impl/codegen/sync_win32.h +49 -0
- data/include/grpc/impl/codegen/time.h +132 -0
- data/include/grpc/status.h +2 -126
- data/include/grpc/support/alloc.h +2 -35
- data/include/grpc/support/atm.h +2 -55
- data/include/grpc/support/atm_gcc_atomic.h +5 -38
- data/include/grpc/support/atm_gcc_sync.h +2 -50
- data/include/grpc/support/atm_win32.h +2 -88
- data/include/grpc/support/avl.h +7 -7
- data/include/grpc/support/cmdline.h +15 -13
- data/include/grpc/support/cpu.h +5 -3
- data/include/grpc/support/histogram.h +23 -20
- data/include/grpc/support/host_port.h +5 -3
- data/include/grpc/support/log.h +2 -71
- data/include/grpc/support/log_win32.h +2 -2
- data/include/grpc/support/port_platform.h +2 -319
- data/include/grpc/support/slice.h +2 -145
- data/include/grpc/support/slice_buffer.h +2 -65
- data/include/grpc/support/string_util.h +3 -3
- data/include/grpc/support/subprocess.h +8 -6
- data/include/grpc/support/sync.h +2 -278
- data/include/grpc/support/sync_generic.h +2 -18
- data/include/grpc/support/sync_posix.h +2 -10
- data/include/grpc/support/sync_win32.h +2 -12
- data/include/grpc/support/thd.h +11 -11
- data/include/grpc/support/time.h +2 -91
- data/include/grpc/support/tls.h +1 -1
- data/include/grpc/support/tls_gcc.h +1 -1
- data/include/grpc/support/tls_msvc.h +1 -1
- data/include/grpc/support/tls_pthread.h +2 -2
- data/src/boringssl/err_data.c +1252 -0
- data/src/core/census/context.c +492 -8
- data/src/core/census/grpc_filter.c +3 -3
- data/src/core/census/initialize.c +4 -7
- data/src/core/census/operation.c +2 -2
- data/src/core/census/placeholders.c +109 -0
- data/src/core/census/rpc_metric_id.h +6 -6
- data/src/core/census/tracing.c +1 -1
- data/src/core/channel/channel_args.c +4 -3
- data/src/core/channel/channel_stack.c +1 -1
- data/src/core/channel/client_channel.c +18 -14
- data/src/core/channel/client_uchannel.c +3 -3
- data/src/core/channel/compress_filter.c +8 -8
- data/src/core/channel/http_client_filter.c +2 -2
- data/src/core/channel/http_server_filter.c +9 -9
- data/src/core/channel/subchannel_call_holder.c +12 -10
- data/src/core/client_config/lb_policies/pick_first.c +49 -31
- data/src/core/client_config/lb_policies/round_robin.c +7 -7
- data/src/core/client_config/resolvers/dns_resolver.c +3 -3
- data/src/core/client_config/resolvers/sockaddr_resolver.c +5 -5
- data/src/core/client_config/subchannel.c +36 -25
- data/src/core/compression/algorithm.c +3 -3
- data/src/core/httpcli/format_request.c +1 -1
- data/src/core/httpcli/httpcli.c +5 -5
- data/src/core/httpcli/httpcli_security_connector.c +2 -3
- data/src/core/httpcli/parser.c +7 -7
- data/src/core/httpcli/parser.h +1 -1
- data/src/core/iomgr/closure.c +7 -7
- data/src/core/iomgr/closure.h +6 -5
- data/src/core/iomgr/exec_ctx.c +12 -8
- data/src/core/iomgr/exec_ctx.h +12 -5
- data/src/core/iomgr/executor.c +4 -4
- data/src/core/iomgr/executor.h +2 -2
- data/src/core/iomgr/fd_posix.c +28 -17
- data/src/core/iomgr/fd_posix.h +7 -4
- data/src/core/iomgr/iocp_windows.c +6 -8
- data/src/core/iomgr/pollset_multipoller_with_epoll.c +70 -5
- data/src/core/iomgr/pollset_multipoller_with_poll_posix.c +4 -2
- data/src/core/iomgr/pollset_posix.c +15 -15
- data/src/core/iomgr/pollset_posix.h +4 -2
- data/src/core/iomgr/pollset_windows.c +3 -12
- data/src/core/iomgr/resolve_address_posix.c +2 -2
- data/src/core/iomgr/resolve_address_windows.c +2 -2
- data/src/core/iomgr/sockaddr_utils.c +6 -6
- data/src/core/iomgr/sockaddr_win32.h +1 -6
- data/src/core/iomgr/tcp_client_posix.c +7 -7
- data/src/core/iomgr/tcp_client_windows.c +4 -4
- data/src/core/iomgr/tcp_posix.c +14 -8
- data/src/core/iomgr/tcp_posix.h +7 -1
- data/src/core/iomgr/tcp_server.h +40 -20
- data/src/core/iomgr/tcp_server_posix.c +106 -49
- data/src/core/iomgr/tcp_server_windows.c +98 -49
- data/src/core/iomgr/tcp_windows.c +11 -15
- data/src/core/iomgr/timer.c +8 -8
- data/src/core/iomgr/timer.h +1 -1
- data/src/core/iomgr/timer_heap.c +10 -10
- data/src/core/iomgr/timer_heap.h +2 -2
- data/src/core/iomgr/udp_server.c +2 -12
- data/src/core/iomgr/udp_server.h +1 -9
- data/src/core/iomgr/workqueue.h +2 -4
- data/src/core/iomgr/workqueue_posix.c +3 -3
- data/src/core/json/json_reader.c +11 -12
- data/src/core/json/json_reader.h +4 -4
- data/src/core/json/json_string.c +19 -19
- data/src/core/json/json_writer.c +7 -9
- data/src/core/profiling/basic_timers.c +1 -1
- data/src/core/security/base64.c +9 -9
- data/src/core/security/client_auth_filter.c +4 -4
- data/src/core/security/credentials.c +5 -5
- data/src/core/security/google_default_credentials.c +3 -3
- data/src/core/security/handshake.c +6 -5
- data/src/core/security/json_token.c +13 -7
- data/src/core/security/jwt_verifier.c +3 -2
- data/src/core/security/secure_endpoint.c +16 -16
- data/src/core/security/security_connector.c +47 -17
- data/src/core/security/security_connector.h +5 -5
- data/src/core/security/server_auth_filter.c +3 -3
- data/src/core/security/server_secure_chttp2.c +30 -31
- data/src/core/statistics/census_interface.h +2 -2
- data/src/core/statistics/census_rpc_stats.h +3 -3
- data/src/core/support/alloc.c +1 -1
- data/src/core/support/cpu_posix.c +2 -2
- data/src/core/support/env_linux.c +12 -2
- data/src/core/support/env_win32.c +15 -7
- data/src/core/support/histogram.c +5 -5
- data/src/core/support/log_posix.c +1 -1
- data/src/core/support/log_win32.c +4 -3
- data/src/core/support/murmur_hash.c +11 -11
- data/src/core/support/murmur_hash.h +1 -1
- data/src/core/support/slice.c +11 -11
- data/src/core/support/slice_buffer.c +6 -6
- data/src/core/support/stack_lockfree.c +20 -10
- data/src/core/support/string.c +15 -15
- data/src/core/support/string.h +5 -5
- data/src/core/support/string_win32.c +5 -5
- data/src/core/support/subprocess_windows.c +141 -0
- data/src/core/support/sync.c +4 -4
- data/src/core/support/sync_posix.c +2 -2
- data/src/core/support/sync_win32.c +10 -5
- data/src/core/support/time.c +29 -29
- data/src/core/support/time_posix.c +15 -6
- data/src/core/support/time_precise.c +2 -2
- data/src/core/support/time_win32.c +18 -9
- data/src/core/support/tls_pthread.c +1 -1
- data/src/core/support/wrap_memcpy.c +53 -0
- data/src/core/surface/alarm.c +83 -0
- data/src/core/surface/byte_buffer_reader.c +1 -1
- data/src/core/surface/call.c +78 -69
- data/src/core/surface/call.h +2 -2
- data/src/core/surface/call_test_only.h +2 -2
- data/src/core/surface/channel.c +9 -9
- data/src/core/surface/channel.h +1 -1
- data/src/core/surface/channel_connectivity.c +3 -3
- data/src/core/surface/channel_create.c +3 -3
- data/src/core/surface/channel_ping.c +2 -2
- data/src/core/surface/completion_queue.c +11 -12
- data/src/core/surface/completion_queue.h +1 -1
- data/src/core/surface/init.c +7 -5
- data/src/core/surface/lame_client.c +3 -3
- data/src/core/surface/secure_channel_create.c +3 -3
- data/src/core/surface/server.c +28 -28
- data/src/core/surface/server_chttp2.c +8 -8
- data/src/core/surface/server_create.c +1 -4
- data/src/core/surface/validate_metadata.c +3 -3
- data/src/core/surface/version.c +2 -2
- data/src/core/transport/byte_stream.c +8 -6
- data/src/core/transport/byte_stream.h +6 -5
- data/src/core/transport/chttp2/bin_encoder.c +29 -29
- data/src/core/transport/chttp2/frame_data.c +29 -26
- data/src/core/transport/chttp2/frame_data.h +6 -6
- data/src/core/transport/chttp2/frame_goaway.c +30 -30
- data/src/core/transport/chttp2/frame_goaway.h +6 -6
- data/src/core/transport/chttp2/frame_ping.c +6 -6
- data/src/core/transport/chttp2/frame_ping.h +5 -5
- data/src/core/transport/chttp2/frame_rst_stream.c +18 -19
- data/src/core/transport/chttp2/frame_rst_stream.h +4 -4
- data/src/core/transport/chttp2/frame_settings.c +30 -30
- data/src/core/transport/chttp2/frame_settings.h +13 -13
- data/src/core/transport/chttp2/frame_window_update.c +17 -18
- data/src/core/transport/chttp2/frame_window_update.h +5 -7
- data/src/core/transport/chttp2/hpack_encoder.c +69 -73
- data/src/core/transport/chttp2/hpack_encoder.h +16 -16
- data/src/core/transport/chttp2/hpack_parser.c +167 -167
- data/src/core/transport/chttp2/hpack_parser.h +16 -16
- data/src/core/transport/chttp2/hpack_table.c +13 -13
- data/src/core/transport/chttp2/hpack_table.h +11 -11
- data/src/core/transport/chttp2/internal.h +97 -86
- data/src/core/transport/chttp2/parsing.c +25 -25
- data/src/core/transport/chttp2/stream_lists.c +26 -3
- data/src/core/transport/chttp2/stream_map.c +13 -14
- data/src/core/transport/chttp2/stream_map.h +6 -7
- data/src/core/transport/chttp2/timeout_encoding.c +19 -16
- data/src/core/transport/chttp2/varint.c +8 -9
- data/src/core/transport/chttp2/varint.h +7 -8
- data/src/core/transport/chttp2/writing.c +26 -23
- data/src/core/transport/chttp2_transport.c +133 -92
- data/src/core/transport/connectivity_state.c +6 -6
- data/src/core/transport/metadata.c +18 -18
- data/src/core/transport/metadata.h +5 -5
- data/src/core/transport/static_metadata.c +15 -16
- data/src/core/transport/static_metadata.h +5 -5
- data/src/core/transport/transport.c +5 -5
- data/src/core/transport/transport.h +14 -1
- data/src/core/tsi/fake_transport_security.c +7 -7
- data/src/core/tsi/ssl_transport_security.c +6 -4
- data/src/core/tsi/ssl_types.h +55 -0
- data/src/ruby/ext/grpc/extconf.rb +51 -14
- data/src/ruby/ext/grpc/rb_byte_buffer.c +3 -1
- data/src/ruby/ext/grpc/rb_call.c +6 -3
- data/src/ruby/ext/grpc/rb_call_credentials.c +4 -0
- data/src/ruby/ext/grpc/rb_channel.c +4 -2
- data/src/ruby/ext/grpc/rb_channel_args.c +3 -1
- data/src/ruby/ext/grpc/rb_channel_credentials.c +3 -1
- data/src/ruby/ext/grpc/rb_completion_queue.c +3 -1
- data/src/ruby/ext/grpc/rb_event_thread.c +5 -0
- data/src/ruby/ext/grpc/rb_grpc.c +11 -3
- data/src/ruby/ext/grpc/rb_grpc_imports.generated.c +560 -0
- data/src/ruby/ext/grpc/rb_grpc_imports.generated.h +843 -0
- data/src/ruby/ext/grpc/rb_loader.c +72 -0
- data/src/ruby/ext/grpc/rb_loader.h +40 -0
- data/src/ruby/ext/grpc/rb_server.c +3 -1
- data/src/ruby/ext/grpc/rb_server_credentials.c +4 -2
- data/src/ruby/lib/grpc/generic/bidi_call.rb +1 -1
- data/src/ruby/lib/grpc/generic/rpc_desc.rb +1 -1
- data/src/ruby/lib/grpc/generic/rpc_server.rb +1 -1
- data/src/ruby/lib/grpc/grpc.rb +34 -0
- data/src/ruby/lib/grpc/version.rb +1 -1
- data/src/ruby/spec/pb/health/checker_spec.rb +1 -1
- data/third_party/boringssl/crypto/aes/aes.c +1142 -0
- data/third_party/boringssl/crypto/aes/internal.h +87 -0
- data/third_party/boringssl/crypto/aes/mode_wrappers.c +108 -0
- data/third_party/boringssl/crypto/asn1/a_bitstr.c +255 -0
- data/third_party/boringssl/crypto/asn1/a_bool.c +112 -0
- data/third_party/boringssl/crypto/asn1/a_bytes.c +317 -0
- data/third_party/boringssl/crypto/asn1/a_d2i_fp.c +286 -0
- data/third_party/boringssl/crypto/asn1/a_dup.c +103 -0
- data/third_party/boringssl/crypto/asn1/a_enum.c +183 -0
- data/third_party/boringssl/crypto/asn1/a_gentm.c +255 -0
- data/third_party/boringssl/crypto/asn1/a_i2d_fp.c +154 -0
- data/third_party/boringssl/crypto/asn1/a_int.c +456 -0
- data/third_party/boringssl/crypto/asn1/a_mbstr.c +390 -0
- data/third_party/boringssl/crypto/asn1/a_object.c +412 -0
- data/third_party/boringssl/crypto/asn1/a_octet.c +70 -0
- data/third_party/boringssl/crypto/asn1/a_print.c +119 -0
- data/third_party/boringssl/crypto/asn1/a_strnid.c +286 -0
- data/third_party/boringssl/crypto/asn1/a_time.c +221 -0
- data/third_party/boringssl/crypto/asn1/a_type.c +160 -0
- data/third_party/boringssl/crypto/asn1/a_utctm.c +342 -0
- data/third_party/boringssl/crypto/asn1/a_utf8.c +210 -0
- data/third_party/boringssl/crypto/asn1/asn1_lib.c +510 -0
- data/third_party/boringssl/crypto/asn1/asn1_locl.h +73 -0
- data/third_party/boringssl/crypto/asn1/asn1_par.c +444 -0
- data/third_party/boringssl/crypto/asn1/asn_pack.c +104 -0
- data/third_party/boringssl/crypto/asn1/bio_asn1.c +496 -0
- data/third_party/boringssl/crypto/asn1/bio_ndef.c +254 -0
- data/third_party/boringssl/crypto/asn1/f_enum.c +206 -0
- data/third_party/boringssl/crypto/asn1/f_int.c +210 -0
- data/third_party/boringssl/crypto/asn1/f_string.c +204 -0
- data/third_party/boringssl/crypto/asn1/t_bitst.c +102 -0
- data/third_party/boringssl/crypto/asn1/t_pkey.c +112 -0
- data/third_party/boringssl/crypto/asn1/tasn_dec.c +1342 -0
- data/third_party/boringssl/crypto/asn1/tasn_enc.c +695 -0
- data/third_party/boringssl/crypto/asn1/tasn_fre.c +264 -0
- data/third_party/boringssl/crypto/asn1/tasn_new.c +398 -0
- data/third_party/boringssl/crypto/asn1/tasn_prn.c +642 -0
- data/third_party/boringssl/crypto/asn1/tasn_typ.c +137 -0
- data/third_party/boringssl/crypto/asn1/tasn_utl.c +266 -0
- data/third_party/boringssl/crypto/asn1/x_bignum.c +143 -0
- data/third_party/boringssl/crypto/asn1/x_long.c +182 -0
- data/third_party/boringssl/crypto/base64/base64.c +478 -0
- data/third_party/boringssl/crypto/bio/bio.c +608 -0
- data/third_party/boringssl/crypto/bio/bio_mem.c +327 -0
- data/third_party/boringssl/crypto/bio/buffer.c +496 -0
- data/third_party/boringssl/crypto/bio/connect.c +544 -0
- data/third_party/boringssl/crypto/bio/fd.c +270 -0
- data/third_party/boringssl/crypto/bio/file.c +349 -0
- data/third_party/boringssl/crypto/bio/hexdump.c +192 -0
- data/third_party/boringssl/crypto/bio/internal.h +108 -0
- data/third_party/boringssl/crypto/bio/pair.c +803 -0
- data/third_party/boringssl/crypto/bio/printf.c +119 -0
- data/third_party/boringssl/crypto/bio/socket.c +195 -0
- data/third_party/boringssl/crypto/bio/socket_helper.c +113 -0
- data/third_party/boringssl/crypto/bn/add.c +377 -0
- data/third_party/boringssl/crypto/bn/asm/x86_64-gcc.c +599 -0
- data/third_party/boringssl/crypto/bn/bn.c +341 -0
- data/third_party/boringssl/crypto/bn/bn_asn1.c +93 -0
- data/third_party/boringssl/crypto/bn/cmp.c +200 -0
- data/third_party/boringssl/crypto/bn/convert.c +597 -0
- data/third_party/boringssl/crypto/bn/ctx.c +311 -0
- data/third_party/boringssl/crypto/bn/div.c +625 -0
- data/third_party/boringssl/crypto/bn/exponentiation.c +1544 -0
- data/third_party/boringssl/crypto/bn/gcd.c +711 -0
- data/third_party/boringssl/crypto/bn/generic.c +1019 -0
- data/third_party/boringssl/crypto/bn/internal.h +294 -0
- data/third_party/boringssl/crypto/bn/kronecker.c +175 -0
- data/third_party/boringssl/crypto/bn/montgomery.c +561 -0
- data/third_party/boringssl/crypto/bn/mul.c +888 -0
- data/third_party/boringssl/crypto/bn/prime.c +845 -0
- data/third_party/boringssl/crypto/bn/random.c +326 -0
- data/third_party/boringssl/crypto/bn/rsaz_exp.c +326 -0
- data/third_party/boringssl/crypto/bn/rsaz_exp.h +56 -0
- data/third_party/boringssl/crypto/bn/shift.c +299 -0
- data/third_party/boringssl/crypto/bn/sqrt.c +505 -0
- data/third_party/boringssl/crypto/buf/buf.c +235 -0
- data/third_party/boringssl/crypto/bytestring/ber.c +221 -0
- data/third_party/boringssl/crypto/bytestring/cbb.c +411 -0
- data/third_party/boringssl/crypto/bytestring/cbs.c +415 -0
- data/third_party/boringssl/crypto/bytestring/internal.h +46 -0
- data/third_party/boringssl/crypto/chacha/chacha_generic.c +140 -0
- data/third_party/boringssl/crypto/chacha/chacha_vec.c +323 -0
- data/third_party/boringssl/crypto/cipher/aead.c +167 -0
- data/third_party/boringssl/crypto/cipher/cipher.c +652 -0
- data/third_party/boringssl/crypto/cipher/derive_key.c +154 -0
- data/third_party/boringssl/crypto/cipher/e_aes.c +1767 -0
- data/third_party/boringssl/crypto/cipher/e_chacha20poly1305.c +311 -0
- data/third_party/boringssl/crypto/cipher/e_des.c +207 -0
- data/third_party/boringssl/crypto/cipher/e_null.c +85 -0
- data/third_party/boringssl/crypto/cipher/e_rc2.c +443 -0
- data/third_party/boringssl/crypto/cipher/e_rc4.c +87 -0
- data/third_party/boringssl/crypto/cipher/e_ssl3.c +463 -0
- data/third_party/boringssl/crypto/cipher/e_tls.c +673 -0
- data/third_party/boringssl/crypto/cipher/internal.h +164 -0
- data/third_party/boringssl/crypto/cipher/tls_cbc.c +495 -0
- data/third_party/boringssl/crypto/cmac/cmac.c +239 -0
- data/third_party/boringssl/crypto/conf/conf.c +778 -0
- data/third_party/boringssl/crypto/conf/conf_def.h +127 -0
- data/third_party/boringssl/crypto/conf/internal.h +31 -0
- data/third_party/boringssl/crypto/cpu-arm.c +199 -0
- data/third_party/boringssl/crypto/cpu-intel.c +261 -0
- data/third_party/boringssl/crypto/crypto.c +140 -0
- data/third_party/boringssl/crypto/curve25519/curve25519.c +4897 -0
- data/third_party/boringssl/crypto/des/des.c +771 -0
- data/third_party/boringssl/crypto/des/internal.h +212 -0
- data/third_party/boringssl/crypto/dh/check.c +180 -0
- data/third_party/boringssl/crypto/dh/dh.c +463 -0
- data/third_party/boringssl/crypto/dh/dh_asn1.c +84 -0
- data/third_party/boringssl/crypto/dh/internal.h +80 -0
- data/third_party/boringssl/crypto/dh/params.c +301 -0
- data/third_party/boringssl/crypto/digest/digest.c +248 -0
- data/third_party/boringssl/crypto/digest/digests.c +321 -0
- data/third_party/boringssl/crypto/digest/internal.h +112 -0
- data/third_party/boringssl/crypto/digest/md32_common.h +322 -0
- data/third_party/boringssl/crypto/directory.h +66 -0
- data/third_party/boringssl/crypto/directory_posix.c +108 -0
- data/third_party/boringssl/crypto/directory_win.c +144 -0
- data/third_party/boringssl/crypto/dsa/dsa.c +908 -0
- data/third_party/boringssl/crypto/dsa/dsa_asn1.c +150 -0
- data/third_party/boringssl/crypto/dsa/internal.h +78 -0
- data/third_party/boringssl/crypto/ec/ec.c +889 -0
- data/third_party/boringssl/crypto/ec/ec_asn1.c +586 -0
- data/third_party/boringssl/crypto/ec/ec_key.c +482 -0
- data/third_party/boringssl/crypto/ec/ec_montgomery.c +280 -0
- data/third_party/boringssl/crypto/ec/internal.h +318 -0
- data/third_party/boringssl/crypto/ec/oct.c +416 -0
- data/third_party/boringssl/crypto/ec/p224-64.c +1305 -0
- data/third_party/boringssl/crypto/ec/p256-64.c +1878 -0
- data/third_party/boringssl/crypto/ec/p256-x86_64-table.h +9548 -0
- data/third_party/boringssl/crypto/ec/p256-x86_64.c +596 -0
- data/third_party/boringssl/crypto/ec/simple.c +1313 -0
- data/third_party/boringssl/crypto/ec/util-64.c +183 -0
- data/third_party/boringssl/crypto/ec/wnaf.c +449 -0
- data/third_party/boringssl/crypto/ecdh/ecdh.c +153 -0
- data/third_party/boringssl/crypto/ecdsa/ecdsa.c +496 -0
- data/third_party/boringssl/crypto/ecdsa/ecdsa_asn1.c +240 -0
- data/third_party/boringssl/crypto/engine/engine.c +96 -0
- data/third_party/boringssl/crypto/err/err.c +756 -0
- data/third_party/boringssl/crypto/evp/algorithm.c +153 -0
- data/third_party/boringssl/crypto/evp/digestsign.c +159 -0
- data/third_party/boringssl/crypto/evp/evp.c +411 -0
- data/third_party/boringssl/crypto/evp/evp_asn1.c +179 -0
- data/third_party/boringssl/crypto/evp/evp_ctx.c +477 -0
- data/third_party/boringssl/crypto/evp/internal.h +278 -0
- data/third_party/boringssl/crypto/evp/p_dsa_asn1.c +588 -0
- data/third_party/boringssl/crypto/evp/p_ec.c +283 -0
- data/third_party/boringssl/crypto/evp/p_ec_asn1.c +562 -0
- data/third_party/boringssl/crypto/evp/p_rsa.c +596 -0
- data/third_party/boringssl/crypto/evp/p_rsa_asn1.c +737 -0
- data/third_party/boringssl/crypto/evp/pbkdf.c +151 -0
- data/third_party/boringssl/crypto/evp/sign.c +151 -0
- data/third_party/boringssl/crypto/ex_data.c +294 -0
- data/third_party/boringssl/crypto/hkdf/hkdf.c +89 -0
- data/third_party/boringssl/crypto/hmac/hmac.c +213 -0
- data/third_party/boringssl/crypto/internal.h +532 -0
- data/third_party/boringssl/crypto/lhash/lhash.c +346 -0
- data/third_party/boringssl/crypto/md4/md4.c +225 -0
- data/third_party/boringssl/crypto/md5/md5.c +275 -0
- data/third_party/boringssl/crypto/mem.c +200 -0
- data/third_party/boringssl/crypto/modes/cbc.c +216 -0
- data/third_party/boringssl/crypto/modes/cfb.c +231 -0
- data/third_party/boringssl/crypto/modes/ctr.c +226 -0
- data/third_party/boringssl/crypto/modes/gcm.c +1252 -0
- data/third_party/boringssl/crypto/modes/internal.h +370 -0
- data/third_party/boringssl/crypto/modes/ofb.c +108 -0
- data/third_party/boringssl/crypto/obj/obj.c +664 -0
- data/third_party/boringssl/crypto/obj/obj_dat.h +5257 -0
- data/third_party/boringssl/crypto/obj/obj_xref.c +124 -0
- data/third_party/boringssl/crypto/obj/obj_xref.h +96 -0
- data/third_party/boringssl/crypto/pem/pem_all.c +281 -0
- data/third_party/boringssl/crypto/pem/pem_info.c +404 -0
- data/third_party/boringssl/crypto/pem/pem_lib.c +835 -0
- data/third_party/boringssl/crypto/pem/pem_oth.c +89 -0
- data/third_party/boringssl/crypto/pem/pem_pk8.c +244 -0
- data/third_party/boringssl/crypto/pem/pem_pkey.c +312 -0
- data/third_party/boringssl/crypto/pem/pem_x509.c +65 -0
- data/third_party/boringssl/crypto/pem/pem_xaux.c +66 -0
- data/third_party/boringssl/crypto/pkcs8/internal.h +83 -0
- data/third_party/boringssl/crypto/pkcs8/p5_pbe.c +150 -0
- data/third_party/boringssl/crypto/pkcs8/p5_pbev2.c +440 -0
- data/third_party/boringssl/crypto/pkcs8/p8_pkey.c +85 -0
- data/third_party/boringssl/crypto/pkcs8/pkcs8.c +1217 -0
- data/third_party/boringssl/crypto/poly1305/poly1305.c +331 -0
- data/third_party/boringssl/crypto/poly1305/poly1305_arm.c +301 -0
- data/third_party/boringssl/crypto/poly1305/poly1305_vec.c +892 -0
- data/third_party/boringssl/crypto/rand/internal.h +32 -0
- data/third_party/boringssl/crypto/rand/rand.c +239 -0
- data/third_party/boringssl/crypto/rand/urandom.c +223 -0
- data/third_party/boringssl/crypto/rand/windows.c +56 -0
- data/third_party/boringssl/crypto/rc4/rc4.c +283 -0
- data/third_party/boringssl/crypto/refcount_c11.c +67 -0
- data/third_party/boringssl/crypto/refcount_lock.c +53 -0
- data/third_party/boringssl/crypto/rsa/blinding.c +462 -0
- data/third_party/boringssl/crypto/rsa/internal.h +164 -0
- data/third_party/boringssl/crypto/rsa/padding.c +711 -0
- data/third_party/boringssl/crypto/rsa/rsa.c +808 -0
- data/third_party/boringssl/crypto/rsa/rsa_asn1.c +473 -0
- data/third_party/boringssl/crypto/rsa/rsa_impl.c +1138 -0
- data/third_party/boringssl/crypto/sha/sha1.c +337 -0
- data/third_party/boringssl/crypto/sha/sha256.c +327 -0
- data/third_party/boringssl/crypto/sha/sha512.c +607 -0
- data/third_party/boringssl/crypto/stack/stack.c +386 -0
- data/third_party/boringssl/crypto/test/scoped_types.h +137 -0
- data/third_party/boringssl/crypto/test/test_util.h +35 -0
- data/third_party/boringssl/crypto/thread.c +101 -0
- data/third_party/boringssl/crypto/thread_none.c +55 -0
- data/third_party/boringssl/crypto/thread_pthread.c +167 -0
- data/third_party/boringssl/crypto/thread_win.c +282 -0
- data/third_party/boringssl/crypto/time_support.c +212 -0
- data/third_party/boringssl/crypto/x509/a_digest.c +97 -0
- data/third_party/boringssl/crypto/x509/a_sign.c +136 -0
- data/third_party/boringssl/crypto/x509/a_strex.c +564 -0
- data/third_party/boringssl/crypto/x509/a_verify.c +133 -0
- data/third_party/boringssl/crypto/x509/asn1_gen.c +873 -0
- data/third_party/boringssl/crypto/x509/by_dir.c +491 -0
- data/third_party/boringssl/crypto/x509/by_file.c +295 -0
- data/third_party/boringssl/crypto/x509/charmap.h +15 -0
- data/third_party/boringssl/crypto/x509/i2d_pr.c +84 -0
- data/third_party/boringssl/crypto/x509/pkcs7.c +353 -0
- data/third_party/boringssl/crypto/x509/t_crl.c +129 -0
- data/third_party/boringssl/crypto/x509/t_req.c +246 -0
- data/third_party/boringssl/crypto/x509/t_x509.c +500 -0
- data/third_party/boringssl/crypto/x509/t_x509a.c +109 -0
- data/third_party/boringssl/crypto/x509/vpm_int.h +70 -0
- data/third_party/boringssl/crypto/x509/x509.c +152 -0
- data/third_party/boringssl/crypto/x509/x509_att.c +353 -0
- data/third_party/boringssl/crypto/x509/x509_cmp.c +490 -0
- data/third_party/boringssl/crypto/x509/x509_d2.c +105 -0
- data/third_party/boringssl/crypto/x509/x509_def.c +88 -0
- data/third_party/boringssl/crypto/x509/x509_ext.c +206 -0
- data/third_party/boringssl/crypto/x509/x509_lu.c +738 -0
- data/third_party/boringssl/crypto/x509/x509_obj.c +191 -0
- data/third_party/boringssl/crypto/x509/x509_r2x.c +113 -0
- data/third_party/boringssl/crypto/x509/x509_req.c +315 -0
- data/third_party/boringssl/crypto/x509/x509_set.c +154 -0
- data/third_party/boringssl/crypto/x509/x509_trs.c +304 -0
- data/third_party/boringssl/crypto/x509/x509_txt.c +209 -0
- data/third_party/boringssl/crypto/x509/x509_v3.c +271 -0
- data/third_party/boringssl/crypto/x509/x509_vfy.c +2456 -0
- data/third_party/boringssl/crypto/x509/x509_vpm.c +672 -0
- data/third_party/boringssl/crypto/x509/x509cset.c +172 -0
- data/third_party/boringssl/crypto/x509/x509name.c +381 -0
- data/third_party/boringssl/crypto/x509/x509rset.c +80 -0
- data/third_party/boringssl/crypto/x509/x509spki.c +135 -0
- data/third_party/boringssl/crypto/x509/x509type.c +128 -0
- data/third_party/boringssl/crypto/x509/x_algor.c +154 -0
- data/third_party/boringssl/crypto/x509/x_all.c +547 -0
- data/third_party/boringssl/crypto/x509/x_attrib.c +117 -0
- data/third_party/boringssl/crypto/x509/x_crl.c +560 -0
- data/third_party/boringssl/crypto/x509/x_exten.c +75 -0
- data/third_party/boringssl/crypto/x509/x_info.c +95 -0
- data/third_party/boringssl/crypto/x509/x_name.c +538 -0
- data/third_party/boringssl/crypto/x509/x_pkey.c +100 -0
- data/third_party/boringssl/crypto/x509/x_pubkey.c +384 -0
- data/third_party/boringssl/crypto/x509/x_req.c +112 -0
- data/third_party/boringssl/crypto/x509/x_sig.c +69 -0
- data/third_party/boringssl/crypto/x509/x_spki.c +78 -0
- data/third_party/boringssl/crypto/x509/x_val.c +69 -0
- data/third_party/boringssl/crypto/x509/x_x509.c +227 -0
- data/third_party/boringssl/crypto/x509/x_x509a.c +197 -0
- data/third_party/boringssl/crypto/x509v3/ext_dat.h +129 -0
- data/third_party/boringssl/crypto/x509v3/pcy_cache.c +299 -0
- data/third_party/boringssl/crypto/x509v3/pcy_data.c +137 -0
- data/third_party/boringssl/crypto/x509v3/pcy_int.h +212 -0
- data/third_party/boringssl/crypto/x509v3/pcy_lib.c +165 -0
- data/third_party/boringssl/crypto/x509v3/pcy_map.c +133 -0
- data/third_party/boringssl/crypto/x509v3/pcy_node.c +197 -0
- data/third_party/boringssl/crypto/x509v3/pcy_tree.c +876 -0
- data/third_party/boringssl/crypto/x509v3/v3_akey.c +212 -0
- data/third_party/boringssl/crypto/x509v3/v3_akeya.c +71 -0
- data/third_party/boringssl/crypto/x509v3/v3_alt.c +622 -0
- data/third_party/boringssl/crypto/x509v3/v3_bcons.c +126 -0
- data/third_party/boringssl/crypto/x509v3/v3_bitst.c +141 -0
- data/third_party/boringssl/crypto/x509v3/v3_conf.c +459 -0
- data/third_party/boringssl/crypto/x509v3/v3_cpols.c +475 -0
- data/third_party/boringssl/crypto/x509v3/v3_crld.c +616 -0
- data/third_party/boringssl/crypto/x509v3/v3_enum.c +98 -0
- data/third_party/boringssl/crypto/x509v3/v3_extku.c +145 -0
- data/third_party/boringssl/crypto/x509v3/v3_genn.c +252 -0
- data/third_party/boringssl/crypto/x509v3/v3_ia5.c +117 -0
- data/third_party/boringssl/crypto/x509v3/v3_info.c +200 -0
- data/third_party/boringssl/crypto/x509v3/v3_int.c +87 -0
- data/third_party/boringssl/crypto/x509v3/v3_lib.c +335 -0
- data/third_party/boringssl/crypto/x509v3/v3_ncons.c +510 -0
- data/third_party/boringssl/crypto/x509v3/v3_pci.c +335 -0
- data/third_party/boringssl/crypto/x509v3/v3_pcia.c +56 -0
- data/third_party/boringssl/crypto/x509v3/v3_pcons.c +142 -0
- data/third_party/boringssl/crypto/x509v3/v3_pku.c +109 -0
- data/third_party/boringssl/crypto/x509v3/v3_pmaps.c +156 -0
- data/third_party/boringssl/crypto/x509v3/v3_prn.c +207 -0
- data/third_party/boringssl/crypto/x509v3/v3_purp.c +805 -0
- data/third_party/boringssl/crypto/x509v3/v3_skey.c +148 -0
- data/third_party/boringssl/crypto/x509v3/v3_sxnet.c +266 -0
- data/third_party/boringssl/crypto/x509v3/v3_utl.c +1322 -0
- data/third_party/boringssl/include/openssl/aead.h +346 -0
- data/third_party/boringssl/include/openssl/aes.h +158 -0
- data/third_party/boringssl/include/openssl/arm_arch.h +127 -0
- data/third_party/boringssl/include/openssl/asn1.h +1168 -0
- data/third_party/boringssl/include/openssl/asn1_mac.h +75 -0
- data/third_party/boringssl/include/openssl/asn1t.h +906 -0
- data/third_party/boringssl/include/openssl/base.h +261 -0
- data/third_party/boringssl/include/openssl/base64.h +184 -0
- data/third_party/boringssl/include/openssl/bio.h +902 -0
- data/third_party/boringssl/include/openssl/blowfish.h +93 -0
- data/third_party/boringssl/include/openssl/bn.h +885 -0
- data/third_party/boringssl/include/openssl/buf.h +118 -0
- data/third_party/boringssl/include/openssl/buffer.h +18 -0
- data/third_party/boringssl/include/openssl/bytestring.h +360 -0
- data/third_party/boringssl/include/openssl/cast.h +96 -0
- data/third_party/boringssl/include/openssl/chacha.h +37 -0
- data/third_party/boringssl/include/openssl/cipher.h +571 -0
- data/third_party/boringssl/include/openssl/cmac.h +76 -0
- data/third_party/boringssl/include/openssl/conf.h +145 -0
- data/third_party/boringssl/include/openssl/cpu.h +184 -0
- data/third_party/boringssl/include/openssl/crypto.h +68 -0
- data/third_party/boringssl/include/openssl/curve25519.h +88 -0
- data/third_party/boringssl/include/openssl/des.h +177 -0
- data/third_party/boringssl/include/openssl/dh.h +238 -0
- data/third_party/boringssl/include/openssl/digest.h +258 -0
- data/third_party/boringssl/include/openssl/dsa.h +343 -0
- data/third_party/boringssl/include/openssl/dtls1.h +16 -0
- data/third_party/boringssl/include/openssl/ec.h +355 -0
- data/third_party/boringssl/include/openssl/ec_key.h +280 -0
- data/third_party/boringssl/include/openssl/ecdh.h +102 -0
- data/third_party/boringssl/include/openssl/ecdsa.h +206 -0
- data/third_party/boringssl/include/openssl/engine.h +98 -0
- data/third_party/boringssl/include/openssl/err.h +487 -0
- data/third_party/boringssl/include/openssl/evp.h +750 -0
- data/third_party/boringssl/include/openssl/ex_data.h +213 -0
- data/third_party/boringssl/include/openssl/hkdf.h +44 -0
- data/third_party/boringssl/include/openssl/hmac.h +160 -0
- data/third_party/boringssl/include/openssl/lhash.h +192 -0
- data/third_party/boringssl/include/openssl/lhash_macros.h +132 -0
- data/third_party/boringssl/include/openssl/md4.h +102 -0
- data/third_party/boringssl/include/openssl/md5.h +107 -0
- data/third_party/boringssl/include/openssl/mem.h +140 -0
- data/third_party/boringssl/include/openssl/obj.h +198 -0
- data/third_party/boringssl/include/openssl/obj_mac.h +4140 -0
- data/third_party/boringssl/include/openssl/objects.h +18 -0
- data/third_party/boringssl/include/openssl/opensslfeatures.h +60 -0
- data/third_party/boringssl/include/openssl/opensslv.h +18 -0
- data/third_party/boringssl/include/openssl/ossl_typ.h +18 -0
- data/third_party/boringssl/include/openssl/pem.h +521 -0
- data/third_party/boringssl/include/openssl/pkcs12.h +18 -0
- data/third_party/boringssl/include/openssl/pkcs7.h +16 -0
- data/third_party/boringssl/include/openssl/pkcs8.h +220 -0
- data/third_party/boringssl/include/openssl/poly1305.h +51 -0
- data/third_party/boringssl/include/openssl/pqueue.h +146 -0
- data/third_party/boringssl/include/openssl/rand.h +113 -0
- data/third_party/boringssl/include/openssl/rc4.h +90 -0
- data/third_party/boringssl/include/openssl/rsa.h +637 -0
- data/third_party/boringssl/include/openssl/safestack.h +16 -0
- data/third_party/boringssl/include/openssl/sha.h +256 -0
- data/third_party/boringssl/include/openssl/srtp.h +18 -0
- data/third_party/boringssl/include/openssl/ssl.h +4466 -0
- data/third_party/boringssl/include/openssl/ssl3.h +441 -0
- data/third_party/boringssl/include/openssl/stack.h +298 -0
- data/third_party/boringssl/include/openssl/stack_macros.h +4190 -0
- data/third_party/boringssl/include/openssl/thread.h +173 -0
- data/third_party/boringssl/include/openssl/time_support.h +90 -0
- data/third_party/boringssl/include/openssl/tls1.h +653 -0
- data/third_party/boringssl/include/openssl/type_check.h +91 -0
- data/third_party/boringssl/include/openssl/x509.h +1258 -0
- data/third_party/boringssl/include/openssl/x509_vfy.h +611 -0
- data/third_party/boringssl/include/openssl/x509v3.h +798 -0
- data/third_party/boringssl/ssl/custom_extensions.c +257 -0
- data/third_party/boringssl/ssl/d1_both.c +880 -0
- data/third_party/boringssl/ssl/d1_clnt.c +566 -0
- data/third_party/boringssl/ssl/d1_lib.c +340 -0
- data/third_party/boringssl/ssl/d1_meth.c +130 -0
- data/third_party/boringssl/ssl/d1_pkt.c +578 -0
- data/third_party/boringssl/ssl/d1_srtp.c +234 -0
- data/third_party/boringssl/ssl/d1_srvr.c +485 -0
- data/third_party/boringssl/ssl/dtls_record.c +308 -0
- data/third_party/boringssl/ssl/internal.h +1276 -0
- data/third_party/boringssl/ssl/pqueue/pqueue.c +197 -0
- data/third_party/boringssl/ssl/s3_both.c +571 -0
- data/third_party/boringssl/ssl/s3_clnt.c +2241 -0
- data/third_party/boringssl/ssl/s3_enc.c +494 -0
- data/third_party/boringssl/ssl/s3_lib.c +587 -0
- data/third_party/boringssl/ssl/s3_meth.c +166 -0
- data/third_party/boringssl/ssl/s3_pkt.c +732 -0
- data/third_party/boringssl/ssl/s3_srvr.c +2536 -0
- data/third_party/boringssl/ssl/ssl_aead_ctx.c +300 -0
- data/third_party/boringssl/ssl/ssl_asn1.c +718 -0
- data/third_party/boringssl/ssl/ssl_buffer.c +319 -0
- data/third_party/boringssl/ssl/ssl_cert.c +539 -0
- data/third_party/boringssl/ssl/ssl_cipher.c +2003 -0
- data/third_party/boringssl/ssl/ssl_file.c +633 -0
- data/third_party/boringssl/ssl/ssl_lib.c +2653 -0
- data/third_party/boringssl/ssl/ssl_rsa.c +423 -0
- data/third_party/boringssl/ssl/ssl_session.c +764 -0
- data/third_party/boringssl/ssl/ssl_stat.c +591 -0
- data/third_party/boringssl/ssl/t1_enc.c +708 -0
- data/third_party/boringssl/ssl/t1_lib.c +2905 -0
- data/third_party/boringssl/ssl/test/async_bio.h +45 -0
- data/third_party/boringssl/ssl/test/packeted_bio.h +44 -0
- data/third_party/boringssl/ssl/test/scoped_types.h +28 -0
- data/third_party/boringssl/ssl/test/test_config.h +108 -0
- data/third_party/boringssl/ssl/tls_record.c +342 -0
- data/third_party/zlib/adler32.c +179 -0
- data/third_party/zlib/compress.c +80 -0
- data/third_party/zlib/crc32.c +425 -0
- data/third_party/zlib/crc32.h +441 -0
- data/third_party/zlib/deflate.c +1967 -0
- data/third_party/zlib/deflate.h +346 -0
- data/third_party/zlib/gzclose.c +25 -0
- data/third_party/zlib/gzguts.h +209 -0
- data/third_party/zlib/gzlib.c +634 -0
- data/third_party/zlib/gzread.c +594 -0
- data/third_party/zlib/gzwrite.c +577 -0
- data/third_party/zlib/infback.c +640 -0
- data/third_party/zlib/inffast.c +340 -0
- data/third_party/zlib/inffast.h +11 -0
- data/third_party/zlib/inffixed.h +94 -0
- data/third_party/zlib/inflate.c +1512 -0
- data/third_party/zlib/inflate.h +122 -0
- data/third_party/zlib/inftrees.c +306 -0
- data/third_party/zlib/inftrees.h +62 -0
- data/third_party/zlib/trees.c +1226 -0
- data/third_party/zlib/trees.h +128 -0
- data/third_party/zlib/uncompr.c +59 -0
- data/third_party/zlib/zconf.h +511 -0
- data/third_party/zlib/zlib.h +1768 -0
- data/third_party/zlib/zutil.c +324 -0
- data/third_party/zlib/zutil.h +253 -0
- metadata +492 -25
- data/Rakefile +0 -63
- data/src/ruby/lib/grpc/grpc.so +0 -0
@@ -0,0 +1,892 @@
|
|
1
|
+
/* Copyright (c) 2014, Google Inc.
|
2
|
+
*
|
3
|
+
* Permission to use, copy, modify, and/or distribute this software for any
|
4
|
+
* purpose with or without fee is hereby granted, provided that the above
|
5
|
+
* copyright notice and this permission notice appear in all copies.
|
6
|
+
*
|
7
|
+
* THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
|
8
|
+
* WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
|
9
|
+
* MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
|
10
|
+
* SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
|
11
|
+
* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION
|
12
|
+
* OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN
|
13
|
+
* CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. */
|
14
|
+
|
15
|
+
/* This implementation of poly1305 is by Andrew Moon
|
16
|
+
* (https://github.com/floodyberry/poly1305-donna) and released as public
|
17
|
+
* domain. It implements SIMD vectorization based on the algorithm described in
|
18
|
+
* http://cr.yp.to/papers.html#neoncrypto. Unrolled to 2 powers, i.e. 64 byte
|
19
|
+
* block size */
|
20
|
+
|
21
|
+
#include <openssl/poly1305.h>
|
22
|
+
|
23
|
+
|
24
|
+
#if !defined(OPENSSL_WINDOWS) && defined(OPENSSL_X86_64)
|
25
|
+
|
26
|
+
#include <emmintrin.h>
|
27
|
+
|
28
|
+
#define ALIGN(x) __attribute__((aligned(x)))
|
29
|
+
/* inline is not a keyword in C89. */
|
30
|
+
#define INLINE
|
31
|
+
#define U8TO64_LE(m) (*(uint64_t *)(m))
|
32
|
+
#define U8TO32_LE(m) (*(uint32_t *)(m))
|
33
|
+
#define U64TO8_LE(m, v) (*(uint64_t *)(m)) = v
|
34
|
+
|
35
|
+
typedef __m128i xmmi;
|
36
|
+
typedef unsigned __int128 uint128_t;
|
37
|
+
|
38
|
+
static const uint32_t ALIGN(16) poly1305_x64_sse2_message_mask[4] = {
|
39
|
+
(1 << 26) - 1, 0, (1 << 26) - 1, 0};
|
40
|
+
static const uint32_t ALIGN(16) poly1305_x64_sse2_5[4] = {5, 0, 5, 0};
|
41
|
+
static const uint32_t ALIGN(16) poly1305_x64_sse2_1shl128[4] = {(1 << 24), 0,
|
42
|
+
(1 << 24), 0};
|
43
|
+
|
44
|
+
static uint128_t INLINE add128(uint128_t a, uint128_t b) { return a + b; }
|
45
|
+
|
46
|
+
static uint128_t INLINE add128_64(uint128_t a, uint64_t b) { return a + b; }
|
47
|
+
|
48
|
+
static uint128_t INLINE mul64x64_128(uint64_t a, uint64_t b) {
|
49
|
+
return (uint128_t)a * b;
|
50
|
+
}
|
51
|
+
|
52
|
+
static uint64_t INLINE lo128(uint128_t a) { return (uint64_t)a; }
|
53
|
+
|
54
|
+
static uint64_t INLINE shr128(uint128_t v, const int shift) {
|
55
|
+
return (uint64_t)(v >> shift);
|
56
|
+
}
|
57
|
+
|
58
|
+
static uint64_t INLINE shr128_pair(uint64_t hi, uint64_t lo, const int shift) {
|
59
|
+
return (uint64_t)((((uint128_t)hi << 64) | lo) >> shift);
|
60
|
+
}
|
61
|
+
|
62
|
+
typedef struct poly1305_power_t {
|
63
|
+
union {
|
64
|
+
xmmi v;
|
65
|
+
uint64_t u[2];
|
66
|
+
uint32_t d[4];
|
67
|
+
} R20, R21, R22, R23, R24, S21, S22, S23, S24;
|
68
|
+
} poly1305_power;
|
69
|
+
|
70
|
+
typedef struct poly1305_state_internal_t {
|
71
|
+
poly1305_power P[2]; /* 288 bytes, top 32 bit halves unused = 144
|
72
|
+
bytes of free storage */
|
73
|
+
union {
|
74
|
+
xmmi H[5]; /* 80 bytes */
|
75
|
+
uint64_t HH[10];
|
76
|
+
};
|
77
|
+
/* uint64_t r0,r1,r2; [24 bytes] */
|
78
|
+
/* uint64_t pad0,pad1; [16 bytes] */
|
79
|
+
uint64_t started; /* 8 bytes */
|
80
|
+
uint64_t leftover; /* 8 bytes */
|
81
|
+
uint8_t buffer[64]; /* 64 bytes */
|
82
|
+
} poly1305_state_internal; /* 448 bytes total + 63 bytes for
|
83
|
+
alignment = 511 bytes raw */
|
84
|
+
|
85
|
+
static poly1305_state_internal INLINE *poly1305_aligned_state(
|
86
|
+
poly1305_state *state) {
|
87
|
+
return (poly1305_state_internal *)(((uint64_t)state + 63) & ~63);
|
88
|
+
}
|
89
|
+
|
90
|
+
/* copy 0-63 bytes */
|
91
|
+
static void INLINE
|
92
|
+
poly1305_block_copy(uint8_t *dst, const uint8_t *src, size_t bytes) {
|
93
|
+
size_t offset = src - dst;
|
94
|
+
if (bytes & 32) {
|
95
|
+
_mm_storeu_si128((xmmi *)(dst + 0),
|
96
|
+
_mm_loadu_si128((xmmi *)(dst + offset + 0)));
|
97
|
+
_mm_storeu_si128((xmmi *)(dst + 16),
|
98
|
+
_mm_loadu_si128((xmmi *)(dst + offset + 16)));
|
99
|
+
dst += 32;
|
100
|
+
}
|
101
|
+
if (bytes & 16) {
|
102
|
+
_mm_storeu_si128((xmmi *)dst, _mm_loadu_si128((xmmi *)(dst + offset)));
|
103
|
+
dst += 16;
|
104
|
+
}
|
105
|
+
if (bytes & 8) {
|
106
|
+
*(uint64_t *)dst = *(uint64_t *)(dst + offset);
|
107
|
+
dst += 8;
|
108
|
+
}
|
109
|
+
if (bytes & 4) {
|
110
|
+
*(uint32_t *)dst = *(uint32_t *)(dst + offset);
|
111
|
+
dst += 4;
|
112
|
+
}
|
113
|
+
if (bytes & 2) {
|
114
|
+
*(uint16_t *)dst = *(uint16_t *)(dst + offset);
|
115
|
+
dst += 2;
|
116
|
+
}
|
117
|
+
if (bytes & 1) {
|
118
|
+
*(uint8_t *)dst = *(uint8_t *)(dst + offset);
|
119
|
+
}
|
120
|
+
}
|
121
|
+
|
122
|
+
/* zero 0-15 bytes */
|
123
|
+
static void INLINE poly1305_block_zero(uint8_t *dst, size_t bytes) {
|
124
|
+
if (bytes & 8) {
|
125
|
+
*(uint64_t *)dst = 0;
|
126
|
+
dst += 8;
|
127
|
+
}
|
128
|
+
if (bytes & 4) {
|
129
|
+
*(uint32_t *)dst = 0;
|
130
|
+
dst += 4;
|
131
|
+
}
|
132
|
+
if (bytes & 2) {
|
133
|
+
*(uint16_t *)dst = 0;
|
134
|
+
dst += 2;
|
135
|
+
}
|
136
|
+
if (bytes & 1) {
|
137
|
+
*(uint8_t *)dst = 0;
|
138
|
+
}
|
139
|
+
}
|
140
|
+
|
141
|
+
static size_t INLINE poly1305_min(size_t a, size_t b) {
|
142
|
+
return (a < b) ? a : b;
|
143
|
+
}
|
144
|
+
|
145
|
+
void CRYPTO_poly1305_init(poly1305_state *state, const uint8_t key[32]) {
|
146
|
+
poly1305_state_internal *st = poly1305_aligned_state(state);
|
147
|
+
poly1305_power *p;
|
148
|
+
uint64_t r0, r1, r2;
|
149
|
+
uint64_t t0, t1;
|
150
|
+
|
151
|
+
/* clamp key */
|
152
|
+
t0 = U8TO64_LE(key + 0);
|
153
|
+
t1 = U8TO64_LE(key + 8);
|
154
|
+
r0 = t0 & 0xffc0fffffff;
|
155
|
+
t0 >>= 44;
|
156
|
+
t0 |= t1 << 20;
|
157
|
+
r1 = t0 & 0xfffffc0ffff;
|
158
|
+
t1 >>= 24;
|
159
|
+
r2 = t1 & 0x00ffffffc0f;
|
160
|
+
|
161
|
+
/* store r in un-used space of st->P[1] */
|
162
|
+
p = &st->P[1];
|
163
|
+
p->R20.d[1] = (uint32_t)(r0);
|
164
|
+
p->R20.d[3] = (uint32_t)(r0 >> 32);
|
165
|
+
p->R21.d[1] = (uint32_t)(r1);
|
166
|
+
p->R21.d[3] = (uint32_t)(r1 >> 32);
|
167
|
+
p->R22.d[1] = (uint32_t)(r2);
|
168
|
+
p->R22.d[3] = (uint32_t)(r2 >> 32);
|
169
|
+
|
170
|
+
/* store pad */
|
171
|
+
p->R23.d[1] = U8TO32_LE(key + 16);
|
172
|
+
p->R23.d[3] = U8TO32_LE(key + 20);
|
173
|
+
p->R24.d[1] = U8TO32_LE(key + 24);
|
174
|
+
p->R24.d[3] = U8TO32_LE(key + 28);
|
175
|
+
|
176
|
+
/* H = 0 */
|
177
|
+
st->H[0] = _mm_setzero_si128();
|
178
|
+
st->H[1] = _mm_setzero_si128();
|
179
|
+
st->H[2] = _mm_setzero_si128();
|
180
|
+
st->H[3] = _mm_setzero_si128();
|
181
|
+
st->H[4] = _mm_setzero_si128();
|
182
|
+
|
183
|
+
st->started = 0;
|
184
|
+
st->leftover = 0;
|
185
|
+
}
|
186
|
+
|
187
|
+
static void poly1305_first_block(poly1305_state_internal *st,
|
188
|
+
const uint8_t *m) {
|
189
|
+
const xmmi MMASK = _mm_load_si128((xmmi *)poly1305_x64_sse2_message_mask);
|
190
|
+
const xmmi FIVE = _mm_load_si128((xmmi *)poly1305_x64_sse2_5);
|
191
|
+
const xmmi HIBIT = _mm_load_si128((xmmi *)poly1305_x64_sse2_1shl128);
|
192
|
+
xmmi T5, T6;
|
193
|
+
poly1305_power *p;
|
194
|
+
uint128_t d[3];
|
195
|
+
uint64_t r0, r1, r2;
|
196
|
+
uint64_t r20, r21, r22, s22;
|
197
|
+
uint64_t pad0, pad1;
|
198
|
+
uint64_t c;
|
199
|
+
uint64_t i;
|
200
|
+
|
201
|
+
/* pull out stored info */
|
202
|
+
p = &st->P[1];
|
203
|
+
|
204
|
+
r0 = ((uint64_t)p->R20.d[3] << 32) | (uint64_t)p->R20.d[1];
|
205
|
+
r1 = ((uint64_t)p->R21.d[3] << 32) | (uint64_t)p->R21.d[1];
|
206
|
+
r2 = ((uint64_t)p->R22.d[3] << 32) | (uint64_t)p->R22.d[1];
|
207
|
+
pad0 = ((uint64_t)p->R23.d[3] << 32) | (uint64_t)p->R23.d[1];
|
208
|
+
pad1 = ((uint64_t)p->R24.d[3] << 32) | (uint64_t)p->R24.d[1];
|
209
|
+
|
210
|
+
/* compute powers r^2,r^4 */
|
211
|
+
r20 = r0;
|
212
|
+
r21 = r1;
|
213
|
+
r22 = r2;
|
214
|
+
for (i = 0; i < 2; i++) {
|
215
|
+
s22 = r22 * (5 << 2);
|
216
|
+
|
217
|
+
d[0] = add128(mul64x64_128(r20, r20), mul64x64_128(r21 * 2, s22));
|
218
|
+
d[1] = add128(mul64x64_128(r22, s22), mul64x64_128(r20 * 2, r21));
|
219
|
+
d[2] = add128(mul64x64_128(r21, r21), mul64x64_128(r22 * 2, r20));
|
220
|
+
|
221
|
+
r20 = lo128(d[0]) & 0xfffffffffff;
|
222
|
+
c = shr128(d[0], 44);
|
223
|
+
d[1] = add128_64(d[1], c);
|
224
|
+
r21 = lo128(d[1]) & 0xfffffffffff;
|
225
|
+
c = shr128(d[1], 44);
|
226
|
+
d[2] = add128_64(d[2], c);
|
227
|
+
r22 = lo128(d[2]) & 0x3ffffffffff;
|
228
|
+
c = shr128(d[2], 42);
|
229
|
+
r20 += c * 5;
|
230
|
+
c = (r20 >> 44);
|
231
|
+
r20 = r20 & 0xfffffffffff;
|
232
|
+
r21 += c;
|
233
|
+
|
234
|
+
p->R20.v = _mm_shuffle_epi32(_mm_cvtsi32_si128((uint32_t)(r20)&0x3ffffff),
|
235
|
+
_MM_SHUFFLE(1, 0, 1, 0));
|
236
|
+
p->R21.v = _mm_shuffle_epi32(
|
237
|
+
_mm_cvtsi32_si128((uint32_t)((r20 >> 26) | (r21 << 18)) & 0x3ffffff),
|
238
|
+
_MM_SHUFFLE(1, 0, 1, 0));
|
239
|
+
p->R22.v =
|
240
|
+
_mm_shuffle_epi32(_mm_cvtsi32_si128((uint32_t)((r21 >> 8)) & 0x3ffffff),
|
241
|
+
_MM_SHUFFLE(1, 0, 1, 0));
|
242
|
+
p->R23.v = _mm_shuffle_epi32(
|
243
|
+
_mm_cvtsi32_si128((uint32_t)((r21 >> 34) | (r22 << 10)) & 0x3ffffff),
|
244
|
+
_MM_SHUFFLE(1, 0, 1, 0));
|
245
|
+
p->R24.v = _mm_shuffle_epi32(_mm_cvtsi32_si128((uint32_t)((r22 >> 16))),
|
246
|
+
_MM_SHUFFLE(1, 0, 1, 0));
|
247
|
+
p->S21.v = _mm_mul_epu32(p->R21.v, FIVE);
|
248
|
+
p->S22.v = _mm_mul_epu32(p->R22.v, FIVE);
|
249
|
+
p->S23.v = _mm_mul_epu32(p->R23.v, FIVE);
|
250
|
+
p->S24.v = _mm_mul_epu32(p->R24.v, FIVE);
|
251
|
+
p--;
|
252
|
+
}
|
253
|
+
|
254
|
+
/* put saved info back */
|
255
|
+
p = &st->P[1];
|
256
|
+
p->R20.d[1] = (uint32_t)(r0);
|
257
|
+
p->R20.d[3] = (uint32_t)(r0 >> 32);
|
258
|
+
p->R21.d[1] = (uint32_t)(r1);
|
259
|
+
p->R21.d[3] = (uint32_t)(r1 >> 32);
|
260
|
+
p->R22.d[1] = (uint32_t)(r2);
|
261
|
+
p->R22.d[3] = (uint32_t)(r2 >> 32);
|
262
|
+
p->R23.d[1] = (uint32_t)(pad0);
|
263
|
+
p->R23.d[3] = (uint32_t)(pad0 >> 32);
|
264
|
+
p->R24.d[1] = (uint32_t)(pad1);
|
265
|
+
p->R24.d[3] = (uint32_t)(pad1 >> 32);
|
266
|
+
|
267
|
+
/* H = [Mx,My] */
|
268
|
+
T5 = _mm_unpacklo_epi64(_mm_loadl_epi64((xmmi *)(m + 0)),
|
269
|
+
_mm_loadl_epi64((xmmi *)(m + 16)));
|
270
|
+
T6 = _mm_unpacklo_epi64(_mm_loadl_epi64((xmmi *)(m + 8)),
|
271
|
+
_mm_loadl_epi64((xmmi *)(m + 24)));
|
272
|
+
st->H[0] = _mm_and_si128(MMASK, T5);
|
273
|
+
st->H[1] = _mm_and_si128(MMASK, _mm_srli_epi64(T5, 26));
|
274
|
+
T5 = _mm_or_si128(_mm_srli_epi64(T5, 52), _mm_slli_epi64(T6, 12));
|
275
|
+
st->H[2] = _mm_and_si128(MMASK, T5);
|
276
|
+
st->H[3] = _mm_and_si128(MMASK, _mm_srli_epi64(T5, 26));
|
277
|
+
st->H[4] = _mm_or_si128(_mm_srli_epi64(T6, 40), HIBIT);
|
278
|
+
}
|
279
|
+
|
280
|
+
static void poly1305_blocks(poly1305_state_internal *st, const uint8_t *m,
|
281
|
+
size_t bytes) {
|
282
|
+
const xmmi MMASK = _mm_load_si128((xmmi *)poly1305_x64_sse2_message_mask);
|
283
|
+
const xmmi FIVE = _mm_load_si128((xmmi *)poly1305_x64_sse2_5);
|
284
|
+
const xmmi HIBIT = _mm_load_si128((xmmi *)poly1305_x64_sse2_1shl128);
|
285
|
+
|
286
|
+
poly1305_power *p;
|
287
|
+
xmmi H0, H1, H2, H3, H4;
|
288
|
+
xmmi T0, T1, T2, T3, T4, T5, T6;
|
289
|
+
xmmi M0, M1, M2, M3, M4;
|
290
|
+
xmmi C1, C2;
|
291
|
+
|
292
|
+
H0 = st->H[0];
|
293
|
+
H1 = st->H[1];
|
294
|
+
H2 = st->H[2];
|
295
|
+
H3 = st->H[3];
|
296
|
+
H4 = st->H[4];
|
297
|
+
|
298
|
+
while (bytes >= 64) {
|
299
|
+
/* H *= [r^4,r^4] */
|
300
|
+
p = &st->P[0];
|
301
|
+
T0 = _mm_mul_epu32(H0, p->R20.v);
|
302
|
+
T1 = _mm_mul_epu32(H0, p->R21.v);
|
303
|
+
T2 = _mm_mul_epu32(H0, p->R22.v);
|
304
|
+
T3 = _mm_mul_epu32(H0, p->R23.v);
|
305
|
+
T4 = _mm_mul_epu32(H0, p->R24.v);
|
306
|
+
T5 = _mm_mul_epu32(H1, p->S24.v);
|
307
|
+
T6 = _mm_mul_epu32(H1, p->R20.v);
|
308
|
+
T0 = _mm_add_epi64(T0, T5);
|
309
|
+
T1 = _mm_add_epi64(T1, T6);
|
310
|
+
T5 = _mm_mul_epu32(H2, p->S23.v);
|
311
|
+
T6 = _mm_mul_epu32(H2, p->S24.v);
|
312
|
+
T0 = _mm_add_epi64(T0, T5);
|
313
|
+
T1 = _mm_add_epi64(T1, T6);
|
314
|
+
T5 = _mm_mul_epu32(H3, p->S22.v);
|
315
|
+
T6 = _mm_mul_epu32(H3, p->S23.v);
|
316
|
+
T0 = _mm_add_epi64(T0, T5);
|
317
|
+
T1 = _mm_add_epi64(T1, T6);
|
318
|
+
T5 = _mm_mul_epu32(H4, p->S21.v);
|
319
|
+
T6 = _mm_mul_epu32(H4, p->S22.v);
|
320
|
+
T0 = _mm_add_epi64(T0, T5);
|
321
|
+
T1 = _mm_add_epi64(T1, T6);
|
322
|
+
T5 = _mm_mul_epu32(H1, p->R21.v);
|
323
|
+
T6 = _mm_mul_epu32(H1, p->R22.v);
|
324
|
+
T2 = _mm_add_epi64(T2, T5);
|
325
|
+
T3 = _mm_add_epi64(T3, T6);
|
326
|
+
T5 = _mm_mul_epu32(H2, p->R20.v);
|
327
|
+
T6 = _mm_mul_epu32(H2, p->R21.v);
|
328
|
+
T2 = _mm_add_epi64(T2, T5);
|
329
|
+
T3 = _mm_add_epi64(T3, T6);
|
330
|
+
T5 = _mm_mul_epu32(H3, p->S24.v);
|
331
|
+
T6 = _mm_mul_epu32(H3, p->R20.v);
|
332
|
+
T2 = _mm_add_epi64(T2, T5);
|
333
|
+
T3 = _mm_add_epi64(T3, T6);
|
334
|
+
T5 = _mm_mul_epu32(H4, p->S23.v);
|
335
|
+
T6 = _mm_mul_epu32(H4, p->S24.v);
|
336
|
+
T2 = _mm_add_epi64(T2, T5);
|
337
|
+
T3 = _mm_add_epi64(T3, T6);
|
338
|
+
T5 = _mm_mul_epu32(H1, p->R23.v);
|
339
|
+
T4 = _mm_add_epi64(T4, T5);
|
340
|
+
T5 = _mm_mul_epu32(H2, p->R22.v);
|
341
|
+
T4 = _mm_add_epi64(T4, T5);
|
342
|
+
T5 = _mm_mul_epu32(H3, p->R21.v);
|
343
|
+
T4 = _mm_add_epi64(T4, T5);
|
344
|
+
T5 = _mm_mul_epu32(H4, p->R20.v);
|
345
|
+
T4 = _mm_add_epi64(T4, T5);
|
346
|
+
|
347
|
+
/* H += [Mx,My]*[r^2,r^2] */
|
348
|
+
T5 = _mm_unpacklo_epi64(_mm_loadl_epi64((xmmi *)(m + 0)),
|
349
|
+
_mm_loadl_epi64((xmmi *)(m + 16)));
|
350
|
+
T6 = _mm_unpacklo_epi64(_mm_loadl_epi64((xmmi *)(m + 8)),
|
351
|
+
_mm_loadl_epi64((xmmi *)(m + 24)));
|
352
|
+
M0 = _mm_and_si128(MMASK, T5);
|
353
|
+
M1 = _mm_and_si128(MMASK, _mm_srli_epi64(T5, 26));
|
354
|
+
T5 = _mm_or_si128(_mm_srli_epi64(T5, 52), _mm_slli_epi64(T6, 12));
|
355
|
+
M2 = _mm_and_si128(MMASK, T5);
|
356
|
+
M3 = _mm_and_si128(MMASK, _mm_srli_epi64(T5, 26));
|
357
|
+
M4 = _mm_or_si128(_mm_srli_epi64(T6, 40), HIBIT);
|
358
|
+
|
359
|
+
p = &st->P[1];
|
360
|
+
T5 = _mm_mul_epu32(M0, p->R20.v);
|
361
|
+
T6 = _mm_mul_epu32(M0, p->R21.v);
|
362
|
+
T0 = _mm_add_epi64(T0, T5);
|
363
|
+
T1 = _mm_add_epi64(T1, T6);
|
364
|
+
T5 = _mm_mul_epu32(M1, p->S24.v);
|
365
|
+
T6 = _mm_mul_epu32(M1, p->R20.v);
|
366
|
+
T0 = _mm_add_epi64(T0, T5);
|
367
|
+
T1 = _mm_add_epi64(T1, T6);
|
368
|
+
T5 = _mm_mul_epu32(M2, p->S23.v);
|
369
|
+
T6 = _mm_mul_epu32(M2, p->S24.v);
|
370
|
+
T0 = _mm_add_epi64(T0, T5);
|
371
|
+
T1 = _mm_add_epi64(T1, T6);
|
372
|
+
T5 = _mm_mul_epu32(M3, p->S22.v);
|
373
|
+
T6 = _mm_mul_epu32(M3, p->S23.v);
|
374
|
+
T0 = _mm_add_epi64(T0, T5);
|
375
|
+
T1 = _mm_add_epi64(T1, T6);
|
376
|
+
T5 = _mm_mul_epu32(M4, p->S21.v);
|
377
|
+
T6 = _mm_mul_epu32(M4, p->S22.v);
|
378
|
+
T0 = _mm_add_epi64(T0, T5);
|
379
|
+
T1 = _mm_add_epi64(T1, T6);
|
380
|
+
T5 = _mm_mul_epu32(M0, p->R22.v);
|
381
|
+
T6 = _mm_mul_epu32(M0, p->R23.v);
|
382
|
+
T2 = _mm_add_epi64(T2, T5);
|
383
|
+
T3 = _mm_add_epi64(T3, T6);
|
384
|
+
T5 = _mm_mul_epu32(M1, p->R21.v);
|
385
|
+
T6 = _mm_mul_epu32(M1, p->R22.v);
|
386
|
+
T2 = _mm_add_epi64(T2, T5);
|
387
|
+
T3 = _mm_add_epi64(T3, T6);
|
388
|
+
T5 = _mm_mul_epu32(M2, p->R20.v);
|
389
|
+
T6 = _mm_mul_epu32(M2, p->R21.v);
|
390
|
+
T2 = _mm_add_epi64(T2, T5);
|
391
|
+
T3 = _mm_add_epi64(T3, T6);
|
392
|
+
T5 = _mm_mul_epu32(M3, p->S24.v);
|
393
|
+
T6 = _mm_mul_epu32(M3, p->R20.v);
|
394
|
+
T2 = _mm_add_epi64(T2, T5);
|
395
|
+
T3 = _mm_add_epi64(T3, T6);
|
396
|
+
T5 = _mm_mul_epu32(M4, p->S23.v);
|
397
|
+
T6 = _mm_mul_epu32(M4, p->S24.v);
|
398
|
+
T2 = _mm_add_epi64(T2, T5);
|
399
|
+
T3 = _mm_add_epi64(T3, T6);
|
400
|
+
T5 = _mm_mul_epu32(M0, p->R24.v);
|
401
|
+
T4 = _mm_add_epi64(T4, T5);
|
402
|
+
T5 = _mm_mul_epu32(M1, p->R23.v);
|
403
|
+
T4 = _mm_add_epi64(T4, T5);
|
404
|
+
T5 = _mm_mul_epu32(M2, p->R22.v);
|
405
|
+
T4 = _mm_add_epi64(T4, T5);
|
406
|
+
T5 = _mm_mul_epu32(M3, p->R21.v);
|
407
|
+
T4 = _mm_add_epi64(T4, T5);
|
408
|
+
T5 = _mm_mul_epu32(M4, p->R20.v);
|
409
|
+
T4 = _mm_add_epi64(T4, T5);
|
410
|
+
|
411
|
+
/* H += [Mx,My] */
|
412
|
+
T5 = _mm_unpacklo_epi64(_mm_loadl_epi64((xmmi *)(m + 32)),
|
413
|
+
_mm_loadl_epi64((xmmi *)(m + 48)));
|
414
|
+
T6 = _mm_unpacklo_epi64(_mm_loadl_epi64((xmmi *)(m + 40)),
|
415
|
+
_mm_loadl_epi64((xmmi *)(m + 56)));
|
416
|
+
M0 = _mm_and_si128(MMASK, T5);
|
417
|
+
M1 = _mm_and_si128(MMASK, _mm_srli_epi64(T5, 26));
|
418
|
+
T5 = _mm_or_si128(_mm_srli_epi64(T5, 52), _mm_slli_epi64(T6, 12));
|
419
|
+
M2 = _mm_and_si128(MMASK, T5);
|
420
|
+
M3 = _mm_and_si128(MMASK, _mm_srli_epi64(T5, 26));
|
421
|
+
M4 = _mm_or_si128(_mm_srli_epi64(T6, 40), HIBIT);
|
422
|
+
|
423
|
+
T0 = _mm_add_epi64(T0, M0);
|
424
|
+
T1 = _mm_add_epi64(T1, M1);
|
425
|
+
T2 = _mm_add_epi64(T2, M2);
|
426
|
+
T3 = _mm_add_epi64(T3, M3);
|
427
|
+
T4 = _mm_add_epi64(T4, M4);
|
428
|
+
|
429
|
+
/* reduce */
|
430
|
+
C1 = _mm_srli_epi64(T0, 26);
|
431
|
+
C2 = _mm_srli_epi64(T3, 26);
|
432
|
+
T0 = _mm_and_si128(T0, MMASK);
|
433
|
+
T3 = _mm_and_si128(T3, MMASK);
|
434
|
+
T1 = _mm_add_epi64(T1, C1);
|
435
|
+
T4 = _mm_add_epi64(T4, C2);
|
436
|
+
C1 = _mm_srli_epi64(T1, 26);
|
437
|
+
C2 = _mm_srli_epi64(T4, 26);
|
438
|
+
T1 = _mm_and_si128(T1, MMASK);
|
439
|
+
T4 = _mm_and_si128(T4, MMASK);
|
440
|
+
T2 = _mm_add_epi64(T2, C1);
|
441
|
+
T0 = _mm_add_epi64(T0, _mm_mul_epu32(C2, FIVE));
|
442
|
+
C1 = _mm_srli_epi64(T2, 26);
|
443
|
+
C2 = _mm_srli_epi64(T0, 26);
|
444
|
+
T2 = _mm_and_si128(T2, MMASK);
|
445
|
+
T0 = _mm_and_si128(T0, MMASK);
|
446
|
+
T3 = _mm_add_epi64(T3, C1);
|
447
|
+
T1 = _mm_add_epi64(T1, C2);
|
448
|
+
C1 = _mm_srli_epi64(T3, 26);
|
449
|
+
T3 = _mm_and_si128(T3, MMASK);
|
450
|
+
T4 = _mm_add_epi64(T4, C1);
|
451
|
+
|
452
|
+
/* H = (H*[r^4,r^4] + [Mx,My]*[r^2,r^2] + [Mx,My]) */
|
453
|
+
H0 = T0;
|
454
|
+
H1 = T1;
|
455
|
+
H2 = T2;
|
456
|
+
H3 = T3;
|
457
|
+
H4 = T4;
|
458
|
+
|
459
|
+
m += 64;
|
460
|
+
bytes -= 64;
|
461
|
+
}
|
462
|
+
|
463
|
+
st->H[0] = H0;
|
464
|
+
st->H[1] = H1;
|
465
|
+
st->H[2] = H2;
|
466
|
+
st->H[3] = H3;
|
467
|
+
st->H[4] = H4;
|
468
|
+
}
|
469
|
+
|
470
|
+
static size_t poly1305_combine(poly1305_state_internal *st, const uint8_t *m,
|
471
|
+
size_t bytes) {
|
472
|
+
const xmmi MMASK = _mm_load_si128((xmmi *)poly1305_x64_sse2_message_mask);
|
473
|
+
const xmmi HIBIT = _mm_load_si128((xmmi *)poly1305_x64_sse2_1shl128);
|
474
|
+
const xmmi FIVE = _mm_load_si128((xmmi *)poly1305_x64_sse2_5);
|
475
|
+
|
476
|
+
poly1305_power *p;
|
477
|
+
xmmi H0, H1, H2, H3, H4;
|
478
|
+
xmmi M0, M1, M2, M3, M4;
|
479
|
+
xmmi T0, T1, T2, T3, T4, T5, T6;
|
480
|
+
xmmi C1, C2;
|
481
|
+
|
482
|
+
uint64_t r0, r1, r2;
|
483
|
+
uint64_t t0, t1, t2, t3, t4;
|
484
|
+
uint64_t c;
|
485
|
+
size_t consumed = 0;
|
486
|
+
|
487
|
+
H0 = st->H[0];
|
488
|
+
H1 = st->H[1];
|
489
|
+
H2 = st->H[2];
|
490
|
+
H3 = st->H[3];
|
491
|
+
H4 = st->H[4];
|
492
|
+
|
493
|
+
/* p = [r^2,r^2] */
|
494
|
+
p = &st->P[1];
|
495
|
+
|
496
|
+
if (bytes >= 32) {
|
497
|
+
/* H *= [r^2,r^2] */
|
498
|
+
T0 = _mm_mul_epu32(H0, p->R20.v);
|
499
|
+
T1 = _mm_mul_epu32(H0, p->R21.v);
|
500
|
+
T2 = _mm_mul_epu32(H0, p->R22.v);
|
501
|
+
T3 = _mm_mul_epu32(H0, p->R23.v);
|
502
|
+
T4 = _mm_mul_epu32(H0, p->R24.v);
|
503
|
+
T5 = _mm_mul_epu32(H1, p->S24.v);
|
504
|
+
T6 = _mm_mul_epu32(H1, p->R20.v);
|
505
|
+
T0 = _mm_add_epi64(T0, T5);
|
506
|
+
T1 = _mm_add_epi64(T1, T6);
|
507
|
+
T5 = _mm_mul_epu32(H2, p->S23.v);
|
508
|
+
T6 = _mm_mul_epu32(H2, p->S24.v);
|
509
|
+
T0 = _mm_add_epi64(T0, T5);
|
510
|
+
T1 = _mm_add_epi64(T1, T6);
|
511
|
+
T5 = _mm_mul_epu32(H3, p->S22.v);
|
512
|
+
T6 = _mm_mul_epu32(H3, p->S23.v);
|
513
|
+
T0 = _mm_add_epi64(T0, T5);
|
514
|
+
T1 = _mm_add_epi64(T1, T6);
|
515
|
+
T5 = _mm_mul_epu32(H4, p->S21.v);
|
516
|
+
T6 = _mm_mul_epu32(H4, p->S22.v);
|
517
|
+
T0 = _mm_add_epi64(T0, T5);
|
518
|
+
T1 = _mm_add_epi64(T1, T6);
|
519
|
+
T5 = _mm_mul_epu32(H1, p->R21.v);
|
520
|
+
T6 = _mm_mul_epu32(H1, p->R22.v);
|
521
|
+
T2 = _mm_add_epi64(T2, T5);
|
522
|
+
T3 = _mm_add_epi64(T3, T6);
|
523
|
+
T5 = _mm_mul_epu32(H2, p->R20.v);
|
524
|
+
T6 = _mm_mul_epu32(H2, p->R21.v);
|
525
|
+
T2 = _mm_add_epi64(T2, T5);
|
526
|
+
T3 = _mm_add_epi64(T3, T6);
|
527
|
+
T5 = _mm_mul_epu32(H3, p->S24.v);
|
528
|
+
T6 = _mm_mul_epu32(H3, p->R20.v);
|
529
|
+
T2 = _mm_add_epi64(T2, T5);
|
530
|
+
T3 = _mm_add_epi64(T3, T6);
|
531
|
+
T5 = _mm_mul_epu32(H4, p->S23.v);
|
532
|
+
T6 = _mm_mul_epu32(H4, p->S24.v);
|
533
|
+
T2 = _mm_add_epi64(T2, T5);
|
534
|
+
T3 = _mm_add_epi64(T3, T6);
|
535
|
+
T5 = _mm_mul_epu32(H1, p->R23.v);
|
536
|
+
T4 = _mm_add_epi64(T4, T5);
|
537
|
+
T5 = _mm_mul_epu32(H2, p->R22.v);
|
538
|
+
T4 = _mm_add_epi64(T4, T5);
|
539
|
+
T5 = _mm_mul_epu32(H3, p->R21.v);
|
540
|
+
T4 = _mm_add_epi64(T4, T5);
|
541
|
+
T5 = _mm_mul_epu32(H4, p->R20.v);
|
542
|
+
T4 = _mm_add_epi64(T4, T5);
|
543
|
+
|
544
|
+
/* H += [Mx,My] */
|
545
|
+
T5 = _mm_unpacklo_epi64(_mm_loadl_epi64((xmmi *)(m + 0)),
|
546
|
+
_mm_loadl_epi64((xmmi *)(m + 16)));
|
547
|
+
T6 = _mm_unpacklo_epi64(_mm_loadl_epi64((xmmi *)(m + 8)),
|
548
|
+
_mm_loadl_epi64((xmmi *)(m + 24)));
|
549
|
+
M0 = _mm_and_si128(MMASK, T5);
|
550
|
+
M1 = _mm_and_si128(MMASK, _mm_srli_epi64(T5, 26));
|
551
|
+
T5 = _mm_or_si128(_mm_srli_epi64(T5, 52), _mm_slli_epi64(T6, 12));
|
552
|
+
M2 = _mm_and_si128(MMASK, T5);
|
553
|
+
M3 = _mm_and_si128(MMASK, _mm_srli_epi64(T5, 26));
|
554
|
+
M4 = _mm_or_si128(_mm_srli_epi64(T6, 40), HIBIT);
|
555
|
+
|
556
|
+
T0 = _mm_add_epi64(T0, M0);
|
557
|
+
T1 = _mm_add_epi64(T1, M1);
|
558
|
+
T2 = _mm_add_epi64(T2, M2);
|
559
|
+
T3 = _mm_add_epi64(T3, M3);
|
560
|
+
T4 = _mm_add_epi64(T4, M4);
|
561
|
+
|
562
|
+
/* reduce */
|
563
|
+
C1 = _mm_srli_epi64(T0, 26);
|
564
|
+
C2 = _mm_srli_epi64(T3, 26);
|
565
|
+
T0 = _mm_and_si128(T0, MMASK);
|
566
|
+
T3 = _mm_and_si128(T3, MMASK);
|
567
|
+
T1 = _mm_add_epi64(T1, C1);
|
568
|
+
T4 = _mm_add_epi64(T4, C2);
|
569
|
+
C1 = _mm_srli_epi64(T1, 26);
|
570
|
+
C2 = _mm_srli_epi64(T4, 26);
|
571
|
+
T1 = _mm_and_si128(T1, MMASK);
|
572
|
+
T4 = _mm_and_si128(T4, MMASK);
|
573
|
+
T2 = _mm_add_epi64(T2, C1);
|
574
|
+
T0 = _mm_add_epi64(T0, _mm_mul_epu32(C2, FIVE));
|
575
|
+
C1 = _mm_srli_epi64(T2, 26);
|
576
|
+
C2 = _mm_srli_epi64(T0, 26);
|
577
|
+
T2 = _mm_and_si128(T2, MMASK);
|
578
|
+
T0 = _mm_and_si128(T0, MMASK);
|
579
|
+
T3 = _mm_add_epi64(T3, C1);
|
580
|
+
T1 = _mm_add_epi64(T1, C2);
|
581
|
+
C1 = _mm_srli_epi64(T3, 26);
|
582
|
+
T3 = _mm_and_si128(T3, MMASK);
|
583
|
+
T4 = _mm_add_epi64(T4, C1);
|
584
|
+
|
585
|
+
/* H = (H*[r^2,r^2] + [Mx,My]) */
|
586
|
+
H0 = T0;
|
587
|
+
H1 = T1;
|
588
|
+
H2 = T2;
|
589
|
+
H3 = T3;
|
590
|
+
H4 = T4;
|
591
|
+
|
592
|
+
consumed = 32;
|
593
|
+
}
|
594
|
+
|
595
|
+
/* finalize, H *= [r^2,r] */
|
596
|
+
r0 = ((uint64_t)p->R20.d[3] << 32) | (uint64_t)p->R20.d[1];
|
597
|
+
r1 = ((uint64_t)p->R21.d[3] << 32) | (uint64_t)p->R21.d[1];
|
598
|
+
r2 = ((uint64_t)p->R22.d[3] << 32) | (uint64_t)p->R22.d[1];
|
599
|
+
|
600
|
+
p->R20.d[2] = (uint32_t)(r0)&0x3ffffff;
|
601
|
+
p->R21.d[2] = (uint32_t)((r0 >> 26) | (r1 << 18)) & 0x3ffffff;
|
602
|
+
p->R22.d[2] = (uint32_t)((r1 >> 8)) & 0x3ffffff;
|
603
|
+
p->R23.d[2] = (uint32_t)((r1 >> 34) | (r2 << 10)) & 0x3ffffff;
|
604
|
+
p->R24.d[2] = (uint32_t)((r2 >> 16));
|
605
|
+
p->S21.d[2] = p->R21.d[2] * 5;
|
606
|
+
p->S22.d[2] = p->R22.d[2] * 5;
|
607
|
+
p->S23.d[2] = p->R23.d[2] * 5;
|
608
|
+
p->S24.d[2] = p->R24.d[2] * 5;
|
609
|
+
|
610
|
+
/* H *= [r^2,r] */
|
611
|
+
T0 = _mm_mul_epu32(H0, p->R20.v);
|
612
|
+
T1 = _mm_mul_epu32(H0, p->R21.v);
|
613
|
+
T2 = _mm_mul_epu32(H0, p->R22.v);
|
614
|
+
T3 = _mm_mul_epu32(H0, p->R23.v);
|
615
|
+
T4 = _mm_mul_epu32(H0, p->R24.v);
|
616
|
+
T5 = _mm_mul_epu32(H1, p->S24.v);
|
617
|
+
T6 = _mm_mul_epu32(H1, p->R20.v);
|
618
|
+
T0 = _mm_add_epi64(T0, T5);
|
619
|
+
T1 = _mm_add_epi64(T1, T6);
|
620
|
+
T5 = _mm_mul_epu32(H2, p->S23.v);
|
621
|
+
T6 = _mm_mul_epu32(H2, p->S24.v);
|
622
|
+
T0 = _mm_add_epi64(T0, T5);
|
623
|
+
T1 = _mm_add_epi64(T1, T6);
|
624
|
+
T5 = _mm_mul_epu32(H3, p->S22.v);
|
625
|
+
T6 = _mm_mul_epu32(H3, p->S23.v);
|
626
|
+
T0 = _mm_add_epi64(T0, T5);
|
627
|
+
T1 = _mm_add_epi64(T1, T6);
|
628
|
+
T5 = _mm_mul_epu32(H4, p->S21.v);
|
629
|
+
T6 = _mm_mul_epu32(H4, p->S22.v);
|
630
|
+
T0 = _mm_add_epi64(T0, T5);
|
631
|
+
T1 = _mm_add_epi64(T1, T6);
|
632
|
+
T5 = _mm_mul_epu32(H1, p->R21.v);
|
633
|
+
T6 = _mm_mul_epu32(H1, p->R22.v);
|
634
|
+
T2 = _mm_add_epi64(T2, T5);
|
635
|
+
T3 = _mm_add_epi64(T3, T6);
|
636
|
+
T5 = _mm_mul_epu32(H2, p->R20.v);
|
637
|
+
T6 = _mm_mul_epu32(H2, p->R21.v);
|
638
|
+
T2 = _mm_add_epi64(T2, T5);
|
639
|
+
T3 = _mm_add_epi64(T3, T6);
|
640
|
+
T5 = _mm_mul_epu32(H3, p->S24.v);
|
641
|
+
T6 = _mm_mul_epu32(H3, p->R20.v);
|
642
|
+
T2 = _mm_add_epi64(T2, T5);
|
643
|
+
T3 = _mm_add_epi64(T3, T6);
|
644
|
+
T5 = _mm_mul_epu32(H4, p->S23.v);
|
645
|
+
T6 = _mm_mul_epu32(H4, p->S24.v);
|
646
|
+
T2 = _mm_add_epi64(T2, T5);
|
647
|
+
T3 = _mm_add_epi64(T3, T6);
|
648
|
+
T5 = _mm_mul_epu32(H1, p->R23.v);
|
649
|
+
T4 = _mm_add_epi64(T4, T5);
|
650
|
+
T5 = _mm_mul_epu32(H2, p->R22.v);
|
651
|
+
T4 = _mm_add_epi64(T4, T5);
|
652
|
+
T5 = _mm_mul_epu32(H3, p->R21.v);
|
653
|
+
T4 = _mm_add_epi64(T4, T5);
|
654
|
+
T5 = _mm_mul_epu32(H4, p->R20.v);
|
655
|
+
T4 = _mm_add_epi64(T4, T5);
|
656
|
+
|
657
|
+
C1 = _mm_srli_epi64(T0, 26);
|
658
|
+
C2 = _mm_srli_epi64(T3, 26);
|
659
|
+
T0 = _mm_and_si128(T0, MMASK);
|
660
|
+
T3 = _mm_and_si128(T3, MMASK);
|
661
|
+
T1 = _mm_add_epi64(T1, C1);
|
662
|
+
T4 = _mm_add_epi64(T4, C2);
|
663
|
+
C1 = _mm_srli_epi64(T1, 26);
|
664
|
+
C2 = _mm_srli_epi64(T4, 26);
|
665
|
+
T1 = _mm_and_si128(T1, MMASK);
|
666
|
+
T4 = _mm_and_si128(T4, MMASK);
|
667
|
+
T2 = _mm_add_epi64(T2, C1);
|
668
|
+
T0 = _mm_add_epi64(T0, _mm_mul_epu32(C2, FIVE));
|
669
|
+
C1 = _mm_srli_epi64(T2, 26);
|
670
|
+
C2 = _mm_srli_epi64(T0, 26);
|
671
|
+
T2 = _mm_and_si128(T2, MMASK);
|
672
|
+
T0 = _mm_and_si128(T0, MMASK);
|
673
|
+
T3 = _mm_add_epi64(T3, C1);
|
674
|
+
T1 = _mm_add_epi64(T1, C2);
|
675
|
+
C1 = _mm_srli_epi64(T3, 26);
|
676
|
+
T3 = _mm_and_si128(T3, MMASK);
|
677
|
+
T4 = _mm_add_epi64(T4, C1);
|
678
|
+
|
679
|
+
/* H = H[0]+H[1] */
|
680
|
+
H0 = _mm_add_epi64(T0, _mm_srli_si128(T0, 8));
|
681
|
+
H1 = _mm_add_epi64(T1, _mm_srli_si128(T1, 8));
|
682
|
+
H2 = _mm_add_epi64(T2, _mm_srli_si128(T2, 8));
|
683
|
+
H3 = _mm_add_epi64(T3, _mm_srli_si128(T3, 8));
|
684
|
+
H4 = _mm_add_epi64(T4, _mm_srli_si128(T4, 8));
|
685
|
+
|
686
|
+
t0 = _mm_cvtsi128_si32(H0);
|
687
|
+
c = (t0 >> 26);
|
688
|
+
t0 &= 0x3ffffff;
|
689
|
+
t1 = _mm_cvtsi128_si32(H1) + c;
|
690
|
+
c = (t1 >> 26);
|
691
|
+
t1 &= 0x3ffffff;
|
692
|
+
t2 = _mm_cvtsi128_si32(H2) + c;
|
693
|
+
c = (t2 >> 26);
|
694
|
+
t2 &= 0x3ffffff;
|
695
|
+
t3 = _mm_cvtsi128_si32(H3) + c;
|
696
|
+
c = (t3 >> 26);
|
697
|
+
t3 &= 0x3ffffff;
|
698
|
+
t4 = _mm_cvtsi128_si32(H4) + c;
|
699
|
+
c = (t4 >> 26);
|
700
|
+
t4 &= 0x3ffffff;
|
701
|
+
t0 = t0 + (c * 5);
|
702
|
+
c = (t0 >> 26);
|
703
|
+
t0 &= 0x3ffffff;
|
704
|
+
t1 = t1 + c;
|
705
|
+
|
706
|
+
st->HH[0] = ((t0) | (t1 << 26)) & 0xfffffffffffull;
|
707
|
+
st->HH[1] = ((t1 >> 18) | (t2 << 8) | (t3 << 34)) & 0xfffffffffffull;
|
708
|
+
st->HH[2] = ((t3 >> 10) | (t4 << 16)) & 0x3ffffffffffull;
|
709
|
+
|
710
|
+
return consumed;
|
711
|
+
}
|
712
|
+
|
713
|
+
void CRYPTO_poly1305_update(poly1305_state *state, const uint8_t *m,
|
714
|
+
size_t bytes) {
|
715
|
+
poly1305_state_internal *st = poly1305_aligned_state(state);
|
716
|
+
size_t want;
|
717
|
+
|
718
|
+
/* need at least 32 initial bytes to start the accelerated branch */
|
719
|
+
if (!st->started) {
|
720
|
+
if ((st->leftover == 0) && (bytes > 32)) {
|
721
|
+
poly1305_first_block(st, m);
|
722
|
+
m += 32;
|
723
|
+
bytes -= 32;
|
724
|
+
} else {
|
725
|
+
want = poly1305_min(32 - st->leftover, bytes);
|
726
|
+
poly1305_block_copy(st->buffer + st->leftover, m, want);
|
727
|
+
bytes -= want;
|
728
|
+
m += want;
|
729
|
+
st->leftover += want;
|
730
|
+
if ((st->leftover < 32) || (bytes == 0)) {
|
731
|
+
return;
|
732
|
+
}
|
733
|
+
poly1305_first_block(st, st->buffer);
|
734
|
+
st->leftover = 0;
|
735
|
+
}
|
736
|
+
st->started = 1;
|
737
|
+
}
|
738
|
+
|
739
|
+
/* handle leftover */
|
740
|
+
if (st->leftover) {
|
741
|
+
want = poly1305_min(64 - st->leftover, bytes);
|
742
|
+
poly1305_block_copy(st->buffer + st->leftover, m, want);
|
743
|
+
bytes -= want;
|
744
|
+
m += want;
|
745
|
+
st->leftover += want;
|
746
|
+
if (st->leftover < 64) {
|
747
|
+
return;
|
748
|
+
}
|
749
|
+
poly1305_blocks(st, st->buffer, 64);
|
750
|
+
st->leftover = 0;
|
751
|
+
}
|
752
|
+
|
753
|
+
/* process 64 byte blocks */
|
754
|
+
if (bytes >= 64) {
|
755
|
+
want = (bytes & ~63);
|
756
|
+
poly1305_blocks(st, m, want);
|
757
|
+
m += want;
|
758
|
+
bytes -= want;
|
759
|
+
}
|
760
|
+
|
761
|
+
if (bytes) {
|
762
|
+
poly1305_block_copy(st->buffer + st->leftover, m, bytes);
|
763
|
+
st->leftover += bytes;
|
764
|
+
}
|
765
|
+
}
|
766
|
+
|
767
|
+
void CRYPTO_poly1305_finish(poly1305_state *state, uint8_t mac[16]) {
|
768
|
+
poly1305_state_internal *st = poly1305_aligned_state(state);
|
769
|
+
size_t leftover = st->leftover;
|
770
|
+
uint8_t *m = st->buffer;
|
771
|
+
uint128_t d[3];
|
772
|
+
uint64_t h0, h1, h2;
|
773
|
+
uint64_t t0, t1;
|
774
|
+
uint64_t g0, g1, g2, c, nc;
|
775
|
+
uint64_t r0, r1, r2, s1, s2;
|
776
|
+
poly1305_power *p;
|
777
|
+
|
778
|
+
if (st->started) {
|
779
|
+
size_t consumed = poly1305_combine(st, m, leftover);
|
780
|
+
leftover -= consumed;
|
781
|
+
m += consumed;
|
782
|
+
}
|
783
|
+
|
784
|
+
/* st->HH will either be 0 or have the combined result */
|
785
|
+
h0 = st->HH[0];
|
786
|
+
h1 = st->HH[1];
|
787
|
+
h2 = st->HH[2];
|
788
|
+
|
789
|
+
p = &st->P[1];
|
790
|
+
r0 = ((uint64_t)p->R20.d[3] << 32) | (uint64_t)p->R20.d[1];
|
791
|
+
r1 = ((uint64_t)p->R21.d[3] << 32) | (uint64_t)p->R21.d[1];
|
792
|
+
r2 = ((uint64_t)p->R22.d[3] << 32) | (uint64_t)p->R22.d[1];
|
793
|
+
s1 = r1 * (5 << 2);
|
794
|
+
s2 = r2 * (5 << 2);
|
795
|
+
|
796
|
+
if (leftover < 16) {
|
797
|
+
goto poly1305_donna_atmost15bytes;
|
798
|
+
}
|
799
|
+
|
800
|
+
poly1305_donna_atleast16bytes:
|
801
|
+
t0 = U8TO64_LE(m + 0);
|
802
|
+
t1 = U8TO64_LE(m + 8);
|
803
|
+
h0 += t0 & 0xfffffffffff;
|
804
|
+
t0 = shr128_pair(t1, t0, 44);
|
805
|
+
h1 += t0 & 0xfffffffffff;
|
806
|
+
h2 += (t1 >> 24) | ((uint64_t)1 << 40);
|
807
|
+
|
808
|
+
poly1305_donna_mul:
|
809
|
+
d[0] = add128(add128(mul64x64_128(h0, r0), mul64x64_128(h1, s2)),
|
810
|
+
mul64x64_128(h2, s1));
|
811
|
+
d[1] = add128(add128(mul64x64_128(h0, r1), mul64x64_128(h1, r0)),
|
812
|
+
mul64x64_128(h2, s2));
|
813
|
+
d[2] = add128(add128(mul64x64_128(h0, r2), mul64x64_128(h1, r1)),
|
814
|
+
mul64x64_128(h2, r0));
|
815
|
+
h0 = lo128(d[0]) & 0xfffffffffff;
|
816
|
+
c = shr128(d[0], 44);
|
817
|
+
d[1] = add128_64(d[1], c);
|
818
|
+
h1 = lo128(d[1]) & 0xfffffffffff;
|
819
|
+
c = shr128(d[1], 44);
|
820
|
+
d[2] = add128_64(d[2], c);
|
821
|
+
h2 = lo128(d[2]) & 0x3ffffffffff;
|
822
|
+
c = shr128(d[2], 42);
|
823
|
+
h0 += c * 5;
|
824
|
+
|
825
|
+
m += 16;
|
826
|
+
leftover -= 16;
|
827
|
+
if (leftover >= 16) {
|
828
|
+
goto poly1305_donna_atleast16bytes;
|
829
|
+
}
|
830
|
+
|
831
|
+
/* final bytes */
|
832
|
+
poly1305_donna_atmost15bytes:
|
833
|
+
if (!leftover) {
|
834
|
+
goto poly1305_donna_finish;
|
835
|
+
}
|
836
|
+
|
837
|
+
m[leftover++] = 1;
|
838
|
+
poly1305_block_zero(m + leftover, 16 - leftover);
|
839
|
+
leftover = 16;
|
840
|
+
|
841
|
+
t0 = U8TO64_LE(m + 0);
|
842
|
+
t1 = U8TO64_LE(m + 8);
|
843
|
+
h0 += t0 & 0xfffffffffff;
|
844
|
+
t0 = shr128_pair(t1, t0, 44);
|
845
|
+
h1 += t0 & 0xfffffffffff;
|
846
|
+
h2 += (t1 >> 24);
|
847
|
+
|
848
|
+
goto poly1305_donna_mul;
|
849
|
+
|
850
|
+
poly1305_donna_finish:
|
851
|
+
c = (h0 >> 44);
|
852
|
+
h0 &= 0xfffffffffff;
|
853
|
+
h1 += c;
|
854
|
+
c = (h1 >> 44);
|
855
|
+
h1 &= 0xfffffffffff;
|
856
|
+
h2 += c;
|
857
|
+
c = (h2 >> 42);
|
858
|
+
h2 &= 0x3ffffffffff;
|
859
|
+
h0 += c * 5;
|
860
|
+
|
861
|
+
g0 = h0 + 5;
|
862
|
+
c = (g0 >> 44);
|
863
|
+
g0 &= 0xfffffffffff;
|
864
|
+
g1 = h1 + c;
|
865
|
+
c = (g1 >> 44);
|
866
|
+
g1 &= 0xfffffffffff;
|
867
|
+
g2 = h2 + c - ((uint64_t)1 << 42);
|
868
|
+
|
869
|
+
c = (g2 >> 63) - 1;
|
870
|
+
nc = ~c;
|
871
|
+
h0 = (h0 & nc) | (g0 & c);
|
872
|
+
h1 = (h1 & nc) | (g1 & c);
|
873
|
+
h2 = (h2 & nc) | (g2 & c);
|
874
|
+
|
875
|
+
/* pad */
|
876
|
+
t0 = ((uint64_t)p->R23.d[3] << 32) | (uint64_t)p->R23.d[1];
|
877
|
+
t1 = ((uint64_t)p->R24.d[3] << 32) | (uint64_t)p->R24.d[1];
|
878
|
+
h0 += (t0 & 0xfffffffffff);
|
879
|
+
c = (h0 >> 44);
|
880
|
+
h0 &= 0xfffffffffff;
|
881
|
+
t0 = shr128_pair(t1, t0, 44);
|
882
|
+
h1 += (t0 & 0xfffffffffff) + c;
|
883
|
+
c = (h1 >> 44);
|
884
|
+
h1 &= 0xfffffffffff;
|
885
|
+
t1 = (t1 >> 24);
|
886
|
+
h2 += (t1)+c;
|
887
|
+
|
888
|
+
U64TO8_LE(mac + 0, ((h0) | (h1 << 44)));
|
889
|
+
U64TO8_LE(mac + 8, ((h1 >> 20) | (h2 << 24)));
|
890
|
+
}
|
891
|
+
|
892
|
+
#endif /* !OPENSSL_WINDOWS && OPENSSL_X86_64 */
|