grpc 0.12.0 → 0.13.0.pre1.1
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of grpc might be problematic. Click here for more details.
- checksums.yaml +4 -4
 - data/Makefile +5707 -22222
 - data/include/grpc/byte_buffer.h +2 -83
 - data/include/grpc/census.h +191 -121
 - data/include/grpc/compression.h +14 -38
 - data/include/grpc/grpc.h +88 -434
 - data/include/grpc/grpc_security.h +76 -46
 - data/include/grpc/grpc_zookeeper.h +1 -1
 - data/include/grpc/impl/codegen/alloc.h +74 -0
 - data/include/grpc/impl/codegen/atm.h +92 -0
 - data/include/grpc/impl/codegen/atm_gcc_atomic.h +72 -0
 - data/include/grpc/impl/codegen/atm_gcc_sync.h +87 -0
 - data/include/grpc/impl/codegen/atm_win32.h +125 -0
 - data/include/grpc/impl/codegen/byte_buffer.h +121 -0
 - data/include/grpc/impl/codegen/compression_types.h +73 -0
 - data/include/grpc/impl/codegen/connectivity_state.h +59 -0
 - data/include/grpc/impl/codegen/grpc_types.h +373 -0
 - data/include/grpc/impl/codegen/log.h +110 -0
 - data/include/grpc/impl/codegen/port_platform.h +362 -0
 - data/include/grpc/impl/codegen/propagation_bits.h +67 -0
 - data/include/grpc/impl/codegen/slice.h +182 -0
 - data/include/grpc/impl/codegen/slice_buffer.h +105 -0
 - data/include/grpc/impl/codegen/status.h +163 -0
 - data/include/grpc/impl/codegen/sync.h +316 -0
 - data/include/grpc/impl/codegen/sync_generic.h +55 -0
 - data/{src/core/census/context.h → include/grpc/impl/codegen/sync_posix.h} +11 -11
 - data/include/grpc/impl/codegen/sync_win32.h +49 -0
 - data/include/grpc/impl/codegen/time.h +132 -0
 - data/include/grpc/status.h +2 -126
 - data/include/grpc/support/alloc.h +2 -35
 - data/include/grpc/support/atm.h +2 -55
 - data/include/grpc/support/atm_gcc_atomic.h +5 -38
 - data/include/grpc/support/atm_gcc_sync.h +2 -50
 - data/include/grpc/support/atm_win32.h +2 -88
 - data/include/grpc/support/avl.h +7 -7
 - data/include/grpc/support/cmdline.h +15 -13
 - data/include/grpc/support/cpu.h +5 -3
 - data/include/grpc/support/histogram.h +23 -20
 - data/include/grpc/support/host_port.h +5 -3
 - data/include/grpc/support/log.h +2 -71
 - data/include/grpc/support/log_win32.h +2 -2
 - data/include/grpc/support/port_platform.h +2 -319
 - data/include/grpc/support/slice.h +2 -145
 - data/include/grpc/support/slice_buffer.h +2 -65
 - data/include/grpc/support/string_util.h +3 -3
 - data/include/grpc/support/subprocess.h +8 -6
 - data/include/grpc/support/sync.h +2 -278
 - data/include/grpc/support/sync_generic.h +2 -18
 - data/include/grpc/support/sync_posix.h +2 -10
 - data/include/grpc/support/sync_win32.h +2 -12
 - data/include/grpc/support/thd.h +11 -11
 - data/include/grpc/support/time.h +2 -91
 - data/include/grpc/support/tls.h +1 -1
 - data/include/grpc/support/tls_gcc.h +1 -1
 - data/include/grpc/support/tls_msvc.h +1 -1
 - data/include/grpc/support/tls_pthread.h +2 -2
 - data/src/boringssl/err_data.c +1252 -0
 - data/src/core/census/context.c +492 -8
 - data/src/core/census/grpc_filter.c +3 -3
 - data/src/core/census/initialize.c +4 -7
 - data/src/core/census/operation.c +2 -2
 - data/src/core/census/placeholders.c +109 -0
 - data/src/core/census/rpc_metric_id.h +6 -6
 - data/src/core/census/tracing.c +1 -1
 - data/src/core/channel/channel_args.c +4 -3
 - data/src/core/channel/channel_stack.c +1 -1
 - data/src/core/channel/client_channel.c +18 -14
 - data/src/core/channel/client_uchannel.c +3 -3
 - data/src/core/channel/compress_filter.c +8 -8
 - data/src/core/channel/http_client_filter.c +2 -2
 - data/src/core/channel/http_server_filter.c +9 -9
 - data/src/core/channel/subchannel_call_holder.c +12 -10
 - data/src/core/client_config/lb_policies/pick_first.c +49 -31
 - data/src/core/client_config/lb_policies/round_robin.c +7 -7
 - data/src/core/client_config/resolvers/dns_resolver.c +3 -3
 - data/src/core/client_config/resolvers/sockaddr_resolver.c +5 -5
 - data/src/core/client_config/subchannel.c +36 -25
 - data/src/core/compression/algorithm.c +3 -3
 - data/src/core/httpcli/format_request.c +1 -1
 - data/src/core/httpcli/httpcli.c +5 -5
 - data/src/core/httpcli/httpcli_security_connector.c +2 -3
 - data/src/core/httpcli/parser.c +7 -7
 - data/src/core/httpcli/parser.h +1 -1
 - data/src/core/iomgr/closure.c +7 -7
 - data/src/core/iomgr/closure.h +6 -5
 - data/src/core/iomgr/exec_ctx.c +12 -8
 - data/src/core/iomgr/exec_ctx.h +12 -5
 - data/src/core/iomgr/executor.c +4 -4
 - data/src/core/iomgr/executor.h +2 -2
 - data/src/core/iomgr/fd_posix.c +28 -17
 - data/src/core/iomgr/fd_posix.h +7 -4
 - data/src/core/iomgr/iocp_windows.c +6 -8
 - data/src/core/iomgr/pollset_multipoller_with_epoll.c +70 -5
 - data/src/core/iomgr/pollset_multipoller_with_poll_posix.c +4 -2
 - data/src/core/iomgr/pollset_posix.c +15 -15
 - data/src/core/iomgr/pollset_posix.h +4 -2
 - data/src/core/iomgr/pollset_windows.c +3 -12
 - data/src/core/iomgr/resolve_address_posix.c +2 -2
 - data/src/core/iomgr/resolve_address_windows.c +2 -2
 - data/src/core/iomgr/sockaddr_utils.c +6 -6
 - data/src/core/iomgr/sockaddr_win32.h +1 -6
 - data/src/core/iomgr/tcp_client_posix.c +7 -7
 - data/src/core/iomgr/tcp_client_windows.c +4 -4
 - data/src/core/iomgr/tcp_posix.c +14 -8
 - data/src/core/iomgr/tcp_posix.h +7 -1
 - data/src/core/iomgr/tcp_server.h +40 -20
 - data/src/core/iomgr/tcp_server_posix.c +106 -49
 - data/src/core/iomgr/tcp_server_windows.c +98 -49
 - data/src/core/iomgr/tcp_windows.c +11 -15
 - data/src/core/iomgr/timer.c +8 -8
 - data/src/core/iomgr/timer.h +1 -1
 - data/src/core/iomgr/timer_heap.c +10 -10
 - data/src/core/iomgr/timer_heap.h +2 -2
 - data/src/core/iomgr/udp_server.c +2 -12
 - data/src/core/iomgr/udp_server.h +1 -9
 - data/src/core/iomgr/workqueue.h +2 -4
 - data/src/core/iomgr/workqueue_posix.c +3 -3
 - data/src/core/json/json_reader.c +11 -12
 - data/src/core/json/json_reader.h +4 -4
 - data/src/core/json/json_string.c +19 -19
 - data/src/core/json/json_writer.c +7 -9
 - data/src/core/profiling/basic_timers.c +1 -1
 - data/src/core/security/base64.c +9 -9
 - data/src/core/security/client_auth_filter.c +4 -4
 - data/src/core/security/credentials.c +5 -5
 - data/src/core/security/google_default_credentials.c +3 -3
 - data/src/core/security/handshake.c +6 -5
 - data/src/core/security/json_token.c +13 -7
 - data/src/core/security/jwt_verifier.c +3 -2
 - data/src/core/security/secure_endpoint.c +16 -16
 - data/src/core/security/security_connector.c +47 -17
 - data/src/core/security/security_connector.h +5 -5
 - data/src/core/security/server_auth_filter.c +3 -3
 - data/src/core/security/server_secure_chttp2.c +30 -31
 - data/src/core/statistics/census_interface.h +2 -2
 - data/src/core/statistics/census_rpc_stats.h +3 -3
 - data/src/core/support/alloc.c +1 -1
 - data/src/core/support/cpu_posix.c +2 -2
 - data/src/core/support/env_linux.c +12 -2
 - data/src/core/support/env_win32.c +15 -7
 - data/src/core/support/histogram.c +5 -5
 - data/src/core/support/log_posix.c +1 -1
 - data/src/core/support/log_win32.c +4 -3
 - data/src/core/support/murmur_hash.c +11 -11
 - data/src/core/support/murmur_hash.h +1 -1
 - data/src/core/support/slice.c +11 -11
 - data/src/core/support/slice_buffer.c +6 -6
 - data/src/core/support/stack_lockfree.c +20 -10
 - data/src/core/support/string.c +15 -15
 - data/src/core/support/string.h +5 -5
 - data/src/core/support/string_win32.c +5 -5
 - data/src/core/support/subprocess_windows.c +141 -0
 - data/src/core/support/sync.c +4 -4
 - data/src/core/support/sync_posix.c +2 -2
 - data/src/core/support/sync_win32.c +10 -5
 - data/src/core/support/time.c +29 -29
 - data/src/core/support/time_posix.c +15 -6
 - data/src/core/support/time_precise.c +2 -2
 - data/src/core/support/time_win32.c +18 -9
 - data/src/core/support/tls_pthread.c +1 -1
 - data/src/core/support/wrap_memcpy.c +53 -0
 - data/src/core/surface/alarm.c +83 -0
 - data/src/core/surface/byte_buffer_reader.c +1 -1
 - data/src/core/surface/call.c +78 -69
 - data/src/core/surface/call.h +2 -2
 - data/src/core/surface/call_test_only.h +2 -2
 - data/src/core/surface/channel.c +9 -9
 - data/src/core/surface/channel.h +1 -1
 - data/src/core/surface/channel_connectivity.c +3 -3
 - data/src/core/surface/channel_create.c +3 -3
 - data/src/core/surface/channel_ping.c +2 -2
 - data/src/core/surface/completion_queue.c +11 -12
 - data/src/core/surface/completion_queue.h +1 -1
 - data/src/core/surface/init.c +7 -5
 - data/src/core/surface/lame_client.c +3 -3
 - data/src/core/surface/secure_channel_create.c +3 -3
 - data/src/core/surface/server.c +28 -28
 - data/src/core/surface/server_chttp2.c +8 -8
 - data/src/core/surface/server_create.c +1 -4
 - data/src/core/surface/validate_metadata.c +3 -3
 - data/src/core/surface/version.c +2 -2
 - data/src/core/transport/byte_stream.c +8 -6
 - data/src/core/transport/byte_stream.h +6 -5
 - data/src/core/transport/chttp2/bin_encoder.c +29 -29
 - data/src/core/transport/chttp2/frame_data.c +29 -26
 - data/src/core/transport/chttp2/frame_data.h +6 -6
 - data/src/core/transport/chttp2/frame_goaway.c +30 -30
 - data/src/core/transport/chttp2/frame_goaway.h +6 -6
 - data/src/core/transport/chttp2/frame_ping.c +6 -6
 - data/src/core/transport/chttp2/frame_ping.h +5 -5
 - data/src/core/transport/chttp2/frame_rst_stream.c +18 -19
 - data/src/core/transport/chttp2/frame_rst_stream.h +4 -4
 - data/src/core/transport/chttp2/frame_settings.c +30 -30
 - data/src/core/transport/chttp2/frame_settings.h +13 -13
 - data/src/core/transport/chttp2/frame_window_update.c +17 -18
 - data/src/core/transport/chttp2/frame_window_update.h +5 -7
 - data/src/core/transport/chttp2/hpack_encoder.c +69 -73
 - data/src/core/transport/chttp2/hpack_encoder.h +16 -16
 - data/src/core/transport/chttp2/hpack_parser.c +167 -167
 - data/src/core/transport/chttp2/hpack_parser.h +16 -16
 - data/src/core/transport/chttp2/hpack_table.c +13 -13
 - data/src/core/transport/chttp2/hpack_table.h +11 -11
 - data/src/core/transport/chttp2/internal.h +97 -86
 - data/src/core/transport/chttp2/parsing.c +25 -25
 - data/src/core/transport/chttp2/stream_lists.c +26 -3
 - data/src/core/transport/chttp2/stream_map.c +13 -14
 - data/src/core/transport/chttp2/stream_map.h +6 -7
 - data/src/core/transport/chttp2/timeout_encoding.c +19 -16
 - data/src/core/transport/chttp2/varint.c +8 -9
 - data/src/core/transport/chttp2/varint.h +7 -8
 - data/src/core/transport/chttp2/writing.c +26 -23
 - data/src/core/transport/chttp2_transport.c +133 -92
 - data/src/core/transport/connectivity_state.c +6 -6
 - data/src/core/transport/metadata.c +18 -18
 - data/src/core/transport/metadata.h +5 -5
 - data/src/core/transport/static_metadata.c +15 -16
 - data/src/core/transport/static_metadata.h +5 -5
 - data/src/core/transport/transport.c +5 -5
 - data/src/core/transport/transport.h +14 -1
 - data/src/core/tsi/fake_transport_security.c +7 -7
 - data/src/core/tsi/ssl_transport_security.c +6 -4
 - data/src/core/tsi/ssl_types.h +55 -0
 - data/src/ruby/ext/grpc/extconf.rb +51 -14
 - data/src/ruby/ext/grpc/rb_byte_buffer.c +3 -1
 - data/src/ruby/ext/grpc/rb_call.c +6 -3
 - data/src/ruby/ext/grpc/rb_call_credentials.c +4 -0
 - data/src/ruby/ext/grpc/rb_channel.c +4 -2
 - data/src/ruby/ext/grpc/rb_channel_args.c +3 -1
 - data/src/ruby/ext/grpc/rb_channel_credentials.c +3 -1
 - data/src/ruby/ext/grpc/rb_completion_queue.c +3 -1
 - data/src/ruby/ext/grpc/rb_event_thread.c +5 -0
 - data/src/ruby/ext/grpc/rb_grpc.c +11 -3
 - data/src/ruby/ext/grpc/rb_grpc_imports.generated.c +560 -0
 - data/src/ruby/ext/grpc/rb_grpc_imports.generated.h +843 -0
 - data/src/ruby/ext/grpc/rb_loader.c +72 -0
 - data/src/ruby/ext/grpc/rb_loader.h +40 -0
 - data/src/ruby/ext/grpc/rb_server.c +3 -1
 - data/src/ruby/ext/grpc/rb_server_credentials.c +4 -2
 - data/src/ruby/lib/grpc/generic/bidi_call.rb +1 -1
 - data/src/ruby/lib/grpc/generic/rpc_desc.rb +1 -1
 - data/src/ruby/lib/grpc/generic/rpc_server.rb +1 -1
 - data/src/ruby/lib/grpc/grpc.rb +34 -0
 - data/src/ruby/lib/grpc/version.rb +1 -1
 - data/src/ruby/spec/pb/health/checker_spec.rb +1 -1
 - data/third_party/boringssl/crypto/aes/aes.c +1142 -0
 - data/third_party/boringssl/crypto/aes/internal.h +87 -0
 - data/third_party/boringssl/crypto/aes/mode_wrappers.c +108 -0
 - data/third_party/boringssl/crypto/asn1/a_bitstr.c +255 -0
 - data/third_party/boringssl/crypto/asn1/a_bool.c +112 -0
 - data/third_party/boringssl/crypto/asn1/a_bytes.c +317 -0
 - data/third_party/boringssl/crypto/asn1/a_d2i_fp.c +286 -0
 - data/third_party/boringssl/crypto/asn1/a_dup.c +103 -0
 - data/third_party/boringssl/crypto/asn1/a_enum.c +183 -0
 - data/third_party/boringssl/crypto/asn1/a_gentm.c +255 -0
 - data/third_party/boringssl/crypto/asn1/a_i2d_fp.c +154 -0
 - data/third_party/boringssl/crypto/asn1/a_int.c +456 -0
 - data/third_party/boringssl/crypto/asn1/a_mbstr.c +390 -0
 - data/third_party/boringssl/crypto/asn1/a_object.c +412 -0
 - data/third_party/boringssl/crypto/asn1/a_octet.c +70 -0
 - data/third_party/boringssl/crypto/asn1/a_print.c +119 -0
 - data/third_party/boringssl/crypto/asn1/a_strnid.c +286 -0
 - data/third_party/boringssl/crypto/asn1/a_time.c +221 -0
 - data/third_party/boringssl/crypto/asn1/a_type.c +160 -0
 - data/third_party/boringssl/crypto/asn1/a_utctm.c +342 -0
 - data/third_party/boringssl/crypto/asn1/a_utf8.c +210 -0
 - data/third_party/boringssl/crypto/asn1/asn1_lib.c +510 -0
 - data/third_party/boringssl/crypto/asn1/asn1_locl.h +73 -0
 - data/third_party/boringssl/crypto/asn1/asn1_par.c +444 -0
 - data/third_party/boringssl/crypto/asn1/asn_pack.c +104 -0
 - data/third_party/boringssl/crypto/asn1/bio_asn1.c +496 -0
 - data/third_party/boringssl/crypto/asn1/bio_ndef.c +254 -0
 - data/third_party/boringssl/crypto/asn1/f_enum.c +206 -0
 - data/third_party/boringssl/crypto/asn1/f_int.c +210 -0
 - data/third_party/boringssl/crypto/asn1/f_string.c +204 -0
 - data/third_party/boringssl/crypto/asn1/t_bitst.c +102 -0
 - data/third_party/boringssl/crypto/asn1/t_pkey.c +112 -0
 - data/third_party/boringssl/crypto/asn1/tasn_dec.c +1342 -0
 - data/third_party/boringssl/crypto/asn1/tasn_enc.c +695 -0
 - data/third_party/boringssl/crypto/asn1/tasn_fre.c +264 -0
 - data/third_party/boringssl/crypto/asn1/tasn_new.c +398 -0
 - data/third_party/boringssl/crypto/asn1/tasn_prn.c +642 -0
 - data/third_party/boringssl/crypto/asn1/tasn_typ.c +137 -0
 - data/third_party/boringssl/crypto/asn1/tasn_utl.c +266 -0
 - data/third_party/boringssl/crypto/asn1/x_bignum.c +143 -0
 - data/third_party/boringssl/crypto/asn1/x_long.c +182 -0
 - data/third_party/boringssl/crypto/base64/base64.c +478 -0
 - data/third_party/boringssl/crypto/bio/bio.c +608 -0
 - data/third_party/boringssl/crypto/bio/bio_mem.c +327 -0
 - data/third_party/boringssl/crypto/bio/buffer.c +496 -0
 - data/third_party/boringssl/crypto/bio/connect.c +544 -0
 - data/third_party/boringssl/crypto/bio/fd.c +270 -0
 - data/third_party/boringssl/crypto/bio/file.c +349 -0
 - data/third_party/boringssl/crypto/bio/hexdump.c +192 -0
 - data/third_party/boringssl/crypto/bio/internal.h +108 -0
 - data/third_party/boringssl/crypto/bio/pair.c +803 -0
 - data/third_party/boringssl/crypto/bio/printf.c +119 -0
 - data/third_party/boringssl/crypto/bio/socket.c +195 -0
 - data/third_party/boringssl/crypto/bio/socket_helper.c +113 -0
 - data/third_party/boringssl/crypto/bn/add.c +377 -0
 - data/third_party/boringssl/crypto/bn/asm/x86_64-gcc.c +599 -0
 - data/third_party/boringssl/crypto/bn/bn.c +341 -0
 - data/third_party/boringssl/crypto/bn/bn_asn1.c +93 -0
 - data/third_party/boringssl/crypto/bn/cmp.c +200 -0
 - data/third_party/boringssl/crypto/bn/convert.c +597 -0
 - data/third_party/boringssl/crypto/bn/ctx.c +311 -0
 - data/third_party/boringssl/crypto/bn/div.c +625 -0
 - data/third_party/boringssl/crypto/bn/exponentiation.c +1544 -0
 - data/third_party/boringssl/crypto/bn/gcd.c +711 -0
 - data/third_party/boringssl/crypto/bn/generic.c +1019 -0
 - data/third_party/boringssl/crypto/bn/internal.h +294 -0
 - data/third_party/boringssl/crypto/bn/kronecker.c +175 -0
 - data/third_party/boringssl/crypto/bn/montgomery.c +561 -0
 - data/third_party/boringssl/crypto/bn/mul.c +888 -0
 - data/third_party/boringssl/crypto/bn/prime.c +845 -0
 - data/third_party/boringssl/crypto/bn/random.c +326 -0
 - data/third_party/boringssl/crypto/bn/rsaz_exp.c +326 -0
 - data/third_party/boringssl/crypto/bn/rsaz_exp.h +56 -0
 - data/third_party/boringssl/crypto/bn/shift.c +299 -0
 - data/third_party/boringssl/crypto/bn/sqrt.c +505 -0
 - data/third_party/boringssl/crypto/buf/buf.c +235 -0
 - data/third_party/boringssl/crypto/bytestring/ber.c +221 -0
 - data/third_party/boringssl/crypto/bytestring/cbb.c +411 -0
 - data/third_party/boringssl/crypto/bytestring/cbs.c +415 -0
 - data/third_party/boringssl/crypto/bytestring/internal.h +46 -0
 - data/third_party/boringssl/crypto/chacha/chacha_generic.c +140 -0
 - data/third_party/boringssl/crypto/chacha/chacha_vec.c +323 -0
 - data/third_party/boringssl/crypto/cipher/aead.c +167 -0
 - data/third_party/boringssl/crypto/cipher/cipher.c +652 -0
 - data/third_party/boringssl/crypto/cipher/derive_key.c +154 -0
 - data/third_party/boringssl/crypto/cipher/e_aes.c +1767 -0
 - data/third_party/boringssl/crypto/cipher/e_chacha20poly1305.c +311 -0
 - data/third_party/boringssl/crypto/cipher/e_des.c +207 -0
 - data/third_party/boringssl/crypto/cipher/e_null.c +85 -0
 - data/third_party/boringssl/crypto/cipher/e_rc2.c +443 -0
 - data/third_party/boringssl/crypto/cipher/e_rc4.c +87 -0
 - data/third_party/boringssl/crypto/cipher/e_ssl3.c +463 -0
 - data/third_party/boringssl/crypto/cipher/e_tls.c +673 -0
 - data/third_party/boringssl/crypto/cipher/internal.h +164 -0
 - data/third_party/boringssl/crypto/cipher/tls_cbc.c +495 -0
 - data/third_party/boringssl/crypto/cmac/cmac.c +239 -0
 - data/third_party/boringssl/crypto/conf/conf.c +778 -0
 - data/third_party/boringssl/crypto/conf/conf_def.h +127 -0
 - data/third_party/boringssl/crypto/conf/internal.h +31 -0
 - data/third_party/boringssl/crypto/cpu-arm.c +199 -0
 - data/third_party/boringssl/crypto/cpu-intel.c +261 -0
 - data/third_party/boringssl/crypto/crypto.c +140 -0
 - data/third_party/boringssl/crypto/curve25519/curve25519.c +4897 -0
 - data/third_party/boringssl/crypto/des/des.c +771 -0
 - data/third_party/boringssl/crypto/des/internal.h +212 -0
 - data/third_party/boringssl/crypto/dh/check.c +180 -0
 - data/third_party/boringssl/crypto/dh/dh.c +463 -0
 - data/third_party/boringssl/crypto/dh/dh_asn1.c +84 -0
 - data/third_party/boringssl/crypto/dh/internal.h +80 -0
 - data/third_party/boringssl/crypto/dh/params.c +301 -0
 - data/third_party/boringssl/crypto/digest/digest.c +248 -0
 - data/third_party/boringssl/crypto/digest/digests.c +321 -0
 - data/third_party/boringssl/crypto/digest/internal.h +112 -0
 - data/third_party/boringssl/crypto/digest/md32_common.h +322 -0
 - data/third_party/boringssl/crypto/directory.h +66 -0
 - data/third_party/boringssl/crypto/directory_posix.c +108 -0
 - data/third_party/boringssl/crypto/directory_win.c +144 -0
 - data/third_party/boringssl/crypto/dsa/dsa.c +908 -0
 - data/third_party/boringssl/crypto/dsa/dsa_asn1.c +150 -0
 - data/third_party/boringssl/crypto/dsa/internal.h +78 -0
 - data/third_party/boringssl/crypto/ec/ec.c +889 -0
 - data/third_party/boringssl/crypto/ec/ec_asn1.c +586 -0
 - data/third_party/boringssl/crypto/ec/ec_key.c +482 -0
 - data/third_party/boringssl/crypto/ec/ec_montgomery.c +280 -0
 - data/third_party/boringssl/crypto/ec/internal.h +318 -0
 - data/third_party/boringssl/crypto/ec/oct.c +416 -0
 - data/third_party/boringssl/crypto/ec/p224-64.c +1305 -0
 - data/third_party/boringssl/crypto/ec/p256-64.c +1878 -0
 - data/third_party/boringssl/crypto/ec/p256-x86_64-table.h +9548 -0
 - data/third_party/boringssl/crypto/ec/p256-x86_64.c +596 -0
 - data/third_party/boringssl/crypto/ec/simple.c +1313 -0
 - data/third_party/boringssl/crypto/ec/util-64.c +183 -0
 - data/third_party/boringssl/crypto/ec/wnaf.c +449 -0
 - data/third_party/boringssl/crypto/ecdh/ecdh.c +153 -0
 - data/third_party/boringssl/crypto/ecdsa/ecdsa.c +496 -0
 - data/third_party/boringssl/crypto/ecdsa/ecdsa_asn1.c +240 -0
 - data/third_party/boringssl/crypto/engine/engine.c +96 -0
 - data/third_party/boringssl/crypto/err/err.c +756 -0
 - data/third_party/boringssl/crypto/evp/algorithm.c +153 -0
 - data/third_party/boringssl/crypto/evp/digestsign.c +159 -0
 - data/third_party/boringssl/crypto/evp/evp.c +411 -0
 - data/third_party/boringssl/crypto/evp/evp_asn1.c +179 -0
 - data/third_party/boringssl/crypto/evp/evp_ctx.c +477 -0
 - data/third_party/boringssl/crypto/evp/internal.h +278 -0
 - data/third_party/boringssl/crypto/evp/p_dsa_asn1.c +588 -0
 - data/third_party/boringssl/crypto/evp/p_ec.c +283 -0
 - data/third_party/boringssl/crypto/evp/p_ec_asn1.c +562 -0
 - data/third_party/boringssl/crypto/evp/p_rsa.c +596 -0
 - data/third_party/boringssl/crypto/evp/p_rsa_asn1.c +737 -0
 - data/third_party/boringssl/crypto/evp/pbkdf.c +151 -0
 - data/third_party/boringssl/crypto/evp/sign.c +151 -0
 - data/third_party/boringssl/crypto/ex_data.c +294 -0
 - data/third_party/boringssl/crypto/hkdf/hkdf.c +89 -0
 - data/third_party/boringssl/crypto/hmac/hmac.c +213 -0
 - data/third_party/boringssl/crypto/internal.h +532 -0
 - data/third_party/boringssl/crypto/lhash/lhash.c +346 -0
 - data/third_party/boringssl/crypto/md4/md4.c +225 -0
 - data/third_party/boringssl/crypto/md5/md5.c +275 -0
 - data/third_party/boringssl/crypto/mem.c +200 -0
 - data/third_party/boringssl/crypto/modes/cbc.c +216 -0
 - data/third_party/boringssl/crypto/modes/cfb.c +231 -0
 - data/third_party/boringssl/crypto/modes/ctr.c +226 -0
 - data/third_party/boringssl/crypto/modes/gcm.c +1252 -0
 - data/third_party/boringssl/crypto/modes/internal.h +370 -0
 - data/third_party/boringssl/crypto/modes/ofb.c +108 -0
 - data/third_party/boringssl/crypto/obj/obj.c +664 -0
 - data/third_party/boringssl/crypto/obj/obj_dat.h +5257 -0
 - data/third_party/boringssl/crypto/obj/obj_xref.c +124 -0
 - data/third_party/boringssl/crypto/obj/obj_xref.h +96 -0
 - data/third_party/boringssl/crypto/pem/pem_all.c +281 -0
 - data/third_party/boringssl/crypto/pem/pem_info.c +404 -0
 - data/third_party/boringssl/crypto/pem/pem_lib.c +835 -0
 - data/third_party/boringssl/crypto/pem/pem_oth.c +89 -0
 - data/third_party/boringssl/crypto/pem/pem_pk8.c +244 -0
 - data/third_party/boringssl/crypto/pem/pem_pkey.c +312 -0
 - data/third_party/boringssl/crypto/pem/pem_x509.c +65 -0
 - data/third_party/boringssl/crypto/pem/pem_xaux.c +66 -0
 - data/third_party/boringssl/crypto/pkcs8/internal.h +83 -0
 - data/third_party/boringssl/crypto/pkcs8/p5_pbe.c +150 -0
 - data/third_party/boringssl/crypto/pkcs8/p5_pbev2.c +440 -0
 - data/third_party/boringssl/crypto/pkcs8/p8_pkey.c +85 -0
 - data/third_party/boringssl/crypto/pkcs8/pkcs8.c +1217 -0
 - data/third_party/boringssl/crypto/poly1305/poly1305.c +331 -0
 - data/third_party/boringssl/crypto/poly1305/poly1305_arm.c +301 -0
 - data/third_party/boringssl/crypto/poly1305/poly1305_vec.c +892 -0
 - data/third_party/boringssl/crypto/rand/internal.h +32 -0
 - data/third_party/boringssl/crypto/rand/rand.c +239 -0
 - data/third_party/boringssl/crypto/rand/urandom.c +223 -0
 - data/third_party/boringssl/crypto/rand/windows.c +56 -0
 - data/third_party/boringssl/crypto/rc4/rc4.c +283 -0
 - data/third_party/boringssl/crypto/refcount_c11.c +67 -0
 - data/third_party/boringssl/crypto/refcount_lock.c +53 -0
 - data/third_party/boringssl/crypto/rsa/blinding.c +462 -0
 - data/third_party/boringssl/crypto/rsa/internal.h +164 -0
 - data/third_party/boringssl/crypto/rsa/padding.c +711 -0
 - data/third_party/boringssl/crypto/rsa/rsa.c +808 -0
 - data/third_party/boringssl/crypto/rsa/rsa_asn1.c +473 -0
 - data/third_party/boringssl/crypto/rsa/rsa_impl.c +1138 -0
 - data/third_party/boringssl/crypto/sha/sha1.c +337 -0
 - data/third_party/boringssl/crypto/sha/sha256.c +327 -0
 - data/third_party/boringssl/crypto/sha/sha512.c +607 -0
 - data/third_party/boringssl/crypto/stack/stack.c +386 -0
 - data/third_party/boringssl/crypto/test/scoped_types.h +137 -0
 - data/third_party/boringssl/crypto/test/test_util.h +35 -0
 - data/third_party/boringssl/crypto/thread.c +101 -0
 - data/third_party/boringssl/crypto/thread_none.c +55 -0
 - data/third_party/boringssl/crypto/thread_pthread.c +167 -0
 - data/third_party/boringssl/crypto/thread_win.c +282 -0
 - data/third_party/boringssl/crypto/time_support.c +212 -0
 - data/third_party/boringssl/crypto/x509/a_digest.c +97 -0
 - data/third_party/boringssl/crypto/x509/a_sign.c +136 -0
 - data/third_party/boringssl/crypto/x509/a_strex.c +564 -0
 - data/third_party/boringssl/crypto/x509/a_verify.c +133 -0
 - data/third_party/boringssl/crypto/x509/asn1_gen.c +873 -0
 - data/third_party/boringssl/crypto/x509/by_dir.c +491 -0
 - data/third_party/boringssl/crypto/x509/by_file.c +295 -0
 - data/third_party/boringssl/crypto/x509/charmap.h +15 -0
 - data/third_party/boringssl/crypto/x509/i2d_pr.c +84 -0
 - data/third_party/boringssl/crypto/x509/pkcs7.c +353 -0
 - data/third_party/boringssl/crypto/x509/t_crl.c +129 -0
 - data/third_party/boringssl/crypto/x509/t_req.c +246 -0
 - data/third_party/boringssl/crypto/x509/t_x509.c +500 -0
 - data/third_party/boringssl/crypto/x509/t_x509a.c +109 -0
 - data/third_party/boringssl/crypto/x509/vpm_int.h +70 -0
 - data/third_party/boringssl/crypto/x509/x509.c +152 -0
 - data/third_party/boringssl/crypto/x509/x509_att.c +353 -0
 - data/third_party/boringssl/crypto/x509/x509_cmp.c +490 -0
 - data/third_party/boringssl/crypto/x509/x509_d2.c +105 -0
 - data/third_party/boringssl/crypto/x509/x509_def.c +88 -0
 - data/third_party/boringssl/crypto/x509/x509_ext.c +206 -0
 - data/third_party/boringssl/crypto/x509/x509_lu.c +738 -0
 - data/third_party/boringssl/crypto/x509/x509_obj.c +191 -0
 - data/third_party/boringssl/crypto/x509/x509_r2x.c +113 -0
 - data/third_party/boringssl/crypto/x509/x509_req.c +315 -0
 - data/third_party/boringssl/crypto/x509/x509_set.c +154 -0
 - data/third_party/boringssl/crypto/x509/x509_trs.c +304 -0
 - data/third_party/boringssl/crypto/x509/x509_txt.c +209 -0
 - data/third_party/boringssl/crypto/x509/x509_v3.c +271 -0
 - data/third_party/boringssl/crypto/x509/x509_vfy.c +2456 -0
 - data/third_party/boringssl/crypto/x509/x509_vpm.c +672 -0
 - data/third_party/boringssl/crypto/x509/x509cset.c +172 -0
 - data/third_party/boringssl/crypto/x509/x509name.c +381 -0
 - data/third_party/boringssl/crypto/x509/x509rset.c +80 -0
 - data/third_party/boringssl/crypto/x509/x509spki.c +135 -0
 - data/third_party/boringssl/crypto/x509/x509type.c +128 -0
 - data/third_party/boringssl/crypto/x509/x_algor.c +154 -0
 - data/third_party/boringssl/crypto/x509/x_all.c +547 -0
 - data/third_party/boringssl/crypto/x509/x_attrib.c +117 -0
 - data/third_party/boringssl/crypto/x509/x_crl.c +560 -0
 - data/third_party/boringssl/crypto/x509/x_exten.c +75 -0
 - data/third_party/boringssl/crypto/x509/x_info.c +95 -0
 - data/third_party/boringssl/crypto/x509/x_name.c +538 -0
 - data/third_party/boringssl/crypto/x509/x_pkey.c +100 -0
 - data/third_party/boringssl/crypto/x509/x_pubkey.c +384 -0
 - data/third_party/boringssl/crypto/x509/x_req.c +112 -0
 - data/third_party/boringssl/crypto/x509/x_sig.c +69 -0
 - data/third_party/boringssl/crypto/x509/x_spki.c +78 -0
 - data/third_party/boringssl/crypto/x509/x_val.c +69 -0
 - data/third_party/boringssl/crypto/x509/x_x509.c +227 -0
 - data/third_party/boringssl/crypto/x509/x_x509a.c +197 -0
 - data/third_party/boringssl/crypto/x509v3/ext_dat.h +129 -0
 - data/third_party/boringssl/crypto/x509v3/pcy_cache.c +299 -0
 - data/third_party/boringssl/crypto/x509v3/pcy_data.c +137 -0
 - data/third_party/boringssl/crypto/x509v3/pcy_int.h +212 -0
 - data/third_party/boringssl/crypto/x509v3/pcy_lib.c +165 -0
 - data/third_party/boringssl/crypto/x509v3/pcy_map.c +133 -0
 - data/third_party/boringssl/crypto/x509v3/pcy_node.c +197 -0
 - data/third_party/boringssl/crypto/x509v3/pcy_tree.c +876 -0
 - data/third_party/boringssl/crypto/x509v3/v3_akey.c +212 -0
 - data/third_party/boringssl/crypto/x509v3/v3_akeya.c +71 -0
 - data/third_party/boringssl/crypto/x509v3/v3_alt.c +622 -0
 - data/third_party/boringssl/crypto/x509v3/v3_bcons.c +126 -0
 - data/third_party/boringssl/crypto/x509v3/v3_bitst.c +141 -0
 - data/third_party/boringssl/crypto/x509v3/v3_conf.c +459 -0
 - data/third_party/boringssl/crypto/x509v3/v3_cpols.c +475 -0
 - data/third_party/boringssl/crypto/x509v3/v3_crld.c +616 -0
 - data/third_party/boringssl/crypto/x509v3/v3_enum.c +98 -0
 - data/third_party/boringssl/crypto/x509v3/v3_extku.c +145 -0
 - data/third_party/boringssl/crypto/x509v3/v3_genn.c +252 -0
 - data/third_party/boringssl/crypto/x509v3/v3_ia5.c +117 -0
 - data/third_party/boringssl/crypto/x509v3/v3_info.c +200 -0
 - data/third_party/boringssl/crypto/x509v3/v3_int.c +87 -0
 - data/third_party/boringssl/crypto/x509v3/v3_lib.c +335 -0
 - data/third_party/boringssl/crypto/x509v3/v3_ncons.c +510 -0
 - data/third_party/boringssl/crypto/x509v3/v3_pci.c +335 -0
 - data/third_party/boringssl/crypto/x509v3/v3_pcia.c +56 -0
 - data/third_party/boringssl/crypto/x509v3/v3_pcons.c +142 -0
 - data/third_party/boringssl/crypto/x509v3/v3_pku.c +109 -0
 - data/third_party/boringssl/crypto/x509v3/v3_pmaps.c +156 -0
 - data/third_party/boringssl/crypto/x509v3/v3_prn.c +207 -0
 - data/third_party/boringssl/crypto/x509v3/v3_purp.c +805 -0
 - data/third_party/boringssl/crypto/x509v3/v3_skey.c +148 -0
 - data/third_party/boringssl/crypto/x509v3/v3_sxnet.c +266 -0
 - data/third_party/boringssl/crypto/x509v3/v3_utl.c +1322 -0
 - data/third_party/boringssl/include/openssl/aead.h +346 -0
 - data/third_party/boringssl/include/openssl/aes.h +158 -0
 - data/third_party/boringssl/include/openssl/arm_arch.h +127 -0
 - data/third_party/boringssl/include/openssl/asn1.h +1168 -0
 - data/third_party/boringssl/include/openssl/asn1_mac.h +75 -0
 - data/third_party/boringssl/include/openssl/asn1t.h +906 -0
 - data/third_party/boringssl/include/openssl/base.h +261 -0
 - data/third_party/boringssl/include/openssl/base64.h +184 -0
 - data/third_party/boringssl/include/openssl/bio.h +902 -0
 - data/third_party/boringssl/include/openssl/blowfish.h +93 -0
 - data/third_party/boringssl/include/openssl/bn.h +885 -0
 - data/third_party/boringssl/include/openssl/buf.h +118 -0
 - data/third_party/boringssl/include/openssl/buffer.h +18 -0
 - data/third_party/boringssl/include/openssl/bytestring.h +360 -0
 - data/third_party/boringssl/include/openssl/cast.h +96 -0
 - data/third_party/boringssl/include/openssl/chacha.h +37 -0
 - data/third_party/boringssl/include/openssl/cipher.h +571 -0
 - data/third_party/boringssl/include/openssl/cmac.h +76 -0
 - data/third_party/boringssl/include/openssl/conf.h +145 -0
 - data/third_party/boringssl/include/openssl/cpu.h +184 -0
 - data/third_party/boringssl/include/openssl/crypto.h +68 -0
 - data/third_party/boringssl/include/openssl/curve25519.h +88 -0
 - data/third_party/boringssl/include/openssl/des.h +177 -0
 - data/third_party/boringssl/include/openssl/dh.h +238 -0
 - data/third_party/boringssl/include/openssl/digest.h +258 -0
 - data/third_party/boringssl/include/openssl/dsa.h +343 -0
 - data/third_party/boringssl/include/openssl/dtls1.h +16 -0
 - data/third_party/boringssl/include/openssl/ec.h +355 -0
 - data/third_party/boringssl/include/openssl/ec_key.h +280 -0
 - data/third_party/boringssl/include/openssl/ecdh.h +102 -0
 - data/third_party/boringssl/include/openssl/ecdsa.h +206 -0
 - data/third_party/boringssl/include/openssl/engine.h +98 -0
 - data/third_party/boringssl/include/openssl/err.h +487 -0
 - data/third_party/boringssl/include/openssl/evp.h +750 -0
 - data/third_party/boringssl/include/openssl/ex_data.h +213 -0
 - data/third_party/boringssl/include/openssl/hkdf.h +44 -0
 - data/third_party/boringssl/include/openssl/hmac.h +160 -0
 - data/third_party/boringssl/include/openssl/lhash.h +192 -0
 - data/third_party/boringssl/include/openssl/lhash_macros.h +132 -0
 - data/third_party/boringssl/include/openssl/md4.h +102 -0
 - data/third_party/boringssl/include/openssl/md5.h +107 -0
 - data/third_party/boringssl/include/openssl/mem.h +140 -0
 - data/third_party/boringssl/include/openssl/obj.h +198 -0
 - data/third_party/boringssl/include/openssl/obj_mac.h +4140 -0
 - data/third_party/boringssl/include/openssl/objects.h +18 -0
 - data/third_party/boringssl/include/openssl/opensslfeatures.h +60 -0
 - data/third_party/boringssl/include/openssl/opensslv.h +18 -0
 - data/third_party/boringssl/include/openssl/ossl_typ.h +18 -0
 - data/third_party/boringssl/include/openssl/pem.h +521 -0
 - data/third_party/boringssl/include/openssl/pkcs12.h +18 -0
 - data/third_party/boringssl/include/openssl/pkcs7.h +16 -0
 - data/third_party/boringssl/include/openssl/pkcs8.h +220 -0
 - data/third_party/boringssl/include/openssl/poly1305.h +51 -0
 - data/third_party/boringssl/include/openssl/pqueue.h +146 -0
 - data/third_party/boringssl/include/openssl/rand.h +113 -0
 - data/third_party/boringssl/include/openssl/rc4.h +90 -0
 - data/third_party/boringssl/include/openssl/rsa.h +637 -0
 - data/third_party/boringssl/include/openssl/safestack.h +16 -0
 - data/third_party/boringssl/include/openssl/sha.h +256 -0
 - data/third_party/boringssl/include/openssl/srtp.h +18 -0
 - data/third_party/boringssl/include/openssl/ssl.h +4466 -0
 - data/third_party/boringssl/include/openssl/ssl3.h +441 -0
 - data/third_party/boringssl/include/openssl/stack.h +298 -0
 - data/third_party/boringssl/include/openssl/stack_macros.h +4190 -0
 - data/third_party/boringssl/include/openssl/thread.h +173 -0
 - data/third_party/boringssl/include/openssl/time_support.h +90 -0
 - data/third_party/boringssl/include/openssl/tls1.h +653 -0
 - data/third_party/boringssl/include/openssl/type_check.h +91 -0
 - data/third_party/boringssl/include/openssl/x509.h +1258 -0
 - data/third_party/boringssl/include/openssl/x509_vfy.h +611 -0
 - data/third_party/boringssl/include/openssl/x509v3.h +798 -0
 - data/third_party/boringssl/ssl/custom_extensions.c +257 -0
 - data/third_party/boringssl/ssl/d1_both.c +880 -0
 - data/third_party/boringssl/ssl/d1_clnt.c +566 -0
 - data/third_party/boringssl/ssl/d1_lib.c +340 -0
 - data/third_party/boringssl/ssl/d1_meth.c +130 -0
 - data/third_party/boringssl/ssl/d1_pkt.c +578 -0
 - data/third_party/boringssl/ssl/d1_srtp.c +234 -0
 - data/third_party/boringssl/ssl/d1_srvr.c +485 -0
 - data/third_party/boringssl/ssl/dtls_record.c +308 -0
 - data/third_party/boringssl/ssl/internal.h +1276 -0
 - data/third_party/boringssl/ssl/pqueue/pqueue.c +197 -0
 - data/third_party/boringssl/ssl/s3_both.c +571 -0
 - data/third_party/boringssl/ssl/s3_clnt.c +2241 -0
 - data/third_party/boringssl/ssl/s3_enc.c +494 -0
 - data/third_party/boringssl/ssl/s3_lib.c +587 -0
 - data/third_party/boringssl/ssl/s3_meth.c +166 -0
 - data/third_party/boringssl/ssl/s3_pkt.c +732 -0
 - data/third_party/boringssl/ssl/s3_srvr.c +2536 -0
 - data/third_party/boringssl/ssl/ssl_aead_ctx.c +300 -0
 - data/third_party/boringssl/ssl/ssl_asn1.c +718 -0
 - data/third_party/boringssl/ssl/ssl_buffer.c +319 -0
 - data/third_party/boringssl/ssl/ssl_cert.c +539 -0
 - data/third_party/boringssl/ssl/ssl_cipher.c +2003 -0
 - data/third_party/boringssl/ssl/ssl_file.c +633 -0
 - data/third_party/boringssl/ssl/ssl_lib.c +2653 -0
 - data/third_party/boringssl/ssl/ssl_rsa.c +423 -0
 - data/third_party/boringssl/ssl/ssl_session.c +764 -0
 - data/third_party/boringssl/ssl/ssl_stat.c +591 -0
 - data/third_party/boringssl/ssl/t1_enc.c +708 -0
 - data/third_party/boringssl/ssl/t1_lib.c +2905 -0
 - data/third_party/boringssl/ssl/test/async_bio.h +45 -0
 - data/third_party/boringssl/ssl/test/packeted_bio.h +44 -0
 - data/third_party/boringssl/ssl/test/scoped_types.h +28 -0
 - data/third_party/boringssl/ssl/test/test_config.h +108 -0
 - data/third_party/boringssl/ssl/tls_record.c +342 -0
 - data/third_party/zlib/adler32.c +179 -0
 - data/third_party/zlib/compress.c +80 -0
 - data/third_party/zlib/crc32.c +425 -0
 - data/third_party/zlib/crc32.h +441 -0
 - data/third_party/zlib/deflate.c +1967 -0
 - data/third_party/zlib/deflate.h +346 -0
 - data/third_party/zlib/gzclose.c +25 -0
 - data/third_party/zlib/gzguts.h +209 -0
 - data/third_party/zlib/gzlib.c +634 -0
 - data/third_party/zlib/gzread.c +594 -0
 - data/third_party/zlib/gzwrite.c +577 -0
 - data/third_party/zlib/infback.c +640 -0
 - data/third_party/zlib/inffast.c +340 -0
 - data/third_party/zlib/inffast.h +11 -0
 - data/third_party/zlib/inffixed.h +94 -0
 - data/third_party/zlib/inflate.c +1512 -0
 - data/third_party/zlib/inflate.h +122 -0
 - data/third_party/zlib/inftrees.c +306 -0
 - data/third_party/zlib/inftrees.h +62 -0
 - data/third_party/zlib/trees.c +1226 -0
 - data/third_party/zlib/trees.h +128 -0
 - data/third_party/zlib/uncompr.c +59 -0
 - data/third_party/zlib/zconf.h +511 -0
 - data/third_party/zlib/zlib.h +1768 -0
 - data/third_party/zlib/zutil.c +324 -0
 - data/third_party/zlib/zutil.h +253 -0
 - metadata +492 -25
 - data/Rakefile +0 -63
 - data/src/ruby/lib/grpc/grpc.so +0 -0
 
| 
         @@ -0,0 +1,892 @@ 
     | 
|
| 
      
 1 
     | 
    
         
            +
            /* Copyright (c) 2014, Google Inc.
         
     | 
| 
      
 2 
     | 
    
         
            +
             *
         
     | 
| 
      
 3 
     | 
    
         
            +
             * Permission to use, copy, modify, and/or distribute this software for any
         
     | 
| 
      
 4 
     | 
    
         
            +
             * purpose with or without fee is hereby granted, provided that the above
         
     | 
| 
      
 5 
     | 
    
         
            +
             * copyright notice and this permission notice appear in all copies.
         
     | 
| 
      
 6 
     | 
    
         
            +
             *
         
     | 
| 
      
 7 
     | 
    
         
            +
             * THE SOFTWARE IS PROVIDED "AS IS" AND THE AUTHOR DISCLAIMS ALL WARRANTIES
         
     | 
| 
      
 8 
     | 
    
         
            +
             * WITH REGARD TO THIS SOFTWARE INCLUDING ALL IMPLIED WARRANTIES OF
         
     | 
| 
      
 9 
     | 
    
         
            +
             * MERCHANTABILITY AND FITNESS. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
         
     | 
| 
      
 10 
     | 
    
         
            +
             * SPECIAL, DIRECT, INDIRECT, OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES
         
     | 
| 
      
 11 
     | 
    
         
            +
             * WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN AN ACTION
         
     | 
| 
      
 12 
     | 
    
         
            +
             * OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, ARISING OUT OF OR IN
         
     | 
| 
      
 13 
     | 
    
         
            +
             * CONNECTION WITH THE USE OR PERFORMANCE OF THIS SOFTWARE. */
         
     | 
| 
      
 14 
     | 
    
         
            +
             
     | 
| 
      
 15 
     | 
    
         
            +
            /* This implementation of poly1305 is by Andrew Moon
         
     | 
| 
      
 16 
     | 
    
         
            +
             * (https://github.com/floodyberry/poly1305-donna) and released as public
         
     | 
| 
      
 17 
     | 
    
         
            +
             * domain. It implements SIMD vectorization based on the algorithm described in
         
     | 
| 
      
 18 
     | 
    
         
            +
             * http://cr.yp.to/papers.html#neoncrypto. Unrolled to 2 powers, i.e. 64 byte
         
     | 
| 
      
 19 
     | 
    
         
            +
             * block size */
         
     | 
| 
      
 20 
     | 
    
         
            +
             
     | 
| 
      
 21 
     | 
    
         
            +
            #include <openssl/poly1305.h>
         
     | 
| 
      
 22 
     | 
    
         
            +
             
     | 
| 
      
 23 
     | 
    
         
            +
             
     | 
| 
      
 24 
     | 
    
         
            +
            #if !defined(OPENSSL_WINDOWS) && defined(OPENSSL_X86_64)
         
     | 
| 
      
 25 
     | 
    
         
            +
             
     | 
| 
      
 26 
     | 
    
         
            +
            #include <emmintrin.h>
         
     | 
| 
      
 27 
     | 
    
         
            +
             
     | 
| 
      
 28 
     | 
    
         
            +
            #define ALIGN(x) __attribute__((aligned(x)))
         
     | 
| 
      
 29 
     | 
    
         
            +
            /* inline is not a keyword in C89. */
         
     | 
| 
      
 30 
     | 
    
         
            +
            #define INLINE 
         
     | 
| 
      
 31 
     | 
    
         
            +
            #define U8TO64_LE(m) (*(uint64_t *)(m))
         
     | 
| 
      
 32 
     | 
    
         
            +
            #define U8TO32_LE(m) (*(uint32_t *)(m))
         
     | 
| 
      
 33 
     | 
    
         
            +
            #define U64TO8_LE(m, v) (*(uint64_t *)(m)) = v
         
     | 
| 
      
 34 
     | 
    
         
            +
             
     | 
| 
      
 35 
     | 
    
         
            +
            typedef __m128i xmmi;
         
     | 
| 
      
 36 
     | 
    
         
            +
            typedef unsigned __int128 uint128_t;
         
     | 
| 
      
 37 
     | 
    
         
            +
             
     | 
| 
      
 38 
     | 
    
         
            +
            static const uint32_t ALIGN(16) poly1305_x64_sse2_message_mask[4] = {
         
     | 
| 
      
 39 
     | 
    
         
            +
                (1 << 26) - 1, 0, (1 << 26) - 1, 0};
         
     | 
| 
      
 40 
     | 
    
         
            +
            static const uint32_t ALIGN(16) poly1305_x64_sse2_5[4] = {5, 0, 5, 0};
         
     | 
| 
      
 41 
     | 
    
         
            +
            static const uint32_t ALIGN(16) poly1305_x64_sse2_1shl128[4] = {(1 << 24), 0,
         
     | 
| 
      
 42 
     | 
    
         
            +
                                                                            (1 << 24), 0};
         
     | 
| 
      
 43 
     | 
    
         
            +
             
     | 
| 
      
 44 
     | 
    
         
            +
            static uint128_t INLINE add128(uint128_t a, uint128_t b) { return a + b; }
         
     | 
| 
      
 45 
     | 
    
         
            +
             
     | 
| 
      
 46 
     | 
    
         
            +
            static uint128_t INLINE add128_64(uint128_t a, uint64_t b) { return a + b; }
         
     | 
| 
      
 47 
     | 
    
         
            +
             
     | 
| 
      
 48 
     | 
    
         
            +
            static uint128_t INLINE mul64x64_128(uint64_t a, uint64_t b) {
         
     | 
| 
      
 49 
     | 
    
         
            +
              return (uint128_t)a * b;
         
     | 
| 
      
 50 
     | 
    
         
            +
            }
         
     | 
| 
      
 51 
     | 
    
         
            +
             
     | 
| 
      
 52 
     | 
    
         
            +
            static uint64_t INLINE lo128(uint128_t a) { return (uint64_t)a; }
         
     | 
| 
      
 53 
     | 
    
         
            +
             
     | 
| 
      
 54 
     | 
    
         
            +
            static uint64_t INLINE shr128(uint128_t v, const int shift) {
         
     | 
| 
      
 55 
     | 
    
         
            +
              return (uint64_t)(v >> shift);
         
     | 
| 
      
 56 
     | 
    
         
            +
            }
         
     | 
| 
      
 57 
     | 
    
         
            +
             
     | 
| 
      
 58 
     | 
    
         
            +
            static uint64_t INLINE shr128_pair(uint64_t hi, uint64_t lo, const int shift) {
         
     | 
| 
      
 59 
     | 
    
         
            +
              return (uint64_t)((((uint128_t)hi << 64) | lo) >> shift);
         
     | 
| 
      
 60 
     | 
    
         
            +
            }
         
     | 
| 
      
 61 
     | 
    
         
            +
             
     | 
| 
      
 62 
     | 
    
         
            +
            typedef struct poly1305_power_t {
         
     | 
| 
      
 63 
     | 
    
         
            +
              union {
         
     | 
| 
      
 64 
     | 
    
         
            +
                xmmi v;
         
     | 
| 
      
 65 
     | 
    
         
            +
                uint64_t u[2];
         
     | 
| 
      
 66 
     | 
    
         
            +
                uint32_t d[4];
         
     | 
| 
      
 67 
     | 
    
         
            +
              } R20, R21, R22, R23, R24, S21, S22, S23, S24;
         
     | 
| 
      
 68 
     | 
    
         
            +
            } poly1305_power;
         
     | 
| 
      
 69 
     | 
    
         
            +
             
     | 
| 
      
 70 
     | 
    
         
            +
            typedef struct poly1305_state_internal_t {
         
     | 
| 
      
 71 
     | 
    
         
            +
              poly1305_power P[2]; /* 288 bytes, top 32 bit halves unused = 144
         
     | 
| 
      
 72 
     | 
    
         
            +
                                      bytes of free storage */
         
     | 
| 
      
 73 
     | 
    
         
            +
              union {
         
     | 
| 
      
 74 
     | 
    
         
            +
                xmmi H[5]; /*  80 bytes  */
         
     | 
| 
      
 75 
     | 
    
         
            +
                uint64_t HH[10];
         
     | 
| 
      
 76 
     | 
    
         
            +
              };
         
     | 
| 
      
 77 
     | 
    
         
            +
              /* uint64_t r0,r1,r2;       [24 bytes] */
         
     | 
| 
      
 78 
     | 
    
         
            +
              /* uint64_t pad0,pad1;      [16 bytes] */
         
     | 
| 
      
 79 
     | 
    
         
            +
              uint64_t started;        /*   8 bytes  */
         
     | 
| 
      
 80 
     | 
    
         
            +
              uint64_t leftover;       /*   8 bytes  */
         
     | 
| 
      
 81 
     | 
    
         
            +
              uint8_t buffer[64];      /*  64 bytes  */
         
     | 
| 
      
 82 
     | 
    
         
            +
            } poly1305_state_internal; /* 448 bytes total + 63 bytes for
         
     | 
| 
      
 83 
     | 
    
         
            +
                                          alignment = 511 bytes raw */
         
     | 
| 
      
 84 
     | 
    
         
            +
             
     | 
| 
      
 85 
     | 
    
         
            +
            static poly1305_state_internal INLINE *poly1305_aligned_state(
         
     | 
| 
      
 86 
     | 
    
         
            +
                poly1305_state *state) {
         
     | 
| 
      
 87 
     | 
    
         
            +
              return (poly1305_state_internal *)(((uint64_t)state + 63) & ~63);
         
     | 
| 
      
 88 
     | 
    
         
            +
            }
         
     | 
| 
      
 89 
     | 
    
         
            +
             
     | 
| 
      
 90 
     | 
    
         
            +
            /* copy 0-63 bytes */
         
     | 
| 
      
 91 
     | 
    
         
            +
            static void INLINE
         
     | 
| 
      
 92 
     | 
    
         
            +
            poly1305_block_copy(uint8_t *dst, const uint8_t *src, size_t bytes) {
         
     | 
| 
      
 93 
     | 
    
         
            +
              size_t offset = src - dst;
         
     | 
| 
      
 94 
     | 
    
         
            +
              if (bytes & 32) {
         
     | 
| 
      
 95 
     | 
    
         
            +
                _mm_storeu_si128((xmmi *)(dst + 0),
         
     | 
| 
      
 96 
     | 
    
         
            +
                                 _mm_loadu_si128((xmmi *)(dst + offset + 0)));
         
     | 
| 
      
 97 
     | 
    
         
            +
                _mm_storeu_si128((xmmi *)(dst + 16),
         
     | 
| 
      
 98 
     | 
    
         
            +
                                 _mm_loadu_si128((xmmi *)(dst + offset + 16)));
         
     | 
| 
      
 99 
     | 
    
         
            +
                dst += 32;
         
     | 
| 
      
 100 
     | 
    
         
            +
              }
         
     | 
| 
      
 101 
     | 
    
         
            +
              if (bytes & 16) {
         
     | 
| 
      
 102 
     | 
    
         
            +
                _mm_storeu_si128((xmmi *)dst, _mm_loadu_si128((xmmi *)(dst + offset)));
         
     | 
| 
      
 103 
     | 
    
         
            +
                dst += 16;
         
     | 
| 
      
 104 
     | 
    
         
            +
              }
         
     | 
| 
      
 105 
     | 
    
         
            +
              if (bytes & 8) {
         
     | 
| 
      
 106 
     | 
    
         
            +
                *(uint64_t *)dst = *(uint64_t *)(dst + offset);
         
     | 
| 
      
 107 
     | 
    
         
            +
                dst += 8;
         
     | 
| 
      
 108 
     | 
    
         
            +
              }
         
     | 
| 
      
 109 
     | 
    
         
            +
              if (bytes & 4) {
         
     | 
| 
      
 110 
     | 
    
         
            +
                *(uint32_t *)dst = *(uint32_t *)(dst + offset);
         
     | 
| 
      
 111 
     | 
    
         
            +
                dst += 4;
         
     | 
| 
      
 112 
     | 
    
         
            +
              }
         
     | 
| 
      
 113 
     | 
    
         
            +
              if (bytes & 2) {
         
     | 
| 
      
 114 
     | 
    
         
            +
                *(uint16_t *)dst = *(uint16_t *)(dst + offset);
         
     | 
| 
      
 115 
     | 
    
         
            +
                dst += 2;
         
     | 
| 
      
 116 
     | 
    
         
            +
              }
         
     | 
| 
      
 117 
     | 
    
         
            +
              if (bytes & 1) {
         
     | 
| 
      
 118 
     | 
    
         
            +
                *(uint8_t *)dst = *(uint8_t *)(dst + offset);
         
     | 
| 
      
 119 
     | 
    
         
            +
              }
         
     | 
| 
      
 120 
     | 
    
         
            +
            }
         
     | 
| 
      
 121 
     | 
    
         
            +
             
     | 
| 
      
 122 
     | 
    
         
            +
            /* zero 0-15 bytes */
         
     | 
| 
      
 123 
     | 
    
         
            +
            static void INLINE poly1305_block_zero(uint8_t *dst, size_t bytes) {
         
     | 
| 
      
 124 
     | 
    
         
            +
              if (bytes & 8) {
         
     | 
| 
      
 125 
     | 
    
         
            +
                *(uint64_t *)dst = 0;
         
     | 
| 
      
 126 
     | 
    
         
            +
                dst += 8;
         
     | 
| 
      
 127 
     | 
    
         
            +
              }
         
     | 
| 
      
 128 
     | 
    
         
            +
              if (bytes & 4) {
         
     | 
| 
      
 129 
     | 
    
         
            +
                *(uint32_t *)dst = 0;
         
     | 
| 
      
 130 
     | 
    
         
            +
                dst += 4;
         
     | 
| 
      
 131 
     | 
    
         
            +
              }
         
     | 
| 
      
 132 
     | 
    
         
            +
              if (bytes & 2) {
         
     | 
| 
      
 133 
     | 
    
         
            +
                *(uint16_t *)dst = 0;
         
     | 
| 
      
 134 
     | 
    
         
            +
                dst += 2;
         
     | 
| 
      
 135 
     | 
    
         
            +
              }
         
     | 
| 
      
 136 
     | 
    
         
            +
              if (bytes & 1) {
         
     | 
| 
      
 137 
     | 
    
         
            +
                *(uint8_t *)dst = 0;
         
     | 
| 
      
 138 
     | 
    
         
            +
              }
         
     | 
| 
      
 139 
     | 
    
         
            +
            }
         
     | 
| 
      
 140 
     | 
    
         
            +
             
     | 
| 
      
 141 
     | 
    
         
            +
            static size_t INLINE poly1305_min(size_t a, size_t b) {
         
     | 
| 
      
 142 
     | 
    
         
            +
              return (a < b) ? a : b;
         
     | 
| 
      
 143 
     | 
    
         
            +
            }
         
     | 
| 
      
 144 
     | 
    
         
            +
             
     | 
| 
      
 145 
     | 
    
         
            +
            void CRYPTO_poly1305_init(poly1305_state *state, const uint8_t key[32]) {
         
     | 
| 
      
 146 
     | 
    
         
            +
              poly1305_state_internal *st = poly1305_aligned_state(state);
         
     | 
| 
      
 147 
     | 
    
         
            +
              poly1305_power *p;
         
     | 
| 
      
 148 
     | 
    
         
            +
              uint64_t r0, r1, r2;
         
     | 
| 
      
 149 
     | 
    
         
            +
              uint64_t t0, t1;
         
     | 
| 
      
 150 
     | 
    
         
            +
             
     | 
| 
      
 151 
     | 
    
         
            +
              /* clamp key */
         
     | 
| 
      
 152 
     | 
    
         
            +
              t0 = U8TO64_LE(key + 0);
         
     | 
| 
      
 153 
     | 
    
         
            +
              t1 = U8TO64_LE(key + 8);
         
     | 
| 
      
 154 
     | 
    
         
            +
              r0 = t0 & 0xffc0fffffff;
         
     | 
| 
      
 155 
     | 
    
         
            +
              t0 >>= 44;
         
     | 
| 
      
 156 
     | 
    
         
            +
              t0 |= t1 << 20;
         
     | 
| 
      
 157 
     | 
    
         
            +
              r1 = t0 & 0xfffffc0ffff;
         
     | 
| 
      
 158 
     | 
    
         
            +
              t1 >>= 24;
         
     | 
| 
      
 159 
     | 
    
         
            +
              r2 = t1 & 0x00ffffffc0f;
         
     | 
| 
      
 160 
     | 
    
         
            +
             
     | 
| 
      
 161 
     | 
    
         
            +
              /* store r in un-used space of st->P[1] */
         
     | 
| 
      
 162 
     | 
    
         
            +
              p = &st->P[1];
         
     | 
| 
      
 163 
     | 
    
         
            +
              p->R20.d[1] = (uint32_t)(r0);
         
     | 
| 
      
 164 
     | 
    
         
            +
              p->R20.d[3] = (uint32_t)(r0 >> 32);
         
     | 
| 
      
 165 
     | 
    
         
            +
              p->R21.d[1] = (uint32_t)(r1);
         
     | 
| 
      
 166 
     | 
    
         
            +
              p->R21.d[3] = (uint32_t)(r1 >> 32);
         
     | 
| 
      
 167 
     | 
    
         
            +
              p->R22.d[1] = (uint32_t)(r2);
         
     | 
| 
      
 168 
     | 
    
         
            +
              p->R22.d[3] = (uint32_t)(r2 >> 32);
         
     | 
| 
      
 169 
     | 
    
         
            +
             
     | 
| 
      
 170 
     | 
    
         
            +
              /* store pad */
         
     | 
| 
      
 171 
     | 
    
         
            +
              p->R23.d[1] = U8TO32_LE(key + 16);
         
     | 
| 
      
 172 
     | 
    
         
            +
              p->R23.d[3] = U8TO32_LE(key + 20);
         
     | 
| 
      
 173 
     | 
    
         
            +
              p->R24.d[1] = U8TO32_LE(key + 24);
         
     | 
| 
      
 174 
     | 
    
         
            +
              p->R24.d[3] = U8TO32_LE(key + 28);
         
     | 
| 
      
 175 
     | 
    
         
            +
             
     | 
| 
      
 176 
     | 
    
         
            +
              /* H = 0 */
         
     | 
| 
      
 177 
     | 
    
         
            +
              st->H[0] = _mm_setzero_si128();
         
     | 
| 
      
 178 
     | 
    
         
            +
              st->H[1] = _mm_setzero_si128();
         
     | 
| 
      
 179 
     | 
    
         
            +
              st->H[2] = _mm_setzero_si128();
         
     | 
| 
      
 180 
     | 
    
         
            +
              st->H[3] = _mm_setzero_si128();
         
     | 
| 
      
 181 
     | 
    
         
            +
              st->H[4] = _mm_setzero_si128();
         
     | 
| 
      
 182 
     | 
    
         
            +
             
     | 
| 
      
 183 
     | 
    
         
            +
              st->started = 0;
         
     | 
| 
      
 184 
     | 
    
         
            +
              st->leftover = 0;
         
     | 
| 
      
 185 
     | 
    
         
            +
            }
         
     | 
| 
      
 186 
     | 
    
         
            +
             
     | 
| 
      
 187 
     | 
    
         
            +
            static void poly1305_first_block(poly1305_state_internal *st,
         
     | 
| 
      
 188 
     | 
    
         
            +
                                             const uint8_t *m) {
         
     | 
| 
      
 189 
     | 
    
         
            +
              const xmmi MMASK = _mm_load_si128((xmmi *)poly1305_x64_sse2_message_mask);
         
     | 
| 
      
 190 
     | 
    
         
            +
              const xmmi FIVE = _mm_load_si128((xmmi *)poly1305_x64_sse2_5);
         
     | 
| 
      
 191 
     | 
    
         
            +
              const xmmi HIBIT = _mm_load_si128((xmmi *)poly1305_x64_sse2_1shl128);
         
     | 
| 
      
 192 
     | 
    
         
            +
              xmmi T5, T6;
         
     | 
| 
      
 193 
     | 
    
         
            +
              poly1305_power *p;
         
     | 
| 
      
 194 
     | 
    
         
            +
              uint128_t d[3];
         
     | 
| 
      
 195 
     | 
    
         
            +
              uint64_t r0, r1, r2;
         
     | 
| 
      
 196 
     | 
    
         
            +
              uint64_t r20, r21, r22, s22;
         
     | 
| 
      
 197 
     | 
    
         
            +
              uint64_t pad0, pad1;
         
     | 
| 
      
 198 
     | 
    
         
            +
              uint64_t c;
         
     | 
| 
      
 199 
     | 
    
         
            +
              uint64_t i;
         
     | 
| 
      
 200 
     | 
    
         
            +
             
     | 
| 
      
 201 
     | 
    
         
            +
              /* pull out stored info */
         
     | 
| 
      
 202 
     | 
    
         
            +
              p = &st->P[1];
         
     | 
| 
      
 203 
     | 
    
         
            +
             
     | 
| 
      
 204 
     | 
    
         
            +
              r0 = ((uint64_t)p->R20.d[3] << 32) | (uint64_t)p->R20.d[1];
         
     | 
| 
      
 205 
     | 
    
         
            +
              r1 = ((uint64_t)p->R21.d[3] << 32) | (uint64_t)p->R21.d[1];
         
     | 
| 
      
 206 
     | 
    
         
            +
              r2 = ((uint64_t)p->R22.d[3] << 32) | (uint64_t)p->R22.d[1];
         
     | 
| 
      
 207 
     | 
    
         
            +
              pad0 = ((uint64_t)p->R23.d[3] << 32) | (uint64_t)p->R23.d[1];
         
     | 
| 
      
 208 
     | 
    
         
            +
              pad1 = ((uint64_t)p->R24.d[3] << 32) | (uint64_t)p->R24.d[1];
         
     | 
| 
      
 209 
     | 
    
         
            +
             
     | 
| 
      
 210 
     | 
    
         
            +
              /* compute powers r^2,r^4 */
         
     | 
| 
      
 211 
     | 
    
         
            +
              r20 = r0;
         
     | 
| 
      
 212 
     | 
    
         
            +
              r21 = r1;
         
     | 
| 
      
 213 
     | 
    
         
            +
              r22 = r2;
         
     | 
| 
      
 214 
     | 
    
         
            +
              for (i = 0; i < 2; i++) {
         
     | 
| 
      
 215 
     | 
    
         
            +
                s22 = r22 * (5 << 2);
         
     | 
| 
      
 216 
     | 
    
         
            +
             
     | 
| 
      
 217 
     | 
    
         
            +
                d[0] = add128(mul64x64_128(r20, r20), mul64x64_128(r21 * 2, s22));
         
     | 
| 
      
 218 
     | 
    
         
            +
                d[1] = add128(mul64x64_128(r22, s22), mul64x64_128(r20 * 2, r21));
         
     | 
| 
      
 219 
     | 
    
         
            +
                d[2] = add128(mul64x64_128(r21, r21), mul64x64_128(r22 * 2, r20));
         
     | 
| 
      
 220 
     | 
    
         
            +
             
     | 
| 
      
 221 
     | 
    
         
            +
                r20 = lo128(d[0]) & 0xfffffffffff;
         
     | 
| 
      
 222 
     | 
    
         
            +
                c = shr128(d[0], 44);
         
     | 
| 
      
 223 
     | 
    
         
            +
                d[1] = add128_64(d[1], c);
         
     | 
| 
      
 224 
     | 
    
         
            +
                r21 = lo128(d[1]) & 0xfffffffffff;
         
     | 
| 
      
 225 
     | 
    
         
            +
                c = shr128(d[1], 44);
         
     | 
| 
      
 226 
     | 
    
         
            +
                d[2] = add128_64(d[2], c);
         
     | 
| 
      
 227 
     | 
    
         
            +
                r22 = lo128(d[2]) & 0x3ffffffffff;
         
     | 
| 
      
 228 
     | 
    
         
            +
                c = shr128(d[2], 42);
         
     | 
| 
      
 229 
     | 
    
         
            +
                r20 += c * 5;
         
     | 
| 
      
 230 
     | 
    
         
            +
                c = (r20 >> 44);
         
     | 
| 
      
 231 
     | 
    
         
            +
                r20 = r20 & 0xfffffffffff;
         
     | 
| 
      
 232 
     | 
    
         
            +
                r21 += c;
         
     | 
| 
      
 233 
     | 
    
         
            +
             
     | 
| 
      
 234 
     | 
    
         
            +
                p->R20.v = _mm_shuffle_epi32(_mm_cvtsi32_si128((uint32_t)(r20)&0x3ffffff),
         
     | 
| 
      
 235 
     | 
    
         
            +
                                             _MM_SHUFFLE(1, 0, 1, 0));
         
     | 
| 
      
 236 
     | 
    
         
            +
                p->R21.v = _mm_shuffle_epi32(
         
     | 
| 
      
 237 
     | 
    
         
            +
                    _mm_cvtsi32_si128((uint32_t)((r20 >> 26) | (r21 << 18)) & 0x3ffffff),
         
     | 
| 
      
 238 
     | 
    
         
            +
                    _MM_SHUFFLE(1, 0, 1, 0));
         
     | 
| 
      
 239 
     | 
    
         
            +
                p->R22.v =
         
     | 
| 
      
 240 
     | 
    
         
            +
                    _mm_shuffle_epi32(_mm_cvtsi32_si128((uint32_t)((r21 >> 8)) & 0x3ffffff),
         
     | 
| 
      
 241 
     | 
    
         
            +
                                      _MM_SHUFFLE(1, 0, 1, 0));
         
     | 
| 
      
 242 
     | 
    
         
            +
                p->R23.v = _mm_shuffle_epi32(
         
     | 
| 
      
 243 
     | 
    
         
            +
                    _mm_cvtsi32_si128((uint32_t)((r21 >> 34) | (r22 << 10)) & 0x3ffffff),
         
     | 
| 
      
 244 
     | 
    
         
            +
                    _MM_SHUFFLE(1, 0, 1, 0));
         
     | 
| 
      
 245 
     | 
    
         
            +
                p->R24.v = _mm_shuffle_epi32(_mm_cvtsi32_si128((uint32_t)((r22 >> 16))),
         
     | 
| 
      
 246 
     | 
    
         
            +
                                             _MM_SHUFFLE(1, 0, 1, 0));
         
     | 
| 
      
 247 
     | 
    
         
            +
                p->S21.v = _mm_mul_epu32(p->R21.v, FIVE);
         
     | 
| 
      
 248 
     | 
    
         
            +
                p->S22.v = _mm_mul_epu32(p->R22.v, FIVE);
         
     | 
| 
      
 249 
     | 
    
         
            +
                p->S23.v = _mm_mul_epu32(p->R23.v, FIVE);
         
     | 
| 
      
 250 
     | 
    
         
            +
                p->S24.v = _mm_mul_epu32(p->R24.v, FIVE);
         
     | 
| 
      
 251 
     | 
    
         
            +
                p--;
         
     | 
| 
      
 252 
     | 
    
         
            +
              }
         
     | 
| 
      
 253 
     | 
    
         
            +
             
     | 
| 
      
 254 
     | 
    
         
            +
              /* put saved info back */
         
     | 
| 
      
 255 
     | 
    
         
            +
              p = &st->P[1];
         
     | 
| 
      
 256 
     | 
    
         
            +
              p->R20.d[1] = (uint32_t)(r0);
         
     | 
| 
      
 257 
     | 
    
         
            +
              p->R20.d[3] = (uint32_t)(r0 >> 32);
         
     | 
| 
      
 258 
     | 
    
         
            +
              p->R21.d[1] = (uint32_t)(r1);
         
     | 
| 
      
 259 
     | 
    
         
            +
              p->R21.d[3] = (uint32_t)(r1 >> 32);
         
     | 
| 
      
 260 
     | 
    
         
            +
              p->R22.d[1] = (uint32_t)(r2);
         
     | 
| 
      
 261 
     | 
    
         
            +
              p->R22.d[3] = (uint32_t)(r2 >> 32);
         
     | 
| 
      
 262 
     | 
    
         
            +
              p->R23.d[1] = (uint32_t)(pad0);
         
     | 
| 
      
 263 
     | 
    
         
            +
              p->R23.d[3] = (uint32_t)(pad0 >> 32);
         
     | 
| 
      
 264 
     | 
    
         
            +
              p->R24.d[1] = (uint32_t)(pad1);
         
     | 
| 
      
 265 
     | 
    
         
            +
              p->R24.d[3] = (uint32_t)(pad1 >> 32);
         
     | 
| 
      
 266 
     | 
    
         
            +
             
     | 
| 
      
 267 
     | 
    
         
            +
              /* H = [Mx,My] */
         
     | 
| 
      
 268 
     | 
    
         
            +
              T5 = _mm_unpacklo_epi64(_mm_loadl_epi64((xmmi *)(m + 0)),
         
     | 
| 
      
 269 
     | 
    
         
            +
                                      _mm_loadl_epi64((xmmi *)(m + 16)));
         
     | 
| 
      
 270 
     | 
    
         
            +
              T6 = _mm_unpacklo_epi64(_mm_loadl_epi64((xmmi *)(m + 8)),
         
     | 
| 
      
 271 
     | 
    
         
            +
                                      _mm_loadl_epi64((xmmi *)(m + 24)));
         
     | 
| 
      
 272 
     | 
    
         
            +
              st->H[0] = _mm_and_si128(MMASK, T5);
         
     | 
| 
      
 273 
     | 
    
         
            +
              st->H[1] = _mm_and_si128(MMASK, _mm_srli_epi64(T5, 26));
         
     | 
| 
      
 274 
     | 
    
         
            +
              T5 = _mm_or_si128(_mm_srli_epi64(T5, 52), _mm_slli_epi64(T6, 12));
         
     | 
| 
      
 275 
     | 
    
         
            +
              st->H[2] = _mm_and_si128(MMASK, T5);
         
     | 
| 
      
 276 
     | 
    
         
            +
              st->H[3] = _mm_and_si128(MMASK, _mm_srli_epi64(T5, 26));
         
     | 
| 
      
 277 
     | 
    
         
            +
              st->H[4] = _mm_or_si128(_mm_srli_epi64(T6, 40), HIBIT);
         
     | 
| 
      
 278 
     | 
    
         
            +
            }
         
     | 
| 
      
 279 
     | 
    
         
            +
             
     | 
| 
      
 280 
     | 
    
         
            +
            static void poly1305_blocks(poly1305_state_internal *st, const uint8_t *m,
         
     | 
| 
      
 281 
     | 
    
         
            +
                                        size_t bytes) {
         
     | 
| 
      
 282 
     | 
    
         
            +
              const xmmi MMASK = _mm_load_si128((xmmi *)poly1305_x64_sse2_message_mask);
         
     | 
| 
      
 283 
     | 
    
         
            +
              const xmmi FIVE = _mm_load_si128((xmmi *)poly1305_x64_sse2_5);
         
     | 
| 
      
 284 
     | 
    
         
            +
              const xmmi HIBIT = _mm_load_si128((xmmi *)poly1305_x64_sse2_1shl128);
         
     | 
| 
      
 285 
     | 
    
         
            +
             
     | 
| 
      
 286 
     | 
    
         
            +
              poly1305_power *p;
         
     | 
| 
      
 287 
     | 
    
         
            +
              xmmi H0, H1, H2, H3, H4;
         
     | 
| 
      
 288 
     | 
    
         
            +
              xmmi T0, T1, T2, T3, T4, T5, T6;
         
     | 
| 
      
 289 
     | 
    
         
            +
              xmmi M0, M1, M2, M3, M4;
         
     | 
| 
      
 290 
     | 
    
         
            +
              xmmi C1, C2;
         
     | 
| 
      
 291 
     | 
    
         
            +
             
     | 
| 
      
 292 
     | 
    
         
            +
              H0 = st->H[0];
         
     | 
| 
      
 293 
     | 
    
         
            +
              H1 = st->H[1];
         
     | 
| 
      
 294 
     | 
    
         
            +
              H2 = st->H[2];
         
     | 
| 
      
 295 
     | 
    
         
            +
              H3 = st->H[3];
         
     | 
| 
      
 296 
     | 
    
         
            +
              H4 = st->H[4];
         
     | 
| 
      
 297 
     | 
    
         
            +
             
     | 
| 
      
 298 
     | 
    
         
            +
              while (bytes >= 64) {
         
     | 
| 
      
 299 
     | 
    
         
            +
                /* H *= [r^4,r^4] */
         
     | 
| 
      
 300 
     | 
    
         
            +
                p = &st->P[0];
         
     | 
| 
      
 301 
     | 
    
         
            +
                T0 = _mm_mul_epu32(H0, p->R20.v);
         
     | 
| 
      
 302 
     | 
    
         
            +
                T1 = _mm_mul_epu32(H0, p->R21.v);
         
     | 
| 
      
 303 
     | 
    
         
            +
                T2 = _mm_mul_epu32(H0, p->R22.v);
         
     | 
| 
      
 304 
     | 
    
         
            +
                T3 = _mm_mul_epu32(H0, p->R23.v);
         
     | 
| 
      
 305 
     | 
    
         
            +
                T4 = _mm_mul_epu32(H0, p->R24.v);
         
     | 
| 
      
 306 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H1, p->S24.v);
         
     | 
| 
      
 307 
     | 
    
         
            +
                T6 = _mm_mul_epu32(H1, p->R20.v);
         
     | 
| 
      
 308 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 309 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 310 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H2, p->S23.v);
         
     | 
| 
      
 311 
     | 
    
         
            +
                T6 = _mm_mul_epu32(H2, p->S24.v);
         
     | 
| 
      
 312 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 313 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 314 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H3, p->S22.v);
         
     | 
| 
      
 315 
     | 
    
         
            +
                T6 = _mm_mul_epu32(H3, p->S23.v);
         
     | 
| 
      
 316 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 317 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 318 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H4, p->S21.v);
         
     | 
| 
      
 319 
     | 
    
         
            +
                T6 = _mm_mul_epu32(H4, p->S22.v);
         
     | 
| 
      
 320 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 321 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 322 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H1, p->R21.v);
         
     | 
| 
      
 323 
     | 
    
         
            +
                T6 = _mm_mul_epu32(H1, p->R22.v);
         
     | 
| 
      
 324 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 325 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 326 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H2, p->R20.v);
         
     | 
| 
      
 327 
     | 
    
         
            +
                T6 = _mm_mul_epu32(H2, p->R21.v);
         
     | 
| 
      
 328 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 329 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 330 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H3, p->S24.v);
         
     | 
| 
      
 331 
     | 
    
         
            +
                T6 = _mm_mul_epu32(H3, p->R20.v);
         
     | 
| 
      
 332 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 333 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 334 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H4, p->S23.v);
         
     | 
| 
      
 335 
     | 
    
         
            +
                T6 = _mm_mul_epu32(H4, p->S24.v);
         
     | 
| 
      
 336 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 337 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 338 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H1, p->R23.v);
         
     | 
| 
      
 339 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 340 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H2, p->R22.v);
         
     | 
| 
      
 341 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 342 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H3, p->R21.v);
         
     | 
| 
      
 343 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 344 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H4, p->R20.v);
         
     | 
| 
      
 345 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 346 
     | 
    
         
            +
             
     | 
| 
      
 347 
     | 
    
         
            +
                /* H += [Mx,My]*[r^2,r^2] */
         
     | 
| 
      
 348 
     | 
    
         
            +
                T5 = _mm_unpacklo_epi64(_mm_loadl_epi64((xmmi *)(m + 0)),
         
     | 
| 
      
 349 
     | 
    
         
            +
                                        _mm_loadl_epi64((xmmi *)(m + 16)));
         
     | 
| 
      
 350 
     | 
    
         
            +
                T6 = _mm_unpacklo_epi64(_mm_loadl_epi64((xmmi *)(m + 8)),
         
     | 
| 
      
 351 
     | 
    
         
            +
                                        _mm_loadl_epi64((xmmi *)(m + 24)));
         
     | 
| 
      
 352 
     | 
    
         
            +
                M0 = _mm_and_si128(MMASK, T5);
         
     | 
| 
      
 353 
     | 
    
         
            +
                M1 = _mm_and_si128(MMASK, _mm_srli_epi64(T5, 26));
         
     | 
| 
      
 354 
     | 
    
         
            +
                T5 = _mm_or_si128(_mm_srli_epi64(T5, 52), _mm_slli_epi64(T6, 12));
         
     | 
| 
      
 355 
     | 
    
         
            +
                M2 = _mm_and_si128(MMASK, T5);
         
     | 
| 
      
 356 
     | 
    
         
            +
                M3 = _mm_and_si128(MMASK, _mm_srli_epi64(T5, 26));
         
     | 
| 
      
 357 
     | 
    
         
            +
                M4 = _mm_or_si128(_mm_srli_epi64(T6, 40), HIBIT);
         
     | 
| 
      
 358 
     | 
    
         
            +
             
     | 
| 
      
 359 
     | 
    
         
            +
                p = &st->P[1];
         
     | 
| 
      
 360 
     | 
    
         
            +
                T5 = _mm_mul_epu32(M0, p->R20.v);
         
     | 
| 
      
 361 
     | 
    
         
            +
                T6 = _mm_mul_epu32(M0, p->R21.v);
         
     | 
| 
      
 362 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 363 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 364 
     | 
    
         
            +
                T5 = _mm_mul_epu32(M1, p->S24.v);
         
     | 
| 
      
 365 
     | 
    
         
            +
                T6 = _mm_mul_epu32(M1, p->R20.v);
         
     | 
| 
      
 366 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 367 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 368 
     | 
    
         
            +
                T5 = _mm_mul_epu32(M2, p->S23.v);
         
     | 
| 
      
 369 
     | 
    
         
            +
                T6 = _mm_mul_epu32(M2, p->S24.v);
         
     | 
| 
      
 370 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 371 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 372 
     | 
    
         
            +
                T5 = _mm_mul_epu32(M3, p->S22.v);
         
     | 
| 
      
 373 
     | 
    
         
            +
                T6 = _mm_mul_epu32(M3, p->S23.v);
         
     | 
| 
      
 374 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 375 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 376 
     | 
    
         
            +
                T5 = _mm_mul_epu32(M4, p->S21.v);
         
     | 
| 
      
 377 
     | 
    
         
            +
                T6 = _mm_mul_epu32(M4, p->S22.v);
         
     | 
| 
      
 378 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 379 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 380 
     | 
    
         
            +
                T5 = _mm_mul_epu32(M0, p->R22.v);
         
     | 
| 
      
 381 
     | 
    
         
            +
                T6 = _mm_mul_epu32(M0, p->R23.v);
         
     | 
| 
      
 382 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 383 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 384 
     | 
    
         
            +
                T5 = _mm_mul_epu32(M1, p->R21.v);
         
     | 
| 
      
 385 
     | 
    
         
            +
                T6 = _mm_mul_epu32(M1, p->R22.v);
         
     | 
| 
      
 386 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 387 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 388 
     | 
    
         
            +
                T5 = _mm_mul_epu32(M2, p->R20.v);
         
     | 
| 
      
 389 
     | 
    
         
            +
                T6 = _mm_mul_epu32(M2, p->R21.v);
         
     | 
| 
      
 390 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 391 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 392 
     | 
    
         
            +
                T5 = _mm_mul_epu32(M3, p->S24.v);
         
     | 
| 
      
 393 
     | 
    
         
            +
                T6 = _mm_mul_epu32(M3, p->R20.v);
         
     | 
| 
      
 394 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 395 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 396 
     | 
    
         
            +
                T5 = _mm_mul_epu32(M4, p->S23.v);
         
     | 
| 
      
 397 
     | 
    
         
            +
                T6 = _mm_mul_epu32(M4, p->S24.v);
         
     | 
| 
      
 398 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 399 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 400 
     | 
    
         
            +
                T5 = _mm_mul_epu32(M0, p->R24.v);
         
     | 
| 
      
 401 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 402 
     | 
    
         
            +
                T5 = _mm_mul_epu32(M1, p->R23.v);
         
     | 
| 
      
 403 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 404 
     | 
    
         
            +
                T5 = _mm_mul_epu32(M2, p->R22.v);
         
     | 
| 
      
 405 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 406 
     | 
    
         
            +
                T5 = _mm_mul_epu32(M3, p->R21.v);
         
     | 
| 
      
 407 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 408 
     | 
    
         
            +
                T5 = _mm_mul_epu32(M4, p->R20.v);
         
     | 
| 
      
 409 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 410 
     | 
    
         
            +
             
     | 
| 
      
 411 
     | 
    
         
            +
                /* H += [Mx,My] */
         
     | 
| 
      
 412 
     | 
    
         
            +
                T5 = _mm_unpacklo_epi64(_mm_loadl_epi64((xmmi *)(m + 32)),
         
     | 
| 
      
 413 
     | 
    
         
            +
                                        _mm_loadl_epi64((xmmi *)(m + 48)));
         
     | 
| 
      
 414 
     | 
    
         
            +
                T6 = _mm_unpacklo_epi64(_mm_loadl_epi64((xmmi *)(m + 40)),
         
     | 
| 
      
 415 
     | 
    
         
            +
                                        _mm_loadl_epi64((xmmi *)(m + 56)));
         
     | 
| 
      
 416 
     | 
    
         
            +
                M0 = _mm_and_si128(MMASK, T5);
         
     | 
| 
      
 417 
     | 
    
         
            +
                M1 = _mm_and_si128(MMASK, _mm_srli_epi64(T5, 26));
         
     | 
| 
      
 418 
     | 
    
         
            +
                T5 = _mm_or_si128(_mm_srli_epi64(T5, 52), _mm_slli_epi64(T6, 12));
         
     | 
| 
      
 419 
     | 
    
         
            +
                M2 = _mm_and_si128(MMASK, T5);
         
     | 
| 
      
 420 
     | 
    
         
            +
                M3 = _mm_and_si128(MMASK, _mm_srli_epi64(T5, 26));
         
     | 
| 
      
 421 
     | 
    
         
            +
                M4 = _mm_or_si128(_mm_srli_epi64(T6, 40), HIBIT);
         
     | 
| 
      
 422 
     | 
    
         
            +
             
     | 
| 
      
 423 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, M0);
         
     | 
| 
      
 424 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, M1);
         
     | 
| 
      
 425 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, M2);
         
     | 
| 
      
 426 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, M3);
         
     | 
| 
      
 427 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, M4);
         
     | 
| 
      
 428 
     | 
    
         
            +
             
     | 
| 
      
 429 
     | 
    
         
            +
                /* reduce */
         
     | 
| 
      
 430 
     | 
    
         
            +
                C1 = _mm_srli_epi64(T0, 26);
         
     | 
| 
      
 431 
     | 
    
         
            +
                C2 = _mm_srli_epi64(T3, 26);
         
     | 
| 
      
 432 
     | 
    
         
            +
                T0 = _mm_and_si128(T0, MMASK);
         
     | 
| 
      
 433 
     | 
    
         
            +
                T3 = _mm_and_si128(T3, MMASK);
         
     | 
| 
      
 434 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, C1);
         
     | 
| 
      
 435 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, C2);
         
     | 
| 
      
 436 
     | 
    
         
            +
                C1 = _mm_srli_epi64(T1, 26);
         
     | 
| 
      
 437 
     | 
    
         
            +
                C2 = _mm_srli_epi64(T4, 26);
         
     | 
| 
      
 438 
     | 
    
         
            +
                T1 = _mm_and_si128(T1, MMASK);
         
     | 
| 
      
 439 
     | 
    
         
            +
                T4 = _mm_and_si128(T4, MMASK);
         
     | 
| 
      
 440 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, C1);
         
     | 
| 
      
 441 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, _mm_mul_epu32(C2, FIVE));
         
     | 
| 
      
 442 
     | 
    
         
            +
                C1 = _mm_srli_epi64(T2, 26);
         
     | 
| 
      
 443 
     | 
    
         
            +
                C2 = _mm_srli_epi64(T0, 26);
         
     | 
| 
      
 444 
     | 
    
         
            +
                T2 = _mm_and_si128(T2, MMASK);
         
     | 
| 
      
 445 
     | 
    
         
            +
                T0 = _mm_and_si128(T0, MMASK);
         
     | 
| 
      
 446 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, C1);
         
     | 
| 
      
 447 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, C2);
         
     | 
| 
      
 448 
     | 
    
         
            +
                C1 = _mm_srli_epi64(T3, 26);
         
     | 
| 
      
 449 
     | 
    
         
            +
                T3 = _mm_and_si128(T3, MMASK);
         
     | 
| 
      
 450 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, C1);
         
     | 
| 
      
 451 
     | 
    
         
            +
             
     | 
| 
      
 452 
     | 
    
         
            +
                /* H = (H*[r^4,r^4] + [Mx,My]*[r^2,r^2] + [Mx,My]) */
         
     | 
| 
      
 453 
     | 
    
         
            +
                H0 = T0;
         
     | 
| 
      
 454 
     | 
    
         
            +
                H1 = T1;
         
     | 
| 
      
 455 
     | 
    
         
            +
                H2 = T2;
         
     | 
| 
      
 456 
     | 
    
         
            +
                H3 = T3;
         
     | 
| 
      
 457 
     | 
    
         
            +
                H4 = T4;
         
     | 
| 
      
 458 
     | 
    
         
            +
             
     | 
| 
      
 459 
     | 
    
         
            +
                m += 64;
         
     | 
| 
      
 460 
     | 
    
         
            +
                bytes -= 64;
         
     | 
| 
      
 461 
     | 
    
         
            +
              }
         
     | 
| 
      
 462 
     | 
    
         
            +
             
     | 
| 
      
 463 
     | 
    
         
            +
              st->H[0] = H0;
         
     | 
| 
      
 464 
     | 
    
         
            +
              st->H[1] = H1;
         
     | 
| 
      
 465 
     | 
    
         
            +
              st->H[2] = H2;
         
     | 
| 
      
 466 
     | 
    
         
            +
              st->H[3] = H3;
         
     | 
| 
      
 467 
     | 
    
         
            +
              st->H[4] = H4;
         
     | 
| 
      
 468 
     | 
    
         
            +
            }
         
     | 
| 
      
 469 
     | 
    
         
            +
             
     | 
| 
      
 470 
     | 
    
         
            +
            static size_t poly1305_combine(poly1305_state_internal *st, const uint8_t *m,
         
     | 
| 
      
 471 
     | 
    
         
            +
                                           size_t bytes) {
         
     | 
| 
      
 472 
     | 
    
         
            +
              const xmmi MMASK = _mm_load_si128((xmmi *)poly1305_x64_sse2_message_mask);
         
     | 
| 
      
 473 
     | 
    
         
            +
              const xmmi HIBIT = _mm_load_si128((xmmi *)poly1305_x64_sse2_1shl128);
         
     | 
| 
      
 474 
     | 
    
         
            +
              const xmmi FIVE = _mm_load_si128((xmmi *)poly1305_x64_sse2_5);
         
     | 
| 
      
 475 
     | 
    
         
            +
             
     | 
| 
      
 476 
     | 
    
         
            +
              poly1305_power *p;
         
     | 
| 
      
 477 
     | 
    
         
            +
              xmmi H0, H1, H2, H3, H4;
         
     | 
| 
      
 478 
     | 
    
         
            +
              xmmi M0, M1, M2, M3, M4;
         
     | 
| 
      
 479 
     | 
    
         
            +
              xmmi T0, T1, T2, T3, T4, T5, T6;
         
     | 
| 
      
 480 
     | 
    
         
            +
              xmmi C1, C2;
         
     | 
| 
      
 481 
     | 
    
         
            +
             
     | 
| 
      
 482 
     | 
    
         
            +
              uint64_t r0, r1, r2;
         
     | 
| 
      
 483 
     | 
    
         
            +
              uint64_t t0, t1, t2, t3, t4;
         
     | 
| 
      
 484 
     | 
    
         
            +
              uint64_t c;
         
     | 
| 
      
 485 
     | 
    
         
            +
              size_t consumed = 0;
         
     | 
| 
      
 486 
     | 
    
         
            +
             
     | 
| 
      
 487 
     | 
    
         
            +
              H0 = st->H[0];
         
     | 
| 
      
 488 
     | 
    
         
            +
              H1 = st->H[1];
         
     | 
| 
      
 489 
     | 
    
         
            +
              H2 = st->H[2];
         
     | 
| 
      
 490 
     | 
    
         
            +
              H3 = st->H[3];
         
     | 
| 
      
 491 
     | 
    
         
            +
              H4 = st->H[4];
         
     | 
| 
      
 492 
     | 
    
         
            +
             
     | 
| 
      
 493 
     | 
    
         
            +
              /* p = [r^2,r^2] */
         
     | 
| 
      
 494 
     | 
    
         
            +
              p = &st->P[1];
         
     | 
| 
      
 495 
     | 
    
         
            +
             
     | 
| 
      
 496 
     | 
    
         
            +
              if (bytes >= 32) {
         
     | 
| 
      
 497 
     | 
    
         
            +
                /* H *= [r^2,r^2] */
         
     | 
| 
      
 498 
     | 
    
         
            +
                T0 = _mm_mul_epu32(H0, p->R20.v);
         
     | 
| 
      
 499 
     | 
    
         
            +
                T1 = _mm_mul_epu32(H0, p->R21.v);
         
     | 
| 
      
 500 
     | 
    
         
            +
                T2 = _mm_mul_epu32(H0, p->R22.v);
         
     | 
| 
      
 501 
     | 
    
         
            +
                T3 = _mm_mul_epu32(H0, p->R23.v);
         
     | 
| 
      
 502 
     | 
    
         
            +
                T4 = _mm_mul_epu32(H0, p->R24.v);
         
     | 
| 
      
 503 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H1, p->S24.v);
         
     | 
| 
      
 504 
     | 
    
         
            +
                T6 = _mm_mul_epu32(H1, p->R20.v);
         
     | 
| 
      
 505 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 506 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 507 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H2, p->S23.v);
         
     | 
| 
      
 508 
     | 
    
         
            +
                T6 = _mm_mul_epu32(H2, p->S24.v);
         
     | 
| 
      
 509 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 510 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 511 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H3, p->S22.v);
         
     | 
| 
      
 512 
     | 
    
         
            +
                T6 = _mm_mul_epu32(H3, p->S23.v);
         
     | 
| 
      
 513 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 514 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 515 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H4, p->S21.v);
         
     | 
| 
      
 516 
     | 
    
         
            +
                T6 = _mm_mul_epu32(H4, p->S22.v);
         
     | 
| 
      
 517 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 518 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 519 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H1, p->R21.v);
         
     | 
| 
      
 520 
     | 
    
         
            +
                T6 = _mm_mul_epu32(H1, p->R22.v);
         
     | 
| 
      
 521 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 522 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 523 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H2, p->R20.v);
         
     | 
| 
      
 524 
     | 
    
         
            +
                T6 = _mm_mul_epu32(H2, p->R21.v);
         
     | 
| 
      
 525 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 526 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 527 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H3, p->S24.v);
         
     | 
| 
      
 528 
     | 
    
         
            +
                T6 = _mm_mul_epu32(H3, p->R20.v);
         
     | 
| 
      
 529 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 530 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 531 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H4, p->S23.v);
         
     | 
| 
      
 532 
     | 
    
         
            +
                T6 = _mm_mul_epu32(H4, p->S24.v);
         
     | 
| 
      
 533 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 534 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 535 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H1, p->R23.v);
         
     | 
| 
      
 536 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 537 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H2, p->R22.v);
         
     | 
| 
      
 538 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 539 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H3, p->R21.v);
         
     | 
| 
      
 540 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 541 
     | 
    
         
            +
                T5 = _mm_mul_epu32(H4, p->R20.v);
         
     | 
| 
      
 542 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 543 
     | 
    
         
            +
             
     | 
| 
      
 544 
     | 
    
         
            +
                /* H += [Mx,My] */
         
     | 
| 
      
 545 
     | 
    
         
            +
                T5 = _mm_unpacklo_epi64(_mm_loadl_epi64((xmmi *)(m + 0)),
         
     | 
| 
      
 546 
     | 
    
         
            +
                                        _mm_loadl_epi64((xmmi *)(m + 16)));
         
     | 
| 
      
 547 
     | 
    
         
            +
                T6 = _mm_unpacklo_epi64(_mm_loadl_epi64((xmmi *)(m + 8)),
         
     | 
| 
      
 548 
     | 
    
         
            +
                                        _mm_loadl_epi64((xmmi *)(m + 24)));
         
     | 
| 
      
 549 
     | 
    
         
            +
                M0 = _mm_and_si128(MMASK, T5);
         
     | 
| 
      
 550 
     | 
    
         
            +
                M1 = _mm_and_si128(MMASK, _mm_srli_epi64(T5, 26));
         
     | 
| 
      
 551 
     | 
    
         
            +
                T5 = _mm_or_si128(_mm_srli_epi64(T5, 52), _mm_slli_epi64(T6, 12));
         
     | 
| 
      
 552 
     | 
    
         
            +
                M2 = _mm_and_si128(MMASK, T5);
         
     | 
| 
      
 553 
     | 
    
         
            +
                M3 = _mm_and_si128(MMASK, _mm_srli_epi64(T5, 26));
         
     | 
| 
      
 554 
     | 
    
         
            +
                M4 = _mm_or_si128(_mm_srli_epi64(T6, 40), HIBIT);
         
     | 
| 
      
 555 
     | 
    
         
            +
             
     | 
| 
      
 556 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, M0);
         
     | 
| 
      
 557 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, M1);
         
     | 
| 
      
 558 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, M2);
         
     | 
| 
      
 559 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, M3);
         
     | 
| 
      
 560 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, M4);
         
     | 
| 
      
 561 
     | 
    
         
            +
             
     | 
| 
      
 562 
     | 
    
         
            +
                /* reduce */
         
     | 
| 
      
 563 
     | 
    
         
            +
                C1 = _mm_srli_epi64(T0, 26);
         
     | 
| 
      
 564 
     | 
    
         
            +
                C2 = _mm_srli_epi64(T3, 26);
         
     | 
| 
      
 565 
     | 
    
         
            +
                T0 = _mm_and_si128(T0, MMASK);
         
     | 
| 
      
 566 
     | 
    
         
            +
                T3 = _mm_and_si128(T3, MMASK);
         
     | 
| 
      
 567 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, C1);
         
     | 
| 
      
 568 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, C2);
         
     | 
| 
      
 569 
     | 
    
         
            +
                C1 = _mm_srli_epi64(T1, 26);
         
     | 
| 
      
 570 
     | 
    
         
            +
                C2 = _mm_srli_epi64(T4, 26);
         
     | 
| 
      
 571 
     | 
    
         
            +
                T1 = _mm_and_si128(T1, MMASK);
         
     | 
| 
      
 572 
     | 
    
         
            +
                T4 = _mm_and_si128(T4, MMASK);
         
     | 
| 
      
 573 
     | 
    
         
            +
                T2 = _mm_add_epi64(T2, C1);
         
     | 
| 
      
 574 
     | 
    
         
            +
                T0 = _mm_add_epi64(T0, _mm_mul_epu32(C2, FIVE));
         
     | 
| 
      
 575 
     | 
    
         
            +
                C1 = _mm_srli_epi64(T2, 26);
         
     | 
| 
      
 576 
     | 
    
         
            +
                C2 = _mm_srli_epi64(T0, 26);
         
     | 
| 
      
 577 
     | 
    
         
            +
                T2 = _mm_and_si128(T2, MMASK);
         
     | 
| 
      
 578 
     | 
    
         
            +
                T0 = _mm_and_si128(T0, MMASK);
         
     | 
| 
      
 579 
     | 
    
         
            +
                T3 = _mm_add_epi64(T3, C1);
         
     | 
| 
      
 580 
     | 
    
         
            +
                T1 = _mm_add_epi64(T1, C2);
         
     | 
| 
      
 581 
     | 
    
         
            +
                C1 = _mm_srli_epi64(T3, 26);
         
     | 
| 
      
 582 
     | 
    
         
            +
                T3 = _mm_and_si128(T3, MMASK);
         
     | 
| 
      
 583 
     | 
    
         
            +
                T4 = _mm_add_epi64(T4, C1);
         
     | 
| 
      
 584 
     | 
    
         
            +
             
     | 
| 
      
 585 
     | 
    
         
            +
                /* H = (H*[r^2,r^2] + [Mx,My]) */
         
     | 
| 
      
 586 
     | 
    
         
            +
                H0 = T0;
         
     | 
| 
      
 587 
     | 
    
         
            +
                H1 = T1;
         
     | 
| 
      
 588 
     | 
    
         
            +
                H2 = T2;
         
     | 
| 
      
 589 
     | 
    
         
            +
                H3 = T3;
         
     | 
| 
      
 590 
     | 
    
         
            +
                H4 = T4;
         
     | 
| 
      
 591 
     | 
    
         
            +
             
     | 
| 
      
 592 
     | 
    
         
            +
                consumed = 32;
         
     | 
| 
      
 593 
     | 
    
         
            +
              }
         
     | 
| 
      
 594 
     | 
    
         
            +
             
     | 
| 
      
 595 
     | 
    
         
            +
              /* finalize, H *= [r^2,r] */
         
     | 
| 
      
 596 
     | 
    
         
            +
              r0 = ((uint64_t)p->R20.d[3] << 32) | (uint64_t)p->R20.d[1];
         
     | 
| 
      
 597 
     | 
    
         
            +
              r1 = ((uint64_t)p->R21.d[3] << 32) | (uint64_t)p->R21.d[1];
         
     | 
| 
      
 598 
     | 
    
         
            +
              r2 = ((uint64_t)p->R22.d[3] << 32) | (uint64_t)p->R22.d[1];
         
     | 
| 
      
 599 
     | 
    
         
            +
             
     | 
| 
      
 600 
     | 
    
         
            +
              p->R20.d[2] = (uint32_t)(r0)&0x3ffffff;
         
     | 
| 
      
 601 
     | 
    
         
            +
              p->R21.d[2] = (uint32_t)((r0 >> 26) | (r1 << 18)) & 0x3ffffff;
         
     | 
| 
      
 602 
     | 
    
         
            +
              p->R22.d[2] = (uint32_t)((r1 >> 8)) & 0x3ffffff;
         
     | 
| 
      
 603 
     | 
    
         
            +
              p->R23.d[2] = (uint32_t)((r1 >> 34) | (r2 << 10)) & 0x3ffffff;
         
     | 
| 
      
 604 
     | 
    
         
            +
              p->R24.d[2] = (uint32_t)((r2 >> 16));
         
     | 
| 
      
 605 
     | 
    
         
            +
              p->S21.d[2] = p->R21.d[2] * 5;
         
     | 
| 
      
 606 
     | 
    
         
            +
              p->S22.d[2] = p->R22.d[2] * 5;
         
     | 
| 
      
 607 
     | 
    
         
            +
              p->S23.d[2] = p->R23.d[2] * 5;
         
     | 
| 
      
 608 
     | 
    
         
            +
              p->S24.d[2] = p->R24.d[2] * 5;
         
     | 
| 
      
 609 
     | 
    
         
            +
             
     | 
| 
      
 610 
     | 
    
         
            +
              /* H *= [r^2,r] */
         
     | 
| 
      
 611 
     | 
    
         
            +
              T0 = _mm_mul_epu32(H0, p->R20.v);
         
     | 
| 
      
 612 
     | 
    
         
            +
              T1 = _mm_mul_epu32(H0, p->R21.v);
         
     | 
| 
      
 613 
     | 
    
         
            +
              T2 = _mm_mul_epu32(H0, p->R22.v);
         
     | 
| 
      
 614 
     | 
    
         
            +
              T3 = _mm_mul_epu32(H0, p->R23.v);
         
     | 
| 
      
 615 
     | 
    
         
            +
              T4 = _mm_mul_epu32(H0, p->R24.v);
         
     | 
| 
      
 616 
     | 
    
         
            +
              T5 = _mm_mul_epu32(H1, p->S24.v);
         
     | 
| 
      
 617 
     | 
    
         
            +
              T6 = _mm_mul_epu32(H1, p->R20.v);
         
     | 
| 
      
 618 
     | 
    
         
            +
              T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 619 
     | 
    
         
            +
              T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 620 
     | 
    
         
            +
              T5 = _mm_mul_epu32(H2, p->S23.v);
         
     | 
| 
      
 621 
     | 
    
         
            +
              T6 = _mm_mul_epu32(H2, p->S24.v);
         
     | 
| 
      
 622 
     | 
    
         
            +
              T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 623 
     | 
    
         
            +
              T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 624 
     | 
    
         
            +
              T5 = _mm_mul_epu32(H3, p->S22.v);
         
     | 
| 
      
 625 
     | 
    
         
            +
              T6 = _mm_mul_epu32(H3, p->S23.v);
         
     | 
| 
      
 626 
     | 
    
         
            +
              T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 627 
     | 
    
         
            +
              T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 628 
     | 
    
         
            +
              T5 = _mm_mul_epu32(H4, p->S21.v);
         
     | 
| 
      
 629 
     | 
    
         
            +
              T6 = _mm_mul_epu32(H4, p->S22.v);
         
     | 
| 
      
 630 
     | 
    
         
            +
              T0 = _mm_add_epi64(T0, T5);
         
     | 
| 
      
 631 
     | 
    
         
            +
              T1 = _mm_add_epi64(T1, T6);
         
     | 
| 
      
 632 
     | 
    
         
            +
              T5 = _mm_mul_epu32(H1, p->R21.v);
         
     | 
| 
      
 633 
     | 
    
         
            +
              T6 = _mm_mul_epu32(H1, p->R22.v);
         
     | 
| 
      
 634 
     | 
    
         
            +
              T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 635 
     | 
    
         
            +
              T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 636 
     | 
    
         
            +
              T5 = _mm_mul_epu32(H2, p->R20.v);
         
     | 
| 
      
 637 
     | 
    
         
            +
              T6 = _mm_mul_epu32(H2, p->R21.v);
         
     | 
| 
      
 638 
     | 
    
         
            +
              T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 639 
     | 
    
         
            +
              T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 640 
     | 
    
         
            +
              T5 = _mm_mul_epu32(H3, p->S24.v);
         
     | 
| 
      
 641 
     | 
    
         
            +
              T6 = _mm_mul_epu32(H3, p->R20.v);
         
     | 
| 
      
 642 
     | 
    
         
            +
              T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 643 
     | 
    
         
            +
              T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 644 
     | 
    
         
            +
              T5 = _mm_mul_epu32(H4, p->S23.v);
         
     | 
| 
      
 645 
     | 
    
         
            +
              T6 = _mm_mul_epu32(H4, p->S24.v);
         
     | 
| 
      
 646 
     | 
    
         
            +
              T2 = _mm_add_epi64(T2, T5);
         
     | 
| 
      
 647 
     | 
    
         
            +
              T3 = _mm_add_epi64(T3, T6);
         
     | 
| 
      
 648 
     | 
    
         
            +
              T5 = _mm_mul_epu32(H1, p->R23.v);
         
     | 
| 
      
 649 
     | 
    
         
            +
              T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 650 
     | 
    
         
            +
              T5 = _mm_mul_epu32(H2, p->R22.v);
         
     | 
| 
      
 651 
     | 
    
         
            +
              T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 652 
     | 
    
         
            +
              T5 = _mm_mul_epu32(H3, p->R21.v);
         
     | 
| 
      
 653 
     | 
    
         
            +
              T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 654 
     | 
    
         
            +
              T5 = _mm_mul_epu32(H4, p->R20.v);
         
     | 
| 
      
 655 
     | 
    
         
            +
              T4 = _mm_add_epi64(T4, T5);
         
     | 
| 
      
 656 
     | 
    
         
            +
             
     | 
| 
      
 657 
     | 
    
         
            +
              C1 = _mm_srli_epi64(T0, 26);
         
     | 
| 
      
 658 
     | 
    
         
            +
              C2 = _mm_srli_epi64(T3, 26);
         
     | 
| 
      
 659 
     | 
    
         
            +
              T0 = _mm_and_si128(T0, MMASK);
         
     | 
| 
      
 660 
     | 
    
         
            +
              T3 = _mm_and_si128(T3, MMASK);
         
     | 
| 
      
 661 
     | 
    
         
            +
              T1 = _mm_add_epi64(T1, C1);
         
     | 
| 
      
 662 
     | 
    
         
            +
              T4 = _mm_add_epi64(T4, C2);
         
     | 
| 
      
 663 
     | 
    
         
            +
              C1 = _mm_srli_epi64(T1, 26);
         
     | 
| 
      
 664 
     | 
    
         
            +
              C2 = _mm_srli_epi64(T4, 26);
         
     | 
| 
      
 665 
     | 
    
         
            +
              T1 = _mm_and_si128(T1, MMASK);
         
     | 
| 
      
 666 
     | 
    
         
            +
              T4 = _mm_and_si128(T4, MMASK);
         
     | 
| 
      
 667 
     | 
    
         
            +
              T2 = _mm_add_epi64(T2, C1);
         
     | 
| 
      
 668 
     | 
    
         
            +
              T0 = _mm_add_epi64(T0, _mm_mul_epu32(C2, FIVE));
         
     | 
| 
      
 669 
     | 
    
         
            +
              C1 = _mm_srli_epi64(T2, 26);
         
     | 
| 
      
 670 
     | 
    
         
            +
              C2 = _mm_srli_epi64(T0, 26);
         
     | 
| 
      
 671 
     | 
    
         
            +
              T2 = _mm_and_si128(T2, MMASK);
         
     | 
| 
      
 672 
     | 
    
         
            +
              T0 = _mm_and_si128(T0, MMASK);
         
     | 
| 
      
 673 
     | 
    
         
            +
              T3 = _mm_add_epi64(T3, C1);
         
     | 
| 
      
 674 
     | 
    
         
            +
              T1 = _mm_add_epi64(T1, C2);
         
     | 
| 
      
 675 
     | 
    
         
            +
              C1 = _mm_srli_epi64(T3, 26);
         
     | 
| 
      
 676 
     | 
    
         
            +
              T3 = _mm_and_si128(T3, MMASK);
         
     | 
| 
      
 677 
     | 
    
         
            +
              T4 = _mm_add_epi64(T4, C1);
         
     | 
| 
      
 678 
     | 
    
         
            +
             
     | 
| 
      
 679 
     | 
    
         
            +
              /* H = H[0]+H[1] */
         
     | 
| 
      
 680 
     | 
    
         
            +
              H0 = _mm_add_epi64(T0, _mm_srli_si128(T0, 8));
         
     | 
| 
      
 681 
     | 
    
         
            +
              H1 = _mm_add_epi64(T1, _mm_srli_si128(T1, 8));
         
     | 
| 
      
 682 
     | 
    
         
            +
              H2 = _mm_add_epi64(T2, _mm_srli_si128(T2, 8));
         
     | 
| 
      
 683 
     | 
    
         
            +
              H3 = _mm_add_epi64(T3, _mm_srli_si128(T3, 8));
         
     | 
| 
      
 684 
     | 
    
         
            +
              H4 = _mm_add_epi64(T4, _mm_srli_si128(T4, 8));
         
     | 
| 
      
 685 
     | 
    
         
            +
             
     | 
| 
      
 686 
     | 
    
         
            +
              t0 = _mm_cvtsi128_si32(H0);
         
     | 
| 
      
 687 
     | 
    
         
            +
              c = (t0 >> 26);
         
     | 
| 
      
 688 
     | 
    
         
            +
              t0 &= 0x3ffffff;
         
     | 
| 
      
 689 
     | 
    
         
            +
              t1 = _mm_cvtsi128_si32(H1) + c;
         
     | 
| 
      
 690 
     | 
    
         
            +
              c = (t1 >> 26);
         
     | 
| 
      
 691 
     | 
    
         
            +
              t1 &= 0x3ffffff;
         
     | 
| 
      
 692 
     | 
    
         
            +
              t2 = _mm_cvtsi128_si32(H2) + c;
         
     | 
| 
      
 693 
     | 
    
         
            +
              c = (t2 >> 26);
         
     | 
| 
      
 694 
     | 
    
         
            +
              t2 &= 0x3ffffff;
         
     | 
| 
      
 695 
     | 
    
         
            +
              t3 = _mm_cvtsi128_si32(H3) + c;
         
     | 
| 
      
 696 
     | 
    
         
            +
              c = (t3 >> 26);
         
     | 
| 
      
 697 
     | 
    
         
            +
              t3 &= 0x3ffffff;
         
     | 
| 
      
 698 
     | 
    
         
            +
              t4 = _mm_cvtsi128_si32(H4) + c;
         
     | 
| 
      
 699 
     | 
    
         
            +
              c = (t4 >> 26);
         
     | 
| 
      
 700 
     | 
    
         
            +
              t4 &= 0x3ffffff;
         
     | 
| 
      
 701 
     | 
    
         
            +
              t0 = t0 + (c * 5);
         
     | 
| 
      
 702 
     | 
    
         
            +
              c = (t0 >> 26);
         
     | 
| 
      
 703 
     | 
    
         
            +
              t0 &= 0x3ffffff;
         
     | 
| 
      
 704 
     | 
    
         
            +
              t1 = t1 + c;
         
     | 
| 
      
 705 
     | 
    
         
            +
             
     | 
| 
      
 706 
     | 
    
         
            +
              st->HH[0] = ((t0) | (t1 << 26)) & 0xfffffffffffull;
         
     | 
| 
      
 707 
     | 
    
         
            +
              st->HH[1] = ((t1 >> 18) | (t2 << 8) | (t3 << 34)) & 0xfffffffffffull;
         
     | 
| 
      
 708 
     | 
    
         
            +
              st->HH[2] = ((t3 >> 10) | (t4 << 16)) & 0x3ffffffffffull;
         
     | 
| 
      
 709 
     | 
    
         
            +
             
     | 
| 
      
 710 
     | 
    
         
            +
              return consumed;
         
     | 
| 
      
 711 
     | 
    
         
            +
            }
         
     | 
| 
      
 712 
     | 
    
         
            +
             
     | 
| 
      
 713 
     | 
    
         
            +
            void CRYPTO_poly1305_update(poly1305_state *state, const uint8_t *m,
         
     | 
| 
      
 714 
     | 
    
         
            +
                                        size_t bytes) {
         
     | 
| 
      
 715 
     | 
    
         
            +
              poly1305_state_internal *st = poly1305_aligned_state(state);
         
     | 
| 
      
 716 
     | 
    
         
            +
              size_t want;
         
     | 
| 
      
 717 
     | 
    
         
            +
             
     | 
| 
      
 718 
     | 
    
         
            +
              /* need at least 32 initial bytes to start the accelerated branch */
         
     | 
| 
      
 719 
     | 
    
         
            +
              if (!st->started) {
         
     | 
| 
      
 720 
     | 
    
         
            +
                if ((st->leftover == 0) && (bytes > 32)) {
         
     | 
| 
      
 721 
     | 
    
         
            +
                  poly1305_first_block(st, m);
         
     | 
| 
      
 722 
     | 
    
         
            +
                  m += 32;
         
     | 
| 
      
 723 
     | 
    
         
            +
                  bytes -= 32;
         
     | 
| 
      
 724 
     | 
    
         
            +
                } else {
         
     | 
| 
      
 725 
     | 
    
         
            +
                  want = poly1305_min(32 - st->leftover, bytes);
         
     | 
| 
      
 726 
     | 
    
         
            +
                  poly1305_block_copy(st->buffer + st->leftover, m, want);
         
     | 
| 
      
 727 
     | 
    
         
            +
                  bytes -= want;
         
     | 
| 
      
 728 
     | 
    
         
            +
                  m += want;
         
     | 
| 
      
 729 
     | 
    
         
            +
                  st->leftover += want;
         
     | 
| 
      
 730 
     | 
    
         
            +
                  if ((st->leftover < 32) || (bytes == 0)) {
         
     | 
| 
      
 731 
     | 
    
         
            +
                    return;
         
     | 
| 
      
 732 
     | 
    
         
            +
                  }
         
     | 
| 
      
 733 
     | 
    
         
            +
                  poly1305_first_block(st, st->buffer);
         
     | 
| 
      
 734 
     | 
    
         
            +
                  st->leftover = 0;
         
     | 
| 
      
 735 
     | 
    
         
            +
                }
         
     | 
| 
      
 736 
     | 
    
         
            +
                st->started = 1;
         
     | 
| 
      
 737 
     | 
    
         
            +
              }
         
     | 
| 
      
 738 
     | 
    
         
            +
             
     | 
| 
      
 739 
     | 
    
         
            +
              /* handle leftover */
         
     | 
| 
      
 740 
     | 
    
         
            +
              if (st->leftover) {
         
     | 
| 
      
 741 
     | 
    
         
            +
                want = poly1305_min(64 - st->leftover, bytes);
         
     | 
| 
      
 742 
     | 
    
         
            +
                poly1305_block_copy(st->buffer + st->leftover, m, want);
         
     | 
| 
      
 743 
     | 
    
         
            +
                bytes -= want;
         
     | 
| 
      
 744 
     | 
    
         
            +
                m += want;
         
     | 
| 
      
 745 
     | 
    
         
            +
                st->leftover += want;
         
     | 
| 
      
 746 
     | 
    
         
            +
                if (st->leftover < 64) {
         
     | 
| 
      
 747 
     | 
    
         
            +
                  return;
         
     | 
| 
      
 748 
     | 
    
         
            +
                }
         
     | 
| 
      
 749 
     | 
    
         
            +
                poly1305_blocks(st, st->buffer, 64);
         
     | 
| 
      
 750 
     | 
    
         
            +
                st->leftover = 0;
         
     | 
| 
      
 751 
     | 
    
         
            +
              }
         
     | 
| 
      
 752 
     | 
    
         
            +
             
     | 
| 
      
 753 
     | 
    
         
            +
              /* process 64 byte blocks */
         
     | 
| 
      
 754 
     | 
    
         
            +
              if (bytes >= 64) {
         
     | 
| 
      
 755 
     | 
    
         
            +
                want = (bytes & ~63);
         
     | 
| 
      
 756 
     | 
    
         
            +
                poly1305_blocks(st, m, want);
         
     | 
| 
      
 757 
     | 
    
         
            +
                m += want;
         
     | 
| 
      
 758 
     | 
    
         
            +
                bytes -= want;
         
     | 
| 
      
 759 
     | 
    
         
            +
              }
         
     | 
| 
      
 760 
     | 
    
         
            +
             
     | 
| 
      
 761 
     | 
    
         
            +
              if (bytes) {
         
     | 
| 
      
 762 
     | 
    
         
            +
                poly1305_block_copy(st->buffer + st->leftover, m, bytes);
         
     | 
| 
      
 763 
     | 
    
         
            +
                st->leftover += bytes;
         
     | 
| 
      
 764 
     | 
    
         
            +
              }
         
     | 
| 
      
 765 
     | 
    
         
            +
            }
         
     | 
| 
      
 766 
     | 
    
         
            +
             
     | 
| 
      
 767 
     | 
    
         
            +
            void CRYPTO_poly1305_finish(poly1305_state *state, uint8_t mac[16]) {
         
     | 
| 
      
 768 
     | 
    
         
            +
              poly1305_state_internal *st = poly1305_aligned_state(state);
         
     | 
| 
      
 769 
     | 
    
         
            +
              size_t leftover = st->leftover;
         
     | 
| 
      
 770 
     | 
    
         
            +
              uint8_t *m = st->buffer;
         
     | 
| 
      
 771 
     | 
    
         
            +
              uint128_t d[3];
         
     | 
| 
      
 772 
     | 
    
         
            +
              uint64_t h0, h1, h2;
         
     | 
| 
      
 773 
     | 
    
         
            +
              uint64_t t0, t1;
         
     | 
| 
      
 774 
     | 
    
         
            +
              uint64_t g0, g1, g2, c, nc;
         
     | 
| 
      
 775 
     | 
    
         
            +
              uint64_t r0, r1, r2, s1, s2;
         
     | 
| 
      
 776 
     | 
    
         
            +
              poly1305_power *p;
         
     | 
| 
      
 777 
     | 
    
         
            +
             
     | 
| 
      
 778 
     | 
    
         
            +
              if (st->started) {
         
     | 
| 
      
 779 
     | 
    
         
            +
                size_t consumed = poly1305_combine(st, m, leftover);
         
     | 
| 
      
 780 
     | 
    
         
            +
                leftover -= consumed;
         
     | 
| 
      
 781 
     | 
    
         
            +
                m += consumed;
         
     | 
| 
      
 782 
     | 
    
         
            +
              }
         
     | 
| 
      
 783 
     | 
    
         
            +
             
     | 
| 
      
 784 
     | 
    
         
            +
              /* st->HH will either be 0 or have the combined result */
         
     | 
| 
      
 785 
     | 
    
         
            +
              h0 = st->HH[0];
         
     | 
| 
      
 786 
     | 
    
         
            +
              h1 = st->HH[1];
         
     | 
| 
      
 787 
     | 
    
         
            +
              h2 = st->HH[2];
         
     | 
| 
      
 788 
     | 
    
         
            +
             
     | 
| 
      
 789 
     | 
    
         
            +
              p = &st->P[1];
         
     | 
| 
      
 790 
     | 
    
         
            +
              r0 = ((uint64_t)p->R20.d[3] << 32) | (uint64_t)p->R20.d[1];
         
     | 
| 
      
 791 
     | 
    
         
            +
              r1 = ((uint64_t)p->R21.d[3] << 32) | (uint64_t)p->R21.d[1];
         
     | 
| 
      
 792 
     | 
    
         
            +
              r2 = ((uint64_t)p->R22.d[3] << 32) | (uint64_t)p->R22.d[1];
         
     | 
| 
      
 793 
     | 
    
         
            +
              s1 = r1 * (5 << 2);
         
     | 
| 
      
 794 
     | 
    
         
            +
              s2 = r2 * (5 << 2);
         
     | 
| 
      
 795 
     | 
    
         
            +
             
     | 
| 
      
 796 
     | 
    
         
            +
              if (leftover < 16) {
         
     | 
| 
      
 797 
     | 
    
         
            +
                goto poly1305_donna_atmost15bytes;
         
     | 
| 
      
 798 
     | 
    
         
            +
              }
         
     | 
| 
      
 799 
     | 
    
         
            +
             
     | 
| 
      
 800 
     | 
    
         
            +
            poly1305_donna_atleast16bytes:
         
     | 
| 
      
 801 
     | 
    
         
            +
              t0 = U8TO64_LE(m + 0);
         
     | 
| 
      
 802 
     | 
    
         
            +
              t1 = U8TO64_LE(m + 8);
         
     | 
| 
      
 803 
     | 
    
         
            +
              h0 += t0 & 0xfffffffffff;
         
     | 
| 
      
 804 
     | 
    
         
            +
              t0 = shr128_pair(t1, t0, 44);
         
     | 
| 
      
 805 
     | 
    
         
            +
              h1 += t0 & 0xfffffffffff;
         
     | 
| 
      
 806 
     | 
    
         
            +
              h2 += (t1 >> 24) | ((uint64_t)1 << 40);
         
     | 
| 
      
 807 
     | 
    
         
            +
             
     | 
| 
      
 808 
     | 
    
         
            +
            poly1305_donna_mul:
         
     | 
| 
      
 809 
     | 
    
         
            +
              d[0] = add128(add128(mul64x64_128(h0, r0), mul64x64_128(h1, s2)),
         
     | 
| 
      
 810 
     | 
    
         
            +
                            mul64x64_128(h2, s1));
         
     | 
| 
      
 811 
     | 
    
         
            +
              d[1] = add128(add128(mul64x64_128(h0, r1), mul64x64_128(h1, r0)),
         
     | 
| 
      
 812 
     | 
    
         
            +
                            mul64x64_128(h2, s2));
         
     | 
| 
      
 813 
     | 
    
         
            +
              d[2] = add128(add128(mul64x64_128(h0, r2), mul64x64_128(h1, r1)),
         
     | 
| 
      
 814 
     | 
    
         
            +
                            mul64x64_128(h2, r0));
         
     | 
| 
      
 815 
     | 
    
         
            +
              h0 = lo128(d[0]) & 0xfffffffffff;
         
     | 
| 
      
 816 
     | 
    
         
            +
              c = shr128(d[0], 44);
         
     | 
| 
      
 817 
     | 
    
         
            +
              d[1] = add128_64(d[1], c);
         
     | 
| 
      
 818 
     | 
    
         
            +
              h1 = lo128(d[1]) & 0xfffffffffff;
         
     | 
| 
      
 819 
     | 
    
         
            +
              c = shr128(d[1], 44);
         
     | 
| 
      
 820 
     | 
    
         
            +
              d[2] = add128_64(d[2], c);
         
     | 
| 
      
 821 
     | 
    
         
            +
              h2 = lo128(d[2]) & 0x3ffffffffff;
         
     | 
| 
      
 822 
     | 
    
         
            +
              c = shr128(d[2], 42);
         
     | 
| 
      
 823 
     | 
    
         
            +
              h0 += c * 5;
         
     | 
| 
      
 824 
     | 
    
         
            +
             
     | 
| 
      
 825 
     | 
    
         
            +
              m += 16;
         
     | 
| 
      
 826 
     | 
    
         
            +
              leftover -= 16;
         
     | 
| 
      
 827 
     | 
    
         
            +
              if (leftover >= 16) {
         
     | 
| 
      
 828 
     | 
    
         
            +
                goto poly1305_donna_atleast16bytes;
         
     | 
| 
      
 829 
     | 
    
         
            +
              }
         
     | 
| 
      
 830 
     | 
    
         
            +
             
     | 
| 
      
 831 
     | 
    
         
            +
            /* final bytes */
         
     | 
| 
      
 832 
     | 
    
         
            +
            poly1305_donna_atmost15bytes:
         
     | 
| 
      
 833 
     | 
    
         
            +
              if (!leftover) {
         
     | 
| 
      
 834 
     | 
    
         
            +
                goto poly1305_donna_finish;
         
     | 
| 
      
 835 
     | 
    
         
            +
              }
         
     | 
| 
      
 836 
     | 
    
         
            +
             
     | 
| 
      
 837 
     | 
    
         
            +
              m[leftover++] = 1;
         
     | 
| 
      
 838 
     | 
    
         
            +
              poly1305_block_zero(m + leftover, 16 - leftover);
         
     | 
| 
      
 839 
     | 
    
         
            +
              leftover = 16;
         
     | 
| 
      
 840 
     | 
    
         
            +
             
     | 
| 
      
 841 
     | 
    
         
            +
              t0 = U8TO64_LE(m + 0);
         
     | 
| 
      
 842 
     | 
    
         
            +
              t1 = U8TO64_LE(m + 8);
         
     | 
| 
      
 843 
     | 
    
         
            +
              h0 += t0 & 0xfffffffffff;
         
     | 
| 
      
 844 
     | 
    
         
            +
              t0 = shr128_pair(t1, t0, 44);
         
     | 
| 
      
 845 
     | 
    
         
            +
              h1 += t0 & 0xfffffffffff;
         
     | 
| 
      
 846 
     | 
    
         
            +
              h2 += (t1 >> 24);
         
     | 
| 
      
 847 
     | 
    
         
            +
             
     | 
| 
      
 848 
     | 
    
         
            +
              goto poly1305_donna_mul;
         
     | 
| 
      
 849 
     | 
    
         
            +
             
     | 
| 
      
 850 
     | 
    
         
            +
            poly1305_donna_finish:
         
     | 
| 
      
 851 
     | 
    
         
            +
              c = (h0 >> 44);
         
     | 
| 
      
 852 
     | 
    
         
            +
              h0 &= 0xfffffffffff;
         
     | 
| 
      
 853 
     | 
    
         
            +
              h1 += c;
         
     | 
| 
      
 854 
     | 
    
         
            +
              c = (h1 >> 44);
         
     | 
| 
      
 855 
     | 
    
         
            +
              h1 &= 0xfffffffffff;
         
     | 
| 
      
 856 
     | 
    
         
            +
              h2 += c;
         
     | 
| 
      
 857 
     | 
    
         
            +
              c = (h2 >> 42);
         
     | 
| 
      
 858 
     | 
    
         
            +
              h2 &= 0x3ffffffffff;
         
     | 
| 
      
 859 
     | 
    
         
            +
              h0 += c * 5;
         
     | 
| 
      
 860 
     | 
    
         
            +
             
     | 
| 
      
 861 
     | 
    
         
            +
              g0 = h0 + 5;
         
     | 
| 
      
 862 
     | 
    
         
            +
              c = (g0 >> 44);
         
     | 
| 
      
 863 
     | 
    
         
            +
              g0 &= 0xfffffffffff;
         
     | 
| 
      
 864 
     | 
    
         
            +
              g1 = h1 + c;
         
     | 
| 
      
 865 
     | 
    
         
            +
              c = (g1 >> 44);
         
     | 
| 
      
 866 
     | 
    
         
            +
              g1 &= 0xfffffffffff;
         
     | 
| 
      
 867 
     | 
    
         
            +
              g2 = h2 + c - ((uint64_t)1 << 42);
         
     | 
| 
      
 868 
     | 
    
         
            +
             
     | 
| 
      
 869 
     | 
    
         
            +
              c = (g2 >> 63) - 1;
         
     | 
| 
      
 870 
     | 
    
         
            +
              nc = ~c;
         
     | 
| 
      
 871 
     | 
    
         
            +
              h0 = (h0 & nc) | (g0 & c);
         
     | 
| 
      
 872 
     | 
    
         
            +
              h1 = (h1 & nc) | (g1 & c);
         
     | 
| 
      
 873 
     | 
    
         
            +
              h2 = (h2 & nc) | (g2 & c);
         
     | 
| 
      
 874 
     | 
    
         
            +
             
     | 
| 
      
 875 
     | 
    
         
            +
              /* pad */
         
     | 
| 
      
 876 
     | 
    
         
            +
              t0 = ((uint64_t)p->R23.d[3] << 32) | (uint64_t)p->R23.d[1];
         
     | 
| 
      
 877 
     | 
    
         
            +
              t1 = ((uint64_t)p->R24.d[3] << 32) | (uint64_t)p->R24.d[1];
         
     | 
| 
      
 878 
     | 
    
         
            +
              h0 += (t0 & 0xfffffffffff);
         
     | 
| 
      
 879 
     | 
    
         
            +
              c = (h0 >> 44);
         
     | 
| 
      
 880 
     | 
    
         
            +
              h0 &= 0xfffffffffff;
         
     | 
| 
      
 881 
     | 
    
         
            +
              t0 = shr128_pair(t1, t0, 44);
         
     | 
| 
      
 882 
     | 
    
         
            +
              h1 += (t0 & 0xfffffffffff) + c;
         
     | 
| 
      
 883 
     | 
    
         
            +
              c = (h1 >> 44);
         
     | 
| 
      
 884 
     | 
    
         
            +
              h1 &= 0xfffffffffff;
         
     | 
| 
      
 885 
     | 
    
         
            +
              t1 = (t1 >> 24);
         
     | 
| 
      
 886 
     | 
    
         
            +
              h2 += (t1)+c;
         
     | 
| 
      
 887 
     | 
    
         
            +
             
     | 
| 
      
 888 
     | 
    
         
            +
              U64TO8_LE(mac + 0, ((h0) | (h1 << 44)));
         
     | 
| 
      
 889 
     | 
    
         
            +
              U64TO8_LE(mac + 8, ((h1 >> 20) | (h2 << 24)));
         
     | 
| 
      
 890 
     | 
    
         
            +
            }
         
     | 
| 
      
 891 
     | 
    
         
            +
             
     | 
| 
      
 892 
     | 
    
         
            +
            #endif  /* !OPENSSL_WINDOWS && OPENSSL_X86_64 */
         
     |