@sbhjt-gr/react-native-webrtc 124.0.3 → 124.0.4

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (361) hide show
  1. package/.clang-format +11 -11
  2. package/.eslintignore +6 -6
  3. package/.nvmrc +1 -1
  4. package/ISSUE_TEMPLATE.md +40 -40
  5. package/LICENSE +22 -22
  6. package/README.md +103 -103
  7. package/android/build.gradle +37 -37
  8. package/android/consumer-rules.pro +3 -3
  9. package/android/src/main/AndroidManifest.xml +11 -11
  10. package/android/src/main/java/com/oney/WebRTCModule/AbstractVideoCaptureController.java +113 -113
  11. package/android/src/main/java/com/oney/WebRTCModule/CameraCaptureController.java +338 -338
  12. package/android/src/main/java/com/oney/WebRTCModule/CameraEventsHandler.java +49 -49
  13. package/android/src/main/java/com/oney/WebRTCModule/DataChannelWrapper.java +99 -99
  14. package/android/src/main/java/com/oney/WebRTCModule/DataPacketCryptorManager.java +62 -62
  15. package/android/src/main/java/com/oney/WebRTCModule/DisplayUtils.java +16 -16
  16. package/android/src/main/java/com/oney/WebRTCModule/EglUtils.java +66 -66
  17. package/android/src/main/java/com/oney/WebRTCModule/GetUserMediaImpl.java +539 -539
  18. package/android/src/main/java/com/oney/WebRTCModule/LibraryLoader.java +21 -21
  19. package/android/src/main/java/com/oney/WebRTCModule/MediaProjectionNotification.java +70 -70
  20. package/android/src/main/java/com/oney/WebRTCModule/MediaProjectionService.java +82 -82
  21. package/android/src/main/java/com/oney/WebRTCModule/PeerConnectionObserver.java +588 -588
  22. package/android/src/main/java/com/oney/WebRTCModule/RTCCryptoManager.java +493 -493
  23. package/android/src/main/java/com/oney/WebRTCModule/RTCVideoViewManager.java +98 -98
  24. package/android/src/main/java/com/oney/WebRTCModule/ReactBridgeUtil.java +35 -35
  25. package/android/src/main/java/com/oney/WebRTCModule/ScreenCaptureController.java +94 -94
  26. package/android/src/main/java/com/oney/WebRTCModule/SerializeUtils.java +342 -342
  27. package/android/src/main/java/com/oney/WebRTCModule/StringUtils.java +100 -100
  28. package/android/src/main/java/com/oney/WebRTCModule/ThreadUtils.java +41 -41
  29. package/android/src/main/java/com/oney/WebRTCModule/TrackCapturerEventsEmitter.java +34 -34
  30. package/android/src/main/java/com/oney/WebRTCModule/VideoTrackAdapter.java +137 -137
  31. package/android/src/main/java/com/oney/WebRTCModule/WebRTCModule.java +1649 -1643
  32. package/android/src/main/java/com/oney/WebRTCModule/WebRTCModuleOptions.java +33 -33
  33. package/android/src/main/java/com/oney/WebRTCModule/WebRTCModulePackage.java +21 -21
  34. package/android/src/main/java/com/oney/WebRTCModule/WebRTCView.java +583 -583
  35. package/android/src/main/java/com/oney/WebRTCModule/palabra/PalabraClient.java +529 -501
  36. package/android/src/main/java/com/oney/WebRTCModule/palabra/PalabraConfig.java +17 -17
  37. package/android/src/main/java/com/oney/WebRTCModule/palabra/PalabraListener.java +7 -7
  38. package/android/src/main/java/com/oney/WebRTCModule/videoEffects/ProcessorProvider.java +38 -38
  39. package/android/src/main/java/com/oney/WebRTCModule/videoEffects/VideoEffectProcessor.java +59 -59
  40. package/android/src/main/java/com/oney/WebRTCModule/videoEffects/VideoFrameProcessor.java +19 -19
  41. package/android/src/main/java/com/oney/WebRTCModule/videoEffects/VideoFrameProcessorFactoryInterface.java +12 -12
  42. package/android/src/main/java/com/oney/WebRTCModule/webrtcutils/H264AndSoftwareVideoDecoderFactory.java +73 -73
  43. package/android/src/main/java/com/oney/WebRTCModule/webrtcutils/H264AndSoftwareVideoEncoderFactory.java +73 -73
  44. package/android/src/main/java/com/oney/WebRTCModule/webrtcutils/SoftwareVideoDecoderFactoryProxy.java +36 -36
  45. package/android/src/main/java/com/oney/WebRTCModule/webrtcutils/SoftwareVideoEncoderFactoryProxy.java +36 -36
  46. package/android/src/main/java/org/webrtc/Camera1Helper.java +54 -54
  47. package/android/src/main/java/org/webrtc/Camera2Helper.java +52 -52
  48. package/android/src/main/res/values/strings.xml +5 -5
  49. package/android/src/main/res/values/styles.xml +8 -8
  50. package/ios/RCTWebRTC/CaptureController.h +18 -18
  51. package/ios/RCTWebRTC/CaptureController.m +28 -28
  52. package/ios/RCTWebRTC/CapturerEventsDelegate.h +12 -12
  53. package/ios/RCTWebRTC/DataChannelWrapper.h +27 -27
  54. package/ios/RCTWebRTC/DataChannelWrapper.m +42 -42
  55. package/ios/RCTWebRTC/I420Converter.h +22 -22
  56. package/ios/RCTWebRTC/I420Converter.m +164 -164
  57. package/ios/RCTWebRTC/PIPController.h +24 -24
  58. package/ios/RCTWebRTC/PIPController.m +234 -234
  59. package/ios/RCTWebRTC/PalabraAudioSink.h +13 -13
  60. package/ios/RCTWebRTC/PalabraAudioSink.m +18 -18
  61. package/ios/RCTWebRTC/PalabraClient.h +42 -36
  62. package/ios/RCTWebRTC/PalabraClient.m +680 -644
  63. package/ios/RCTWebRTC/RCTConvert+WebRTC.h +16 -16
  64. package/ios/RCTWebRTC/RCTConvert+WebRTC.m +206 -206
  65. package/ios/RCTWebRTC/RTCMediaStreamTrack+React.h +10 -10
  66. package/ios/RCTWebRTC/RTCMediaStreamTrack+React.m +16 -16
  67. package/ios/RCTWebRTC/RTCVideoViewManager.h +29 -29
  68. package/ios/RCTWebRTC/RTCVideoViewManager.m +411 -411
  69. package/ios/RCTWebRTC/SampleBufferVideoCallView.h +12 -12
  70. package/ios/RCTWebRTC/SampleBufferVideoCallView.m +178 -178
  71. package/ios/RCTWebRTC/ScreenCaptureController.h +20 -20
  72. package/ios/RCTWebRTC/ScreenCaptureController.m +82 -82
  73. package/ios/RCTWebRTC/ScreenCapturePickerViewManager.h +7 -7
  74. package/ios/RCTWebRTC/ScreenCapturePickerViewManager.m +59 -59
  75. package/ios/RCTWebRTC/ScreenCapturer.h +19 -19
  76. package/ios/RCTWebRTC/ScreenCapturer.m +263 -263
  77. package/ios/RCTWebRTC/SerializeUtils.h +28 -28
  78. package/ios/RCTWebRTC/SerializeUtils.m +314 -314
  79. package/ios/RCTWebRTC/SocketConnection.h +13 -13
  80. package/ios/RCTWebRTC/SocketConnection.m +137 -137
  81. package/ios/RCTWebRTC/TrackCapturerEventsEmitter.h +14 -14
  82. package/ios/RCTWebRTC/TrackCapturerEventsEmitter.m +36 -36
  83. package/ios/RCTWebRTC/VideoCaptureController.h +21 -21
  84. package/ios/RCTWebRTC/VideoCaptureController.m +328 -328
  85. package/ios/RCTWebRTC/WLVAudioDevice.h +12 -12
  86. package/ios/RCTWebRTC/WLVAudioDevice.m +137 -137
  87. package/ios/RCTWebRTC/WebRTCModule+Palabra.h +4 -4
  88. package/ios/RCTWebRTC/WebRTCModule+Palabra.m +92 -83
  89. package/ios/RCTWebRTC/WebRTCModule+Permissions.m +75 -75
  90. package/ios/RCTWebRTC/WebRTCModule+RTCAudioSession.m +20 -20
  91. package/ios/RCTWebRTC/WebRTCModule+RTCDataChannel.h +14 -14
  92. package/ios/RCTWebRTC/WebRTCModule+RTCDataChannel.m +165 -165
  93. package/ios/RCTWebRTC/WebRTCModule+RTCFrameCryptor.m +611 -611
  94. package/ios/RCTWebRTC/WebRTCModule+RTCMediaStream.h +13 -13
  95. package/ios/RCTWebRTC/WebRTCModule+RTCMediaStream.m +728 -728
  96. package/ios/RCTWebRTC/WebRTCModule+RTCPeerConnection.h +24 -24
  97. package/ios/RCTWebRTC/WebRTCModule+RTCPeerConnection.m +1004 -1004
  98. package/ios/RCTWebRTC/WebRTCModule+Transceivers.m +267 -267
  99. package/ios/RCTWebRTC/WebRTCModule+VideoTrackAdapter.h +12 -12
  100. package/ios/RCTWebRTC/WebRTCModule+VideoTrackAdapter.m +166 -166
  101. package/ios/RCTWebRTC/WebRTCModule.h +58 -58
  102. package/ios/RCTWebRTC/WebRTCModule.m +169 -169
  103. package/ios/RCTWebRTC/WebRTCModuleOptions.h +24 -24
  104. package/ios/RCTWebRTC/WebRTCModuleOptions.m +31 -31
  105. package/ios/RCTWebRTC/videoEffects/ProcessorProvider.h +9 -9
  106. package/ios/RCTWebRTC/videoEffects/ProcessorProvider.m +23 -23
  107. package/ios/RCTWebRTC/videoEffects/VideoEffectProcessor.h +13 -13
  108. package/ios/RCTWebRTC/videoEffects/VideoEffectProcessor.m +23 -23
  109. package/ios/RCTWebRTC/videoEffects/VideoFrameProcessor.h +8 -8
  110. package/ios/RCTWebRTC.xcodeproj/project.pbxproj +404 -404
  111. package/ios/RCTWebRTC.xcworkspace/contents.xcworkspacedata +10 -10
  112. package/lib/commonjs/Constraints.js.map +1 -1
  113. package/lib/commonjs/EventEmitter.js.map +1 -1
  114. package/lib/commonjs/Logger.js.map +1 -1
  115. package/lib/commonjs/MediaDevices.js +17 -17
  116. package/lib/commonjs/MediaDevices.js.map +1 -1
  117. package/lib/commonjs/MediaStream.js +19 -19
  118. package/lib/commonjs/MediaStream.js.map +1 -1
  119. package/lib/commonjs/MediaStreamError.js.map +1 -1
  120. package/lib/commonjs/MediaStreamErrorEvent.js.map +1 -1
  121. package/lib/commonjs/MediaStreamTrack.js +28 -28
  122. package/lib/commonjs/MediaStreamTrack.js.map +1 -1
  123. package/lib/commonjs/MediaStreamTrackEvent.js +6 -6
  124. package/lib/commonjs/MediaStreamTrackEvent.js.map +1 -1
  125. package/lib/commonjs/MessageEvent.js +7 -7
  126. package/lib/commonjs/MessageEvent.js.map +1 -1
  127. package/lib/commonjs/Permissions.js +28 -28
  128. package/lib/commonjs/Permissions.js.map +1 -1
  129. package/lib/commonjs/RTCAudioSession.js +4 -4
  130. package/lib/commonjs/RTCAudioSession.js.map +1 -1
  131. package/lib/commonjs/RTCDataChannel.js +2 -2
  132. package/lib/commonjs/RTCDataChannel.js.map +1 -1
  133. package/lib/commonjs/RTCDataChannelEvent.js +6 -6
  134. package/lib/commonjs/RTCDataChannelEvent.js.map +1 -1
  135. package/lib/commonjs/RTCDataPacketCryptor.js.map +1 -1
  136. package/lib/commonjs/RTCDataPacketCryptorFactory.js.map +1 -1
  137. package/lib/commonjs/RTCErrorEvent.js +3 -3
  138. package/lib/commonjs/RTCErrorEvent.js.map +1 -1
  139. package/lib/commonjs/RTCFrameCryptor.js +8 -8
  140. package/lib/commonjs/RTCFrameCryptor.js.map +1 -1
  141. package/lib/commonjs/RTCFrameCryptorFactory.js.map +1 -1
  142. package/lib/commonjs/RTCIceCandidate.js.map +1 -1
  143. package/lib/commonjs/RTCIceCandidateEvent.js +7 -7
  144. package/lib/commonjs/RTCIceCandidateEvent.js.map +1 -1
  145. package/lib/commonjs/RTCKeyProvider.js.map +1 -1
  146. package/lib/commonjs/RTCPIPView.js +2 -2
  147. package/lib/commonjs/RTCPIPView.js.map +1 -1
  148. package/lib/commonjs/RTCPIPView.web.js.map +1 -1
  149. package/lib/commonjs/RTCPeerConnection.js +36 -36
  150. package/lib/commonjs/RTCPeerConnection.js.map +1 -1
  151. package/lib/commonjs/RTCRtcpParameters.js.map +1 -1
  152. package/lib/commonjs/RTCRtpCapabilities.js +2 -2
  153. package/lib/commonjs/RTCRtpCapabilities.js.map +1 -1
  154. package/lib/commonjs/RTCRtpCodecCapability.js.map +1 -1
  155. package/lib/commonjs/RTCRtpCodecParameters.js.map +1 -1
  156. package/lib/commonjs/RTCRtpEncodingParameters.js.map +1 -1
  157. package/lib/commonjs/RTCRtpHeaderExtension.js.map +1 -1
  158. package/lib/commonjs/RTCRtpParameters.js.map +1 -1
  159. package/lib/commonjs/RTCRtpReceiveParameters.js.map +1 -1
  160. package/lib/commonjs/RTCRtpReceiver.js +7 -7
  161. package/lib/commonjs/RTCRtpReceiver.js.map +1 -1
  162. package/lib/commonjs/RTCRtpSendParameters.js +3 -3
  163. package/lib/commonjs/RTCRtpSendParameters.js.map +1 -1
  164. package/lib/commonjs/RTCRtpSender.js +7 -7
  165. package/lib/commonjs/RTCRtpSender.js.map +1 -1
  166. package/lib/commonjs/RTCRtpTransceiver.js.map +1 -1
  167. package/lib/commonjs/RTCSessionDescription.js.map +1 -1
  168. package/lib/commonjs/RTCTrackEvent.js +6 -6
  169. package/lib/commonjs/RTCTrackEvent.js.map +1 -1
  170. package/lib/commonjs/RTCUtil.js +28 -28
  171. package/lib/commonjs/RTCUtil.js.map +1 -1
  172. package/lib/commonjs/RTCView.js +5 -5
  173. package/lib/commonjs/RTCView.js.map +1 -1
  174. package/lib/commonjs/RTCView.web.js.map +1 -1
  175. package/lib/commonjs/ScreenCapturePickerView.js.map +1 -1
  176. package/lib/commonjs/ScreenCapturePickerView.web.js.map +1 -1
  177. package/lib/commonjs/getDisplayMedia.js.map +1 -1
  178. package/lib/commonjs/getUserMedia.js.map +1 -1
  179. package/lib/commonjs/index.js.map +1 -1
  180. package/lib/commonjs/index.web.js.map +1 -1
  181. package/lib/commonjs/webStream.js.map +1 -1
  182. package/lib/module/Constraints.js.map +1 -1
  183. package/lib/module/EventEmitter.js.map +1 -1
  184. package/lib/module/Logger.js.map +1 -1
  185. package/lib/module/MediaDevices.js +17 -17
  186. package/lib/module/MediaDevices.js.map +1 -1
  187. package/lib/module/MediaStream.js +19 -19
  188. package/lib/module/MediaStream.js.map +1 -1
  189. package/lib/module/MediaStreamError.js.map +1 -1
  190. package/lib/module/MediaStreamErrorEvent.js.map +1 -1
  191. package/lib/module/MediaStreamTrack.js +28 -28
  192. package/lib/module/MediaStreamTrack.js.map +1 -1
  193. package/lib/module/MediaStreamTrackEvent.js +6 -6
  194. package/lib/module/MediaStreamTrackEvent.js.map +1 -1
  195. package/lib/module/MessageEvent.js +7 -7
  196. package/lib/module/MessageEvent.js.map +1 -1
  197. package/lib/module/Permissions.js +28 -28
  198. package/lib/module/Permissions.js.map +1 -1
  199. package/lib/module/RTCAudioSession.js +4 -4
  200. package/lib/module/RTCAudioSession.js.map +1 -1
  201. package/lib/module/RTCDataChannel.js +2 -2
  202. package/lib/module/RTCDataChannel.js.map +1 -1
  203. package/lib/module/RTCDataChannelEvent.js +6 -6
  204. package/lib/module/RTCDataChannelEvent.js.map +1 -1
  205. package/lib/module/RTCDataPacketCryptor.js.map +1 -1
  206. package/lib/module/RTCDataPacketCryptorFactory.js.map +1 -1
  207. package/lib/module/RTCErrorEvent.js +3 -3
  208. package/lib/module/RTCErrorEvent.js.map +1 -1
  209. package/lib/module/RTCFrameCryptor.js +8 -8
  210. package/lib/module/RTCFrameCryptor.js.map +1 -1
  211. package/lib/module/RTCFrameCryptorFactory.js.map +1 -1
  212. package/lib/module/RTCIceCandidate.js.map +1 -1
  213. package/lib/module/RTCIceCandidateEvent.js +7 -7
  214. package/lib/module/RTCIceCandidateEvent.js.map +1 -1
  215. package/lib/module/RTCKeyProvider.js.map +1 -1
  216. package/lib/module/RTCPIPView.js +2 -2
  217. package/lib/module/RTCPIPView.js.map +1 -1
  218. package/lib/module/RTCPIPView.web.js.map +1 -1
  219. package/lib/module/RTCPeerConnection.js +36 -36
  220. package/lib/module/RTCPeerConnection.js.map +1 -1
  221. package/lib/module/RTCRtcpParameters.js.map +1 -1
  222. package/lib/module/RTCRtpCapabilities.js +2 -2
  223. package/lib/module/RTCRtpCapabilities.js.map +1 -1
  224. package/lib/module/RTCRtpCodecCapability.js.map +1 -1
  225. package/lib/module/RTCRtpCodecParameters.js.map +1 -1
  226. package/lib/module/RTCRtpEncodingParameters.js.map +1 -1
  227. package/lib/module/RTCRtpHeaderExtension.js.map +1 -1
  228. package/lib/module/RTCRtpParameters.js.map +1 -1
  229. package/lib/module/RTCRtpReceiveParameters.js.map +1 -1
  230. package/lib/module/RTCRtpReceiver.js +7 -7
  231. package/lib/module/RTCRtpReceiver.js.map +1 -1
  232. package/lib/module/RTCRtpSendParameters.js +3 -3
  233. package/lib/module/RTCRtpSendParameters.js.map +1 -1
  234. package/lib/module/RTCRtpSender.js +7 -7
  235. package/lib/module/RTCRtpSender.js.map +1 -1
  236. package/lib/module/RTCRtpTransceiver.js.map +1 -1
  237. package/lib/module/RTCSessionDescription.js.map +1 -1
  238. package/lib/module/RTCTrackEvent.js +6 -6
  239. package/lib/module/RTCTrackEvent.js.map +1 -1
  240. package/lib/module/RTCUtil.js +28 -28
  241. package/lib/module/RTCUtil.js.map +1 -1
  242. package/lib/module/RTCView.js +5 -5
  243. package/lib/module/RTCView.js.map +1 -1
  244. package/lib/module/RTCView.web.js.map +1 -1
  245. package/lib/module/ScreenCapturePickerView.js.map +1 -1
  246. package/lib/module/ScreenCapturePickerView.web.js.map +1 -1
  247. package/lib/module/getDisplayMedia.js.map +1 -1
  248. package/lib/module/getUserMedia.js.map +1 -1
  249. package/lib/module/index.js.map +1 -1
  250. package/lib/module/index.web.js.map +1 -1
  251. package/lib/module/webStream.js.map +1 -1
  252. package/lib/typescript/Constraints.d.ts +19 -19
  253. package/lib/typescript/EventEmitter.d.ts +6 -6
  254. package/lib/typescript/Logger.d.ts +13 -13
  255. package/lib/typescript/MediaDevices.d.ts +30 -30
  256. package/lib/typescript/MediaStream.d.ts +48 -48
  257. package/lib/typescript/MediaStreamError.d.ts +6 -6
  258. package/lib/typescript/MediaStreamErrorEvent.d.ts +6 -6
  259. package/lib/typescript/MediaStreamTrack.d.ts +101 -101
  260. package/lib/typescript/MediaStreamTrackEvent.d.ts +19 -19
  261. package/lib/typescript/MessageEvent.d.ts +20 -20
  262. package/lib/typescript/Permissions.d.ts +55 -55
  263. package/lib/typescript/RTCAudioSession.d.ts +10 -10
  264. package/lib/typescript/RTCDataChannel.d.ts +43 -43
  265. package/lib/typescript/RTCDataChannelEvent.d.ts +19 -19
  266. package/lib/typescript/RTCDataPacketCryptor.d.ts +12 -12
  267. package/lib/typescript/RTCDataPacketCryptorFactory.d.ts +6 -6
  268. package/lib/typescript/RTCErrorEvent.d.ts +12 -12
  269. package/lib/typescript/RTCFrameCryptor.d.ts +47 -47
  270. package/lib/typescript/RTCFrameCryptorFactory.d.ts +21 -21
  271. package/lib/typescript/RTCIceCandidate.d.ts +17 -17
  272. package/lib/typescript/RTCIceCandidateEvent.d.ts +20 -20
  273. package/lib/typescript/RTCKeyProvider.d.ts +21 -21
  274. package/lib/typescript/RTCPIPView.d.ts +15 -15
  275. package/lib/typescript/RTCPIPView.web.d.ts +13 -13
  276. package/lib/typescript/RTCPeerConnection.d.ts +117 -117
  277. package/lib/typescript/RTCRtcpParameters.d.ts +10 -10
  278. package/lib/typescript/RTCRtpCapabilities.d.ts +9 -9
  279. package/lib/typescript/RTCRtpCodecCapability.d.ts +7 -7
  280. package/lib/typescript/RTCRtpCodecParameters.d.ts +16 -16
  281. package/lib/typescript/RTCRtpEncodingParameters.d.ts +23 -23
  282. package/lib/typescript/RTCRtpHeaderExtension.d.ts +12 -12
  283. package/lib/typescript/RTCRtpParameters.d.ts +19 -19
  284. package/lib/typescript/RTCRtpReceiveParameters.d.ts +4 -4
  285. package/lib/typescript/RTCRtpReceiver.d.ts +21 -21
  286. package/lib/typescript/RTCRtpSendParameters.d.ts +20 -20
  287. package/lib/typescript/RTCRtpSender.d.ts +22 -22
  288. package/lib/typescript/RTCRtpTransceiver.d.ts +31 -31
  289. package/lib/typescript/RTCSessionDescription.d.ts +12 -12
  290. package/lib/typescript/RTCTrackEvent.d.ts +29 -29
  291. package/lib/typescript/RTCUtil.d.ts +37 -37
  292. package/lib/typescript/RTCView.d.ts +117 -117
  293. package/lib/typescript/RTCView.web.d.ts +25 -25
  294. package/lib/typescript/ScreenCapturePickerView.d.ts +2 -2
  295. package/lib/typescript/ScreenCapturePickerView.web.d.ts +1 -1
  296. package/lib/typescript/getDisplayMedia.d.ts +2 -2
  297. package/lib/typescript/getUserMedia.d.ts +7 -7
  298. package/lib/typescript/index.d.ts +22 -22
  299. package/lib/typescript/index.web.d.ts +101 -101
  300. package/lib/typescript/webStream.d.ts +3 -3
  301. package/livekit-react-native-webrtc.podspec +29 -29
  302. package/macos/RCTWebRTC.xcodeproj/project.pbxproj +324 -324
  303. package/macos/RCTWebRTC.xcodeproj/project.xcworkspace/contents.xcworkspacedata +7 -7
  304. package/macos/RCTWebRTC.xcodeproj/project.xcworkspace/xcshareddata/IDEWorkspaceChecks.plist +8 -8
  305. package/metro.config.js +7 -7
  306. package/metro.config.macos.js +14 -14
  307. package/package.json +66 -66
  308. package/react-native.config.js +11 -11
  309. package/src/.eslintrc.cjs +67 -67
  310. package/src/Constraints.ts +20 -20
  311. package/src/EventEmitter.ts +65 -65
  312. package/src/Logger.ts +49 -49
  313. package/src/MediaDevices.ts +53 -53
  314. package/src/MediaStream.ts +161 -161
  315. package/src/MediaStreamError.ts +12 -12
  316. package/src/MediaStreamErrorEvent.ts +11 -11
  317. package/src/MediaStreamTrack.ts +282 -282
  318. package/src/MediaStreamTrackEvent.ts +25 -25
  319. package/src/MessageEvent.ts +26 -26
  320. package/src/Permissions.ts +133 -133
  321. package/src/RTCAudioSession.ts +25 -25
  322. package/src/RTCDataChannel.ts +190 -190
  323. package/src/RTCDataChannelEvent.ts +28 -28
  324. package/src/RTCDataPacketCryptor.ts +90 -90
  325. package/src/RTCDataPacketCryptorFactory.ts +24 -24
  326. package/src/RTCErrorEvent.ts +20 -20
  327. package/src/RTCFrameCryptor.ts +162 -162
  328. package/src/RTCFrameCryptorFactory.ts +101 -101
  329. package/src/RTCIceCandidate.ts +29 -29
  330. package/src/RTCIceCandidateEvent.ts +26 -26
  331. package/src/RTCKeyProvider.ts +117 -117
  332. package/src/RTCPIPView.tsx +46 -46
  333. package/src/RTCPIPView.web.tsx +18 -18
  334. package/src/RTCPeerConnection.ts +935 -935
  335. package/src/RTCRtcpParameters.ts +23 -23
  336. package/src/RTCRtpCapabilities.ts +16 -16
  337. package/src/RTCRtpCodecCapability.ts +12 -12
  338. package/src/RTCRtpCodecParameters.ts +44 -44
  339. package/src/RTCRtpEncodingParameters.ts +90 -90
  340. package/src/RTCRtpHeaderExtension.ts +27 -27
  341. package/src/RTCRtpParameters.ts +37 -37
  342. package/src/RTCRtpReceiveParameters.ts +7 -7
  343. package/src/RTCRtpReceiver.ts +60 -60
  344. package/src/RTCRtpSendParameters.ts +63 -63
  345. package/src/RTCRtpSender.ts +78 -78
  346. package/src/RTCRtpTransceiver.ts +107 -107
  347. package/src/RTCSessionDescription.ts +30 -30
  348. package/src/RTCTrackEvent.ts +42 -42
  349. package/src/RTCUtil.ts +211 -211
  350. package/src/RTCView.ts +122 -122
  351. package/src/RTCView.web.tsx +80 -80
  352. package/src/ScreenCapturePickerView.ts +4 -4
  353. package/src/ScreenCapturePickerView.web.tsx +3 -3
  354. package/src/getDisplayMedia.ts +30 -30
  355. package/src/getUserMedia.ts +136 -136
  356. package/src/index.ts +107 -107
  357. package/src/index.web.ts +191 -191
  358. package/src/webStream.ts +31 -31
  359. package/tools/format.sh +6 -6
  360. package/tools/release.sh +45 -45
  361. package/tsconfig.json +17 -17
@@ -1,501 +1,529 @@
1
- package com.oney.WebRTCModule.palabra;
2
-
3
- import android.content.Context;
4
- import android.media.AudioFormat;
5
- import android.media.AudioManager;
6
- import android.media.AudioTrack;
7
- import android.os.Handler;
8
- import android.os.Looper;
9
- import android.util.Base64;
10
- import android.util.Log;
11
-
12
- import org.json.JSONArray;
13
- import org.json.JSONException;
14
- import org.json.JSONObject;
15
- import org.webrtc.AudioTrackSink;
16
-
17
- import java.io.BufferedReader;
18
- import java.io.ByteArrayOutputStream;
19
- import java.io.IOException;
20
- import java.io.InputStream;
21
- import java.io.InputStreamReader;
22
- import java.io.OutputStream;
23
- import java.net.HttpURLConnection;
24
- import java.net.URL;
25
- import java.nio.ByteBuffer;
26
- import java.nio.ByteOrder;
27
- import java.nio.charset.StandardCharsets;
28
- import java.util.concurrent.ExecutorService;
29
- import java.util.concurrent.Executors;
30
- import java.util.concurrent.TimeUnit;
31
- import java.util.concurrent.atomic.AtomicBoolean;
32
-
33
- import okhttp3.OkHttpClient;
34
- import okhttp3.Request;
35
- import okhttp3.Response;
36
- import okhttp3.WebSocket;
37
- import okhttp3.WebSocketListener;
38
-
39
- public class PalabraClient implements AudioTrackSink {
40
- private static final String TAG = "PalabraClient";
41
- private static final int SAMPLE_RATE_IN = 16000;
42
- private static final int SAMPLE_RATE_OUT = 24000;
43
- private static final int CHANNELS = 1;
44
- private static final int CHUNK_MS = 320;
45
- private static final int CHUNK_SAMPLES = SAMPLE_RATE_IN * CHUNK_MS / 1000;
46
- private static final int CHUNK_BYTES = CHUNK_SAMPLES * 2;
47
-
48
- private final Context context;
49
- private final PalabraConfig config;
50
- private PalabraListener listener;
51
-
52
- private org.webrtc.AudioTrack remoteTrack;
53
- private OkHttpClient httpClient;
54
- private WebSocket webSocket;
55
-
56
- private AudioTrack audioPlayer;
57
- private final ExecutorService executor = Executors.newSingleThreadExecutor();
58
- private final Handler mainHandler = new Handler(Looper.getMainLooper());
59
-
60
- private String sessionId;
61
- private String wsUrl;
62
- private String publisherToken;
63
-
64
- private AtomicBoolean connected = new AtomicBoolean(false);
65
- private AtomicBoolean translating = new AtomicBoolean(false);
66
-
67
- private ByteArrayOutputStream audioBuffer = new ByteArrayOutputStream();
68
- private final Object bufferLock = new Object();
69
-
70
- public PalabraClient(Context context, PalabraConfig config) {
71
- this.context = context;
72
- this.config = config;
73
- this.httpClient = new OkHttpClient.Builder()
74
- .connectTimeout(30, TimeUnit.SECONDS)
75
- .readTimeout(30, TimeUnit.SECONDS)
76
- .writeTimeout(30, TimeUnit.SECONDS)
77
- .build();
78
- setupAudioPlayer();
79
- }
80
-
81
- public void setListener(PalabraListener listener) {
82
- this.listener = listener;
83
- }
84
-
85
- public boolean isConnected() {
86
- return connected.get();
87
- }
88
-
89
- public boolean isTranslating() {
90
- return translating.get();
91
- }
92
-
93
- private void setupAudioPlayer() {
94
- int channelConfig = AudioFormat.CHANNEL_OUT_MONO;
95
- int audioFormat = AudioFormat.ENCODING_PCM_16BIT;
96
- int bufferSize = AudioTrack.getMinBufferSize(SAMPLE_RATE_OUT, channelConfig, audioFormat) * 2;
97
-
98
- audioPlayer = new AudioTrack(
99
- AudioManager.STREAM_VOICE_CALL,
100
- SAMPLE_RATE_OUT,
101
- channelConfig,
102
- audioFormat,
103
- bufferSize,
104
- AudioTrack.MODE_STREAM
105
- );
106
- }
107
-
108
- public void start(org.webrtc.AudioTrack remoteAudioTrack) {
109
- if (translating.get()) {
110
- return;
111
- }
112
-
113
- this.remoteTrack = remoteAudioTrack;
114
- remoteAudioTrack.setVolume(0);
115
-
116
- notifyConnectionState("connecting");
117
-
118
- executor.execute(() -> {
119
- try {
120
- JSONObject session = createSession();
121
- Log.d(TAG, "session_response: " + session.toString());
122
- JSONObject data = session.getJSONObject("data");
123
- sessionId = data.getString("id");
124
- wsUrl = data.getString("ws_url");
125
- publisherToken = data.getString("publisher");
126
- Log.d(TAG, "ws_url: " + wsUrl);
127
-
128
- mainHandler.post(this::connectWebSocket);
129
- } catch (Exception e) {
130
- Log.e(TAG, "session_create_failed", e);
131
- mainHandler.post(() -> {
132
- if (remoteAudioTrack != null) {
133
- remoteAudioTrack.setVolume(1.0);
134
- }
135
- notifyError(500, e.getMessage());
136
- });
137
- }
138
- });
139
- }
140
-
141
- private JSONObject createSession() throws IOException, JSONException {
142
- URL url = new URL(config.apiUrl + "/session-storage/session");
143
- HttpURLConnection conn = (HttpURLConnection) url.openConnection();
144
- conn.setRequestMethod("POST");
145
- conn.setRequestProperty("ClientId", config.clientId);
146
- conn.setRequestProperty("ClientSecret", config.clientSecret);
147
- conn.setRequestProperty("Content-Type", "application/json");
148
- conn.setDoOutput(true);
149
-
150
- JSONObject body = new JSONObject();
151
- JSONObject bodyData = new JSONObject();
152
- bodyData.put("subscriber_count", 0);
153
- bodyData.put("publisher_can_subscribe", true);
154
- body.put("data", bodyData);
155
-
156
- try (OutputStream os = conn.getOutputStream()) {
157
- os.write(body.toString().getBytes(StandardCharsets.UTF_8));
158
- }
159
-
160
- int responseCode = conn.getResponseCode();
161
- if (responseCode < 200 || responseCode >= 300) {
162
- throw new IOException(buildSessionError(conn, responseCode));
163
- }
164
-
165
- String response = readStream(conn.getInputStream());
166
-
167
- return new JSONObject(response);
168
- }
169
-
170
- private String buildSessionError(HttpURLConnection conn, int responseCode) throws IOException {
171
- String fallback = "session_http_error_" + responseCode;
172
- String payload = readStream(conn.getErrorStream());
173
- if (payload.isEmpty()) {
174
- return fallback;
175
- }
176
-
177
- try {
178
- JSONObject json = new JSONObject(payload);
179
- JSONArray errors = json.optJSONArray("errors");
180
- if (errors != null && errors.length() > 0) {
181
- JSONObject first = errors.optJSONObject(0);
182
- if (first != null) {
183
- String detail = first.optString("detail");
184
- if (detail != null && !detail.isEmpty()) {
185
- return fallback + ": " + detail;
186
- }
187
- }
188
- }
189
- } catch (JSONException e) {
190
- Log.d(TAG, "session_error_parse_failed", e);
191
- }
192
-
193
- return fallback;
194
- }
195
-
196
- private String readStream(InputStream stream) throws IOException {
197
- if (stream == null) {
198
- return "";
199
- }
200
-
201
- StringBuilder response = new StringBuilder();
202
- try (BufferedReader br = new BufferedReader(new InputStreamReader(stream, StandardCharsets.UTF_8))) {
203
- String line;
204
- while ((line = br.readLine()) != null) {
205
- response.append(line);
206
- }
207
- }
208
-
209
- return response.toString();
210
- }
211
-
212
- private void connectWebSocket() {
213
- String endpoint = wsUrl + "?token=" + publisherToken;
214
- Log.d(TAG, "connecting_ws: " + endpoint);
215
-
216
- Request request = new Request.Builder()
217
- .url(endpoint)
218
- .build();
219
-
220
- webSocket = httpClient.newWebSocket(request, new WebSocketListener() {
221
- @Override
222
- public void onOpen(WebSocket ws, Response response) {
223
- Log.d(TAG, "ws_open");
224
- connected.set(true);
225
- translating.set(true);
226
-
227
- remoteTrack.addSink(PalabraClient.this);
228
- audioPlayer.play();
229
-
230
- mainHandler.post(() -> notifyConnectionState("connected"));
231
-
232
- mainHandler.postDelayed(() -> sendSetTask(), 500);
233
- }
234
-
235
- @Override
236
- public void onMessage(WebSocket ws, String text) {
237
- handleMessage(text);
238
- }
239
-
240
- @Override
241
- public void onFailure(WebSocket ws, Throwable t, Response response) {
242
- Log.e(TAG, "ws_error", t);
243
- mainHandler.post(() -> {
244
- stop();
245
- notifyError(500, t.getMessage());
246
- });
247
- }
248
-
249
- @Override
250
- public void onClosed(WebSocket ws, int code, String reason) {
251
- Log.d(TAG, "ws_closed: " + code);
252
- mainHandler.post(() -> stop());
253
- }
254
- });
255
- }
256
-
257
- private void sendSetTask() {
258
- if (webSocket == null || !connected.get()) {
259
- return;
260
- }
261
-
262
- try {
263
- JSONObject msg = new JSONObject();
264
- msg.put("message_type", "set_task");
265
-
266
- JSONObject data = new JSONObject();
267
-
268
- JSONObject inputStream = new JSONObject();
269
- inputStream.put("content_type", "audio");
270
- JSONObject source = new JSONObject();
271
- source.put("type", "ws");
272
- source.put("format", "pcm_s16le");
273
- source.put("sample_rate", SAMPLE_RATE_IN);
274
- source.put("channels", CHANNELS);
275
- inputStream.put("source", source);
276
- data.put("input_stream", inputStream);
277
-
278
- JSONObject outputStream = new JSONObject();
279
- outputStream.put("content_type", "audio");
280
- JSONObject target = new JSONObject();
281
- target.put("type", "ws");
282
- target.put("format", "pcm_s16le");
283
- outputStream.put("target", target);
284
- data.put("output_stream", outputStream);
285
-
286
- JSONObject pipeline = new JSONObject();
287
-
288
- JSONObject transcription = new JSONObject();
289
- transcription.put("source_language", config.sourceLang);
290
- pipeline.put("transcription", transcription);
291
-
292
- JSONArray translations = new JSONArray();
293
- JSONObject translation = new JSONObject();
294
- translation.put("target_language", config.targetLang);
295
- JSONObject speechGen = new JSONObject();
296
- speechGen.put("voice_cloning", false);
297
- translation.put("speech_generation", speechGen);
298
- translations.put(translation);
299
- pipeline.put("translations", translations);
300
-
301
- JSONArray allowedTypes = new JSONArray();
302
- allowedTypes.put("partial_transcription");
303
- allowedTypes.put("validated_transcription");
304
- allowedTypes.put("translated_transcription");
305
- pipeline.put("allowed_message_types", allowedTypes);
306
-
307
- data.put("pipeline", pipeline);
308
- msg.put("data", data);
309
-
310
- String payload = msg.toString();
311
- Log.d(TAG, "set_task: " + payload);
312
- webSocket.send(payload);
313
- } catch (JSONException e) {
314
- Log.e(TAG, "set_task_error", e);
315
- }
316
- }
317
-
318
- private void handleMessage(String text) {
319
- try {
320
- JSONObject json = new JSONObject(text);
321
- String type = json.optString("message_type", "");
322
-
323
- if ("output_audio_data".equals(type)) {
324
- JSONObject data = json.getJSONObject("data");
325
- String audioBase64 = data.optString("data", "");
326
- if (!audioBase64.isEmpty()) {
327
- byte[] audioBytes = Base64.decode(audioBase64, Base64.DEFAULT);
328
- if (audioPlayer != null && translating.get()) {
329
- audioPlayer.write(audioBytes, 0, audioBytes.length);
330
- }
331
- }
332
- } else if (type.contains("transcription")) {
333
- JSONObject data = json.getJSONObject("data");
334
- JSONObject transcription = data.optJSONObject("transcription");
335
- if (transcription != null) {
336
- String txt = transcription.optString("text", "");
337
- String lang = transcription.optString("language", "");
338
- boolean isFinal = !"partial_transcription".equals(type);
339
- mainHandler.post(() -> notifyTranscription(txt, lang, isFinal));
340
- }
341
- } else if ("error".equals(type)) {
342
- JSONObject data = json.optJSONObject("data");
343
- String desc = data != null ? data.optString("desc", "unknown") : "unknown";
344
- Log.e(TAG, "palabra_error: " + desc);
345
- mainHandler.post(() -> notifyError(500, desc));
346
- }
347
- } catch (JSONException e) {
348
- Log.e(TAG, "msg_parse_error", e);
349
- }
350
- }
351
-
352
- public void stop() {
353
- if (!translating.getAndSet(false)) {
354
- return;
355
- }
356
-
357
- connected.set(false);
358
-
359
- if (remoteTrack != null) {
360
- try {
361
- remoteTrack.removeSink(this);
362
- remoteTrack.setVolume(1.0);
363
- } catch (Exception e) {
364
- Log.w(TAG, "stop_track_cleanup_error: " + e.getMessage());
365
- }
366
- }
367
-
368
- if (webSocket != null) {
369
- try {
370
- JSONObject endMsg = new JSONObject();
371
- endMsg.put("message_type", "end_task");
372
- endMsg.put("data", new JSONObject().put("force", false));
373
- webSocket.send(endMsg.toString());
374
- } catch (JSONException e) {
375
- Log.e(TAG, "end_task_error", e);
376
- }
377
- try {
378
- webSocket.close(1000, "stop");
379
- } catch (Exception e) {
380
- Log.w(TAG, "websocket_close_error: " + e.getMessage());
381
- }
382
- webSocket = null;
383
- }
384
-
385
- if (audioPlayer != null) {
386
- try {
387
- audioPlayer.stop();
388
- } catch (Exception e) {
389
- Log.w(TAG, "audio_player_stop_error: " + e.getMessage());
390
- }
391
- }
392
-
393
- synchronized (bufferLock) {
394
- audioBuffer.reset();
395
- }
396
-
397
- remoteTrack = null;
398
- notifyConnectionState("disconnected");
399
- }
400
-
401
- @Override
402
- public void onData(ByteBuffer audioData, int bitsPerSample, int sampleRate, int channels, int frames, long timestamp) {
403
- if (!translating.get() || webSocket == null) {
404
- return;
405
- }
406
-
407
- byte[] samples = new byte[audioData.remaining()];
408
- audioData.get(samples);
409
-
410
- byte[] resampled = resample(samples, sampleRate, channels, SAMPLE_RATE_IN, CHANNELS);
411
-
412
- synchronized (bufferLock) {
413
- try {
414
- audioBuffer.write(resampled);
415
-
416
- while (audioBuffer.size() >= CHUNK_BYTES) {
417
- byte[] chunk = new byte[CHUNK_BYTES];
418
- byte[] all = audioBuffer.toByteArray();
419
- System.arraycopy(all, 0, chunk, 0, CHUNK_BYTES);
420
-
421
- audioBuffer.reset();
422
- if (all.length > CHUNK_BYTES) {
423
- audioBuffer.write(all, CHUNK_BYTES, all.length - CHUNK_BYTES);
424
- }
425
-
426
- sendAudioChunk(chunk);
427
- }
428
- } catch (IOException e) {
429
- Log.e(TAG, "buffer_error", e);
430
- }
431
- }
432
- }
433
-
434
- private byte[] resample(byte[] input, int srcRate, int srcChannels, int dstRate, int dstChannels) {
435
- if (srcRate == dstRate && srcChannels == dstChannels) {
436
- return input;
437
- }
438
-
439
- int srcSamples = input.length / (2 * srcChannels);
440
- int dstSamples = (int) ((long) srcSamples * dstRate / srcRate);
441
-
442
- short[] srcData = new short[srcSamples * srcChannels];
443
- ByteBuffer.wrap(input).order(ByteOrder.LITTLE_ENDIAN).asShortBuffer().get(srcData);
444
-
445
- short[] monoSrc = srcData;
446
- if (srcChannels == 2) {
447
- monoSrc = new short[srcSamples];
448
- for (int i = 0; i < srcSamples; i++) {
449
- monoSrc[i] = (short) ((srcData[i * 2] + srcData[i * 2 + 1]) / 2);
450
- }
451
- }
452
-
453
- short[] dstData = new short[dstSamples];
454
- for (int i = 0; i < dstSamples; i++) {
455
- float srcIdx = (float) i * (monoSrc.length - 1) / (dstSamples - 1);
456
- int idx0 = (int) srcIdx;
457
- int idx1 = Math.min(idx0 + 1, monoSrc.length - 1);
458
- float frac = srcIdx - idx0;
459
- dstData[i] = (short) (monoSrc[idx0] * (1 - frac) + monoSrc[idx1] * frac);
460
- }
461
-
462
- byte[] output = new byte[dstSamples * 2];
463
- ByteBuffer.wrap(output).order(ByteOrder.LITTLE_ENDIAN).asShortBuffer().put(dstData);
464
- return output;
465
- }
466
-
467
- private void sendAudioChunk(byte[] chunk) {
468
- if (webSocket == null || !connected.get()) {
469
- return;
470
- }
471
-
472
- try {
473
- JSONObject msg = new JSONObject();
474
- msg.put("message_type", "input_audio_data");
475
- JSONObject data = new JSONObject();
476
- data.put("data", Base64.encodeToString(chunk, Base64.NO_WRAP));
477
- msg.put("data", data);
478
- webSocket.send(msg.toString());
479
- } catch (JSONException e) {
480
- Log.e(TAG, "send_audio_error", e);
481
- }
482
- }
483
-
484
- private void notifyConnectionState(String state) {
485
- if (listener != null) {
486
- listener.onConnectionState(state);
487
- }
488
- }
489
-
490
- private void notifyError(int code, String message) {
491
- if (listener != null) {
492
- listener.onError(code, message);
493
- }
494
- }
495
-
496
- private void notifyTranscription(String text, String lang, boolean isFinal) {
497
- if (listener != null) {
498
- listener.onTranscription(text, lang, isFinal);
499
- }
500
- }
501
- }
1
+ package com.oney.WebRTCModule.palabra;
2
+
3
+ import android.content.Context;
4
+ import android.media.AudioFormat;
5
+ import android.media.AudioManager;
6
+ import android.media.AudioTrack;
7
+ import android.os.Handler;
8
+ import android.os.Looper;
9
+ import android.util.Base64;
10
+ import android.util.Log;
11
+
12
+ import org.json.JSONArray;
13
+ import org.json.JSONException;
14
+ import org.json.JSONObject;
15
+ import org.webrtc.AudioTrackSink;
16
+
17
+ import java.io.BufferedReader;
18
+ import java.io.ByteArrayOutputStream;
19
+ import java.io.IOException;
20
+ import java.io.InputStream;
21
+ import java.io.InputStreamReader;
22
+ import java.io.OutputStream;
23
+ import java.net.HttpURLConnection;
24
+ import java.net.URL;
25
+ import java.nio.ByteBuffer;
26
+ import java.nio.ByteOrder;
27
+ import java.nio.charset.StandardCharsets;
28
+ import java.util.concurrent.ExecutorService;
29
+ import java.util.concurrent.Executors;
30
+ import java.util.concurrent.TimeUnit;
31
+ import java.util.concurrent.atomic.AtomicBoolean;
32
+
33
+ import okhttp3.OkHttpClient;
34
+ import okhttp3.Request;
35
+ import okhttp3.Response;
36
+ import okhttp3.WebSocket;
37
+ import okhttp3.WebSocketListener;
38
+
39
+ public class PalabraClient implements AudioTrackSink {
40
+ private static final String TAG = "PalabraClient";
41
+ private static final int SAMPLE_RATE_IN = 16000;
42
+ private static final int SAMPLE_RATE_OUT = 24000;
43
+ private static final int CHANNELS = 1;
44
+ private static final int CHUNK_MS = 320;
45
+ private static final int CHUNK_SAMPLES = SAMPLE_RATE_IN * CHUNK_MS / 1000;
46
+ private static final int CHUNK_BYTES = CHUNK_SAMPLES * 2;
47
+
48
+ private final Context context;
49
+ private final PalabraConfig config;
50
+ private PalabraListener listener;
51
+
52
+ private org.webrtc.AudioTrack remoteTrack;
53
+ private OkHttpClient httpClient;
54
+ private WebSocket webSocket;
55
+
56
+ private AudioTrack audioPlayer;
57
+ private final ExecutorService executor = Executors.newSingleThreadExecutor();
58
+ private final Handler mainHandler = new Handler(Looper.getMainLooper());
59
+
60
+ private String sessionId;
61
+ private String wsUrl;
62
+ private String publisherToken;
63
+ private String remoteTrackId;
64
+
65
+ private AtomicBoolean connected = new AtomicBoolean(false);
66
+ private AtomicBoolean starting = new AtomicBoolean(false);
67
+ private AtomicBoolean translating = new AtomicBoolean(false);
68
+
69
+ private ByteArrayOutputStream audioBuffer = new ByteArrayOutputStream();
70
+ private final Object bufferLock = new Object();
71
+
72
+ public PalabraClient(Context context, PalabraConfig config) {
73
+ this.context = context;
74
+ this.config = config;
75
+ this.httpClient = new OkHttpClient.Builder()
76
+ .connectTimeout(30, TimeUnit.SECONDS)
77
+ .readTimeout(30, TimeUnit.SECONDS)
78
+ .writeTimeout(30, TimeUnit.SECONDS)
79
+ .build();
80
+ setupAudioPlayer();
81
+ }
82
+
83
+ public void setListener(PalabraListener listener) {
84
+ this.listener = listener;
85
+ }
86
+
87
+ public boolean isConnected() {
88
+ return connected.get();
89
+ }
90
+
91
+ public boolean isStarting() {
92
+ return starting.get();
93
+ }
94
+
95
+ public boolean isRunning() {
96
+ return starting.get() || connected.get() || translating.get();
97
+ }
98
+
99
+ public boolean matchesSession(String trackId, String sourceLang, String targetLang, String apiUrl) {
100
+ return remoteTrackId != null
101
+ && remoteTrackId.equals(trackId)
102
+ && config.sourceLang.equals(sourceLang)
103
+ && config.targetLang.equals(targetLang)
104
+ && config.apiUrl.equals(apiUrl);
105
+ }
106
+
107
+ public boolean isTranslating() {
108
+ return translating.get();
109
+ }
110
+
111
+ private void setupAudioPlayer() {
112
+ int channelConfig = AudioFormat.CHANNEL_OUT_MONO;
113
+ int audioFormat = AudioFormat.ENCODING_PCM_16BIT;
114
+ int bufferSize = AudioTrack.getMinBufferSize(SAMPLE_RATE_OUT, channelConfig, audioFormat) * 2;
115
+
116
+ audioPlayer = new AudioTrack(
117
+ AudioManager.STREAM_VOICE_CALL,
118
+ SAMPLE_RATE_OUT,
119
+ channelConfig,
120
+ audioFormat,
121
+ bufferSize,
122
+ AudioTrack.MODE_STREAM
123
+ );
124
+ }
125
+
126
+ public void start(org.webrtc.AudioTrack remoteAudioTrack) {
127
+ if (starting.get() || translating.get()) {
128
+ Log.d(TAG, "palabra_start_skip_busy");
129
+ return;
130
+ }
131
+
132
+ starting.set(true);
133
+ this.remoteTrack = remoteAudioTrack;
134
+ this.remoteTrackId = remoteAudioTrack.id();
135
+ remoteAudioTrack.setVolume(0);
136
+
137
+ Log.d(TAG, "palabra_start", remoteTrackId);
138
+
139
+ notifyConnectionState("connecting");
140
+
141
+ executor.execute(() -> {
142
+ try {
143
+ JSONObject session = createSession();
144
+ Log.d(TAG, "session_response: " + session.toString());
145
+ JSONObject data = session.getJSONObject("data");
146
+ sessionId = data.getString("id");
147
+ wsUrl = data.getString("ws_url");
148
+ publisherToken = data.getString("publisher");
149
+ Log.d(TAG, "ws_url: " + wsUrl);
150
+
151
+ mainHandler.post(this::connectWebSocket);
152
+ } catch (Exception e) {
153
+ Log.e(TAG, "session_create_failed", e);
154
+ mainHandler.post(() -> {
155
+ starting.set(false);
156
+ if (remoteAudioTrack != null) {
157
+ remoteAudioTrack.setVolume(1.0);
158
+ }
159
+ notifyError(500, e.getMessage());
160
+ });
161
+ }
162
+ });
163
+ }
164
+
165
+ private JSONObject createSession() throws IOException, JSONException {
166
+ URL url = new URL(config.apiUrl + "/session-storage/session");
167
+ HttpURLConnection conn = (HttpURLConnection) url.openConnection();
168
+ conn.setRequestMethod("POST");
169
+ conn.setRequestProperty("ClientId", config.clientId);
170
+ conn.setRequestProperty("ClientSecret", config.clientSecret);
171
+ conn.setRequestProperty("Content-Type", "application/json");
172
+ conn.setDoOutput(true);
173
+
174
+ JSONObject body = new JSONObject();
175
+ JSONObject bodyData = new JSONObject();
176
+ bodyData.put("subscriber_count", 0);
177
+ bodyData.put("publisher_can_subscribe", true);
178
+ body.put("data", bodyData);
179
+
180
+ try (OutputStream os = conn.getOutputStream()) {
181
+ os.write(body.toString().getBytes(StandardCharsets.UTF_8));
182
+ }
183
+
184
+ int responseCode = conn.getResponseCode();
185
+ if (responseCode < 200 || responseCode >= 300) {
186
+ throw new IOException(buildSessionError(conn, responseCode));
187
+ }
188
+
189
+ String response = readStream(conn.getInputStream());
190
+
191
+ return new JSONObject(response);
192
+ }
193
+
194
+ private String buildSessionError(HttpURLConnection conn, int responseCode) throws IOException {
195
+ String fallback = "session_http_error_" + responseCode;
196
+ String payload = readStream(conn.getErrorStream());
197
+ if (payload.isEmpty()) {
198
+ return fallback;
199
+ }
200
+
201
+ try {
202
+ JSONObject json = new JSONObject(payload);
203
+ JSONArray errors = json.optJSONArray("errors");
204
+ if (errors != null && errors.length() > 0) {
205
+ JSONObject first = errors.optJSONObject(0);
206
+ if (first != null) {
207
+ String detail = first.optString("detail");
208
+ if (detail != null && !detail.isEmpty()) {
209
+ return fallback + ": " + detail;
210
+ }
211
+ }
212
+ }
213
+ } catch (JSONException e) {
214
+ Log.d(TAG, "session_error_parse_failed", e);
215
+ }
216
+
217
+ return fallback;
218
+ }
219
+
220
+ private String readStream(InputStream stream) throws IOException {
221
+ if (stream == null) {
222
+ return "";
223
+ }
224
+
225
+ StringBuilder response = new StringBuilder();
226
+ try (BufferedReader br = new BufferedReader(new InputStreamReader(stream, StandardCharsets.UTF_8))) {
227
+ String line;
228
+ while ((line = br.readLine()) != null) {
229
+ response.append(line);
230
+ }
231
+ }
232
+
233
+ return response.toString();
234
+ }
235
+
236
+ private void connectWebSocket() {
237
+ String endpoint = wsUrl + "?token=" + publisherToken;
238
+ Log.d(TAG, "connecting_ws: " + endpoint);
239
+
240
+ Request request = new Request.Builder()
241
+ .url(endpoint)
242
+ .build();
243
+
244
+ webSocket = httpClient.newWebSocket(request, new WebSocketListener() {
245
+ @Override
246
+ public void onOpen(WebSocket ws, Response response) {
247
+ Log.d(TAG, "ws_open");
248
+ starting.set(false);
249
+ connected.set(true);
250
+ translating.set(true);
251
+
252
+ remoteTrack.addSink(PalabraClient.this);
253
+ audioPlayer.play();
254
+
255
+ mainHandler.post(() -> notifyConnectionState("connected"));
256
+
257
+ mainHandler.postDelayed(() -> sendSetTask(), 500);
258
+ }
259
+
260
+ @Override
261
+ public void onMessage(WebSocket ws, String text) {
262
+ handleMessage(text);
263
+ }
264
+
265
+ @Override
266
+ public void onFailure(WebSocket ws, Throwable t, Response response) {
267
+ Log.e(TAG, "ws_error", t);
268
+ mainHandler.post(() -> {
269
+ stop();
270
+ notifyError(500, t.getMessage());
271
+ });
272
+ }
273
+
274
+ @Override
275
+ public void onClosed(WebSocket ws, int code, String reason) {
276
+ Log.d(TAG, "ws_closed: " + code);
277
+ mainHandler.post(() -> stop());
278
+ }
279
+ });
280
+ }
281
+
282
+ private void sendSetTask() {
283
+ if (webSocket == null || !connected.get()) {
284
+ return;
285
+ }
286
+
287
+ try {
288
+ JSONObject msg = new JSONObject();
289
+ msg.put("message_type", "set_task");
290
+
291
+ JSONObject data = new JSONObject();
292
+
293
+ JSONObject inputStream = new JSONObject();
294
+ inputStream.put("content_type", "audio");
295
+ JSONObject source = new JSONObject();
296
+ source.put("type", "ws");
297
+ source.put("format", "pcm_s16le");
298
+ source.put("sample_rate", SAMPLE_RATE_IN);
299
+ source.put("channels", CHANNELS);
300
+ inputStream.put("source", source);
301
+ data.put("input_stream", inputStream);
302
+
303
+ JSONObject outputStream = new JSONObject();
304
+ outputStream.put("content_type", "audio");
305
+ JSONObject target = new JSONObject();
306
+ target.put("type", "ws");
307
+ target.put("format", "pcm_s16le");
308
+ outputStream.put("target", target);
309
+ data.put("output_stream", outputStream);
310
+
311
+ JSONObject pipeline = new JSONObject();
312
+
313
+ JSONObject transcription = new JSONObject();
314
+ transcription.put("source_language", config.sourceLang);
315
+ pipeline.put("transcription", transcription);
316
+
317
+ JSONArray translations = new JSONArray();
318
+ JSONObject translation = new JSONObject();
319
+ translation.put("target_language", config.targetLang);
320
+ JSONObject speechGen = new JSONObject();
321
+ speechGen.put("voice_cloning", false);
322
+ translation.put("speech_generation", speechGen);
323
+ translations.put(translation);
324
+ pipeline.put("translations", translations);
325
+
326
+ JSONArray allowedTypes = new JSONArray();
327
+ allowedTypes.put("partial_transcription");
328
+ allowedTypes.put("validated_transcription");
329
+ allowedTypes.put("translated_transcription");
330
+ pipeline.put("allowed_message_types", allowedTypes);
331
+
332
+ data.put("pipeline", pipeline);
333
+ msg.put("data", data);
334
+
335
+ String payload = msg.toString();
336
+ Log.d(TAG, "set_task: " + payload);
337
+ webSocket.send(payload);
338
+ } catch (JSONException e) {
339
+ Log.e(TAG, "set_task_error", e);
340
+ }
341
+ }
342
+
343
+ private void handleMessage(String text) {
344
+ try {
345
+ JSONObject json = new JSONObject(text);
346
+ String type = json.optString("message_type", "");
347
+
348
+ if ("output_audio_data".equals(type)) {
349
+ JSONObject data = json.getJSONObject("data");
350
+ String audioBase64 = data.optString("data", "");
351
+ if (!audioBase64.isEmpty()) {
352
+ byte[] audioBytes = Base64.decode(audioBase64, Base64.DEFAULT);
353
+ if (audioPlayer != null && translating.get()) {
354
+ audioPlayer.write(audioBytes, 0, audioBytes.length);
355
+ }
356
+ }
357
+ } else if (type.contains("transcription")) {
358
+ JSONObject data = json.getJSONObject("data");
359
+ JSONObject transcription = data.optJSONObject("transcription");
360
+ if (transcription != null) {
361
+ String txt = transcription.optString("text", "");
362
+ String lang = transcription.optString("language", "");
363
+ boolean isFinal = !"partial_transcription".equals(type);
364
+ mainHandler.post(() -> notifyTranscription(txt, lang, isFinal));
365
+ }
366
+ } else if ("error".equals(type)) {
367
+ JSONObject data = json.optJSONObject("data");
368
+ String desc = data != null ? data.optString("desc", "unknown") : "unknown";
369
+ Log.e(TAG, "palabra_error: " + desc);
370
+ mainHandler.post(() -> notifyError(500, desc));
371
+ }
372
+ } catch (JSONException e) {
373
+ Log.e(TAG, "msg_parse_error", e);
374
+ }
375
+ }
376
+
377
+ public void stop() {
378
+ boolean wasStarting = starting.getAndSet(false);
379
+ boolean wasTranslating = translating.getAndSet(false);
380
+ if (!wasStarting && !wasTranslating && !connected.get() && remoteTrack == null && webSocket == null) {
381
+ return;
382
+ }
383
+
384
+ connected.set(false);
385
+
386
+ if (remoteTrack != null) {
387
+ try {
388
+ remoteTrack.removeSink(this);
389
+ remoteTrack.setVolume(1.0);
390
+ } catch (Exception e) {
391
+ Log.w(TAG, "stop_track_cleanup_error: " + e.getMessage());
392
+ }
393
+ }
394
+
395
+ if (webSocket != null) {
396
+ try {
397
+ JSONObject endMsg = new JSONObject();
398
+ endMsg.put("message_type", "end_task");
399
+ endMsg.put("data", new JSONObject().put("force", false));
400
+ webSocket.send(endMsg.toString());
401
+ } catch (JSONException e) {
402
+ Log.e(TAG, "end_task_error", e);
403
+ }
404
+ try {
405
+ webSocket.close(1000, "stop");
406
+ } catch (Exception e) {
407
+ Log.w(TAG, "websocket_close_error: " + e.getMessage());
408
+ }
409
+ webSocket = null;
410
+ }
411
+
412
+ if (audioPlayer != null) {
413
+ try {
414
+ audioPlayer.stop();
415
+ } catch (Exception e) {
416
+ Log.w(TAG, "audio_player_stop_error: " + e.getMessage());
417
+ }
418
+ }
419
+
420
+ synchronized (bufferLock) {
421
+ audioBuffer.reset();
422
+ }
423
+
424
+ remoteTrack = null;
425
+ remoteTrackId = null;
426
+ notifyConnectionState("disconnected");
427
+ }
428
+
429
+ @Override
430
+ public void onData(ByteBuffer audioData, int bitsPerSample, int sampleRate, int channels, int frames, long timestamp) {
431
+ if (!translating.get() || webSocket == null) {
432
+ return;
433
+ }
434
+
435
+ byte[] samples = new byte[audioData.remaining()];
436
+ audioData.get(samples);
437
+
438
+ byte[] resampled = resample(samples, sampleRate, channels, SAMPLE_RATE_IN, CHANNELS);
439
+
440
+ synchronized (bufferLock) {
441
+ try {
442
+ audioBuffer.write(resampled);
443
+
444
+ while (audioBuffer.size() >= CHUNK_BYTES) {
445
+ byte[] chunk = new byte[CHUNK_BYTES];
446
+ byte[] all = audioBuffer.toByteArray();
447
+ System.arraycopy(all, 0, chunk, 0, CHUNK_BYTES);
448
+
449
+ audioBuffer.reset();
450
+ if (all.length > CHUNK_BYTES) {
451
+ audioBuffer.write(all, CHUNK_BYTES, all.length - CHUNK_BYTES);
452
+ }
453
+
454
+ sendAudioChunk(chunk);
455
+ }
456
+ } catch (IOException e) {
457
+ Log.e(TAG, "buffer_error", e);
458
+ }
459
+ }
460
+ }
461
+
462
+ private byte[] resample(byte[] input, int srcRate, int srcChannels, int dstRate, int dstChannels) {
463
+ if (srcRate == dstRate && srcChannels == dstChannels) {
464
+ return input;
465
+ }
466
+
467
+ int srcSamples = input.length / (2 * srcChannels);
468
+ int dstSamples = (int) ((long) srcSamples * dstRate / srcRate);
469
+
470
+ short[] srcData = new short[srcSamples * srcChannels];
471
+ ByteBuffer.wrap(input).order(ByteOrder.LITTLE_ENDIAN).asShortBuffer().get(srcData);
472
+
473
+ short[] monoSrc = srcData;
474
+ if (srcChannels == 2) {
475
+ monoSrc = new short[srcSamples];
476
+ for (int i = 0; i < srcSamples; i++) {
477
+ monoSrc[i] = (short) ((srcData[i * 2] + srcData[i * 2 + 1]) / 2);
478
+ }
479
+ }
480
+
481
+ short[] dstData = new short[dstSamples];
482
+ for (int i = 0; i < dstSamples; i++) {
483
+ float srcIdx = (float) i * (monoSrc.length - 1) / (dstSamples - 1);
484
+ int idx0 = (int) srcIdx;
485
+ int idx1 = Math.min(idx0 + 1, monoSrc.length - 1);
486
+ float frac = srcIdx - idx0;
487
+ dstData[i] = (short) (monoSrc[idx0] * (1 - frac) + monoSrc[idx1] * frac);
488
+ }
489
+
490
+ byte[] output = new byte[dstSamples * 2];
491
+ ByteBuffer.wrap(output).order(ByteOrder.LITTLE_ENDIAN).asShortBuffer().put(dstData);
492
+ return output;
493
+ }
494
+
495
+ private void sendAudioChunk(byte[] chunk) {
496
+ if (webSocket == null || !connected.get()) {
497
+ return;
498
+ }
499
+
500
+ try {
501
+ JSONObject msg = new JSONObject();
502
+ msg.put("message_type", "input_audio_data");
503
+ JSONObject data = new JSONObject();
504
+ data.put("data", Base64.encodeToString(chunk, Base64.NO_WRAP));
505
+ msg.put("data", data);
506
+ webSocket.send(msg.toString());
507
+ } catch (JSONException e) {
508
+ Log.e(TAG, "send_audio_error", e);
509
+ }
510
+ }
511
+
512
+ private void notifyConnectionState(String state) {
513
+ if (listener != null) {
514
+ listener.onConnectionState(state);
515
+ }
516
+ }
517
+
518
+ private void notifyError(int code, String message) {
519
+ if (listener != null) {
520
+ listener.onError(code, message);
521
+ }
522
+ }
523
+
524
+ private void notifyTranscription(String text, String lang, boolean isFinal) {
525
+ if (listener != null) {
526
+ listener.onTranscription(text, lang, isFinal);
527
+ }
528
+ }
529
+ }