@sbhjt-gr/react-native-webrtc 124.0.0 → 124.0.2

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (362) hide show
  1. package/.clang-format +11 -11
  2. package/.eslintignore +6 -6
  3. package/.nvmrc +1 -1
  4. package/ISSUE_TEMPLATE.md +40 -40
  5. package/LICENSE +22 -22
  6. package/README.md +103 -103
  7. package/android/build.gradle +37 -37
  8. package/android/consumer-rules.pro +3 -3
  9. package/android/src/main/AndroidManifest.xml +11 -11
  10. package/android/src/main/java/com/oney/WebRTCModule/AbstractVideoCaptureController.java +113 -113
  11. package/android/src/main/java/com/oney/WebRTCModule/CameraCaptureController.java +338 -338
  12. package/android/src/main/java/com/oney/WebRTCModule/CameraEventsHandler.java +49 -49
  13. package/android/src/main/java/com/oney/WebRTCModule/DataChannelWrapper.java +99 -99
  14. package/android/src/main/java/com/oney/WebRTCModule/DataPacketCryptorManager.java +62 -62
  15. package/android/src/main/java/com/oney/WebRTCModule/DisplayUtils.java +16 -16
  16. package/android/src/main/java/com/oney/WebRTCModule/EglUtils.java +66 -66
  17. package/android/src/main/java/com/oney/WebRTCModule/GetUserMediaImpl.java +539 -539
  18. package/android/src/main/java/com/oney/WebRTCModule/LibraryLoader.java +21 -21
  19. package/android/src/main/java/com/oney/WebRTCModule/MediaProjectionNotification.java +70 -70
  20. package/android/src/main/java/com/oney/WebRTCModule/MediaProjectionService.java +82 -82
  21. package/android/src/main/java/com/oney/WebRTCModule/PeerConnectionObserver.java +588 -588
  22. package/android/src/main/java/com/oney/WebRTCModule/RTCCryptoManager.java +493 -493
  23. package/android/src/main/java/com/oney/WebRTCModule/RTCVideoViewManager.java +98 -98
  24. package/android/src/main/java/com/oney/WebRTCModule/ReactBridgeUtil.java +35 -35
  25. package/android/src/main/java/com/oney/WebRTCModule/ScreenCaptureController.java +94 -94
  26. package/android/src/main/java/com/oney/WebRTCModule/SerializeUtils.java +342 -342
  27. package/android/src/main/java/com/oney/WebRTCModule/StringUtils.java +100 -100
  28. package/android/src/main/java/com/oney/WebRTCModule/ThreadUtils.java +41 -41
  29. package/android/src/main/java/com/oney/WebRTCModule/TrackCapturerEventsEmitter.java +34 -34
  30. package/android/src/main/java/com/oney/WebRTCModule/VideoTrackAdapter.java +137 -137
  31. package/android/src/main/java/com/oney/WebRTCModule/WebRTCModule.java +1643 -1643
  32. package/android/src/main/java/com/oney/WebRTCModule/WebRTCModuleOptions.java +33 -33
  33. package/android/src/main/java/com/oney/WebRTCModule/WebRTCModulePackage.java +21 -21
  34. package/android/src/main/java/com/oney/WebRTCModule/WebRTCView.java +583 -583
  35. package/android/src/main/java/com/oney/WebRTCModule/palabra/PalabraClient.java +464 -464
  36. package/android/src/main/java/com/oney/WebRTCModule/palabra/PalabraConfig.java +17 -17
  37. package/android/src/main/java/com/oney/WebRTCModule/palabra/PalabraListener.java +7 -7
  38. package/android/src/main/java/com/oney/WebRTCModule/videoEffects/ProcessorProvider.java +38 -38
  39. package/android/src/main/java/com/oney/WebRTCModule/videoEffects/VideoEffectProcessor.java +59 -59
  40. package/android/src/main/java/com/oney/WebRTCModule/videoEffects/VideoFrameProcessor.java +19 -19
  41. package/android/src/main/java/com/oney/WebRTCModule/videoEffects/VideoFrameProcessorFactoryInterface.java +12 -12
  42. package/android/src/main/java/com/oney/WebRTCModule/webrtcutils/H264AndSoftwareVideoDecoderFactory.java +73 -73
  43. package/android/src/main/java/com/oney/WebRTCModule/webrtcutils/H264AndSoftwareVideoEncoderFactory.java +73 -73
  44. package/android/src/main/java/com/oney/WebRTCModule/webrtcutils/SoftwareVideoDecoderFactoryProxy.java +36 -36
  45. package/android/src/main/java/com/oney/WebRTCModule/webrtcutils/SoftwareVideoEncoderFactoryProxy.java +36 -36
  46. package/android/src/main/java/org/webrtc/Camera1Helper.java +54 -54
  47. package/android/src/main/java/org/webrtc/Camera2Helper.java +52 -52
  48. package/android/src/main/res/values/strings.xml +5 -5
  49. package/android/src/main/res/values/styles.xml +8 -8
  50. package/ios/RCTWebRTC/CaptureController.h +18 -18
  51. package/ios/RCTWebRTC/CaptureController.m +28 -28
  52. package/ios/RCTWebRTC/CapturerEventsDelegate.h +12 -12
  53. package/ios/RCTWebRTC/DataChannelWrapper.h +27 -27
  54. package/ios/RCTWebRTC/DataChannelWrapper.m +42 -42
  55. package/ios/RCTWebRTC/I420Converter.h +22 -22
  56. package/ios/RCTWebRTC/I420Converter.m +164 -164
  57. package/ios/RCTWebRTC/PIPController.h +24 -24
  58. package/ios/RCTWebRTC/PIPController.m +234 -234
  59. package/ios/RCTWebRTC/PalabraAudioSink.h +13 -13
  60. package/ios/RCTWebRTC/PalabraAudioSink.m +18 -18
  61. package/ios/RCTWebRTC/PalabraClient.h +36 -36
  62. package/ios/RCTWebRTC/PalabraClient.m +584 -584
  63. package/ios/RCTWebRTC/RCTConvert+WebRTC.h +16 -16
  64. package/ios/RCTWebRTC/RCTConvert+WebRTC.m +206 -206
  65. package/ios/RCTWebRTC/RTCMediaStreamTrack+React.h +10 -10
  66. package/ios/RCTWebRTC/RTCMediaStreamTrack+React.m +16 -16
  67. package/ios/RCTWebRTC/RTCVideoViewManager.h +29 -29
  68. package/ios/RCTWebRTC/RTCVideoViewManager.m +411 -411
  69. package/ios/RCTWebRTC/SampleBufferVideoCallView.h +12 -12
  70. package/ios/RCTWebRTC/SampleBufferVideoCallView.m +178 -178
  71. package/ios/RCTWebRTC/ScreenCaptureController.h +20 -20
  72. package/ios/RCTWebRTC/ScreenCaptureController.m +82 -82
  73. package/ios/RCTWebRTC/ScreenCapturePickerViewManager.h +7 -7
  74. package/ios/RCTWebRTC/ScreenCapturePickerViewManager.m +59 -59
  75. package/ios/RCTWebRTC/ScreenCapturer.h +19 -19
  76. package/ios/RCTWebRTC/ScreenCapturer.m +263 -263
  77. package/ios/RCTWebRTC/SerializeUtils.h +28 -28
  78. package/ios/RCTWebRTC/SerializeUtils.m +314 -314
  79. package/ios/RCTWebRTC/SocketConnection.h +13 -13
  80. package/ios/RCTWebRTC/SocketConnection.m +137 -137
  81. package/ios/RCTWebRTC/TrackCapturerEventsEmitter.h +14 -14
  82. package/ios/RCTWebRTC/TrackCapturerEventsEmitter.m +36 -36
  83. package/ios/RCTWebRTC/VideoCaptureController.h +21 -21
  84. package/ios/RCTWebRTC/VideoCaptureController.m +328 -328
  85. package/ios/RCTWebRTC/WLVAudioDevice.h +12 -0
  86. package/ios/RCTWebRTC/WLVAudioDevice.m +137 -0
  87. package/ios/RCTWebRTC/WebRTCModule+Palabra.h +4 -4
  88. package/ios/RCTWebRTC/WebRTCModule+Palabra.m +83 -83
  89. package/ios/RCTWebRTC/WebRTCModule+Permissions.m +75 -75
  90. package/ios/RCTWebRTC/WebRTCModule+RTCAudioSession.m +20 -20
  91. package/ios/RCTWebRTC/WebRTCModule+RTCDataChannel.h +14 -14
  92. package/ios/RCTWebRTC/WebRTCModule+RTCDataChannel.m +165 -165
  93. package/ios/RCTWebRTC/WebRTCModule+RTCFrameCryptor.m +611 -611
  94. package/ios/RCTWebRTC/WebRTCModule+RTCMediaStream.h +13 -13
  95. package/ios/RCTWebRTC/WebRTCModule+RTCMediaStream.m +728 -533
  96. package/ios/RCTWebRTC/WebRTCModule+RTCPeerConnection.h +24 -24
  97. package/ios/RCTWebRTC/WebRTCModule+RTCPeerConnection.m +1004 -1004
  98. package/ios/RCTWebRTC/WebRTCModule+Transceivers.m +267 -267
  99. package/ios/RCTWebRTC/WebRTCModule+VideoTrackAdapter.h +12 -12
  100. package/ios/RCTWebRTC/WebRTCModule+VideoTrackAdapter.m +166 -166
  101. package/ios/RCTWebRTC/WebRTCModule.h +58 -51
  102. package/ios/RCTWebRTC/WebRTCModule.m +169 -151
  103. package/ios/RCTWebRTC/WebRTCModuleOptions.h +24 -24
  104. package/ios/RCTWebRTC/WebRTCModuleOptions.m +31 -31
  105. package/ios/RCTWebRTC/videoEffects/ProcessorProvider.h +9 -9
  106. package/ios/RCTWebRTC/videoEffects/ProcessorProvider.m +23 -23
  107. package/ios/RCTWebRTC/videoEffects/VideoEffectProcessor.h +13 -13
  108. package/ios/RCTWebRTC/videoEffects/VideoEffectProcessor.m +23 -23
  109. package/ios/RCTWebRTC/videoEffects/VideoFrameProcessor.h +8 -8
  110. package/ios/RCTWebRTC.xcodeproj/project.pbxproj +404 -404
  111. package/ios/RCTWebRTC.xcworkspace/contents.xcworkspacedata +10 -10
  112. package/lib/commonjs/Constraints.js.map +1 -1
  113. package/lib/commonjs/EventEmitter.js.map +1 -1
  114. package/lib/commonjs/Logger.js.map +1 -1
  115. package/lib/commonjs/MediaDevices.js +17 -17
  116. package/lib/commonjs/MediaDevices.js.map +1 -1
  117. package/lib/commonjs/MediaStream.js +19 -19
  118. package/lib/commonjs/MediaStream.js.map +1 -1
  119. package/lib/commonjs/MediaStreamError.js.map +1 -1
  120. package/lib/commonjs/MediaStreamErrorEvent.js.map +1 -1
  121. package/lib/commonjs/MediaStreamTrack.js +28 -28
  122. package/lib/commonjs/MediaStreamTrack.js.map +1 -1
  123. package/lib/commonjs/MediaStreamTrackEvent.js +6 -6
  124. package/lib/commonjs/MediaStreamTrackEvent.js.map +1 -1
  125. package/lib/commonjs/MessageEvent.js +7 -7
  126. package/lib/commonjs/MessageEvent.js.map +1 -1
  127. package/lib/commonjs/Permissions.js +28 -28
  128. package/lib/commonjs/Permissions.js.map +1 -1
  129. package/lib/commonjs/RTCAudioSession.js +4 -4
  130. package/lib/commonjs/RTCAudioSession.js.map +1 -1
  131. package/lib/commonjs/RTCDataChannel.js +2 -2
  132. package/lib/commonjs/RTCDataChannel.js.map +1 -1
  133. package/lib/commonjs/RTCDataChannelEvent.js +6 -6
  134. package/lib/commonjs/RTCDataChannelEvent.js.map +1 -1
  135. package/lib/commonjs/RTCDataPacketCryptor.js.map +1 -1
  136. package/lib/commonjs/RTCDataPacketCryptorFactory.js.map +1 -1
  137. package/lib/commonjs/RTCErrorEvent.js +3 -3
  138. package/lib/commonjs/RTCErrorEvent.js.map +1 -1
  139. package/lib/commonjs/RTCFrameCryptor.js +8 -8
  140. package/lib/commonjs/RTCFrameCryptor.js.map +1 -1
  141. package/lib/commonjs/RTCFrameCryptorFactory.js.map +1 -1
  142. package/lib/commonjs/RTCIceCandidate.js.map +1 -1
  143. package/lib/commonjs/RTCIceCandidateEvent.js +7 -7
  144. package/lib/commonjs/RTCIceCandidateEvent.js.map +1 -1
  145. package/lib/commonjs/RTCKeyProvider.js.map +1 -1
  146. package/lib/commonjs/RTCPIPView.js +2 -2
  147. package/lib/commonjs/RTCPIPView.js.map +1 -1
  148. package/lib/commonjs/RTCPIPView.web.js.map +1 -1
  149. package/lib/commonjs/RTCPeerConnection.js +36 -36
  150. package/lib/commonjs/RTCPeerConnection.js.map +1 -1
  151. package/lib/commonjs/RTCRtcpParameters.js.map +1 -1
  152. package/lib/commonjs/RTCRtpCapabilities.js +2 -2
  153. package/lib/commonjs/RTCRtpCapabilities.js.map +1 -1
  154. package/lib/commonjs/RTCRtpCodecCapability.js.map +1 -1
  155. package/lib/commonjs/RTCRtpCodecParameters.js.map +1 -1
  156. package/lib/commonjs/RTCRtpEncodingParameters.js.map +1 -1
  157. package/lib/commonjs/RTCRtpHeaderExtension.js.map +1 -1
  158. package/lib/commonjs/RTCRtpParameters.js.map +1 -1
  159. package/lib/commonjs/RTCRtpReceiveParameters.js.map +1 -1
  160. package/lib/commonjs/RTCRtpReceiver.js +7 -7
  161. package/lib/commonjs/RTCRtpReceiver.js.map +1 -1
  162. package/lib/commonjs/RTCRtpSendParameters.js +3 -3
  163. package/lib/commonjs/RTCRtpSendParameters.js.map +1 -1
  164. package/lib/commonjs/RTCRtpSender.js +7 -7
  165. package/lib/commonjs/RTCRtpSender.js.map +1 -1
  166. package/lib/commonjs/RTCRtpTransceiver.js.map +1 -1
  167. package/lib/commonjs/RTCSessionDescription.js.map +1 -1
  168. package/lib/commonjs/RTCTrackEvent.js +6 -6
  169. package/lib/commonjs/RTCTrackEvent.js.map +1 -1
  170. package/lib/commonjs/RTCUtil.js +28 -28
  171. package/lib/commonjs/RTCUtil.js.map +1 -1
  172. package/lib/commonjs/RTCView.js +5 -5
  173. package/lib/commonjs/RTCView.js.map +1 -1
  174. package/lib/commonjs/RTCView.web.js.map +1 -1
  175. package/lib/commonjs/ScreenCapturePickerView.js.map +1 -1
  176. package/lib/commonjs/ScreenCapturePickerView.web.js.map +1 -1
  177. package/lib/commonjs/getDisplayMedia.js.map +1 -1
  178. package/lib/commonjs/getUserMedia.js.map +1 -1
  179. package/lib/commonjs/index.js.map +1 -1
  180. package/lib/commonjs/index.web.js.map +1 -1
  181. package/lib/commonjs/webStream.js.map +1 -1
  182. package/lib/module/Constraints.js.map +1 -1
  183. package/lib/module/EventEmitter.js.map +1 -1
  184. package/lib/module/Logger.js.map +1 -1
  185. package/lib/module/MediaDevices.js +17 -17
  186. package/lib/module/MediaDevices.js.map +1 -1
  187. package/lib/module/MediaStream.js +19 -19
  188. package/lib/module/MediaStream.js.map +1 -1
  189. package/lib/module/MediaStreamError.js.map +1 -1
  190. package/lib/module/MediaStreamErrorEvent.js.map +1 -1
  191. package/lib/module/MediaStreamTrack.js +28 -28
  192. package/lib/module/MediaStreamTrack.js.map +1 -1
  193. package/lib/module/MediaStreamTrackEvent.js +6 -6
  194. package/lib/module/MediaStreamTrackEvent.js.map +1 -1
  195. package/lib/module/MessageEvent.js +7 -7
  196. package/lib/module/MessageEvent.js.map +1 -1
  197. package/lib/module/Permissions.js +28 -28
  198. package/lib/module/Permissions.js.map +1 -1
  199. package/lib/module/RTCAudioSession.js +4 -4
  200. package/lib/module/RTCAudioSession.js.map +1 -1
  201. package/lib/module/RTCDataChannel.js +2 -2
  202. package/lib/module/RTCDataChannel.js.map +1 -1
  203. package/lib/module/RTCDataChannelEvent.js +6 -6
  204. package/lib/module/RTCDataChannelEvent.js.map +1 -1
  205. package/lib/module/RTCDataPacketCryptor.js.map +1 -1
  206. package/lib/module/RTCDataPacketCryptorFactory.js.map +1 -1
  207. package/lib/module/RTCErrorEvent.js +3 -3
  208. package/lib/module/RTCErrorEvent.js.map +1 -1
  209. package/lib/module/RTCFrameCryptor.js +8 -8
  210. package/lib/module/RTCFrameCryptor.js.map +1 -1
  211. package/lib/module/RTCFrameCryptorFactory.js.map +1 -1
  212. package/lib/module/RTCIceCandidate.js.map +1 -1
  213. package/lib/module/RTCIceCandidateEvent.js +7 -7
  214. package/lib/module/RTCIceCandidateEvent.js.map +1 -1
  215. package/lib/module/RTCKeyProvider.js.map +1 -1
  216. package/lib/module/RTCPIPView.js +2 -2
  217. package/lib/module/RTCPIPView.js.map +1 -1
  218. package/lib/module/RTCPIPView.web.js.map +1 -1
  219. package/lib/module/RTCPeerConnection.js +36 -36
  220. package/lib/module/RTCPeerConnection.js.map +1 -1
  221. package/lib/module/RTCRtcpParameters.js.map +1 -1
  222. package/lib/module/RTCRtpCapabilities.js +2 -2
  223. package/lib/module/RTCRtpCapabilities.js.map +1 -1
  224. package/lib/module/RTCRtpCodecCapability.js.map +1 -1
  225. package/lib/module/RTCRtpCodecParameters.js.map +1 -1
  226. package/lib/module/RTCRtpEncodingParameters.js.map +1 -1
  227. package/lib/module/RTCRtpHeaderExtension.js.map +1 -1
  228. package/lib/module/RTCRtpParameters.js.map +1 -1
  229. package/lib/module/RTCRtpReceiveParameters.js.map +1 -1
  230. package/lib/module/RTCRtpReceiver.js +7 -7
  231. package/lib/module/RTCRtpReceiver.js.map +1 -1
  232. package/lib/module/RTCRtpSendParameters.js +3 -3
  233. package/lib/module/RTCRtpSendParameters.js.map +1 -1
  234. package/lib/module/RTCRtpSender.js +7 -7
  235. package/lib/module/RTCRtpSender.js.map +1 -1
  236. package/lib/module/RTCRtpTransceiver.js.map +1 -1
  237. package/lib/module/RTCSessionDescription.js.map +1 -1
  238. package/lib/module/RTCTrackEvent.js +6 -6
  239. package/lib/module/RTCTrackEvent.js.map +1 -1
  240. package/lib/module/RTCUtil.js +28 -28
  241. package/lib/module/RTCUtil.js.map +1 -1
  242. package/lib/module/RTCView.js +5 -5
  243. package/lib/module/RTCView.js.map +1 -1
  244. package/lib/module/RTCView.web.js.map +1 -1
  245. package/lib/module/ScreenCapturePickerView.js.map +1 -1
  246. package/lib/module/ScreenCapturePickerView.web.js.map +1 -1
  247. package/lib/module/getDisplayMedia.js.map +1 -1
  248. package/lib/module/getUserMedia.js.map +1 -1
  249. package/lib/module/index.js.map +1 -1
  250. package/lib/module/index.web.js.map +1 -1
  251. package/lib/module/webStream.js.map +1 -1
  252. package/lib/typescript/Constraints.d.ts +19 -19
  253. package/lib/typescript/EventEmitter.d.ts +6 -6
  254. package/lib/typescript/Logger.d.ts +13 -13
  255. package/lib/typescript/MediaDevices.d.ts +30 -30
  256. package/lib/typescript/MediaStream.d.ts +48 -48
  257. package/lib/typescript/MediaStreamError.d.ts +6 -6
  258. package/lib/typescript/MediaStreamErrorEvent.d.ts +6 -6
  259. package/lib/typescript/MediaStreamTrack.d.ts +101 -101
  260. package/lib/typescript/MediaStreamTrackEvent.d.ts +19 -19
  261. package/lib/typescript/MessageEvent.d.ts +20 -20
  262. package/lib/typescript/Permissions.d.ts +55 -55
  263. package/lib/typescript/RTCAudioSession.d.ts +10 -10
  264. package/lib/typescript/RTCDataChannel.d.ts +43 -43
  265. package/lib/typescript/RTCDataChannelEvent.d.ts +19 -19
  266. package/lib/typescript/RTCDataPacketCryptor.d.ts +12 -12
  267. package/lib/typescript/RTCDataPacketCryptorFactory.d.ts +6 -6
  268. package/lib/typescript/RTCErrorEvent.d.ts +12 -12
  269. package/lib/typescript/RTCFrameCryptor.d.ts +47 -47
  270. package/lib/typescript/RTCFrameCryptorFactory.d.ts +21 -21
  271. package/lib/typescript/RTCIceCandidate.d.ts +17 -17
  272. package/lib/typescript/RTCIceCandidateEvent.d.ts +20 -20
  273. package/lib/typescript/RTCKeyProvider.d.ts +21 -21
  274. package/lib/typescript/RTCPIPView.d.ts +15 -15
  275. package/lib/typescript/RTCPIPView.web.d.ts +13 -13
  276. package/lib/typescript/RTCPeerConnection.d.ts +117 -117
  277. package/lib/typescript/RTCRtcpParameters.d.ts +10 -10
  278. package/lib/typescript/RTCRtpCapabilities.d.ts +9 -9
  279. package/lib/typescript/RTCRtpCodecCapability.d.ts +7 -7
  280. package/lib/typescript/RTCRtpCodecParameters.d.ts +16 -16
  281. package/lib/typescript/RTCRtpEncodingParameters.d.ts +23 -23
  282. package/lib/typescript/RTCRtpHeaderExtension.d.ts +12 -12
  283. package/lib/typescript/RTCRtpParameters.d.ts +19 -19
  284. package/lib/typescript/RTCRtpReceiveParameters.d.ts +4 -4
  285. package/lib/typescript/RTCRtpReceiver.d.ts +21 -21
  286. package/lib/typescript/RTCRtpSendParameters.d.ts +20 -20
  287. package/lib/typescript/RTCRtpSender.d.ts +22 -22
  288. package/lib/typescript/RTCRtpTransceiver.d.ts +31 -31
  289. package/lib/typescript/RTCSessionDescription.d.ts +12 -12
  290. package/lib/typescript/RTCTrackEvent.d.ts +29 -29
  291. package/lib/typescript/RTCUtil.d.ts +37 -37
  292. package/lib/typescript/RTCView.d.ts +117 -117
  293. package/lib/typescript/RTCView.web.d.ts +25 -25
  294. package/lib/typescript/ScreenCapturePickerView.d.ts +2 -2
  295. package/lib/typescript/ScreenCapturePickerView.web.d.ts +1 -1
  296. package/lib/typescript/getDisplayMedia.d.ts +2 -2
  297. package/lib/typescript/getUserMedia.d.ts +7 -7
  298. package/lib/typescript/index.d.ts +22 -22
  299. package/lib/typescript/index.web.d.ts +101 -101
  300. package/lib/typescript/webStream.d.ts +3 -3
  301. package/livekit-react-native-webrtc.podspec +29 -29
  302. package/macos/RCTWebRTC.xcodeproj/project.pbxproj +324 -324
  303. package/macos/RCTWebRTC.xcodeproj/project.xcworkspace/contents.xcworkspacedata +7 -7
  304. package/macos/RCTWebRTC.xcodeproj/project.xcworkspace/xcshareddata/IDEWorkspaceChecks.plist +8 -8
  305. package/metro.config.js +7 -7
  306. package/metro.config.macos.js +14 -14
  307. package/package.json +66 -66
  308. package/react-native.config.js +11 -11
  309. package/src/.eslintrc.cjs +67 -67
  310. package/src/Constraints.ts +20 -20
  311. package/src/EventEmitter.ts +65 -65
  312. package/src/Logger.ts +49 -49
  313. package/src/MediaDevices.ts +53 -53
  314. package/src/MediaStream.ts +161 -161
  315. package/src/MediaStreamError.ts +12 -12
  316. package/src/MediaStreamErrorEvent.ts +11 -11
  317. package/src/MediaStreamTrack.ts +282 -282
  318. package/src/MediaStreamTrackEvent.ts +25 -25
  319. package/src/MessageEvent.ts +26 -26
  320. package/src/Permissions.ts +133 -133
  321. package/src/RTCAudioSession.ts +25 -25
  322. package/src/RTCDataChannel.ts +190 -190
  323. package/src/RTCDataChannelEvent.ts +28 -28
  324. package/src/RTCDataPacketCryptor.ts +90 -90
  325. package/src/RTCDataPacketCryptorFactory.ts +24 -24
  326. package/src/RTCErrorEvent.ts +20 -20
  327. package/src/RTCFrameCryptor.ts +162 -162
  328. package/src/RTCFrameCryptorFactory.ts +101 -101
  329. package/src/RTCIceCandidate.ts +29 -29
  330. package/src/RTCIceCandidateEvent.ts +26 -26
  331. package/src/RTCKeyProvider.ts +117 -117
  332. package/src/RTCPIPView.tsx +46 -46
  333. package/src/RTCPIPView.web.tsx +18 -18
  334. package/src/RTCPeerConnection.ts +832 -832
  335. package/src/RTCRtcpParameters.ts +23 -23
  336. package/src/RTCRtpCapabilities.ts +16 -16
  337. package/src/RTCRtpCodecCapability.ts +12 -12
  338. package/src/RTCRtpCodecParameters.ts +44 -44
  339. package/src/RTCRtpEncodingParameters.ts +90 -90
  340. package/src/RTCRtpHeaderExtension.ts +27 -27
  341. package/src/RTCRtpParameters.ts +37 -37
  342. package/src/RTCRtpReceiveParameters.ts +7 -7
  343. package/src/RTCRtpReceiver.ts +60 -60
  344. package/src/RTCRtpSendParameters.ts +63 -63
  345. package/src/RTCRtpSender.ts +78 -78
  346. package/src/RTCRtpTransceiver.ts +107 -107
  347. package/src/RTCSessionDescription.ts +30 -30
  348. package/src/RTCTrackEvent.ts +42 -42
  349. package/src/RTCUtil.ts +211 -211
  350. package/src/RTCView.ts +122 -122
  351. package/src/RTCView.web.tsx +80 -80
  352. package/src/ScreenCapturePickerView.ts +4 -4
  353. package/src/ScreenCapturePickerView.web.tsx +3 -3
  354. package/src/getDisplayMedia.ts +30 -30
  355. package/src/getUserMedia.ts +111 -111
  356. package/src/index.ts +107 -107
  357. package/src/index.web.ts +191 -191
  358. package/src/webStream.ts +31 -31
  359. package/tools/format.sh +6 -6
  360. package/tools/release.sh +45 -45
  361. package/tsconfig.json +17 -17
  362. package/.claude/settings.local.json +0 -9
@@ -1,464 +1,464 @@
1
- package com.oney.WebRTCModule.palabra;
2
-
3
- import android.content.Context;
4
- import android.media.AudioFormat;
5
- import android.media.AudioManager;
6
- import android.media.AudioTrack;
7
- import android.os.Handler;
8
- import android.os.Looper;
9
- import android.util.Base64;
10
- import android.util.Log;
11
-
12
- import org.json.JSONArray;
13
- import org.json.JSONException;
14
- import org.json.JSONObject;
15
- import org.webrtc.AudioTrackSink;
16
-
17
- import java.io.BufferedReader;
18
- import java.io.ByteArrayOutputStream;
19
- import java.io.IOException;
20
- import java.io.InputStreamReader;
21
- import java.io.OutputStream;
22
- import java.net.HttpURLConnection;
23
- import java.net.URL;
24
- import java.nio.ByteBuffer;
25
- import java.nio.ByteOrder;
26
- import java.nio.charset.StandardCharsets;
27
- import java.util.concurrent.ExecutorService;
28
- import java.util.concurrent.Executors;
29
- import java.util.concurrent.TimeUnit;
30
- import java.util.concurrent.atomic.AtomicBoolean;
31
-
32
- import okhttp3.OkHttpClient;
33
- import okhttp3.Request;
34
- import okhttp3.Response;
35
- import okhttp3.WebSocket;
36
- import okhttp3.WebSocketListener;
37
-
38
- public class PalabraClient implements AudioTrackSink {
39
- private static final String TAG = "PalabraClient";
40
- private static final int SAMPLE_RATE_IN = 16000;
41
- private static final int SAMPLE_RATE_OUT = 24000;
42
- private static final int CHANNELS = 1;
43
- private static final int CHUNK_MS = 320;
44
- private static final int CHUNK_SAMPLES = SAMPLE_RATE_IN * CHUNK_MS / 1000;
45
- private static final int CHUNK_BYTES = CHUNK_SAMPLES * 2;
46
-
47
- private final Context context;
48
- private final PalabraConfig config;
49
- private PalabraListener listener;
50
-
51
- private org.webrtc.AudioTrack remoteTrack;
52
- private OkHttpClient httpClient;
53
- private WebSocket webSocket;
54
-
55
- private AudioTrack audioPlayer;
56
- private final ExecutorService executor = Executors.newSingleThreadExecutor();
57
- private final Handler mainHandler = new Handler(Looper.getMainLooper());
58
-
59
- private String sessionId;
60
- private String wsUrl;
61
- private String publisherToken;
62
-
63
- private AtomicBoolean connected = new AtomicBoolean(false);
64
- private AtomicBoolean translating = new AtomicBoolean(false);
65
-
66
- private ByteArrayOutputStream audioBuffer = new ByteArrayOutputStream();
67
- private final Object bufferLock = new Object();
68
-
69
- public PalabraClient(Context context, PalabraConfig config) {
70
- this.context = context;
71
- this.config = config;
72
- this.httpClient = new OkHttpClient.Builder()
73
- .connectTimeout(30, TimeUnit.SECONDS)
74
- .readTimeout(30, TimeUnit.SECONDS)
75
- .writeTimeout(30, TimeUnit.SECONDS)
76
- .build();
77
- setupAudioPlayer();
78
- }
79
-
80
- public void setListener(PalabraListener listener) {
81
- this.listener = listener;
82
- }
83
-
84
- public boolean isConnected() {
85
- return connected.get();
86
- }
87
-
88
- public boolean isTranslating() {
89
- return translating.get();
90
- }
91
-
92
- private void setupAudioPlayer() {
93
- int channelConfig = AudioFormat.CHANNEL_OUT_MONO;
94
- int audioFormat = AudioFormat.ENCODING_PCM_16BIT;
95
- int bufferSize = AudioTrack.getMinBufferSize(SAMPLE_RATE_OUT, channelConfig, audioFormat) * 2;
96
-
97
- audioPlayer = new AudioTrack(
98
- AudioManager.STREAM_VOICE_CALL,
99
- SAMPLE_RATE_OUT,
100
- channelConfig,
101
- audioFormat,
102
- bufferSize,
103
- AudioTrack.MODE_STREAM
104
- );
105
- }
106
-
107
- public void start(org.webrtc.AudioTrack remoteAudioTrack) {
108
- if (translating.get()) {
109
- return;
110
- }
111
-
112
- this.remoteTrack = remoteAudioTrack;
113
- remoteAudioTrack.setVolume(0);
114
-
115
- notifyConnectionState("connecting");
116
-
117
- executor.execute(() -> {
118
- try {
119
- JSONObject session = createSession();
120
- Log.d(TAG, "session_response: " + session.toString());
121
- JSONObject data = session.getJSONObject("data");
122
- sessionId = data.getString("id");
123
- wsUrl = data.getString("ws_url");
124
- publisherToken = data.getString("publisher");
125
- Log.d(TAG, "ws_url: " + wsUrl);
126
-
127
- mainHandler.post(this::connectWebSocket);
128
- } catch (Exception e) {
129
- Log.e(TAG, "session_create_failed", e);
130
- mainHandler.post(() -> {
131
- if (remoteAudioTrack != null) {
132
- remoteAudioTrack.setVolume(1.0);
133
- }
134
- notifyError(500, e.getMessage());
135
- });
136
- }
137
- });
138
- }
139
-
140
- private JSONObject createSession() throws IOException, JSONException {
141
- URL url = new URL(config.apiUrl + "/session-storage/session");
142
- HttpURLConnection conn = (HttpURLConnection) url.openConnection();
143
- conn.setRequestMethod("POST");
144
- conn.setRequestProperty("ClientId", config.clientId);
145
- conn.setRequestProperty("ClientSecret", config.clientSecret);
146
- conn.setRequestProperty("Content-Type", "application/json");
147
- conn.setDoOutput(true);
148
-
149
- JSONObject body = new JSONObject();
150
- JSONObject bodyData = new JSONObject();
151
- bodyData.put("subscriber_count", 0);
152
- bodyData.put("publisher_can_subscribe", true);
153
- body.put("data", bodyData);
154
-
155
- try (OutputStream os = conn.getOutputStream()) {
156
- os.write(body.toString().getBytes(StandardCharsets.UTF_8));
157
- }
158
-
159
- int responseCode = conn.getResponseCode();
160
- if (responseCode < 200 || responseCode >= 300) {
161
- throw new IOException("session_http_error_" + responseCode);
162
- }
163
-
164
- StringBuilder response = new StringBuilder();
165
- try (BufferedReader br = new BufferedReader(new InputStreamReader(conn.getInputStream()))) {
166
- String line;
167
- while ((line = br.readLine()) != null) {
168
- response.append(line);
169
- }
170
- }
171
-
172
- return new JSONObject(response.toString());
173
- }
174
-
175
- private void connectWebSocket() {
176
- String endpoint = wsUrl + "?token=" + publisherToken;
177
- Log.d(TAG, "connecting_ws: " + endpoint);
178
-
179
- Request request = new Request.Builder()
180
- .url(endpoint)
181
- .build();
182
-
183
- webSocket = httpClient.newWebSocket(request, new WebSocketListener() {
184
- @Override
185
- public void onOpen(WebSocket ws, Response response) {
186
- Log.d(TAG, "ws_open");
187
- connected.set(true);
188
- translating.set(true);
189
-
190
- remoteTrack.addSink(PalabraClient.this);
191
- audioPlayer.play();
192
-
193
- mainHandler.post(() -> notifyConnectionState("connected"));
194
-
195
- mainHandler.postDelayed(() -> sendSetTask(), 500);
196
- }
197
-
198
- @Override
199
- public void onMessage(WebSocket ws, String text) {
200
- handleMessage(text);
201
- }
202
-
203
- @Override
204
- public void onFailure(WebSocket ws, Throwable t, Response response) {
205
- Log.e(TAG, "ws_error", t);
206
- mainHandler.post(() -> {
207
- stop();
208
- notifyError(500, t.getMessage());
209
- });
210
- }
211
-
212
- @Override
213
- public void onClosed(WebSocket ws, int code, String reason) {
214
- Log.d(TAG, "ws_closed: " + code);
215
- mainHandler.post(() -> stop());
216
- }
217
- });
218
- }
219
-
220
- private void sendSetTask() {
221
- if (webSocket == null || !connected.get()) {
222
- return;
223
- }
224
-
225
- try {
226
- JSONObject msg = new JSONObject();
227
- msg.put("message_type", "set_task");
228
-
229
- JSONObject data = new JSONObject();
230
-
231
- JSONObject inputStream = new JSONObject();
232
- inputStream.put("content_type", "audio");
233
- JSONObject source = new JSONObject();
234
- source.put("type", "ws");
235
- source.put("format", "pcm_s16le");
236
- source.put("sample_rate", SAMPLE_RATE_IN);
237
- source.put("channels", CHANNELS);
238
- inputStream.put("source", source);
239
- data.put("input_stream", inputStream);
240
-
241
- JSONObject outputStream = new JSONObject();
242
- outputStream.put("content_type", "audio");
243
- JSONObject target = new JSONObject();
244
- target.put("type", "ws");
245
- target.put("format", "pcm_s16le");
246
- outputStream.put("target", target);
247
- data.put("output_stream", outputStream);
248
-
249
- JSONObject pipeline = new JSONObject();
250
-
251
- JSONObject transcription = new JSONObject();
252
- transcription.put("source_language", config.sourceLang);
253
- pipeline.put("transcription", transcription);
254
-
255
- JSONArray translations = new JSONArray();
256
- JSONObject translation = new JSONObject();
257
- translation.put("target_language", config.targetLang);
258
- JSONObject speechGen = new JSONObject();
259
- speechGen.put("voice_cloning", false);
260
- translation.put("speech_generation", speechGen);
261
- translations.put(translation);
262
- pipeline.put("translations", translations);
263
-
264
- JSONArray allowedTypes = new JSONArray();
265
- allowedTypes.put("partial_transcription");
266
- allowedTypes.put("validated_transcription");
267
- allowedTypes.put("translated_transcription");
268
- pipeline.put("allowed_message_types", allowedTypes);
269
-
270
- data.put("pipeline", pipeline);
271
- msg.put("data", data);
272
-
273
- String payload = msg.toString();
274
- Log.d(TAG, "set_task: " + payload);
275
- webSocket.send(payload);
276
- } catch (JSONException e) {
277
- Log.e(TAG, "set_task_error", e);
278
- }
279
- }
280
-
281
- private void handleMessage(String text) {
282
- try {
283
- JSONObject json = new JSONObject(text);
284
- String type = json.optString("message_type", "");
285
-
286
- if ("output_audio_data".equals(type)) {
287
- JSONObject data = json.getJSONObject("data");
288
- String audioBase64 = data.optString("data", "");
289
- if (!audioBase64.isEmpty()) {
290
- byte[] audioBytes = Base64.decode(audioBase64, Base64.DEFAULT);
291
- if (audioPlayer != null && translating.get()) {
292
- audioPlayer.write(audioBytes, 0, audioBytes.length);
293
- }
294
- }
295
- } else if (type.contains("transcription")) {
296
- JSONObject data = json.getJSONObject("data");
297
- JSONObject transcription = data.optJSONObject("transcription");
298
- if (transcription != null) {
299
- String txt = transcription.optString("text", "");
300
- String lang = transcription.optString("language", "");
301
- boolean isFinal = !"partial_transcription".equals(type);
302
- mainHandler.post(() -> notifyTranscription(txt, lang, isFinal));
303
- }
304
- } else if ("error".equals(type)) {
305
- JSONObject data = json.optJSONObject("data");
306
- String desc = data != null ? data.optString("desc", "unknown") : "unknown";
307
- Log.e(TAG, "palabra_error: " + desc);
308
- mainHandler.post(() -> notifyError(500, desc));
309
- }
310
- } catch (JSONException e) {
311
- Log.e(TAG, "msg_parse_error", e);
312
- }
313
- }
314
-
315
- public void stop() {
316
- if (!translating.getAndSet(false)) {
317
- return;
318
- }
319
-
320
- connected.set(false);
321
-
322
- if (remoteTrack != null) {
323
- try {
324
- remoteTrack.removeSink(this);
325
- remoteTrack.setVolume(1.0);
326
- } catch (Exception e) {
327
- Log.w(TAG, "stop_track_cleanup_error: " + e.getMessage());
328
- }
329
- }
330
-
331
- if (webSocket != null) {
332
- try {
333
- JSONObject endMsg = new JSONObject();
334
- endMsg.put("message_type", "end_task");
335
- endMsg.put("data", new JSONObject().put("force", false));
336
- webSocket.send(endMsg.toString());
337
- } catch (JSONException e) {
338
- Log.e(TAG, "end_task_error", e);
339
- }
340
- try {
341
- webSocket.close(1000, "stop");
342
- } catch (Exception e) {
343
- Log.w(TAG, "websocket_close_error: " + e.getMessage());
344
- }
345
- webSocket = null;
346
- }
347
-
348
- if (audioPlayer != null) {
349
- try {
350
- audioPlayer.stop();
351
- } catch (Exception e) {
352
- Log.w(TAG, "audio_player_stop_error: " + e.getMessage());
353
- }
354
- }
355
-
356
- synchronized (bufferLock) {
357
- audioBuffer.reset();
358
- }
359
-
360
- remoteTrack = null;
361
- notifyConnectionState("disconnected");
362
- }
363
-
364
- @Override
365
- public void onData(ByteBuffer audioData, int bitsPerSample, int sampleRate, int channels, int frames, long timestamp) {
366
- if (!translating.get() || webSocket == null) {
367
- return;
368
- }
369
-
370
- byte[] samples = new byte[audioData.remaining()];
371
- audioData.get(samples);
372
-
373
- byte[] resampled = resample(samples, sampleRate, channels, SAMPLE_RATE_IN, CHANNELS);
374
-
375
- synchronized (bufferLock) {
376
- try {
377
- audioBuffer.write(resampled);
378
-
379
- while (audioBuffer.size() >= CHUNK_BYTES) {
380
- byte[] chunk = new byte[CHUNK_BYTES];
381
- byte[] all = audioBuffer.toByteArray();
382
- System.arraycopy(all, 0, chunk, 0, CHUNK_BYTES);
383
-
384
- audioBuffer.reset();
385
- if (all.length > CHUNK_BYTES) {
386
- audioBuffer.write(all, CHUNK_BYTES, all.length - CHUNK_BYTES);
387
- }
388
-
389
- sendAudioChunk(chunk);
390
- }
391
- } catch (IOException e) {
392
- Log.e(TAG, "buffer_error", e);
393
- }
394
- }
395
- }
396
-
397
- private byte[] resample(byte[] input, int srcRate, int srcChannels, int dstRate, int dstChannels) {
398
- if (srcRate == dstRate && srcChannels == dstChannels) {
399
- return input;
400
- }
401
-
402
- int srcSamples = input.length / (2 * srcChannels);
403
- int dstSamples = (int) ((long) srcSamples * dstRate / srcRate);
404
-
405
- short[] srcData = new short[srcSamples * srcChannels];
406
- ByteBuffer.wrap(input).order(ByteOrder.LITTLE_ENDIAN).asShortBuffer().get(srcData);
407
-
408
- short[] monoSrc = srcData;
409
- if (srcChannels == 2) {
410
- monoSrc = new short[srcSamples];
411
- for (int i = 0; i < srcSamples; i++) {
412
- monoSrc[i] = (short) ((srcData[i * 2] + srcData[i * 2 + 1]) / 2);
413
- }
414
- }
415
-
416
- short[] dstData = new short[dstSamples];
417
- for (int i = 0; i < dstSamples; i++) {
418
- float srcIdx = (float) i * (monoSrc.length - 1) / (dstSamples - 1);
419
- int idx0 = (int) srcIdx;
420
- int idx1 = Math.min(idx0 + 1, monoSrc.length - 1);
421
- float frac = srcIdx - idx0;
422
- dstData[i] = (short) (monoSrc[idx0] * (1 - frac) + monoSrc[idx1] * frac);
423
- }
424
-
425
- byte[] output = new byte[dstSamples * 2];
426
- ByteBuffer.wrap(output).order(ByteOrder.LITTLE_ENDIAN).asShortBuffer().put(dstData);
427
- return output;
428
- }
429
-
430
- private void sendAudioChunk(byte[] chunk) {
431
- if (webSocket == null || !connected.get()) {
432
- return;
433
- }
434
-
435
- try {
436
- JSONObject msg = new JSONObject();
437
- msg.put("message_type", "input_audio_data");
438
- JSONObject data = new JSONObject();
439
- data.put("data", Base64.encodeToString(chunk, Base64.NO_WRAP));
440
- msg.put("data", data);
441
- webSocket.send(msg.toString());
442
- } catch (JSONException e) {
443
- Log.e(TAG, "send_audio_error", e);
444
- }
445
- }
446
-
447
- private void notifyConnectionState(String state) {
448
- if (listener != null) {
449
- listener.onConnectionState(state);
450
- }
451
- }
452
-
453
- private void notifyError(int code, String message) {
454
- if (listener != null) {
455
- listener.onError(code, message);
456
- }
457
- }
458
-
459
- private void notifyTranscription(String text, String lang, boolean isFinal) {
460
- if (listener != null) {
461
- listener.onTranscription(text, lang, isFinal);
462
- }
463
- }
464
- }
1
+ package com.oney.WebRTCModule.palabra;
2
+
3
+ import android.content.Context;
4
+ import android.media.AudioFormat;
5
+ import android.media.AudioManager;
6
+ import android.media.AudioTrack;
7
+ import android.os.Handler;
8
+ import android.os.Looper;
9
+ import android.util.Base64;
10
+ import android.util.Log;
11
+
12
+ import org.json.JSONArray;
13
+ import org.json.JSONException;
14
+ import org.json.JSONObject;
15
+ import org.webrtc.AudioTrackSink;
16
+
17
+ import java.io.BufferedReader;
18
+ import java.io.ByteArrayOutputStream;
19
+ import java.io.IOException;
20
+ import java.io.InputStreamReader;
21
+ import java.io.OutputStream;
22
+ import java.net.HttpURLConnection;
23
+ import java.net.URL;
24
+ import java.nio.ByteBuffer;
25
+ import java.nio.ByteOrder;
26
+ import java.nio.charset.StandardCharsets;
27
+ import java.util.concurrent.ExecutorService;
28
+ import java.util.concurrent.Executors;
29
+ import java.util.concurrent.TimeUnit;
30
+ import java.util.concurrent.atomic.AtomicBoolean;
31
+
32
+ import okhttp3.OkHttpClient;
33
+ import okhttp3.Request;
34
+ import okhttp3.Response;
35
+ import okhttp3.WebSocket;
36
+ import okhttp3.WebSocketListener;
37
+
38
+ public class PalabraClient implements AudioTrackSink {
39
+ private static final String TAG = "PalabraClient";
40
+ private static final int SAMPLE_RATE_IN = 16000;
41
+ private static final int SAMPLE_RATE_OUT = 24000;
42
+ private static final int CHANNELS = 1;
43
+ private static final int CHUNK_MS = 320;
44
+ private static final int CHUNK_SAMPLES = SAMPLE_RATE_IN * CHUNK_MS / 1000;
45
+ private static final int CHUNK_BYTES = CHUNK_SAMPLES * 2;
46
+
47
+ private final Context context;
48
+ private final PalabraConfig config;
49
+ private PalabraListener listener;
50
+
51
+ private org.webrtc.AudioTrack remoteTrack;
52
+ private OkHttpClient httpClient;
53
+ private WebSocket webSocket;
54
+
55
+ private AudioTrack audioPlayer;
56
+ private final ExecutorService executor = Executors.newSingleThreadExecutor();
57
+ private final Handler mainHandler = new Handler(Looper.getMainLooper());
58
+
59
+ private String sessionId;
60
+ private String wsUrl;
61
+ private String publisherToken;
62
+
63
+ private AtomicBoolean connected = new AtomicBoolean(false);
64
+ private AtomicBoolean translating = new AtomicBoolean(false);
65
+
66
+ private ByteArrayOutputStream audioBuffer = new ByteArrayOutputStream();
67
+ private final Object bufferLock = new Object();
68
+
69
+ public PalabraClient(Context context, PalabraConfig config) {
70
+ this.context = context;
71
+ this.config = config;
72
+ this.httpClient = new OkHttpClient.Builder()
73
+ .connectTimeout(30, TimeUnit.SECONDS)
74
+ .readTimeout(30, TimeUnit.SECONDS)
75
+ .writeTimeout(30, TimeUnit.SECONDS)
76
+ .build();
77
+ setupAudioPlayer();
78
+ }
79
+
80
+ public void setListener(PalabraListener listener) {
81
+ this.listener = listener;
82
+ }
83
+
84
+ public boolean isConnected() {
85
+ return connected.get();
86
+ }
87
+
88
+ public boolean isTranslating() {
89
+ return translating.get();
90
+ }
91
+
92
+ private void setupAudioPlayer() {
93
+ int channelConfig = AudioFormat.CHANNEL_OUT_MONO;
94
+ int audioFormat = AudioFormat.ENCODING_PCM_16BIT;
95
+ int bufferSize = AudioTrack.getMinBufferSize(SAMPLE_RATE_OUT, channelConfig, audioFormat) * 2;
96
+
97
+ audioPlayer = new AudioTrack(
98
+ AudioManager.STREAM_VOICE_CALL,
99
+ SAMPLE_RATE_OUT,
100
+ channelConfig,
101
+ audioFormat,
102
+ bufferSize,
103
+ AudioTrack.MODE_STREAM
104
+ );
105
+ }
106
+
107
+ public void start(org.webrtc.AudioTrack remoteAudioTrack) {
108
+ if (translating.get()) {
109
+ return;
110
+ }
111
+
112
+ this.remoteTrack = remoteAudioTrack;
113
+ remoteAudioTrack.setVolume(0);
114
+
115
+ notifyConnectionState("connecting");
116
+
117
+ executor.execute(() -> {
118
+ try {
119
+ JSONObject session = createSession();
120
+ Log.d(TAG, "session_response: " + session.toString());
121
+ JSONObject data = session.getJSONObject("data");
122
+ sessionId = data.getString("id");
123
+ wsUrl = data.getString("ws_url");
124
+ publisherToken = data.getString("publisher");
125
+ Log.d(TAG, "ws_url: " + wsUrl);
126
+
127
+ mainHandler.post(this::connectWebSocket);
128
+ } catch (Exception e) {
129
+ Log.e(TAG, "session_create_failed", e);
130
+ mainHandler.post(() -> {
131
+ if (remoteAudioTrack != null) {
132
+ remoteAudioTrack.setVolume(1.0);
133
+ }
134
+ notifyError(500, e.getMessage());
135
+ });
136
+ }
137
+ });
138
+ }
139
+
140
+ private JSONObject createSession() throws IOException, JSONException {
141
+ URL url = new URL(config.apiUrl + "/session-storage/session");
142
+ HttpURLConnection conn = (HttpURLConnection) url.openConnection();
143
+ conn.setRequestMethod("POST");
144
+ conn.setRequestProperty("ClientId", config.clientId);
145
+ conn.setRequestProperty("ClientSecret", config.clientSecret);
146
+ conn.setRequestProperty("Content-Type", "application/json");
147
+ conn.setDoOutput(true);
148
+
149
+ JSONObject body = new JSONObject();
150
+ JSONObject bodyData = new JSONObject();
151
+ bodyData.put("subscriber_count", 0);
152
+ bodyData.put("publisher_can_subscribe", true);
153
+ body.put("data", bodyData);
154
+
155
+ try (OutputStream os = conn.getOutputStream()) {
156
+ os.write(body.toString().getBytes(StandardCharsets.UTF_8));
157
+ }
158
+
159
+ int responseCode = conn.getResponseCode();
160
+ if (responseCode < 200 || responseCode >= 300) {
161
+ throw new IOException("session_http_error_" + responseCode);
162
+ }
163
+
164
+ StringBuilder response = new StringBuilder();
165
+ try (BufferedReader br = new BufferedReader(new InputStreamReader(conn.getInputStream()))) {
166
+ String line;
167
+ while ((line = br.readLine()) != null) {
168
+ response.append(line);
169
+ }
170
+ }
171
+
172
+ return new JSONObject(response.toString());
173
+ }
174
+
175
+ private void connectWebSocket() {
176
+ String endpoint = wsUrl + "?token=" + publisherToken;
177
+ Log.d(TAG, "connecting_ws: " + endpoint);
178
+
179
+ Request request = new Request.Builder()
180
+ .url(endpoint)
181
+ .build();
182
+
183
+ webSocket = httpClient.newWebSocket(request, new WebSocketListener() {
184
+ @Override
185
+ public void onOpen(WebSocket ws, Response response) {
186
+ Log.d(TAG, "ws_open");
187
+ connected.set(true);
188
+ translating.set(true);
189
+
190
+ remoteTrack.addSink(PalabraClient.this);
191
+ audioPlayer.play();
192
+
193
+ mainHandler.post(() -> notifyConnectionState("connected"));
194
+
195
+ mainHandler.postDelayed(() -> sendSetTask(), 500);
196
+ }
197
+
198
+ @Override
199
+ public void onMessage(WebSocket ws, String text) {
200
+ handleMessage(text);
201
+ }
202
+
203
+ @Override
204
+ public void onFailure(WebSocket ws, Throwable t, Response response) {
205
+ Log.e(TAG, "ws_error", t);
206
+ mainHandler.post(() -> {
207
+ stop();
208
+ notifyError(500, t.getMessage());
209
+ });
210
+ }
211
+
212
+ @Override
213
+ public void onClosed(WebSocket ws, int code, String reason) {
214
+ Log.d(TAG, "ws_closed: " + code);
215
+ mainHandler.post(() -> stop());
216
+ }
217
+ });
218
+ }
219
+
220
+ private void sendSetTask() {
221
+ if (webSocket == null || !connected.get()) {
222
+ return;
223
+ }
224
+
225
+ try {
226
+ JSONObject msg = new JSONObject();
227
+ msg.put("message_type", "set_task");
228
+
229
+ JSONObject data = new JSONObject();
230
+
231
+ JSONObject inputStream = new JSONObject();
232
+ inputStream.put("content_type", "audio");
233
+ JSONObject source = new JSONObject();
234
+ source.put("type", "ws");
235
+ source.put("format", "pcm_s16le");
236
+ source.put("sample_rate", SAMPLE_RATE_IN);
237
+ source.put("channels", CHANNELS);
238
+ inputStream.put("source", source);
239
+ data.put("input_stream", inputStream);
240
+
241
+ JSONObject outputStream = new JSONObject();
242
+ outputStream.put("content_type", "audio");
243
+ JSONObject target = new JSONObject();
244
+ target.put("type", "ws");
245
+ target.put("format", "pcm_s16le");
246
+ outputStream.put("target", target);
247
+ data.put("output_stream", outputStream);
248
+
249
+ JSONObject pipeline = new JSONObject();
250
+
251
+ JSONObject transcription = new JSONObject();
252
+ transcription.put("source_language", config.sourceLang);
253
+ pipeline.put("transcription", transcription);
254
+
255
+ JSONArray translations = new JSONArray();
256
+ JSONObject translation = new JSONObject();
257
+ translation.put("target_language", config.targetLang);
258
+ JSONObject speechGen = new JSONObject();
259
+ speechGen.put("voice_cloning", false);
260
+ translation.put("speech_generation", speechGen);
261
+ translations.put(translation);
262
+ pipeline.put("translations", translations);
263
+
264
+ JSONArray allowedTypes = new JSONArray();
265
+ allowedTypes.put("partial_transcription");
266
+ allowedTypes.put("validated_transcription");
267
+ allowedTypes.put("translated_transcription");
268
+ pipeline.put("allowed_message_types", allowedTypes);
269
+
270
+ data.put("pipeline", pipeline);
271
+ msg.put("data", data);
272
+
273
+ String payload = msg.toString();
274
+ Log.d(TAG, "set_task: " + payload);
275
+ webSocket.send(payload);
276
+ } catch (JSONException e) {
277
+ Log.e(TAG, "set_task_error", e);
278
+ }
279
+ }
280
+
281
+ private void handleMessage(String text) {
282
+ try {
283
+ JSONObject json = new JSONObject(text);
284
+ String type = json.optString("message_type", "");
285
+
286
+ if ("output_audio_data".equals(type)) {
287
+ JSONObject data = json.getJSONObject("data");
288
+ String audioBase64 = data.optString("data", "");
289
+ if (!audioBase64.isEmpty()) {
290
+ byte[] audioBytes = Base64.decode(audioBase64, Base64.DEFAULT);
291
+ if (audioPlayer != null && translating.get()) {
292
+ audioPlayer.write(audioBytes, 0, audioBytes.length);
293
+ }
294
+ }
295
+ } else if (type.contains("transcription")) {
296
+ JSONObject data = json.getJSONObject("data");
297
+ JSONObject transcription = data.optJSONObject("transcription");
298
+ if (transcription != null) {
299
+ String txt = transcription.optString("text", "");
300
+ String lang = transcription.optString("language", "");
301
+ boolean isFinal = !"partial_transcription".equals(type);
302
+ mainHandler.post(() -> notifyTranscription(txt, lang, isFinal));
303
+ }
304
+ } else if ("error".equals(type)) {
305
+ JSONObject data = json.optJSONObject("data");
306
+ String desc = data != null ? data.optString("desc", "unknown") : "unknown";
307
+ Log.e(TAG, "palabra_error: " + desc);
308
+ mainHandler.post(() -> notifyError(500, desc));
309
+ }
310
+ } catch (JSONException e) {
311
+ Log.e(TAG, "msg_parse_error", e);
312
+ }
313
+ }
314
+
315
+ public void stop() {
316
+ if (!translating.getAndSet(false)) {
317
+ return;
318
+ }
319
+
320
+ connected.set(false);
321
+
322
+ if (remoteTrack != null) {
323
+ try {
324
+ remoteTrack.removeSink(this);
325
+ remoteTrack.setVolume(1.0);
326
+ } catch (Exception e) {
327
+ Log.w(TAG, "stop_track_cleanup_error: " + e.getMessage());
328
+ }
329
+ }
330
+
331
+ if (webSocket != null) {
332
+ try {
333
+ JSONObject endMsg = new JSONObject();
334
+ endMsg.put("message_type", "end_task");
335
+ endMsg.put("data", new JSONObject().put("force", false));
336
+ webSocket.send(endMsg.toString());
337
+ } catch (JSONException e) {
338
+ Log.e(TAG, "end_task_error", e);
339
+ }
340
+ try {
341
+ webSocket.close(1000, "stop");
342
+ } catch (Exception e) {
343
+ Log.w(TAG, "websocket_close_error: " + e.getMessage());
344
+ }
345
+ webSocket = null;
346
+ }
347
+
348
+ if (audioPlayer != null) {
349
+ try {
350
+ audioPlayer.stop();
351
+ } catch (Exception e) {
352
+ Log.w(TAG, "audio_player_stop_error: " + e.getMessage());
353
+ }
354
+ }
355
+
356
+ synchronized (bufferLock) {
357
+ audioBuffer.reset();
358
+ }
359
+
360
+ remoteTrack = null;
361
+ notifyConnectionState("disconnected");
362
+ }
363
+
364
+ @Override
365
+ public void onData(ByteBuffer audioData, int bitsPerSample, int sampleRate, int channels, int frames, long timestamp) {
366
+ if (!translating.get() || webSocket == null) {
367
+ return;
368
+ }
369
+
370
+ byte[] samples = new byte[audioData.remaining()];
371
+ audioData.get(samples);
372
+
373
+ byte[] resampled = resample(samples, sampleRate, channels, SAMPLE_RATE_IN, CHANNELS);
374
+
375
+ synchronized (bufferLock) {
376
+ try {
377
+ audioBuffer.write(resampled);
378
+
379
+ while (audioBuffer.size() >= CHUNK_BYTES) {
380
+ byte[] chunk = new byte[CHUNK_BYTES];
381
+ byte[] all = audioBuffer.toByteArray();
382
+ System.arraycopy(all, 0, chunk, 0, CHUNK_BYTES);
383
+
384
+ audioBuffer.reset();
385
+ if (all.length > CHUNK_BYTES) {
386
+ audioBuffer.write(all, CHUNK_BYTES, all.length - CHUNK_BYTES);
387
+ }
388
+
389
+ sendAudioChunk(chunk);
390
+ }
391
+ } catch (IOException e) {
392
+ Log.e(TAG, "buffer_error", e);
393
+ }
394
+ }
395
+ }
396
+
397
+ private byte[] resample(byte[] input, int srcRate, int srcChannels, int dstRate, int dstChannels) {
398
+ if (srcRate == dstRate && srcChannels == dstChannels) {
399
+ return input;
400
+ }
401
+
402
+ int srcSamples = input.length / (2 * srcChannels);
403
+ int dstSamples = (int) ((long) srcSamples * dstRate / srcRate);
404
+
405
+ short[] srcData = new short[srcSamples * srcChannels];
406
+ ByteBuffer.wrap(input).order(ByteOrder.LITTLE_ENDIAN).asShortBuffer().get(srcData);
407
+
408
+ short[] monoSrc = srcData;
409
+ if (srcChannels == 2) {
410
+ monoSrc = new short[srcSamples];
411
+ for (int i = 0; i < srcSamples; i++) {
412
+ monoSrc[i] = (short) ((srcData[i * 2] + srcData[i * 2 + 1]) / 2);
413
+ }
414
+ }
415
+
416
+ short[] dstData = new short[dstSamples];
417
+ for (int i = 0; i < dstSamples; i++) {
418
+ float srcIdx = (float) i * (monoSrc.length - 1) / (dstSamples - 1);
419
+ int idx0 = (int) srcIdx;
420
+ int idx1 = Math.min(idx0 + 1, monoSrc.length - 1);
421
+ float frac = srcIdx - idx0;
422
+ dstData[i] = (short) (monoSrc[idx0] * (1 - frac) + monoSrc[idx1] * frac);
423
+ }
424
+
425
+ byte[] output = new byte[dstSamples * 2];
426
+ ByteBuffer.wrap(output).order(ByteOrder.LITTLE_ENDIAN).asShortBuffer().put(dstData);
427
+ return output;
428
+ }
429
+
430
+ private void sendAudioChunk(byte[] chunk) {
431
+ if (webSocket == null || !connected.get()) {
432
+ return;
433
+ }
434
+
435
+ try {
436
+ JSONObject msg = new JSONObject();
437
+ msg.put("message_type", "input_audio_data");
438
+ JSONObject data = new JSONObject();
439
+ data.put("data", Base64.encodeToString(chunk, Base64.NO_WRAP));
440
+ msg.put("data", data);
441
+ webSocket.send(msg.toString());
442
+ } catch (JSONException e) {
443
+ Log.e(TAG, "send_audio_error", e);
444
+ }
445
+ }
446
+
447
+ private void notifyConnectionState(String state) {
448
+ if (listener != null) {
449
+ listener.onConnectionState(state);
450
+ }
451
+ }
452
+
453
+ private void notifyError(int code, String message) {
454
+ if (listener != null) {
455
+ listener.onError(code, message);
456
+ }
457
+ }
458
+
459
+ private void notifyTranscription(String text, String lang, boolean isFinal) {
460
+ if (listener != null) {
461
+ listener.onTranscription(text, lang, isFinal);
462
+ }
463
+ }
464
+ }