tencentcloud-sdk-asr 3.0.1161 → 3.0.1184

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (4) hide show
  1. checksums.yaml +4 -4
  2. data/lib/VERSION +1 -1
  3. data/lib/v20190614/models.rb +62 -24
  4. metadata +3 -3
checksums.yaml CHANGED
@@ -1,7 +1,7 @@
1
1
  ---
2
2
  SHA1:
3
- metadata.gz: 3d44e052c1c113ad1b936064dfe2bc51dbb54652
4
- data.tar.gz: 151be8386b0ba31622eefda3c8f95a762528d579
3
+ metadata.gz: 182a61e43aa111f27e93c531075aea02d2fe06d8
4
+ data.tar.gz: 474059e7f927a31724cc8e0f5ae4326f24ddd43d
5
5
  SHA512:
6
- metadata.gz: 5c6b40c1d1d23303c1f41e9a5daf3f67f23be6b31a6ce3ad645c28c066830678fed4b3ca22f7692df016fd2ed730e71863501c8a29a9dfe76fb009f587029b85
7
- data.tar.gz: 5df0f4a26e00a3fec02410a88dba65f35452afe4ff3b6ca9c7575e4a9718194ba595accfc562d1a7e6d45ad43ae0f9790d964f686360a91995feb4549eb3acaf
6
+ metadata.gz: 977cb2d4e3566d45340174af95a0e92cc394c069c7cc72f3da5657c61d87bacabfa7f43bf3c1182ff1f3a3d21b677263d0332817c26d288548248f643fa92cb0
7
+ data.tar.gz: 2cac0703665a4af4c1c47ffe38ac0ad3f1075eb8cdbdcaa6fdbafb5d19964b480e68288635be41409a3da3fa8eba83f6669412dd98be27d1d90a991ca4f02ac3
data/lib/VERSION CHANGED
@@ -1 +1 @@
1
- 3.0.1161
1
+ 3.0.1184
@@ -305,8 +305,8 @@ module TencentCloud
305
305
 
306
306
  attr_accessor :ModelName, :TextUrl, :ModelType, :TagInfos
307
307
  extend Gem::Deprecate
308
- deprecate :TagInfos, :none, 2025, 11
309
- deprecate :TagInfos=, :none, 2025, 11
308
+ deprecate :TagInfos, :none, 2025, 12
309
+ deprecate :TagInfos=, :none, 2025, 12
310
310
 
311
311
  def initialize(modelname=nil, texturl=nil, modeltype=nil, taginfos=nil)
312
312
  @ModelName = modelname
@@ -352,13 +352,13 @@ module TencentCloud
352
352
  # **注意:电话通讯场景,请务必使用以下8k引擎**
353
353
  # • 8k_zh:中文电话通讯;
354
354
  # • 8k_en:英文电话通讯;
355
- # • 8k_zh_large:中文电话场景专用大模型引擎【大模型版】。通过显著提升模型参数规模与语言建模能力,实现对电话音频中复杂场景(如口音干扰、背景噪声)的高精度识别,识别准确率较常规版本大幅提升。[点击这里](https://console.cloud.tencent.com/asr/demonstrate) 对比常规版本与普方大模型效果;
355
+ # • 8k_zh_large:中文电话场景专用大模型引擎【大模型版】。当前模型同时支持中文、上海话、四川话、武汉话、贵阳话、昆明话、西安话、郑州话、太原话、兰州话、银川话、西宁话、南京话、合肥话、南昌话、长沙话、苏州话、杭州话、济南话、天津话、石家庄话、黑龙江话、吉林话、辽宁话、闽南语、客家话、粤语、南宁话方言识别,通过显著提升模型参数规模与语言建模能力,实现对电话音频中复杂场景(如口音干扰、背景噪声)的高精度识别,识别准确率较常规版本大幅提升。[点击这里](https://console.cloud.tencent.com/asr/demonstrate) 对比常规版本与普方大模型效果;
356
356
 
357
357
  # 注意:如您有电话通讯场景识别需求,但发现需求语种仅支持16k,可将8k音频传入下方16k引擎,亦能获取识别结果。但**16k引擎并非基于电话通讯数据训练,无法承诺此种调用方式的识别效果,需由您自行验证识别结果是否可用**
358
358
 
359
359
  # 通用场景引擎:
360
360
  # **注意:除电话通讯场景以外的其它识别场景,请务必使用以下16k引擎**
361
- # • **16k_zh_en**:中英粤+7种方言大模型引擎【大模型版】。当前模型同时支持中文、英语、粤语、四川、陕西、河南、上海、湖南、湖北和安徽方言识别,模型参数量极大,语言模型性能增强,针对噪声大、回音大、人声小、人声远等低质量音频的识别准确率极大提升;
361
+ # • **16k_zh_en**:中英粤+9种方言大模型引擎【大模型版】。当前模型同时支持中文、英语、粤语、四川、陕西、河南、上海、湖南、湖北、安徽、闽南和潮汕方言识别,模型参数量极大,语言模型性能增强,针对噪声大、回音大、人声小、人声远等低质量音频的识别准确率极大提升;
362
362
  # • **16k_zh_large:**普方英大模型引擎【大模型版】。当前模型同时支持中文、英文、[多种中文方言](https://cloud.tencent.com/document/product/1093/35682)等语言的识别,模型参数量极大,语言模型性能增强,针对噪声大、回音大、人声小、人声远等低质量音频的识别准确率极大提升,[点击这里](https://console.cloud.tencent.com/asr/demonstrate) 对比中文普通话常规版本与普方英大模型版本的识别效果;
363
363
  # • **16k_multi_lang:**多语种大模型引擎【大模型版】。当前模型同时支持英语、日语、韩语、阿拉伯语、菲律宾语、法语、印地语、印尼语、马来语、葡萄牙语、西班牙语、泰语、土耳其语、越南语、德语的识别,可实现15个语种的自动识别(句子/段落级别);
364
364
  # • **16k_zh:**中文普通话通用引擎,支持中文普通话和少量英语,使用丰富的中文普通话语料训练,覆盖场景广泛,适用于除电话通讯外的所有中文普通话识别场景;
@@ -432,7 +432,8 @@ module TencentCloud
432
432
  # @type CallbackUrl: String
433
433
  # @param SpeakerDiarization: 是否开启说话人分离
434
434
  # 0:不开启;
435
- # 1:开启(仅支持以下引擎:8k_zh/16k_zh/16k_ms/16k_en/16k_id/16k_zh_large/16k_zh_dialect/16k_zh_en,且ChannelNum=1时可用);
435
+ # 1:开启(仅支持以下引擎:8k_zh/8k_zh_large/16k_zh/16k_ms/16k_en/16k_id/16k_zh_large/16k_zh_dialect/16k_zh_en,且ChannelNum=1时可用);
436
+ # 3: 开启角色分离,需配合SpeakerRoles参数使用(增值服务,仅支持16k_zh_en引擎,可支持传入声纹对录音文件内的说话人进行角色认证)
436
437
  # 默认值为 0
437
438
 
438
439
  # 注意:
@@ -537,13 +538,21 @@ module TencentCloud
537
538
  # 注意:
538
539
  # 1. 本功能配置完成后,预计在10分钟后生效
539
540
  # @type ReplaceTextId: String
540
-
541
- attr_accessor :EngineModelType, :ChannelNum, :ResTextFormat, :SourceType, :Data, :DataLen, :Url, :CallbackUrl, :SpeakerDiarization, :SpeakerNumber, :HotwordId, :ReinforceHotword, :CustomizationId, :EmotionRecognition, :EmotionalEnergy, :ConvertNumMode, :FilterDirty, :FilterPunc, :FilterModal, :SentenceMaxLength, :Extra, :HotwordList, :KeyWordLibIdList, :ReplaceTextId
541
+ # @param SpeakerRoles: 开启角色分离能力
542
+ # 配合SpeakerDiarization: 3 使用,ASR增值服务,可传入一组声纹信息进行角色认证,仅支持16k_zh_en引擎。
543
+ # 需传入SpeakerRoleInfo数据组,确定说话人的角色信息,涉及RoleAudioUrl和RoleName两个参数。
544
+ # RoleAudioUrl:需要认证角色的声纹音频地址,建议30s内的纯净人声,最长不能超过45s。
545
+ # RoleName:需要认证角色的名称,若匹配成功,会替换话者分离中的SpeakerID。
546
+ # 示例:
547
+ # "{\"EngineModelType\":\"16k_zh_en\",\"ChannelNum\":1,\"ResTextFormat\":1,\"SourceType\":0,\"Url\":\"需要进行ASR识别的音频链接\",\"SpeakerDiarization\":3,\"SpeakerRoles\":[{\"RoleAudioUrl\":\"需要认证角色的声纹音频地址\",\"RoleName\":\"需要认证角色的名称\"}]}"
548
+ # @type SpeakerRoles: Array
549
+
550
+ attr_accessor :EngineModelType, :ChannelNum, :ResTextFormat, :SourceType, :Data, :DataLen, :Url, :CallbackUrl, :SpeakerDiarization, :SpeakerNumber, :HotwordId, :ReinforceHotword, :CustomizationId, :EmotionRecognition, :EmotionalEnergy, :ConvertNumMode, :FilterDirty, :FilterPunc, :FilterModal, :SentenceMaxLength, :Extra, :HotwordList, :KeyWordLibIdList, :ReplaceTextId, :SpeakerRoles
542
551
  extend Gem::Deprecate
543
- deprecate :ReinforceHotword, :none, 2025, 11
544
- deprecate :ReinforceHotword=, :none, 2025, 11
552
+ deprecate :ReinforceHotword, :none, 2025, 12
553
+ deprecate :ReinforceHotword=, :none, 2025, 12
545
554
 
546
- def initialize(enginemodeltype=nil, channelnum=nil, restextformat=nil, sourcetype=nil, data=nil, datalen=nil, url=nil, callbackurl=nil, speakerdiarization=nil, speakernumber=nil, hotwordid=nil, reinforcehotword=nil, customizationid=nil, emotionrecognition=nil, emotionalenergy=nil, convertnummode=nil, filterdirty=nil, filterpunc=nil, filtermodal=nil, sentencemaxlength=nil, extra=nil, hotwordlist=nil, keywordlibidlist=nil, replacetextid=nil)
555
+ def initialize(enginemodeltype=nil, channelnum=nil, restextformat=nil, sourcetype=nil, data=nil, datalen=nil, url=nil, callbackurl=nil, speakerdiarization=nil, speakernumber=nil, hotwordid=nil, reinforcehotword=nil, customizationid=nil, emotionrecognition=nil, emotionalenergy=nil, convertnummode=nil, filterdirty=nil, filterpunc=nil, filtermodal=nil, sentencemaxlength=nil, extra=nil, hotwordlist=nil, keywordlibidlist=nil, replacetextid=nil, speakerroles=nil)
547
556
  @EngineModelType = enginemodeltype
548
557
  @ChannelNum = channelnum
549
558
  @ResTextFormat = restextformat
@@ -568,6 +577,7 @@ module TencentCloud
568
577
  @HotwordList = hotwordlist
569
578
  @KeyWordLibIdList = keywordlibidlist
570
579
  @ReplaceTextId = replacetextid
580
+ @SpeakerRoles = speakerroles
571
581
  end
572
582
 
573
583
  def deserialize(params)
@@ -595,6 +605,14 @@ module TencentCloud
595
605
  @HotwordList = params['HotwordList']
596
606
  @KeyWordLibIdList = params['KeyWordLibIdList']
597
607
  @ReplaceTextId = params['ReplaceTextId']
608
+ unless params['SpeakerRoles'].nil?
609
+ @SpeakerRoles = []
610
+ params['SpeakerRoles'].each do |i|
611
+ speakerroleinfo_tmp = SpeakerRoleInfo.new
612
+ speakerroleinfo_tmp.deserialize(i)
613
+ @SpeakerRoles << speakerroleinfo_tmp
614
+ end
615
+ end
598
616
  end
599
617
  end
600
618
 
@@ -931,8 +949,8 @@ module TencentCloud
931
949
 
932
950
  attr_accessor :TagInfos, :Offset, :Limit
933
951
  extend Gem::Deprecate
934
- deprecate :TagInfos, :none, 2025, 11
935
- deprecate :TagInfos=, :none, 2025, 11
952
+ deprecate :TagInfos, :none, 2025, 12
953
+ deprecate :TagInfos=, :none, 2025, 12
936
954
 
937
955
  def initialize(taginfos=nil, offset=nil, limit=nil)
938
956
  @TagInfos = taginfos
@@ -1056,8 +1074,8 @@ module TencentCloud
1056
1074
 
1057
1075
  attr_accessor :TagInfos, :Limit, :Offset
1058
1076
  extend Gem::Deprecate
1059
- deprecate :TagInfos, :none, 2025, 11
1060
- deprecate :TagInfos=, :none, 2025, 11
1077
+ deprecate :TagInfos, :none, 2025, 12
1078
+ deprecate :TagInfos=, :none, 2025, 12
1061
1079
 
1062
1080
  def initialize(taginfos=nil, limit=nil, offset=nil)
1063
1081
  @TagInfos = taginfos
@@ -1357,8 +1375,8 @@ module TencentCloud
1357
1375
 
1358
1376
  attr_accessor :ModelName, :DictName, :ModelId, :ModelType, :ServiceType, :ModelState, :AtUpdated, :TagInfos
1359
1377
  extend Gem::Deprecate
1360
- deprecate :TagInfos, :none, 2025, 11
1361
- deprecate :TagInfos=, :none, 2025, 11
1378
+ deprecate :TagInfos, :none, 2025, 12
1379
+ deprecate :TagInfos=, :none, 2025, 12
1362
1380
 
1363
1381
  def initialize(modelname=nil, dictname=nil, modelid=nil, modeltype=nil, servicetype=nil, modelstate=nil, atupdated=nil, taginfos=nil)
1364
1382
  @ModelName = modelname
@@ -1638,14 +1656,14 @@ module TencentCloud
1638
1656
 
1639
1657
  attr_accessor :EngSerViceType, :SourceType, :VoiceFormat, :ProjectId, :SubServiceType, :Url, :UsrAudioKey, :Data, :DataLen, :WordInfo, :FilterDirty, :FilterModal, :FilterPunc, :ConvertNumMode, :HotwordId, :CustomizationId, :ReinforceHotword, :HotwordList, :InputSampleRate
1640
1658
  extend Gem::Deprecate
1641
- deprecate :ProjectId, :none, 2025, 11
1642
- deprecate :ProjectId=, :none, 2025, 11
1643
- deprecate :SubServiceType, :none, 2025, 11
1644
- deprecate :SubServiceType=, :none, 2025, 11
1645
- deprecate :UsrAudioKey, :none, 2025, 11
1646
- deprecate :UsrAudioKey=, :none, 2025, 11
1647
- deprecate :ReinforceHotword, :none, 2025, 11
1648
- deprecate :ReinforceHotword=, :none, 2025, 11
1659
+ deprecate :ProjectId, :none, 2025, 12
1660
+ deprecate :ProjectId=, :none, 2025, 12
1661
+ deprecate :SubServiceType, :none, 2025, 12
1662
+ deprecate :SubServiceType=, :none, 2025, 12
1663
+ deprecate :UsrAudioKey, :none, 2025, 12
1664
+ deprecate :UsrAudioKey=, :none, 2025, 12
1665
+ deprecate :ReinforceHotword, :none, 2025, 12
1666
+ deprecate :ReinforceHotword=, :none, 2025, 12
1649
1667
 
1650
1668
  def initialize(engservicetype=nil, sourcetype=nil, voiceformat=nil, projectid=nil, subservicetype=nil, url=nil, usraudiokey=nil, data=nil, datalen=nil, wordinfo=nil, filterdirty=nil, filtermodal=nil, filterpunc=nil, convertnummode=nil, hotwordid=nil, customizationid=nil, reinforcehotword=nil, hotwordlist=nil, inputsamplerate=nil)
1651
1669
  @EngSerViceType = engservicetype
@@ -1824,6 +1842,26 @@ module TencentCloud
1824
1842
  end
1825
1843
  end
1826
1844
 
1845
+ # 说话人注册角色声纹信息
1846
+ class SpeakerRoleInfo < TencentCloud::Common::AbstractModel
1847
+ # @param RoleAudioUrl: 音频url地址,建议不超过30秒,最大45秒
1848
+ # @type RoleAudioUrl: String
1849
+ # @param RoleName: 不超过30字节
1850
+ # @type RoleName: String
1851
+
1852
+ attr_accessor :RoleAudioUrl, :RoleName
1853
+
1854
+ def initialize(roleaudiourl=nil, rolename=nil)
1855
+ @RoleAudioUrl = roleaudiourl
1856
+ @RoleName = rolename
1857
+ end
1858
+
1859
+ def deserialize(params)
1860
+ @RoleAudioUrl = params['RoleAudioUrl']
1861
+ @RoleName = params['RoleName']
1862
+ end
1863
+ end
1864
+
1827
1865
  # [录音文件识别](https://cloud.tencent.com/document/product/1093/37823#3.-.E8.BE.93.E5.87.BA.E5.8F.82.E6.95.B0)、[实时语音异步识别](https://cloud.tencent.com/document/product/1093/52061#3.-.E8.BE.93.E5.87.BA.E5.8F.82.E6.95.B0)请求的返回数据
1828
1866
  class Task < TencentCloud::Common::AbstractModel
1829
1867
  # @param TaskId: 任务ID,可通过此ID在轮询接口获取识别状态与结果。TaskId数据类型为**uint64**。
metadata CHANGED
@@ -1,14 +1,14 @@
1
1
  --- !ruby/object:Gem::Specification
2
2
  name: tencentcloud-sdk-asr
3
3
  version: !ruby/object:Gem::Version
4
- version: 3.0.1161
4
+ version: 3.0.1184
5
5
  platform: ruby
6
6
  authors:
7
7
  - Tencent Cloud
8
8
  autorequire:
9
9
  bindir: bin
10
10
  cert_chain: []
11
- date: 2025-11-04 00:00:00.000000000 Z
11
+ date: 2025-12-18 00:00:00.000000000 Z
12
12
  dependencies:
13
13
  - !ruby/object:Gem::Dependency
14
14
  name: tencentcloud-sdk-common
@@ -34,8 +34,8 @@ extensions: []
34
34
  extra_rdoc_files: []
35
35
  files:
36
36
  - lib/tencentcloud-sdk-asr.rb
37
- - lib/v20190614/client.rb
38
37
  - lib/v20190614/models.rb
38
+ - lib/v20190614/client.rb
39
39
  - lib/VERSION
40
40
  homepage: https://github.com/TencentCloud/tencentcloud-sdk-ruby
41
41
  licenses: