tencentcloud-sdk-asr 3.0.1161 → 3.0.1184
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- checksums.yaml +4 -4
- data/lib/VERSION +1 -1
- data/lib/v20190614/models.rb +62 -24
- metadata +3 -3
checksums.yaml
CHANGED
|
@@ -1,7 +1,7 @@
|
|
|
1
1
|
---
|
|
2
2
|
SHA1:
|
|
3
|
-
metadata.gz:
|
|
4
|
-
data.tar.gz:
|
|
3
|
+
metadata.gz: 182a61e43aa111f27e93c531075aea02d2fe06d8
|
|
4
|
+
data.tar.gz: 474059e7f927a31724cc8e0f5ae4326f24ddd43d
|
|
5
5
|
SHA512:
|
|
6
|
-
metadata.gz:
|
|
7
|
-
data.tar.gz:
|
|
6
|
+
metadata.gz: 977cb2d4e3566d45340174af95a0e92cc394c069c7cc72f3da5657c61d87bacabfa7f43bf3c1182ff1f3a3d21b677263d0332817c26d288548248f643fa92cb0
|
|
7
|
+
data.tar.gz: 2cac0703665a4af4c1c47ffe38ac0ad3f1075eb8cdbdcaa6fdbafb5d19964b480e68288635be41409a3da3fa8eba83f6669412dd98be27d1d90a991ca4f02ac3
|
data/lib/VERSION
CHANGED
|
@@ -1 +1 @@
|
|
|
1
|
-
3.0.
|
|
1
|
+
3.0.1184
|
data/lib/v20190614/models.rb
CHANGED
|
@@ -305,8 +305,8 @@ module TencentCloud
|
|
|
305
305
|
|
|
306
306
|
attr_accessor :ModelName, :TextUrl, :ModelType, :TagInfos
|
|
307
307
|
extend Gem::Deprecate
|
|
308
|
-
deprecate :TagInfos, :none, 2025,
|
|
309
|
-
deprecate :TagInfos=, :none, 2025,
|
|
308
|
+
deprecate :TagInfos, :none, 2025, 12
|
|
309
|
+
deprecate :TagInfos=, :none, 2025, 12
|
|
310
310
|
|
|
311
311
|
def initialize(modelname=nil, texturl=nil, modeltype=nil, taginfos=nil)
|
|
312
312
|
@ModelName = modelname
|
|
@@ -352,13 +352,13 @@ module TencentCloud
|
|
|
352
352
|
# **注意:电话通讯场景,请务必使用以下8k引擎**
|
|
353
353
|
# • 8k_zh:中文电话通讯;
|
|
354
354
|
# • 8k_en:英文电话通讯;
|
|
355
|
-
# • 8k_zh_large
|
|
355
|
+
# • 8k_zh_large:中文电话场景专用大模型引擎【大模型版】。当前模型同时支持中文、上海话、四川话、武汉话、贵阳话、昆明话、西安话、郑州话、太原话、兰州话、银川话、西宁话、南京话、合肥话、南昌话、长沙话、苏州话、杭州话、济南话、天津话、石家庄话、黑龙江话、吉林话、辽宁话、闽南语、客家话、粤语、南宁话方言识别,通过显著提升模型参数规模与语言建模能力,实现对电话音频中复杂场景(如口音干扰、背景噪声)的高精度识别,识别准确率较常规版本大幅提升。[点击这里](https://console.cloud.tencent.com/asr/demonstrate) 对比常规版本与普方大模型效果;
|
|
356
356
|
|
|
357
357
|
# 注意:如您有电话通讯场景识别需求,但发现需求语种仅支持16k,可将8k音频传入下方16k引擎,亦能获取识别结果。但**16k引擎并非基于电话通讯数据训练,无法承诺此种调用方式的识别效果,需由您自行验证识别结果是否可用**
|
|
358
358
|
|
|
359
359
|
# 通用场景引擎:
|
|
360
360
|
# **注意:除电话通讯场景以外的其它识别场景,请务必使用以下16k引擎**
|
|
361
|
-
# • **16k_zh_en**:中英粤+
|
|
361
|
+
# • **16k_zh_en**:中英粤+9种方言大模型引擎【大模型版】。当前模型同时支持中文、英语、粤语、四川、陕西、河南、上海、湖南、湖北、安徽、闽南和潮汕方言识别,模型参数量极大,语言模型性能增强,针对噪声大、回音大、人声小、人声远等低质量音频的识别准确率极大提升;
|
|
362
362
|
# • **16k_zh_large:**普方英大模型引擎【大模型版】。当前模型同时支持中文、英文、[多种中文方言](https://cloud.tencent.com/document/product/1093/35682)等语言的识别,模型参数量极大,语言模型性能增强,针对噪声大、回音大、人声小、人声远等低质量音频的识别准确率极大提升,[点击这里](https://console.cloud.tencent.com/asr/demonstrate) 对比中文普通话常规版本与普方英大模型版本的识别效果;
|
|
363
363
|
# • **16k_multi_lang:**多语种大模型引擎【大模型版】。当前模型同时支持英语、日语、韩语、阿拉伯语、菲律宾语、法语、印地语、印尼语、马来语、葡萄牙语、西班牙语、泰语、土耳其语、越南语、德语的识别,可实现15个语种的自动识别(句子/段落级别);
|
|
364
364
|
# • **16k_zh:**中文普通话通用引擎,支持中文普通话和少量英语,使用丰富的中文普通话语料训练,覆盖场景广泛,适用于除电话通讯外的所有中文普通话识别场景;
|
|
@@ -432,7 +432,8 @@ module TencentCloud
|
|
|
432
432
|
# @type CallbackUrl: String
|
|
433
433
|
# @param SpeakerDiarization: 是否开启说话人分离
|
|
434
434
|
# 0:不开启;
|
|
435
|
-
# 1:开启(仅支持以下引擎:8k_zh/16k_zh/16k_ms/16k_en/16k_id/16k_zh_large/16k_zh_dialect/16k_zh_en,且ChannelNum=1时可用);
|
|
435
|
+
# 1:开启(仅支持以下引擎:8k_zh/8k_zh_large/16k_zh/16k_ms/16k_en/16k_id/16k_zh_large/16k_zh_dialect/16k_zh_en,且ChannelNum=1时可用);
|
|
436
|
+
# 3: 开启角色分离,需配合SpeakerRoles参数使用(增值服务,仅支持16k_zh_en引擎,可支持传入声纹对录音文件内的说话人进行角色认证)
|
|
436
437
|
# 默认值为 0
|
|
437
438
|
|
|
438
439
|
# 注意:
|
|
@@ -537,13 +538,21 @@ module TencentCloud
|
|
|
537
538
|
# 注意:
|
|
538
539
|
# 1. 本功能配置完成后,预计在10分钟后生效
|
|
539
540
|
# @type ReplaceTextId: String
|
|
540
|
-
|
|
541
|
-
|
|
541
|
+
# @param SpeakerRoles: 开启角色分离能力
|
|
542
|
+
# 配合SpeakerDiarization: 3 使用,ASR增值服务,可传入一组声纹信息进行角色认证,仅支持16k_zh_en引擎。
|
|
543
|
+
# 需传入SpeakerRoleInfo数据组,确定说话人的角色信息,涉及RoleAudioUrl和RoleName两个参数。
|
|
544
|
+
# RoleAudioUrl:需要认证角色的声纹音频地址,建议30s内的纯净人声,最长不能超过45s。
|
|
545
|
+
# RoleName:需要认证角色的名称,若匹配成功,会替换话者分离中的SpeakerID。
|
|
546
|
+
# 示例:
|
|
547
|
+
# "{\"EngineModelType\":\"16k_zh_en\",\"ChannelNum\":1,\"ResTextFormat\":1,\"SourceType\":0,\"Url\":\"需要进行ASR识别的音频链接\",\"SpeakerDiarization\":3,\"SpeakerRoles\":[{\"RoleAudioUrl\":\"需要认证角色的声纹音频地址\",\"RoleName\":\"需要认证角色的名称\"}]}"
|
|
548
|
+
# @type SpeakerRoles: Array
|
|
549
|
+
|
|
550
|
+
attr_accessor :EngineModelType, :ChannelNum, :ResTextFormat, :SourceType, :Data, :DataLen, :Url, :CallbackUrl, :SpeakerDiarization, :SpeakerNumber, :HotwordId, :ReinforceHotword, :CustomizationId, :EmotionRecognition, :EmotionalEnergy, :ConvertNumMode, :FilterDirty, :FilterPunc, :FilterModal, :SentenceMaxLength, :Extra, :HotwordList, :KeyWordLibIdList, :ReplaceTextId, :SpeakerRoles
|
|
542
551
|
extend Gem::Deprecate
|
|
543
|
-
deprecate :ReinforceHotword, :none, 2025,
|
|
544
|
-
deprecate :ReinforceHotword=, :none, 2025,
|
|
552
|
+
deprecate :ReinforceHotword, :none, 2025, 12
|
|
553
|
+
deprecate :ReinforceHotword=, :none, 2025, 12
|
|
545
554
|
|
|
546
|
-
def initialize(enginemodeltype=nil, channelnum=nil, restextformat=nil, sourcetype=nil, data=nil, datalen=nil, url=nil, callbackurl=nil, speakerdiarization=nil, speakernumber=nil, hotwordid=nil, reinforcehotword=nil, customizationid=nil, emotionrecognition=nil, emotionalenergy=nil, convertnummode=nil, filterdirty=nil, filterpunc=nil, filtermodal=nil, sentencemaxlength=nil, extra=nil, hotwordlist=nil, keywordlibidlist=nil, replacetextid=nil)
|
|
555
|
+
def initialize(enginemodeltype=nil, channelnum=nil, restextformat=nil, sourcetype=nil, data=nil, datalen=nil, url=nil, callbackurl=nil, speakerdiarization=nil, speakernumber=nil, hotwordid=nil, reinforcehotword=nil, customizationid=nil, emotionrecognition=nil, emotionalenergy=nil, convertnummode=nil, filterdirty=nil, filterpunc=nil, filtermodal=nil, sentencemaxlength=nil, extra=nil, hotwordlist=nil, keywordlibidlist=nil, replacetextid=nil, speakerroles=nil)
|
|
547
556
|
@EngineModelType = enginemodeltype
|
|
548
557
|
@ChannelNum = channelnum
|
|
549
558
|
@ResTextFormat = restextformat
|
|
@@ -568,6 +577,7 @@ module TencentCloud
|
|
|
568
577
|
@HotwordList = hotwordlist
|
|
569
578
|
@KeyWordLibIdList = keywordlibidlist
|
|
570
579
|
@ReplaceTextId = replacetextid
|
|
580
|
+
@SpeakerRoles = speakerroles
|
|
571
581
|
end
|
|
572
582
|
|
|
573
583
|
def deserialize(params)
|
|
@@ -595,6 +605,14 @@ module TencentCloud
|
|
|
595
605
|
@HotwordList = params['HotwordList']
|
|
596
606
|
@KeyWordLibIdList = params['KeyWordLibIdList']
|
|
597
607
|
@ReplaceTextId = params['ReplaceTextId']
|
|
608
|
+
unless params['SpeakerRoles'].nil?
|
|
609
|
+
@SpeakerRoles = []
|
|
610
|
+
params['SpeakerRoles'].each do |i|
|
|
611
|
+
speakerroleinfo_tmp = SpeakerRoleInfo.new
|
|
612
|
+
speakerroleinfo_tmp.deserialize(i)
|
|
613
|
+
@SpeakerRoles << speakerroleinfo_tmp
|
|
614
|
+
end
|
|
615
|
+
end
|
|
598
616
|
end
|
|
599
617
|
end
|
|
600
618
|
|
|
@@ -931,8 +949,8 @@ module TencentCloud
|
|
|
931
949
|
|
|
932
950
|
attr_accessor :TagInfos, :Offset, :Limit
|
|
933
951
|
extend Gem::Deprecate
|
|
934
|
-
deprecate :TagInfos, :none, 2025,
|
|
935
|
-
deprecate :TagInfos=, :none, 2025,
|
|
952
|
+
deprecate :TagInfos, :none, 2025, 12
|
|
953
|
+
deprecate :TagInfos=, :none, 2025, 12
|
|
936
954
|
|
|
937
955
|
def initialize(taginfos=nil, offset=nil, limit=nil)
|
|
938
956
|
@TagInfos = taginfos
|
|
@@ -1056,8 +1074,8 @@ module TencentCloud
|
|
|
1056
1074
|
|
|
1057
1075
|
attr_accessor :TagInfos, :Limit, :Offset
|
|
1058
1076
|
extend Gem::Deprecate
|
|
1059
|
-
deprecate :TagInfos, :none, 2025,
|
|
1060
|
-
deprecate :TagInfos=, :none, 2025,
|
|
1077
|
+
deprecate :TagInfos, :none, 2025, 12
|
|
1078
|
+
deprecate :TagInfos=, :none, 2025, 12
|
|
1061
1079
|
|
|
1062
1080
|
def initialize(taginfos=nil, limit=nil, offset=nil)
|
|
1063
1081
|
@TagInfos = taginfos
|
|
@@ -1357,8 +1375,8 @@ module TencentCloud
|
|
|
1357
1375
|
|
|
1358
1376
|
attr_accessor :ModelName, :DictName, :ModelId, :ModelType, :ServiceType, :ModelState, :AtUpdated, :TagInfos
|
|
1359
1377
|
extend Gem::Deprecate
|
|
1360
|
-
deprecate :TagInfos, :none, 2025,
|
|
1361
|
-
deprecate :TagInfos=, :none, 2025,
|
|
1378
|
+
deprecate :TagInfos, :none, 2025, 12
|
|
1379
|
+
deprecate :TagInfos=, :none, 2025, 12
|
|
1362
1380
|
|
|
1363
1381
|
def initialize(modelname=nil, dictname=nil, modelid=nil, modeltype=nil, servicetype=nil, modelstate=nil, atupdated=nil, taginfos=nil)
|
|
1364
1382
|
@ModelName = modelname
|
|
@@ -1638,14 +1656,14 @@ module TencentCloud
|
|
|
1638
1656
|
|
|
1639
1657
|
attr_accessor :EngSerViceType, :SourceType, :VoiceFormat, :ProjectId, :SubServiceType, :Url, :UsrAudioKey, :Data, :DataLen, :WordInfo, :FilterDirty, :FilterModal, :FilterPunc, :ConvertNumMode, :HotwordId, :CustomizationId, :ReinforceHotword, :HotwordList, :InputSampleRate
|
|
1640
1658
|
extend Gem::Deprecate
|
|
1641
|
-
deprecate :ProjectId, :none, 2025,
|
|
1642
|
-
deprecate :ProjectId=, :none, 2025,
|
|
1643
|
-
deprecate :SubServiceType, :none, 2025,
|
|
1644
|
-
deprecate :SubServiceType=, :none, 2025,
|
|
1645
|
-
deprecate :UsrAudioKey, :none, 2025,
|
|
1646
|
-
deprecate :UsrAudioKey=, :none, 2025,
|
|
1647
|
-
deprecate :ReinforceHotword, :none, 2025,
|
|
1648
|
-
deprecate :ReinforceHotword=, :none, 2025,
|
|
1659
|
+
deprecate :ProjectId, :none, 2025, 12
|
|
1660
|
+
deprecate :ProjectId=, :none, 2025, 12
|
|
1661
|
+
deprecate :SubServiceType, :none, 2025, 12
|
|
1662
|
+
deprecate :SubServiceType=, :none, 2025, 12
|
|
1663
|
+
deprecate :UsrAudioKey, :none, 2025, 12
|
|
1664
|
+
deprecate :UsrAudioKey=, :none, 2025, 12
|
|
1665
|
+
deprecate :ReinforceHotword, :none, 2025, 12
|
|
1666
|
+
deprecate :ReinforceHotword=, :none, 2025, 12
|
|
1649
1667
|
|
|
1650
1668
|
def initialize(engservicetype=nil, sourcetype=nil, voiceformat=nil, projectid=nil, subservicetype=nil, url=nil, usraudiokey=nil, data=nil, datalen=nil, wordinfo=nil, filterdirty=nil, filtermodal=nil, filterpunc=nil, convertnummode=nil, hotwordid=nil, customizationid=nil, reinforcehotword=nil, hotwordlist=nil, inputsamplerate=nil)
|
|
1651
1669
|
@EngSerViceType = engservicetype
|
|
@@ -1824,6 +1842,26 @@ module TencentCloud
|
|
|
1824
1842
|
end
|
|
1825
1843
|
end
|
|
1826
1844
|
|
|
1845
|
+
# 说话人注册角色声纹信息
|
|
1846
|
+
class SpeakerRoleInfo < TencentCloud::Common::AbstractModel
|
|
1847
|
+
# @param RoleAudioUrl: 音频url地址,建议不超过30秒,最大45秒
|
|
1848
|
+
# @type RoleAudioUrl: String
|
|
1849
|
+
# @param RoleName: 不超过30字节
|
|
1850
|
+
# @type RoleName: String
|
|
1851
|
+
|
|
1852
|
+
attr_accessor :RoleAudioUrl, :RoleName
|
|
1853
|
+
|
|
1854
|
+
def initialize(roleaudiourl=nil, rolename=nil)
|
|
1855
|
+
@RoleAudioUrl = roleaudiourl
|
|
1856
|
+
@RoleName = rolename
|
|
1857
|
+
end
|
|
1858
|
+
|
|
1859
|
+
def deserialize(params)
|
|
1860
|
+
@RoleAudioUrl = params['RoleAudioUrl']
|
|
1861
|
+
@RoleName = params['RoleName']
|
|
1862
|
+
end
|
|
1863
|
+
end
|
|
1864
|
+
|
|
1827
1865
|
# [录音文件识别](https://cloud.tencent.com/document/product/1093/37823#3.-.E8.BE.93.E5.87.BA.E5.8F.82.E6.95.B0)、[实时语音异步识别](https://cloud.tencent.com/document/product/1093/52061#3.-.E8.BE.93.E5.87.BA.E5.8F.82.E6.95.B0)请求的返回数据
|
|
1828
1866
|
class Task < TencentCloud::Common::AbstractModel
|
|
1829
1867
|
# @param TaskId: 任务ID,可通过此ID在轮询接口获取识别状态与结果。TaskId数据类型为**uint64**。
|
metadata
CHANGED
|
@@ -1,14 +1,14 @@
|
|
|
1
1
|
--- !ruby/object:Gem::Specification
|
|
2
2
|
name: tencentcloud-sdk-asr
|
|
3
3
|
version: !ruby/object:Gem::Version
|
|
4
|
-
version: 3.0.
|
|
4
|
+
version: 3.0.1184
|
|
5
5
|
platform: ruby
|
|
6
6
|
authors:
|
|
7
7
|
- Tencent Cloud
|
|
8
8
|
autorequire:
|
|
9
9
|
bindir: bin
|
|
10
10
|
cert_chain: []
|
|
11
|
-
date: 2025-
|
|
11
|
+
date: 2025-12-18 00:00:00.000000000 Z
|
|
12
12
|
dependencies:
|
|
13
13
|
- !ruby/object:Gem::Dependency
|
|
14
14
|
name: tencentcloud-sdk-common
|
|
@@ -34,8 +34,8 @@ extensions: []
|
|
|
34
34
|
extra_rdoc_files: []
|
|
35
35
|
files:
|
|
36
36
|
- lib/tencentcloud-sdk-asr.rb
|
|
37
|
-
- lib/v20190614/client.rb
|
|
38
37
|
- lib/v20190614/models.rb
|
|
38
|
+
- lib/v20190614/client.rb
|
|
39
39
|
- lib/VERSION
|
|
40
40
|
homepage: https://github.com/TencentCloud/tencentcloud-sdk-ruby
|
|
41
41
|
licenses:
|