[{"@type":"PropertyValue","name":"Formato","value":"16kHz, 16 bit, WAV, mono"},{"@type":"PropertyValue","name":"Categorias de Conteúdo","value":"Entrevistas, discursos, etc."},{"@type":"PropertyValue","name":"Ambiente de Gravação","value":"Baixo ruído"},{"@type":"PropertyValue","name":"País","value":"Índia"},{"@type":"PropertyValue","name":"Código de Região Linguística","value":"ta-IN"},{"@type":"PropertyValue","name":"Língua","value":"Tâmil"},{"@type":"PropertyValue","name":"Características de Anotação","value":"Anotação de conteúdo textual, marca de tempo de frase, identificação do locutor, género, anotação de ruído"},{"@type":"PropertyValue","name":"Taxa de Precisão","value":"Precisão de palavras: 98%"}]
{"id":1390,"datatype":"1","titleimg":"https://pt.nexdata.ai/shujutang/static/image/index/datatang_yuyin_default.webp","type1":"165","type1str":null,"type2":"166","type2str":null,"dataname":"203 horas de dados de voz em tâmil — linguagem oral","datazy":[{"title":"Formato","desc":"Formato","content":"16kHz, 16 bit, WAV, mono"},{"title":"Categorias de Conteúdo","desc":"Categorias de Conteúdo","content":"Entrevistas, discursos, etc."},{"title":"Ambiente de Gravação","desc":"Ambiente de Gravação","content":"Baixo ruído"},{"title":"País","desc":"País","content":"Índia"},{"title":"Código de Região Linguística","desc":"Código de Região Linguística","content":"ta-IN"},{"title":"Língua","desc":"Língua","content":"Tâmil"},{"title":"Características de Anotação","desc":"Características de Anotação","content":"Anotação de conteúdo textual, marca de tempo de frase, identificação do locutor, género, anotação de ruído"},{"title":"Taxa de Precisão","desc":"Taxa de Precisão","content":"Precisão de palavras: 98%"}],"datatag":"Tamil,India","technologydoc":null,"downurl":null,"datainfo":null,"standard":null,"dataylurl":null,"flag":null,"publishtime":null,"createby":null,"createtime":null,"ext1":null,"samplestoreloc":null,"hosturl":null,"datasize":null,"industryPlan":null,"keyInformation":"","samplePresentation":[{"name":"/data/apps/damp/temp/ziptemp/APY240315002_demo1725271202051/APY240315002_demo/000003-1-8.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY240315002_demo1725271202051/APY240315002_demo/000003-1-8.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=foGBcxzZ6YZUzUGekvu5FfUve0I%3D","intro":"தமிழ்நாட்டு வரலாற்றில், இது தான் முதல் முறை ஒரு அரசாங்கம் கடனை வாங்கி வட்டி கட்டுது.","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY240315002_demo1725271202051/APY240315002_demo/000003-1-2.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY240315002_demo1725271202051/APY240315002_demo/000003-1-2.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=fNREn52miYKDMbPUp1tVAOHQEdo%3D","intro":"உறுப்பினர் சொல்ற கருத்து, நல்ல கருத்து. ஏற்கனவே எங்களுக்கு ஒரு idea இருஞ்சு. என்ன சொல்ல மறந்துட்டாரு? இதே கருத்தை நான் ரெண்டாயிரத்தி பதினேழில் கூறினேன்.","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY240315002_demo1725271202051/APY240315002_demo/000003-1-10.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY240315002_demo1725271202051/APY240315002_demo/000003-1-10.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=esuHdkwAgKa0FUymtrzUUKG3axM%3D","intro":"ஒரே ஒரு நிமிஷம் பதினஞ்சாவது நிதிக்குழு இந்த அதிமுகவின்","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY240315002_demo1725271202051/APY240315002_demo/000003-1-1.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY240315002_demo1725271202051/APY240315002_demo/000003-1-1.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=zWCa8C6RzIbZKg764Mx0i%2FEbJps%3D","intro":"வீட்டிக்குள்ள பூட்டி வச்சுருந்திங்கன்னா, இது யாருங்க சொத்து? மக்கள் சொத்து இல்லையா? எதற்காக இது செய்யப்பட்டது? சட்டமன்றத்துல சொல்றிங்க மாண்புமிகு","size":0,"progress":100,"type":"mp3"},{"name":"/data/apps/damp/temp/ziptemp/APY240315002_demo1725271202051/APY240315002_demo/000003-1-6.wav","url":"https://bj-oss-datatang-03.oss-cn-beijing.aliyuncs.com/filesInfoUpload/data/apps/damp/temp/ziptemp/APY240315002_demo1725271202051/APY240315002_demo/000003-1-6.wav?Expires=4102329599&OSSAccessKeyId=LTAI8NWs2pDolLNH&Signature=tZnJh1ssOZfbfPebKrl8N6BkS%2FA%3D","intro":"யாருக்கு வெற்றி?","size":0,"progress":100,"type":"mp3"}],"officialSummary":"Dados de voz em tâmil — linguagem espontânea, abrangendo discursos, entrevistas e outros domínios. Reproduz contextos reais de interação. O conjunto de dados contém anotações detalhadas e foi gravado por locutors nativos de várias regiões e culturas, garantindo alta precisão. É útil para o desenvolvimento de modelos robustos de reconhecimento de fala. Conformidade total com GDPR, CCPA e PIPL.","dataexampl":null,"datakeyword":["Tâmil"," Índia"],"isDelete":null,"ids":null,"idsList":null,"datasetCode":null,"productStatus":null,"tagTypeEn":"Data Type,Language","tagTypeZh":null,"website":null,"samplePresentationList":null,"datazyList":null,"keyInformationList":null,"dataexamplList":null,"bgimg":null,"datazyScriptList":null,"datakeywordListString":null,"sourceShowPage":"speechRec","dataShowType":"[{\"code\":\"1\",\"language\":\"ZH\"},{\"code\":\"3\",\"language\":\"EN\"},{\"code\":\"0\",\"language\":\"ZH\"},{\"code\":\"2\",\"language\":\"EN,JP,PT,DE\"},{\"code\":\"4\",\"language\":\"JP\"}]","productNameEn":"203 Hours - Tamil Real-world Casual Conversation and Monologue speech dataset","BGimg":"brightSpot_audio","voiceBg":["/shujutang/static/image/comm/audio_bg.webp","/shujutang/static/image/comm/audio_bg2.webp","/shujutang/static/image/comm/audio_bg3.webp","/shujutang/static/image/comm/audio_bg4.webp","/shujutang/static/image/comm/audio_bg5.webp"]}
203 horas de dados de voz em tâmil — linguagem oral
Tâmil
Índia
Dados de voz em tâmil — linguagem espontânea, abrangendo discursos, entrevistas e outros domínios. Reproduz contextos reais de interação. O conjunto de dados contém anotações detalhadas e foi gravado por locutors nativos de várias regiões e culturas, garantindo alta precisão. É útil para o desenvolvimento de modelos robustos de reconhecimento de fala. Conformidade total com GDPR, CCPA e PIPL.
Este é um conjunto de dado pagos destinando a uso comercial, fins de investigação e otras finalidades. Conjunto de dados licenciado e pronto ajuda a acelerar projetos d IA.
Características
Formato
16kHz, 16 bit, WAV, mono
Categorias de Conteúdo
Entrevistas, discursos, etc.
Ambiente de Gravação
Baixo ruído
País
Índia
Código de Região Linguística
ta-IN
Língua
Tâmil
Características de Anotação
Anotação de conteúdo textual, marca de tempo de frase, identificação do locutor, género, anotação de ruído
Taxa de Precisão
Precisão de palavras: 98%
Amostra
Audio
தமிழ்நாட்டு வரலாற்றில், இது தான் முதல் முறை ஒரு அரசாங்கம் கடனை வாங்கி வட்டி கட்டுது.
Audio
உறுப்பினர் சொல்ற கருத்து, நல்ல கருத்து. ஏற்கனவே எங்களுக்கு ஒரு idea இருஞ்சு. என்ன சொல்ல மறந்துட்டாரு? இதே கருத்தை நான் ரெண்டாயிரத்தி பதினேழில் கூறினேன்.
Audio
ஒரே ஒரு நிமிஷம் பதினஞ்சாவது நிதிக்குழு இந்த அதிமுகவின்
Audio
வீட்டிக்குள்ள பூட்டி வச்சுருந்திங்கன்னா, இது யாருங்க சொத்து? மக்கள் சொத்து இல்லையா? எதற்காக இது செய்யப்பட்டது? சட்டமன்றத்துல சொல்றிங்க மாண்புமிகு