{ "locales": { "ab": { "buckets": { "dev": 9329, "test": 9230, "train": 21331, "validated": 42970, "invalidated": 5419, "other": 15860 }, "duration": 332682156, "reportedSentences": 225, "validatedSentences": 1046780, "unvalidatedSentences": 5, "clips": 64249, "splits": { "accent": {}, "age": { "": 0.2, "twenties": 0.17, "thirties": 0.17, "teens": 0.26, "fourties": 0.08, "fifties": 0.06, "sixties": 0.05, "seventies": 0.01, "eighties": 0.01, "nineties": 0 }, "gender": { "": 0.2, "male_masculine": 0.17, "female_feminine": 0.63, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 64249, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 427, "size": 1976516939, "checksum": "ecc75443c63048b97d1244b89b45b483ce31c151e035345928a0c9158fd16397", "avgDurationSecs": 5.178, "validDurationSecs": 222499.218, "totalHrs": 92.41, "validHrs": 61.8 }, "abb": { "buckets": { "dev": 293, "test": 313, "train": 390, "validated": 7887, "invalidated": 35, "other": 0 }, "duration": 40474692, "reportedSentences": 0, "validatedSentences": 996, "unvalidatedSentences": -1, "clips": 7922, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7922, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 22, "size": 238179520, "checksum": "7ef1fe7863a8ee8a5e36c3bcf68ecfbdc3a704bae91ceeda28191dcd51c49e4b", "avgDurationSecs": 5.109, "validDurationSecs": 40295.872, "totalHrs": 11.24, "validHrs": 11.19 }, "ady": { "buckets": { "dev": 2991, "test": 2989, "train": 3664, "validated": 40812, "invalidated": 1524, "other": 3124 }, "duration": 227644956, "reportedSentences": 633, "validatedSentences": 10309, "unvalidatedSentences": 2725, "clips": 45460, "splits": { "accent": {}, "age": { "": 0.09, "twenties": 0.31, "thirties": 0.19, "teens": 0.09, "fourties": 0.12, "fifties": 0.14, "sixties": 0.05, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.31, "male_masculine": 0.02, "female_feminine": 0.66, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 362, "agriculture_food": 25, "automotive_transport": 0, "finance": 0, "service_retail": 57, "general": 95250, "healthcare": 47, "history_law_government": 0, "language_fundamentals": 463, "media_entertainment": 87, "nature_environment": 7, "news_current_affairs": 94, "technology_robotics": 0 } }, "users": 137, "size": 1301563097, "checksum": "31759be8f8da07a3fd2ff2799457ce783fca6a88c6f4530364d63ec79fc16759", "avgDurationSecs": 5.008, "validDurationSecs": 204369.686, "totalHrs": 63.23, "validHrs": 56.76 }, "af": { "buckets": { "dev": 118, "test": 129, "train": 181, "validated": 428, "invalidated": 201, "other": 348 }, "duration": 5938740, "reportedSentences": 73, "validatedSentences": 4802, "unvalidatedSentences": 16565, "clips": 977, "splits": { "accent": {}, "age": { "": 0.32, "twenties": 0.31, "thirties": 0, "teens": 0.01, "fourties": 0.21, "fifties": 0.15, "sixties": 0, "seventies": 0.01, "eighties": 0, "nineties": 0 }, "gender": { "": 0.46, "male_masculine": 0.32, "female_feminine": 0.22, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 977, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 65, "size": 35967911, "checksum": "9c95833ed6d565d4872fa551d1dd0ca4d4fd75aabc3c6e9a7355e4d799c234c4", "avgDurationSecs": 6.079, "validDurationSecs": 2601.618, "totalHrs": 1.64, "validHrs": 0.72 }, "ajg": { "buckets": { "dev": 560, "test": 774, "train": 1873, "validated": 19155, "invalidated": 212, "other": 31 }, "duration": 46342044, "reportedSentences": 0, "validatedSentences": 3213, "unvalidatedSentences": -1, "clips": 19398, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 19398, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 23, "size": 263833585, "checksum": "75c41be24180fa08cdce591497fbeba663931358c56eebaa1c81b58d5a2d79e2", "avgDurationSecs": 2.389, "validDurationSecs": 45761.514, "totalHrs": 12.87, "validHrs": 12.71 }, "am": { "buckets": { "dev": 248, "test": 263, "train": 534, "validated": 1045, "invalidated": 30, "other": 557 }, "duration": 10279728, "reportedSentences": 11, "validatedSentences": 2208, "unvalidatedSentences": 12, "clips": 1632, "splits": { "accent": {}, "age": { "": 0.23, "twenties": 0.14, "thirties": 0.61, "teens": 0, "fourties": 0.01, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.25, "male_masculine": 0.75, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1632, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 46, "size": 60581563, "checksum": "f5d8274eb80826338f6f1d6d47fd80d4702207fb31276a2afe0dd815e205fc99", "avgDurationSecs": 6.299, "validDurationSecs": 6582.301, "totalHrs": 2.85, "validHrs": 1.82 }, "an": { "buckets": { "dev": 2872, "test": 2920, "train": 4190, "validated": 13277, "invalidated": 758, "other": 5 }, "duration": 64215432, "reportedSentences": 8, "validatedSentences": 10454, "unvalidatedSentences": 357, "clips": 14040, "splits": { "accent": {}, "age": { "": 0.19, "twenties": 0.02, "thirties": 0.2, "teens": 0, "fourties": 0.32, "fifties": 0.11, "sixties": 0.12, "seventies": 0.04, "eighties": 0, "nineties": 0 }, "gender": { "": 0.71, "male_masculine": 0.15, "female_feminine": 0.15, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 456, "agriculture_food": 0, "automotive_transport": 0, "finance": 2, "service_retail": 2, "general": 13638, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 53, "size": 374347878, "checksum": "780f87179dd488f46fcd9af2737cd2aed3e662cb678d686243f4146c78320573", "avgDurationSecs": 4.574, "validDurationSecs": 60725.662, "totalHrs": 17.83, "validHrs": 16.86 }, "ar": { "buckets": { "dev": 10219, "test": 10498, "train": 28870, "validated": 79354, "invalidated": 15249, "other": 41437 }, "duration": 566224506, "reportedSentences": 2137, "validatedSentences": 59434, "unvalidatedSentences": 1742112, "clips": 136040, "splits": { "accent": {}, "age": { "": 0.55, "twenties": 0.3, "thirties": 0.11, "teens": 0.03, "fourties": 0.01, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.55, "male_masculine": 0.28, "female_feminine": 0.17, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 136040, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 1651, "size": 3484836841, "checksum": "5df32f94259c2cfc45854fb7cf7191e317c5a9b662335fb9cfc9e5c3ec8b4f25", "avgDurationSecs": 4.162, "validDurationSecs": 330286.529, "totalHrs": 157.28, "validHrs": 91.74 }, "as": { "buckets": { "dev": 485, "test": 394, "train": 953, "validated": 1832, "invalidated": 282, "other": 2567 }, "duration": 27604649, "reportedSentences": 249, "validatedSentences": 7171, "unvalidatedSentences": 3344, "clips": 4681, "splits": { "accent": {}, "age": { "": 0.28, "twenties": 0.16, "thirties": 0.02, "teens": 0, "fourties": 0.52, "fifties": 0.02, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.82, "male_masculine": 0.18, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 4670, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 11, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 11 } }, "users": 51, "size": 167861194, "checksum": "799c31374c95f64b4400f9c1989466f727a797bd874d96359580012f1271e4f1", "avgDurationSecs": 5.897, "validDurationSecs": 10803.614, "totalHrs": 7.66, "validHrs": 3 }, "ast": { "buckets": { "dev": 114, "test": 230, "train": 445, "validated": 804, "invalidated": 42, "other": 863 }, "duration": 7513344, "reportedSentences": 0, "validatedSentences": 1642, "unvalidatedSentences": 290, "clips": 1709, "splits": { "accent": {}, "age": { "": 0.25, "twenties": 0.1, "thirties": 0.12, "teens": 0.06, "fourties": 0.27, "fifties": 0.2, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.25, "male_masculine": 0.59, "female_feminine": 0.14, "transgender": 0.02, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1709, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 31, "size": 42880232, "checksum": "85477bbd78bab637a35e0ed18562dcbd729d85f253a22b75ce5a42124954167b", "avgDurationSecs": 4.396, "validDurationSecs": 3534.657, "totalHrs": 2.08, "validHrs": 0.98 }, "az": { "buckets": { "dev": 93, "test": 121, "train": 197, "validated": 411, "invalidated": 53, "other": 545 }, "duration": 5501016, "reportedSentences": 5, "validatedSentences": 93161, "unvalidatedSentences": 1862, "clips": 1009, "splits": { "accent": {}, "age": { "": 0.2, "twenties": 0.17, "thirties": 0.61, "teens": 0.01, "fourties": 0.01, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.82, "male_masculine": 0.17, "female_feminine": 0.01, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1009, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 45, "size": 38453820, "checksum": "00f1b0d6ef904e62eafbcc8d92e8e764486ba3d2d3d37a6b321b63555ab26a59", "avgDurationSecs": 5.452, "validDurationSecs": 2240.751, "totalHrs": 1.52, "validHrs": 0.62 }, "ba": { "buckets": { "dev": 14525, "test": 14569, "train": 119138, "validated": 210457, "invalidated": 8011, "other": 50 }, "duration": 967387572, "reportedSentences": 868, "validatedSentences": 153968, "unvalidatedSentences": 5, "clips": 218518, "splits": { "accent": {}, "age": { "": 0.3, "twenties": 0.17, "thirties": 0.17, "teens": 0.04, "fourties": 0.06, "fifties": 0.05, "sixties": 0.19, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.3, "male_masculine": 0.3, "female_feminine": 0.39, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 218518, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 930, "size": 5451322660, "checksum": "fab12b73feb3d921f594f5e0fa3b648d6ff79169c0fbeec35dee302a957adedc", "avgDurationSecs": 4.427, "validDurationSecs": 931701.216, "totalHrs": 268.71, "validHrs": 258.8 }, "bag": { "buckets": { "dev": 261, "test": 324, "train": 421, "validated": 7028, "invalidated": 49, "other": 35 }, "duration": 40652964, "reportedSentences": 1, "validatedSentences": 1006, "unvalidatedSentences": 6, "clips": 7112, "splits": { "accent": {}, "age": { "": 0.84, "twenties": 0, "thirties": 0.02, "teens": 0, "fourties": 0.14, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.84, "male_masculine": 0, "female_feminine": 0.02, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.14 }, "sentence_domain": { "": 7112, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 14, "size": 228620074, "checksum": "a8f8539aeae94dfe59b4842698eeccbf9f8adec175ef11ae0bac25f3ca925683", "avgDurationSecs": 5.716, "validDurationSecs": 40172.811, "totalHrs": 11.29, "validHrs": 11.15 }, "bas": { "buckets": { "dev": 1324, "test": 1550, "train": 2112, "validated": 11138, "invalidated": 1217, "other": 144 }, "duration": 49084848, "reportedSentences": 8, "validatedSentences": 5226, "unvalidatedSentences": 105, "clips": 12499, "splits": { "accent": {}, "age": { "": 0.39, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0.61, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.99, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 12491, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 8, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 57, "size": 254567498, "checksum": "185c03ca819b5b2e8db5ee3dfa63929c364fe5f952e919dc0b71bf4a126e7d68", "avgDurationSecs": 3.927, "validDurationSecs": 43740.062, "totalHrs": 13.63, "validHrs": 12.15 }, "bax": { "buckets": { "dev": 319, "test": 338, "train": 373, "validated": 7777, "invalidated": 80, "other": 829 }, "duration": 44092836, "reportedSentences": 0, "validatedSentences": 1030, "unvalidatedSentences": -1, "clips": 8686, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8686, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 13, "size": 251893798, "checksum": "009c91f847a92d1dcd6061fc943a2fce3c94a0006bf340fff2ac6dea08e10a74", "avgDurationSecs": 5.076, "validDurationSecs": 39478.469, "totalHrs": 12.24, "validHrs": 10.96 }, "bba": { "buckets": { "dev": 251, "test": 236, "train": 292, "validated": 6273, "invalidated": 2279, "other": 0 }, "duration": 54094284, "reportedSentences": 94, "validatedSentences": 971, "unvalidatedSentences": -1, "clips": 8552, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8552, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 14, "size": 297924030, "checksum": "b4c88af1da2257fabbeb487809e14f1048ee453d2392348cd3a88fba780d6779", "avgDurationSecs": 6.325, "validDurationSecs": 39678.84, "totalHrs": 15.02, "validHrs": 11.02 }, "bbj": { "buckets": { "dev": 268, "test": 324, "train": 404, "validated": 7242, "invalidated": 17, "other": 265 }, "duration": 46645812, "reportedSentences": 1, "validatedSentences": 996, "unvalidatedSentences": 1, "clips": 7524, "splits": { "accent": {}, "age": { "": 0.85, "twenties": 0.02, "thirties": 0.13, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.86, "male_masculine": 0, "female_feminine": 0.14, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7524, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 31, "size": 272457246, "checksum": "e95e5c54a75a528e49cd6eb79ddcc6dec8823d382d2d22e3421fc6299ca0b2b5", "avgDurationSecs": 6.2, "validDurationSecs": 44897.524, "totalHrs": 12.95, "validHrs": 12.47 }, "bbl": { "buckets": { "dev": 377, "test": 377, "train": 407, "validated": 4580, "invalidated": 130, "other": 112 }, "duration": 42473448, "reportedSentences": 0, "validatedSentences": 1661, "unvalidatedSentences": 462, "clips": 4822, "splits": { "accent": {}, "age": { "": 0.02, "twenties": 0, "thirties": 0.15, "teens": 0, "fourties": 0, "fifties": 0.04, "sixties": 0.55, "seventies": 0.24, "eighties": 0, "nineties": 0 }, "gender": { "": 0.33, "male_masculine": 0, "female_feminine": 0.67, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 248, "agriculture_food": 20, "automotive_transport": 28, "finance": 0, "service_retail": 0, "general": 4539, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 20, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 22, "size": 252071422, "checksum": "630e474f98551ae6be9c32014ccfcd9e2147773dd2f039f08a57f89754cfa76d", "avgDurationSecs": 8.808, "validDurationSecs": 40341.848, "totalHrs": 11.79, "validHrs": 11.2 }, "bce": { "buckets": { "dev": 320, "test": 322, "train": 336, "validated": 6117, "invalidated": 24, "other": 0 }, "duration": 36181656, "reportedSentences": 0, "validatedSentences": 986, "unvalidatedSentences": -1, "clips": 6141, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 6141, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 14, "size": 146567369, "checksum": "c05a81d13e145b5e30d749a6c51bd9e36731b10b99cc8947e989131f94c0e068", "avgDurationSecs": 5.892, "validDurationSecs": 36040.252, "totalHrs": 10.05, "validHrs": 10.01 }, "bci": { "buckets": { "dev": 267, "test": 290, "train": 319, "validated": 5623, "invalidated": 141, "other": 1414 }, "duration": 53374860, "reportedSentences": 1, "validatedSentences": 876, "unvalidatedSentences": -1, "clips": 7178, "splits": { "accent": {}, "age": { "": 0.86, "twenties": 0.14, "thirties": 0.01, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.93, "male_masculine": 0, "female_feminine": 0.07, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7178, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 16, "size": 309014764, "checksum": "77cca7a20507da7a7fb01355f526b7591406cbb354cbcf22193dc16e6e5f8fcd", "avgDurationSecs": 7.436, "validDurationSecs": 41812.042, "totalHrs": 14.82, "validHrs": 11.61 }, "be": { "buckets": { "dev": 15877, "test": 15880, "train": 347680, "validated": 1362284, "invalidated": 36972, "other": 18514 }, "duration": 6795011700, "reportedSentences": 3200, "validatedSentences": 379548, "unvalidatedSentences": 1931, "clips": 1417770, "splits": { "accent": {}, "age": { "": 0.87, "twenties": 0.03, "thirties": 0.04, "teens": 0.01, "fourties": 0.04, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.87, "male_masculine": 0.06, "female_feminine": 0.07, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1417681, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 4, "general": 33, "healthcare": 0, "history_law_government": 34, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 4, "news_current_affairs": 7, "technology_robotics": 7 } }, "users": 8596, "size": 38690099984, "checksum": "680f17ef2a63ef2934a2cd2c311e2d5002d32465fcccddb3a111141e95ac6d76", "avgDurationSecs": 4.793, "validDurationSecs": 6529081.387, "totalHrs": 1887.5, "validHrs": 1813.63 }, "beb": { "buckets": { "dev": 324, "test": 331, "train": 350, "validated": 6742, "invalidated": 737, "other": 2 }, "duration": 40845996, "reportedSentences": 0, "validatedSentences": 1005, "unvalidatedSentences": -1, "clips": 7481, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7481, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 33, "size": 235854057, "checksum": "4fbd54e932f2c10d69de7d04340e3a9dd79fa3ed518b78a243685acc0ac2e410", "avgDurationSecs": 5.46, "validDurationSecs": 36811.082, "totalHrs": 11.34, "validHrs": 10.22 }, "bfd": { "buckets": { "dev": 252, "test": 254, "train": 260, "validated": 6454, "invalidated": 53, "other": 673 }, "duration": 40598964, "reportedSentences": 0, "validatedSentences": 766, "unvalidatedSentences": -1, "clips": 7180, "splits": { "accent": {}, "age": { "": 0.99, "twenties": 0, "thirties": 0.01, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.99, "male_masculine": 0, "female_feminine": 0.01, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7180, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 36, "size": 232041727, "checksum": "91ec8fb3b6aa03a9eefe8adffc781d1dd8e2afa97c87d76968392955b9d6ae89", "avgDurationSecs": 5.654, "validDurationSecs": 36493.832, "totalHrs": 11.27, "validHrs": 10.13 }, "bft": { "buckets": { "dev": 1833, "test": 1805, "train": 2211, "validated": 10059, "invalidated": 489, "other": 10 }, "duration": 65071008, "reportedSentences": 37, "validatedSentences": 7968, "unvalidatedSentences": 12, "clips": 10558, "splits": { "accent": {}, "age": { "": 0.27, "twenties": 0.37, "thirties": 0.35, "teens": 0.01, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.78, "male_masculine": 0, "female_feminine": 0.13, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.1 }, "sentence_domain": { "": 10558, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 154, "size": 377793372, "checksum": "84f039c5154daaa1087d779cc28ca89181526c65080cc95a741dc8f17775453f", "avgDurationSecs": 6.163, "validDurationSecs": 61995.574, "totalHrs": 18.07, "validHrs": 17.22 }, "bg": { "buckets": { "dev": 2949, "test": 3380, "train": 4967, "validated": 11313, "invalidated": 777, "other": 1772 }, "duration": 75850704, "reportedSentences": 191, "validatedSentences": 39572, "unvalidatedSentences": 3, "clips": 13862, "splits": { "accent": {}, "age": { "": 0.37, "twenties": 0.11, "thirties": 0.28, "teens": 0, "fourties": 0.23, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.37, "male_masculine": 0.58, "female_feminine": 0.04, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 13862, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 148, "size": 446977666, "checksum": "6189a89f3fb0b00fc4e915ce6038f84e4cf4ff20879ded0eb32bac2f83e4f302", "avgDurationSecs": 5.472, "validDurationSecs": 61902.973, "totalHrs": 21.06, "validHrs": 17.19 }, "bgp": { "buckets": { "dev": 1105, "test": 2139, "train": 3538, "validated": 7606, "invalidated": 268, "other": 29 }, "duration": 48108024, "reportedSentences": 0, "validatedSentences": 6997, "unvalidatedSentences": -1, "clips": 7903, "splits": { "accent": {}, "age": { "": 0.95, "twenties": 0.05, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.99, "male_masculine": 0, "female_feminine": 0.01, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7903, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 25, "size": 284064238, "checksum": "149863ab8d1b264cbd81116c92708f7dc630f5c65ba4a12319838c4e12858c1b", "avgDurationSecs": 6.087, "validDurationSecs": 46300.092, "totalHrs": 13.36, "validHrs": 12.86 }, "bkh": { "buckets": { "dev": 305, "test": 304, "train": 377, "validated": 5614, "invalidated": 1949, "other": 0 }, "duration": 52500744, "reportedSentences": 2, "validatedSentences": 986, "unvalidatedSentences": 1, "clips": 7563, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7563, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 13, "size": 288996956, "checksum": "a39171ec6092f4b8a502f8a3b5316342d0293192ef64594a838f4b3a7d487072", "avgDurationSecs": 6.942, "validDurationSecs": 38971.199, "totalHrs": 14.58, "validHrs": 10.82 }, "bkm": { "buckets": { "dev": 304, "test": 310, "train": 326, "validated": 7573, "invalidated": 260, "other": 0 }, "duration": 45229536, "reportedSentences": 0, "validatedSentences": 940, "unvalidatedSentences": -1, "clips": 7833, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7833, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 27, "size": 266191823, "checksum": "6bb316a0f85ab143d44817041c8fa6e25ad5e5ff53d745911f4e08cc4b16d889", "avgDurationSecs": 5.774, "validDurationSecs": 43728.236, "totalHrs": 12.56, "validHrs": 12.14 }, "bn": { "buckets": { "dev": 9394, "test": 9394, "train": 21575, "validated": 44655, "invalidated": 7928, "other": 999507 }, "duration": 4598510976, "reportedSentences": 1890, "validatedSentences": 562827, "unvalidatedSentences": 94116, "clips": 1052090, "splits": { "accent": {}, "age": { "": 0.22, "twenties": 0.67, "thirties": 0.03, "teens": 0.07, "fourties": 0.01, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.23, "male_masculine": 0.54, "female_feminine": 0.23, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1052090, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 23002, "size": 26574204428, "checksum": "3e0f6c6c6484df5f7b2c03af079962671d2d3debb0fcab38351db1d644b01b4e", "avgDurationSecs": 4.371, "validDurationSecs": 195179.602, "totalHrs": 1277.36, "validHrs": 54.21 }, "bnm": { "buckets": { "dev": 282, "test": 331, "train": 412, "validated": 7675, "invalidated": 83, "other": 216 }, "duration": 60507684, "reportedSentences": 2, "validatedSentences": 1025, "unvalidatedSentences": -1, "clips": 7974, "splits": { "accent": {}, "age": { "": 0.65, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0.06, "fifties": 0.12, "sixties": 0.05, "seventies": 0.12, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7974, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 21, "size": 357621762, "checksum": "1877f0433254855359cafe4dcc6ea8f7919d5d98de023929a4cc501b3e3257c4", "avgDurationSecs": 7.588, "validDurationSecs": 58238.836, "totalHrs": 16.8, "validHrs": 16.17 }, "bnn": { "buckets": { "dev": 958, "test": 960, "train": 1040, "validated": 7274, "invalidated": 946, "other": 10 }, "duration": 41889204, "reportedSentences": 3, "validatedSentences": 3167, "unvalidatedSentences": 8, "clips": 8230, "splits": { "accent": {}, "age": { "": 0.6, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0.06, "sixties": 0.34, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.18, "male_masculine": 0.06, "female_feminine": 0.41, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.35 }, "sentence_domain": { "": 273, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 10108, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 19, "size": 246952751, "checksum": "cb970d52a5f68caad735b54666dc96b8b063526072d6a6c80b96f0cf3002a813", "avgDurationSecs": 5.09, "validDurationSecs": 37023.338, "totalHrs": 11.63, "validHrs": 10.28 }, "br": { "buckets": { "dev": 3397, "test": 3399, "train": 4396, "validated": 33695, "invalidated": 2406, "other": 0 }, "duration": 117428587, "reportedSentences": 304, "validatedSentences": 22656, "unvalidatedSentences": 370, "clips": 36101, "splits": { "accent": {}, "age": { "": 0.26, "twenties": 0.29, "thirties": 0.13, "teens": 0.01, "fourties": 0.06, "fifties": 0.08, "sixties": 0.12, "seventies": 0.06, "eighties": 0, "nineties": 0 }, "gender": { "": 0.35, "male_masculine": 0.59, "female_feminine": 0.06, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 31773, "agriculture_food": 3, "automotive_transport": 2, "finance": 1, "service_retail": 4, "general": 4276, "healthcare": 13, "history_law_government": 11, "language_fundamentals": 0, "media_entertainment": 13, "nature_environment": 8, "news_current_affairs": 0, "technology_robotics": 4 } }, "users": 272, "size": 796308893, "checksum": "4d824b0baf8291a9afbd9daab2ce651d5fb48974b4f33181fe8c0bdf7b57eea7", "avgDurationSecs": 3.253, "validDurationSecs": 109602.4, "totalHrs": 32.61, "validHrs": 30.44 }, "brh": { "buckets": { "dev": 504, "test": 882, "train": 1705, "validated": 5084, "invalidated": 12, "other": 12 }, "duration": 37155096, "reportedSentences": 0, "validatedSentences": 3095, "unvalidatedSentences": -1, "clips": 5108, "splits": { "accent": {}, "age": { "": 0.81, "twenties": 0, "thirties": 0.19, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 5108, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 18, "size": 215870657, "checksum": "a7404392ac28d37861d0d5cf7d444bb1591332c1601d11c6b55d0df8c242e39a", "avgDurationSecs": 7.274, "validDurationSecs": 36980.522, "totalHrs": 10.32, "validHrs": 10.27 }, "bri": { "buckets": { "dev": 203, "test": 298, "train": 699, "validated": 8838, "invalidated": 234, "other": 122 }, "duration": 39939480, "reportedSentences": 12, "validatedSentences": 1200, "unvalidatedSentences": -1, "clips": 9194, "splits": { "accent": {}, "age": { "": 0.86, "twenties": 0.01, "thirties": 0.13, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.87, "male_masculine": 0, "female_feminine": 0.13, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 9194, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 15, "size": 197673444, "checksum": "385b9cae7f3fa2d70cfc54c00d191f28c435392d8309c33a666695146798903c", "avgDurationSecs": 4.344, "validDurationSecs": 38392.987, "totalHrs": 11.09, "validHrs": 10.66 }, "bsh": { "buckets": { "dev": 515, "test": 693, "train": 1420, "validated": 6765, "invalidated": 60, "other": 37 }, "duration": 37426032, "reportedSentences": 2, "validatedSentences": 2646, "unvalidatedSentences": 40, "clips": 6862, "splits": { "accent": {}, "age": { "": 0.15, "twenties": 0.57, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0.28, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 6862, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 14, "size": 220715976, "checksum": "4111396cbb8b05515503fe3846ab5732d1209a8325d951e58e2212fedc8e0839", "avgDurationSecs": 5.454, "validDurationSecs": 36896.984, "totalHrs": 10.39, "validHrs": 10.24 }, "bsk": { "buckets": { "dev": 348, "test": 733, "train": 1187, "validated": 8615, "invalidated": 686, "other": 1 }, "duration": 39648312, "reportedSentences": 2, "validatedSentences": 2447, "unvalidatedSentences": 22, "clips": 9302, "splits": { "accent": {}, "age": { "": 0.3, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0.46, "fifties": 0.24, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 9248, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 54, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 27, "size": 229263635, "checksum": "468289bf74d387ddf1f708a23ef08b5f6d25a56bdabd7cf637e02d547df9301a", "avgDurationSecs": 4.262, "validDurationSecs": 36720.083, "totalHrs": 11.01, "validHrs": 10.2 }, "btv": { "buckets": { "dev": 226, "test": 329, "train": 452, "validated": 9109, "invalidated": 127, "other": 47 }, "duration": 37660860, "reportedSentences": 263, "validatedSentences": 1053, "unvalidatedSentences": 9, "clips": 9283, "splits": { "accent": {}, "age": { "": 0.47, "twenties": 0.32, "thirties": 0, "teens": 0, "fourties": 0.21, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.89, "male_masculine": 0.11, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 9274, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 8, "healthcare": 1, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 16, "size": 215819786, "checksum": "8e3da90b7112ef6be21aadd8ef9b34b5339e0d96dda50179864bdbdaebade716", "avgDurationSecs": 4.057, "validDurationSecs": 36954.947, "totalHrs": 10.46, "validHrs": 10.26 }, "bum": { "buckets": { "dev": 269, "test": 285, "train": 347, "validated": 7751, "invalidated": 177, "other": 29 }, "duration": 37052424, "reportedSentences": 0, "validatedSentences": 901, "unvalidatedSentences": -1, "clips": 7957, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7957, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 22, "size": 210559404, "checksum": "ea1e4b8532b0b153d715335f212bafabc80166cc4c4a92f0d7d2fc75380605f9", "avgDurationSecs": 4.657, "validDurationSecs": 36093.168, "totalHrs": 10.29, "validHrs": 10.02 }, "byv": { "buckets": { "dev": 327, "test": 327, "train": 336, "validated": 7719, "invalidated": 0, "other": 0 }, "duration": 47684376, "reportedSentences": 0, "validatedSentences": 990, "unvalidatedSentences": 1027, "clips": 7719, "splits": { "accent": {}, "age": { "": 0.81, "twenties": 0.06, "thirties": 0.12, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.94, "male_masculine": 0, "female_feminine": 0.06, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7719, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 96, "size": 276978955, "checksum": "669c0a2460b4badcf56f48d8b9008f342ba6f5967d0574b09b830c6e6ba705bb", "avgDurationSecs": 6.178, "validDurationSecs": 47684.376, "totalHrs": 13.24, "validHrs": 13.24 }, "ca": { "buckets": { "dev": 16416, "test": 16416, "train": 1215000, "validated": 2297291, "invalidated": 141235, "other": 238250 }, "duration": 13920572682, "reportedSentences": 9581, "validatedSentences": 1304058, "unvalidatedSentences": 3656, "clips": 2676776, "splits": { "accent": {}, "age": { "": 0.27, "twenties": 0.04, "thirties": 0.05, "teens": 0.01, "fourties": 0.12, "fifties": 0.19, "sixties": 0.29, "seventies": 0.04, "eighties": 0, "nineties": 0 }, "gender": { "": 0.27, "male_masculine": 0.52, "female_feminine": 0.21, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0, "intersex": 0 }, "sentence_domain": { "": 2675630, "agriculture_food": 59, "automotive_transport": 31, "finance": 4, "service_retail": 63, "general": 657, "healthcare": 36, "history_law_government": 65, "language_fundamentals": 34, "media_entertainment": 37, "nature_environment": 135, "news_current_affairs": 36, "technology_robotics": 27 } }, "users": 36868, "size": 83674470758, "checksum": "74b7ee289aaf2a199661b45a7b99447e7cc0dc527c1276e5448cd20b6dacc100", "avgDurationSecs": 5.2, "validDurationSecs": 11947061.068, "totalHrs": 3866.82, "validHrs": 3318.62 }, "cjk": { "buckets": { "dev": 377, "test": 377, "train": 387, "validated": 7333, "invalidated": 1195, "other": 0 }, "duration": 50697864, "reportedSentences": 0, "validatedSentences": 1141, "unvalidatedSentences": 1, "clips": 8528, "splits": { "accent": {}, "age": { "": 0.11, "twenties": 0.12, "thirties": 0.26, "teens": 0, "fourties": 0.49, "fifties": 0.02, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.62, "male_masculine": 0.03, "female_feminine": 0.35, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8528, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 45, "size": 279634470, "checksum": "0da6fc97db29d26c393769cd2299305ede7e6a9e9ca5e827f95f04731665e69f", "avgDurationSecs": 5.945, "validDurationSecs": 43593.743, "totalHrs": 14.08, "validHrs": 12.1 }, "ckb": { "buckets": { "dev": 5348, "test": 5348, "train": 7883, "validated": 119869, "invalidated": 9278, "other": 39520 }, "duration": 690661692, "reportedSentences": 2531, "validatedSentences": 19230, "unvalidatedSentences": 15255, "clips": 168667, "splits": { "accent": {}, "age": { "": 0.32, "twenties": 0.43, "thirties": 0.1, "teens": 0.02, "fourties": 0.02, "fifties": 0.01, "sixties": 0.1, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.32, "male_masculine": 0.63, "female_feminine": 0.05, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 168421, "agriculture_food": 0, "automotive_transport": 10, "finance": 0, "service_retail": 0, "general": 121, "healthcare": 0, "history_law_government": 10, "language_fundamentals": 10, "media_entertainment": 95, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 1976, "size": 3817557893, "checksum": "19fc00e7df6b164a6f77c7eca7c22530b52f032b9d00a12e99ee46ccb403553e", "avgDurationSecs": 4.095, "validDurationSecs": 490842.467, "totalHrs": 191.85, "validHrs": 136.34 }, "cnh": { "buckets": { "dev": 763, "test": 765, "train": 818, "validated": 2463, "invalidated": 437, "other": 3287 }, "duration": 21751656, "reportedSentences": 9, "validatedSentences": 5218, "unvalidatedSentences": -1, "clips": 6187, "splits": { "accent": {}, "age": { "": 0.48, "twenties": 0.4, "thirties": 0.07, "teens": 0.01, "fourties": 0.01, "fifties": 0.02, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.48, "male_masculine": 0.3, "female_feminine": 0.21, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 6187, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 300, "size": 168181204, "checksum": "cb04539ec3670594b854f4010f0dbb8ce0464ed8bf0bcbbc726f22fd58bd91fc", "avgDurationSecs": 3.516, "validDurationSecs": 8659.177, "totalHrs": 6.04, "validHrs": 2.4 }, "cpy": { "buckets": { "dev": 188, "test": 294, "train": 518, "validated": 8162, "invalidated": 26, "other": 84 }, "duration": 36567612, "reportedSentences": 0, "validatedSentences": 1000, "unvalidatedSentences": 15, "clips": 8272, "splits": { "accent": {}, "age": { "": 0.01, "twenties": 0.12, "thirties": 0.12, "teens": 0.24, "fourties": 0.39, "fifties": 0, "sixties": 0.12, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.77, "male_masculine": 0, "female_feminine": 0.23, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8272, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 15, "size": 210662597, "checksum": "912429d002017db6e89bef944953a49cd8468c538e1d71f5071a401933549cf9", "avgDurationSecs": 4.421, "validDurationSecs": 36081.341, "totalHrs": 10.15, "validHrs": 10.02 }, "cs": { "buckets": { "dev": 9458, "test": 9437, "train": 21951, "validated": 65000, "invalidated": 2610, "other": 149239 }, "duration": 967201527, "reportedSentences": 973, "validatedSentences": 451217, "unvalidatedSentences": 141, "clips": 216849, "splits": { "accent": {}, "age": { "": 0.24, "twenties": 0.19, "thirties": 0.47, "teens": 0.02, "fourties": 0.07, "fifties": 0.01, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.25, "male_masculine": 0.53, "female_feminine": 0.22, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 216826, "agriculture_food": 0, "automotive_transport": 1, "finance": 0, "service_retail": 0, "general": 15, "healthcare": 0, "history_law_government": 1, "language_fundamentals": 0, "media_entertainment": 4, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 8 } }, "users": 1129, "size": 5950686352, "checksum": "3ef013a0c17afa5e873694e292c928dfe20a26f83b6eae5ed89a2710c58f6181", "avgDurationSecs": 4.46, "validDurationSecs": 289916.482, "totalHrs": 268.66, "validHrs": 80.53 }, "cut": { "buckets": { "dev": 290, "test": 325, "train": 378, "validated": 5481, "invalidated": 5, "other": 130 }, "duration": 37239084, "reportedSentences": 0, "validatedSentences": 994, "unvalidatedSentences": 1, "clips": 5616, "splits": { "accent": {}, "age": { "": 0.25, "twenties": 0, "thirties": 0.42, "teens": 0, "fourties": 0.17, "fifties": 0.16, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.32, "male_masculine": 0, "female_feminine": 0.68, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 5616, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 15, "size": 219697025, "checksum": "95481d4df662f9640074f60ebab50808f0c651abaf574b3ca694a647735ce0f0", "avgDurationSecs": 6.631, "validDurationSecs": 36343.914, "totalHrs": 10.34, "validHrs": 10.09 }, "cux": { "buckets": { "dev": 647, "test": 494, "train": 1107, "validated": 9016, "invalidated": 325, "other": 9 }, "duration": 38339748, "reportedSentences": 1, "validatedSentences": 2251, "unvalidatedSentences": 18, "clips": 9350, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.36, "thirties": 0.23, "teens": 0.41, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.35, "male_masculine": 0, "female_feminine": 0.65, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 9350, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 11, "size": 174502178, "checksum": "8a0023face6efa3ba1ed8b536d8a107b6586ccae6e1561a71f18c16ce6acfc9a", "avgDurationSecs": 4.101, "validDurationSecs": 36970.178, "totalHrs": 10.64, "validHrs": 10.26 }, "cv": { "buckets": { "dev": 1242, "test": 1288, "train": 1456, "validated": 17497, "invalidated": 2215, "other": 744 }, "duration": 103130544, "reportedSentences": 144, "validatedSentences": 4382, "unvalidatedSentences": 4, "clips": 20456, "splits": { "accent": {}, "age": { "": 0.24, "twenties": 0.5, "thirties": 0.01, "teens": 0.18, "fourties": 0.06, "fifties": 0.01, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.22, "male_masculine": 0.51, "female_feminine": 0.27, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 20455, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 1 } }, "users": 122, "size": 697770986, "checksum": "4ffa14e3b8d428118c32e8a26c5b940d246eaececc85eecb572b5ca8dc5b7819", "avgDurationSecs": 5.042, "validDurationSecs": 88212.511, "totalHrs": 28.64, "validHrs": 24.5 }, "cy": { "buckets": { "dev": 5414, "test": 5414, "train": 8026, "validated": 90859, "invalidated": 4471, "other": 20672 }, "duration": 570264093, "reportedSentences": 176, "validatedSentences": 118044, "unvalidatedSentences": 15, "clips": 116002, "splits": { "accent": {}, "age": { "": 0.43, "twenties": 0.13, "thirties": 0.09, "teens": 0.02, "fourties": 0.16, "fifties": 0.09, "sixties": 0.07, "seventies": 0.01, "eighties": 0, "nineties": 0 }, "gender": { "": 0.43, "male_masculine": 0.33, "female_feminine": 0.25, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 116001, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 1, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 1931, "size": 4158425297, "checksum": "c73af06c90775d7b9108c569ce6f41a4111a76897e6962e83ca64a1e99f82c8a", "avgDurationSecs": 4.916, "validDurationSecs": 446661.482, "totalHrs": 158.4, "validHrs": 124.07 }, "da": { "buckets": { "dev": 2629, "test": 2758, "train": 3602, "validated": 11341, "invalidated": 441, "other": 2308 }, "duration": 57211740, "reportedSentences": 685, "validatedSentences": 20807, "unvalidatedSentences": 274, "clips": 14090, "splits": { "accent": {}, "age": { "": 0.4, "twenties": 0.16, "thirties": 0.22, "teens": 0.01, "fourties": 0.16, "fifties": 0.04, "sixties": 0.01, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.46, "male_masculine": 0.48, "female_feminine": 0.06, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 14063, "agriculture_food": 1, "automotive_transport": 3, "finance": 0, "service_retail": 1, "general": 16, "healthcare": 1, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 9, "nature_environment": 2, "news_current_affairs": 0, "technology_robotics": 1 } }, "users": 296, "size": 331777774, "checksum": "3d60b07b341b736ae70ed8fc0c685663ae7304bd2840ade7d705f6bdada74d9b", "avgDurationSecs": 4.06, "validDurationSecs": 46049.563, "totalHrs": 15.89, "validHrs": 12.79 }, "dag": { "buckets": { "dev": 396, "test": 415, "train": 446, "validated": 8114, "invalidated": 114, "other": 13046 }, "duration": 91434492, "reportedSentences": 0, "validatedSentences": 5220, "unvalidatedSentences": 15347, "clips": 21274, "splits": { "accent": {}, "age": { "": 0.36, "twenties": 0.39, "thirties": 0.24, "teens": 0, "fourties": 0.01, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.78, "male_masculine": 0.02, "female_feminine": 0.18, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.02 }, "sentence_domain": { "": 21261, "agriculture_food": 3, "automotive_transport": 3, "finance": 6, "service_retail": 0, "general": 7, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 57, "size": 508358002, "checksum": "6cd20551fbfb1352fea5f535c502f8d85c37ad70adeef52c7981cd8816c30a95", "avgDurationSecs": 4.298, "validDurationSecs": 34873.53, "totalHrs": 25.39, "validHrs": 9.68 }, "dar": { "buckets": { "dev": 611, "test": 689, "train": 859, "validated": 3113, "invalidated": 31, "other": 2013 }, "duration": 27594144, "reportedSentences": 4, "validatedSentences": 2819, "unvalidatedSentences": 472, "clips": 5157, "splits": { "accent": {}, "age": { "": 0.18, "twenties": 0.36, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0.45, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.7, "male_masculine": 0, "female_feminine": 0.3, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 2, "agriculture_food": 18, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 3214, "healthcare": 59, "history_law_government": 121, "language_fundamentals": 166, "media_entertainment": 1125, "nature_environment": 0, "news_current_affairs": 456, "technology_robotics": 0 } }, "users": 13, "size": 160770318, "checksum": "4b6fadcda297c53d5ff319d2ee29f02698e9959cc46eb96128fd973bfe378b6f", "avgDurationSecs": 5.351, "validDurationSecs": 16657.082, "totalHrs": 7.66, "validHrs": 4.62 }, "dav": { "buckets": { "dev": 1276, "test": 1004, "train": 2098, "validated": 8264, "invalidated": 663, "other": 40703 }, "duration": 201431016, "reportedSentences": 11, "validatedSentences": 11773, "unvalidatedSentences": 20119, "clips": 49630, "splits": { "accent": {}, "age": { "": 0.04, "twenties": 0.61, "thirties": 0.1, "teens": 0, "fourties": 0.01, "fifties": 0.01, "sixties": 0.23, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.73, "male_masculine": 0, "female_feminine": 0.27, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 971, "agriculture_food": 499, "automotive_transport": 100, "finance": 304, "service_retail": 1218, "general": 45323, "healthcare": 967, "history_law_government": 334, "language_fundamentals": 150, "media_entertainment": 68, "nature_environment": 873, "news_current_affairs": 86, "technology_robotics": 75 } }, "users": 24, "size": 1084119611, "checksum": "88631830c7aa16e1e62508169dc6434f58d957828bac8a12b93f375eab805328", "avgDurationSecs": 4.059, "validDurationSecs": 33540.72, "totalHrs": 55.95, "validHrs": 9.31 }, "de": { "buckets": { "dev": 16203, "test": 16203, "train": 616461, "validated": 944924, "invalidated": 57712, "other": 11538 }, "duration": 5339754341, "reportedSentences": 11379, "validatedSentences": 2057983, "unvalidatedSentences": 1537, "clips": 1014174, "splits": { "accent": {}, "age": { "": 0.33, "twenties": 0.17, "thirties": 0.16, "teens": 0.03, "fourties": 0.17, "fifties": 0.11, "sixties": 0.02, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.34, "male_masculine": 0.58, "female_feminine": 0.08, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1013973, "agriculture_food": 0, "automotive_transport": 6, "finance": 0, "service_retail": 12, "general": 142, "healthcare": 16, "history_law_government": 14, "language_fundamentals": 3, "media_entertainment": 1, "nature_environment": 12, "news_current_affairs": 4, "technology_robotics": 9 } }, "users": 20413, "size": 37071377685, "checksum": "7b0b97f32ed8404b02c75251a99e3ea19317888fd3a51567275b971cb36c1f21", "avgDurationSecs": 5.265, "validDurationSecs": 4975144.335, "totalHrs": 1483.26, "validHrs": 1381.98 }, "dmk": { "buckets": { "dev": 0, "test": 938, "train": 3200, "validated": 10648, "invalidated": 123, "other": 21 }, "duration": 38273472, "reportedSentences": 732, "validatedSentences": 4139, "unvalidatedSentences": 194, "clips": 10792, "splits": { "accent": {}, "age": { "": 0.04, "twenties": 0.01, "thirties": 0.15, "teens": 0, "fourties": 0.81, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.95, "male_masculine": 0, "female_feminine": 0.05, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 10790, "agriculture_food": 2, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 2, "healthcare": 2, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 10, "size": 223080239, "checksum": "12bd601e002918086e4f6381da0c00820170a3fb111674c55fd3ae91257b35aa", "avgDurationSecs": 3.546, "validDurationSecs": 37762.781, "totalHrs": 10.63, "validHrs": 10.48 }, "dml": { "buckets": { "dev": 1101, "test": 626, "train": 3190, "validated": 6115, "invalidated": 73, "other": 299 }, "duration": 39238596, "reportedSentences": 0, "validatedSentences": 5670, "unvalidatedSentences": 676, "clips": 6487, "splits": { "accent": {}, "age": { "": 0.08, "twenties": 0.09, "thirties": 0, "teens": 0, "fourties": 0.79, "fifties": 0.03, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 6473, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 7, "healthcare": 0, "history_law_government": 3, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 4, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 5, "size": 232053163, "checksum": "217262aaf8bc8133edd0088e2813d7b91e1a3b1970351356d877f76859b4d900", "avgDurationSecs": 6.049, "validDurationSecs": 36988.441, "totalHrs": 10.89, "validHrs": 10.27 }, "dru": { "buckets": { "dev": 933, "test": 957, "train": 1074, "validated": 6576, "invalidated": 116, "other": 1 }, "duration": 37990332, "reportedSentences": 2, "validatedSentences": 3867, "unvalidatedSentences": 477, "clips": 6693, "splits": { "accent": {}, "age": { "": 0.88, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0.12, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0, "male_masculine": 0, "female_feminine": 0.12, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.87 }, "sentence_domain": { "": 71, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 10031, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 1759, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 20, "size": 223976380, "checksum": "0a27a4418f5afc38f8960d83bd89deeb77d8a6f9a557158e525cac1edeaf33ff", "avgDurationSecs": 5.676, "validDurationSecs": 37326.225, "totalHrs": 10.55, "validHrs": 10.36 }, "dsb": { "buckets": { "dev": 0, "test": 0, "train": 0, "validated": 0, "invalidated": 0, "other": 5 }, "duration": 40284, "reportedSentences": 0, "validatedSentences": 796, "unvalidatedSentences": -1, "clips": 5, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 0, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 2, "healthcare": 0, "history_law_government": 2, "language_fundamentals": 0, "media_entertainment": 2, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 1, "size": 293762, "checksum": "88c5e7f1c3a52573d7248bbf464b63cea37bec7a2690c7e2724a9007cbbe38a6", "avgDurationSecs": 8.057, "validDurationSecs": 0, "totalHrs": 0.01, "validHrs": 0 }, "dua": { "buckets": { "dev": 326, "test": 311, "train": 366, "validated": 7018, "invalidated": 1102, "other": 4 }, "duration": 55392156, "reportedSentences": 1, "validatedSentences": 1003, "unvalidatedSentences": 1, "clips": 8124, "splits": { "accent": {}, "age": { "": 0.77, "twenties": 0.11, "thirties": 0.1, "teens": 0, "fourties": 0.02, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.89, "male_masculine": 0, "female_feminine": 0.11, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8124, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 13, "size": 312378845, "checksum": "7510e1763517426565510abe5376ba0b5ea3eabdf1efbba198fe198416da2ac6", "avgDurationSecs": 6.818, "validDurationSecs": 47851.077, "totalHrs": 15.38, "validHrs": 13.29 }, "dv": { "buckets": { "dev": 2243, "test": 2228, "train": 2648, "validated": 26571, "invalidated": 1661, "other": 15071 }, "duration": 221700519, "reportedSentences": 59, "validatedSentences": 7174, "unvalidatedSentences": 9, "clips": 43303, "splits": { "accent": {}, "age": { "": 0.24, "twenties": 0.11, "thirties": 0.39, "teens": 0.01, "fourties": 0.23, "fifties": 0.03, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.24, "male_masculine": 0.24, "female_feminine": 0.52, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 43302, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 1, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 391, "size": 1409830097, "checksum": "4bc4c02d7baee9139efa04f9b7b06c7d2fb7bdfca62a3ea071c4df678e67822f", "avgDurationSecs": 5.12, "validDurationSecs": 136036.868, "totalHrs": 61.58, "validHrs": 37.78 }, "dyu": { "buckets": { "dev": 50, "test": 63, "train": 90, "validated": 211, "invalidated": 15, "other": 69 }, "duration": 1861236, "reportedSentences": 0, "validatedSentences": 5028, "unvalidatedSentences": 41, "clips": 295, "splits": { "accent": {}, "age": { "": 0.31, "twenties": 0.66, "thirties": 0, "teens": 0.02, "fourties": 0.02, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.31, "male_masculine": 0.39, "female_feminine": 0.3, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 295, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 35, "size": 10792930, "checksum": "5c73eef972e528e84cc618c3ba889e8f40656fa5d1aa2daba186fef1d7359c72", "avgDurationSecs": 6.309, "validDurationSecs": 1331.257, "totalHrs": 0.51, "validHrs": 0.36 }, "ebr": { "buckets": { "dev": 0, "test": 228, "train": 644, "validated": 1544, "invalidated": 1, "other": 506 }, "duration": 11458872, "reportedSentences": 5, "validatedSentences": 872, "unvalidatedSentences": 3, "clips": 2051, "splits": { "accent": {}, "age": { "": 0.03, "twenties": 0.23, "thirties": 0.32, "teens": 0, "fourties": 0.42, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.68, "male_masculine": 0, "female_feminine": 0.32, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 2051, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 6, "size": 64924896, "checksum": "4d3c3313b8e1c20da0216c410510ed86d5c21c5ddaf97f959f464cd07e98d5e6", "avgDurationSecs": 5.587, "validDurationSecs": 8626.279, "totalHrs": 3.18, "validHrs": 2.39 }, "eko": { "buckets": { "dev": 353, "test": 414, "train": 519, "validated": 3950, "invalidated": 113, "other": 12 }, "duration": 37988928, "reportedSentences": 0, "validatedSentences": 1288, "unvalidatedSentences": 16, "clips": 4075, "splits": { "accent": {}, "age": { "": 0.08, "twenties": 0.31, "thirties": 0.55, "teens": 0, "fourties": 0.05, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.48, "male_masculine": 0, "female_feminine": 0.52, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1794, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 2257, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 24, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 7, "size": 221521094, "checksum": "a565d2a7e72ea4b0ed67ddc43e2adacf991c5b3f785f92bb7c7d1d5df7d01033", "avgDurationSecs": 9.322, "validDurationSecs": 36823.623, "totalHrs": 10.55, "validHrs": 10.22 }, "el": { "buckets": { "dev": 1711, "test": 1717, "train": 1921, "validated": 17020, "invalidated": 877, "other": 10324 }, "duration": 117179854, "reportedSentences": 72, "validatedSentences": 7018, "unvalidatedSentences": 4340, "clips": 28221, "splits": { "accent": {}, "age": { "": 0.31, "twenties": 0.12, "thirties": 0.36, "teens": 0.01, "fourties": 0.17, "fifties": 0.03, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.34, "male_masculine": 0.63, "female_feminine": 0.03, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 28221, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 448, "size": 777849676, "checksum": "61e377fda91bf4f7a0a45b735d0bede5d140573600a4e9356b381ba1dc5ee297", "avgDurationSecs": 4.152, "validDurationSecs": 70670.817, "totalHrs": 32.54, "validHrs": 19.63 }, "en": { "buckets": { "dev": 16403, "test": 16403, "train": 1147819, "validated": 1869726, "invalidated": 309878, "other": 389504 }, "duration": 13605229315, "reportedSentences": 9830, "validatedSentences": 1681441, "unvalidatedSentences": 37247, "clips": 2569108, "splits": { "accent": {}, "age": { "": 0.36, "twenties": 0.25, "thirties": 0.14, "teens": 0.06, "fourties": 0.09, "fifties": 0.05, "sixties": 0.04, "seventies": 0.01, "eighties": 0, "nineties": 0 }, "gender": { "": 0.39, "male_masculine": 0.43, "female_feminine": 0.18, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0, "intersex": 0 }, "sentence_domain": { "": 2567905, "agriculture_food": 161, "automotive_transport": 8, "finance": 44, "service_retail": 29, "general": 644, "healthcare": 25, "history_law_government": 120, "language_fundamentals": 10, "media_entertainment": 115, "nature_environment": 55, "news_current_affairs": 13, "technology_robotics": 98 } }, "users": 99289, "size": 94210106373, "checksum": "a477e793f831662c00fd526453abde3c3e4791b8eda19e1a723457751f8f3c61", "avgDurationSecs": 5.296, "validDurationSecs": 9901510.947, "totalHrs": 3779.23, "validHrs": 2750.41 }, "eo": { "buckets": { "dev": 14916, "test": 14900, "train": 144451, "validated": 852619, "invalidated": 127521, "other": 164426 }, "duration": 6951494923, "reportedSentences": 2404, "validatedSentences": 181129, "unvalidatedSentences": 21895, "clips": 1144566, "splits": { "accent": {}, "age": { "": 0.2, "twenties": 0.56, "thirties": 0.12, "teens": 0.05, "fourties": 0.04, "fifties": 0.02, "sixties": 0, "seventies": 0, "eighties": 0.01, "nineties": 0 }, "gender": { "": 0.2, "male_masculine": 0.69, "female_feminine": 0.11, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1144561, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 5, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 1878, "size": 41544000333, "checksum": "b35aa988b502d8c7da49f5f34525a5b7d55948e4c6c1cd62a6cd0cd6ffb3902c", "avgDurationSecs": 6.073, "validDurationSecs": 5178361.623, "totalHrs": 1930.97, "validHrs": 1438.43 }, "es": { "buckets": { "dev": 15900, "test": 15900, "train": 357397, "validated": 436590, "invalidated": 95033, "other": 1144151 }, "duration": 8177052330, "reportedSentences": 2666, "validatedSentences": 1082337, "unvalidatedSentences": 4887, "clips": 1675774, "splits": { "accent": {}, "age": { "": 0.13, "twenties": 0.53, "thirties": 0.09, "teens": 0.08, "fourties": 0.03, "fifties": 0.04, "sixties": 0.1, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.13, "male_masculine": 0.55, "female_feminine": 0.31, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1675639, "agriculture_food": 1, "automotive_transport": 4, "finance": 5, "service_retail": 3, "general": 43, "healthcare": 4, "history_law_government": 33, "language_fundamentals": 8, "media_entertainment": 8, "nature_environment": 11, "news_current_affairs": 18, "technology_robotics": 22 } }, "users": 26838, "size": 51528103656, "checksum": "2c2943fbc5c96d5c00bd98f6fe41f358a057ae451fd4c324bff98a1b41e4f0d8", "avgDurationSecs": 4.88, "validDurationSecs": 2130370.37, "totalHrs": 2271.4, "validHrs": 591.76 }, "esu": { "buckets": { "dev": 0, "test": 501, "train": 6125, "validated": 7219, "invalidated": 0, "other": 5 }, "duration": 27453780, "reportedSentences": 17, "validatedSentences": 6929, "unvalidatedSentences": 5, "clips": 7224, "splits": { "accent": {}, "age": { "": 0, "twenties": 0, "thirties": 1, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7224, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 4, "size": 142932823, "checksum": "3a7954a7aadc0752923b1ba0c4429ac08bd491ffdb2b8bc3eda1f067fb2eb276", "avgDurationSecs": 3.8, "validDurationSecs": 27434.778, "totalHrs": 7.62, "validHrs": 7.62 }, "et": { "buckets": { "dev": 2887, "test": 2887, "train": 3496, "validated": 27656, "invalidated": 7962, "other": 126 }, "duration": 240245642, "reportedSentences": 571, "validatedSentences": 11090, "unvalidatedSentences": 1876, "clips": 35744, "splits": { "accent": {}, "age": { "": 0.18, "twenties": 0.7, "thirties": 0.08, "teens": 0, "fourties": 0.03, "fifties": 0.01, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.24, "male_masculine": 0.49, "female_feminine": 0.26, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 34751, "agriculture_food": 61, "automotive_transport": 46, "finance": 42, "service_retail": 14, "general": 620, "healthcare": 36, "history_law_government": 40, "language_fundamentals": 17, "media_entertainment": 46, "nature_environment": 111, "news_current_affairs": 23, "technology_robotics": 46 } }, "users": 1067, "size": 1599629830, "checksum": "42e83ac54800354de55915a618b1499f87aab5228ba1e76a1e8bef80151fed21", "avgDurationSecs": 6.721, "validDurationSecs": 185883.882, "totalHrs": 66.73, "validHrs": 51.63 }, "eto": { "buckets": { "dev": 300, "test": 307, "train": 359, "validated": 10552, "invalidated": 346, "other": 204 }, "duration": 38369448, "reportedSentences": 0, "validatedSentences": 966, "unvalidatedSentences": -1, "clips": 11102, "splits": { "accent": {}, "age": { "": 0.99, "twenties": 0, "thirties": 0.01, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 11102, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 26, "size": 217054142, "checksum": "a5b737b4a4f050cc83ff2219a52ad54ebb9e47a0dda86172a12086928c2e5d5d", "avgDurationSecs": 3.456, "validDurationSecs": 36468.602, "totalHrs": 10.65, "validHrs": 10.13 }, "eu": { "buckets": { "dev": 14804, "test": 14804, "train": 134190, "validated": 311983, "invalidated": 50883, "other": 102015 }, "duration": 2559683811, "reportedSentences": 1279, "validatedSentences": 1018163, "unvalidatedSentences": 12680, "clips": 464881, "splits": { "accent": {}, "age": { "": 0.45, "twenties": 0.17, "thirties": 0.06, "teens": 0.02, "fourties": 0.16, "fifties": 0.11, "sixties": 0.04, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.47, "male_masculine": 0.25, "female_feminine": 0.29, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0, "intersex": 0 }, "sentence_domain": { "": 443641, "agriculture_food": 7, "automotive_transport": 6, "finance": 4, "service_retail": 7, "general": 21307, "healthcare": 22, "history_law_government": 0, "language_fundamentals": 2, "media_entertainment": 6, "nature_environment": 6, "news_current_affairs": 0, "technology_robotics": 23 } }, "users": 11045, "size": 15692713908, "checksum": "594a7b558c3d9c11899e8f13f07e28783ea7085fc39f3dbe6613c6a8b7715874", "avgDurationSecs": 5.506, "validDurationSecs": 1717811.299, "totalHrs": 711.02, "validHrs": 477.16 }, "ewo": { "buckets": { "dev": 288, "test": 288, "train": 307, "validated": 7571, "invalidated": 461, "other": 102 }, "duration": 71308908, "reportedSentences": 0, "validatedSentences": 883, "unvalidatedSentences": -1, "clips": 8134, "splits": { "accent": {}, "age": { "": 0.94, "twenties": 0.01, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0.05, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.99, "male_masculine": 0, "female_feminine": 0.01, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8134, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 31, "size": 410898056, "checksum": "cdad8bdbf48360d44a20754b4e4ba8aa7ae002f009fe5a8f466a61b7bdea08c4", "avgDurationSecs": 8.767, "validDurationSecs": 66373.216, "totalHrs": 19.8, "validHrs": 18.43 }, "fa": { "buckets": { "dev": 10712, "test": 10712, "train": 30066, "validated": 340117, "invalidated": 15412, "other": 34605 }, "duration": 1543007888, "reportedSentences": 2810, "validatedSentences": 57763, "unvalidatedSentences": 283344, "clips": 390134, "splits": { "accent": {}, "age": { "": 0.25, "twenties": 0.33, "thirties": 0.35, "teens": 0.03, "fourties": 0.02, "fifties": 0.01, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.23, "male_masculine": 0.7, "female_feminine": 0.06, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 390103, "agriculture_food": 0, "automotive_transport": 3, "finance": 0, "service_retail": 0, "general": 27, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 1, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 4639, "size": 11134521257, "checksum": "543fe1231d5c72b76919906b452f77fdb2f15c8fd60779fe2254030dc44ce656", "avgDurationSecs": 3.955, "validDurationSecs": 1345187.074, "totalHrs": 428.61, "validHrs": 373.66 }, "fan": { "buckets": { "dev": 327, "test": 328, "train": 349, "validated": 7706, "invalidated": 82, "other": 346 }, "duration": 42145596, "reportedSentences": 0, "validatedSentences": 1005, "unvalidatedSentences": -1, "clips": 8134, "splits": { "accent": {}, "age": { "": 0.89, "twenties": 0, "thirties": 0, "teens": 0.01, "fourties": 0.1, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8134, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 43, "size": 247401451, "checksum": "65d9feb954bc8209ec5dd994ae7488f94e6ec8f732c0e6cd7a4ecee136edc7ff", "avgDurationSecs": 5.181, "validDurationSecs": 39927.952, "totalHrs": 11.7, "validHrs": 11.09 }, "fi": { "buckets": { "dev": 1812, "test": 1796, "train": 2069, "validated": 12196, "invalidated": 426, "other": 5248 }, "duration": 82683723, "reportedSentences": 78, "validatedSentences": 5865, "unvalidatedSentences": 49163, "clips": 17870, "splits": { "accent": {}, "age": { "": 0.33, "twenties": 0.16, "thirties": 0.17, "teens": 0.01, "fourties": 0.3, "fifties": 0.03, "sixties": 0.01, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.34, "male_masculine": 0.36, "female_feminine": 0.3, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 17870, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 248, "size": 493606591, "checksum": "77756bdc318c2daabdc0abde96cd47db55bd0b29029e0044c6cdf97de763df5d", "avgDurationSecs": 4.627, "validDurationSecs": 56430.369, "totalHrs": 22.96, "validHrs": 15.67 }, "fmp": { "buckets": { "dev": 326, "test": 327, "train": 351, "validated": 5206, "invalidated": 293, "other": 105 }, "duration": 44521524, "reportedSentences": 5, "validatedSentences": 1004, "unvalidatedSentences": -1, "clips": 5604, "splits": { "accent": {}, "age": { "": 0.74, "twenties": 0.2, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0.06, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 5604, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 32, "size": 255854248, "checksum": "75f0d4b381a4adda3ccea5c8ff326454202b0f61cbc62ac92873aec398ab20c3", "avgDurationSecs": 7.945, "validDurationSecs": 41359.574, "totalHrs": 12.36, "validHrs": 11.48 }, "fr": { "buckets": { "dev": 16196, "test": 16196, "train": 605822, "validated": 775562, "invalidated": 67557, "other": 13071 }, "duration": 4311619534, "reportedSentences": 7619, "validatedSentences": 1649084, "unvalidatedSentences": 43764, "clips": 856190, "splits": { "accent": {}, "age": { "": 0.38, "twenties": 0.17, "thirties": 0.15, "teens": 0.03, "fourties": 0.14, "fifties": 0.09, "sixties": 0.03, "seventies": 0.01, "eighties": 0, "nineties": 0 }, "gender": { "": 0.33, "male_masculine": 0.57, "female_feminine": 0.11, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 856083, "agriculture_food": 0, "automotive_transport": 1, "finance": 1, "service_retail": 0, "general": 70, "healthcare": 5, "history_law_government": 19, "language_fundamentals": 7, "media_entertainment": 16, "nature_environment": 8, "news_current_affairs": 2, "technology_robotics": 18 } }, "users": 20926, "size": 30119183507, "checksum": "ab1903e88eb7eab4c27804f34937e1d2f880cc1cb2a4bdebb06f77325042a2ee", "avgDurationSecs": 5.036, "validDurationSecs": 3905591.363, "totalHrs": 1197.67, "validHrs": 1084.88 }, "fub": { "buckets": { "dev": 277, "test": 345, "train": 445, "validated": 7686, "invalidated": 30, "other": 154 }, "duration": 48138012, "reportedSentences": 0, "validatedSentences": 1067, "unvalidatedSentences": -1, "clips": 7870, "splits": { "accent": {}, "age": { "": 0.98, "twenties": 0.01, "thirties": 0, "teens": 0.01, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.99, "male_masculine": 0, "female_feminine": 0.01, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7870, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 18, "size": 263109466, "checksum": "44fb5c99b7dc56bb390cffc93e94c9d92f4b7bb0e3164dcc07a1fbbe89737103", "avgDurationSecs": 6.117, "validDurationSecs": 47012.549, "totalHrs": 13.37, "validHrs": 13.05 }, "fue": { "buckets": { "dev": 0, "test": 88, "train": 900, "validated": 7146, "invalidated": 11, "other": 108 }, "duration": 38734056, "reportedSentences": 0, "validatedSentences": 988, "unvalidatedSentences": -1, "clips": 7265, "splits": { "accent": {}, "age": { "": 0.86, "twenties": 0, "thirties": 0.14, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7265, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 10, "size": 221067092, "checksum": "860c7d976b474b04331c7daade001693e9c1761ba19636b265771a91a36cfbf5", "avgDurationSecs": 5.332, "validDurationSecs": 38099.596, "totalHrs": 10.75, "validHrs": 10.58 }, "fy-NL": { "buckets": { "dev": 3173, "test": 3173, "train": 3927, "validated": 52227, "invalidated": 4054, "other": 103297 }, "duration": 774347499, "reportedSentences": 553, "validatedSentences": 10902, "unvalidatedSentences": 15, "clips": 159578, "splits": { "accent": {}, "age": { "": 0.56, "twenties": 0.04, "thirties": 0.1, "teens": 0, "fourties": 0.07, "fifties": 0.1, "sixties": 0.12, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.57, "male_masculine": 0.13, "female_feminine": 0.3, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 157895, "agriculture_food": 1216, "automotive_transport": 0, "finance": 207, "service_retail": 0, "general": 467, "healthcare": 0, "history_law_government": 1148, "language_fundamentals": 288, "media_entertainment": 1433, "nature_environment": 3, "news_current_affairs": 223, "technology_robotics": 25 } }, "users": 2095, "size": 4641549420, "checksum": "73a493e91ec5f4915064327c9e80463d3f2cfe138e563e9f8939c0f2db8a8784", "avgDurationSecs": 4.852, "validDurationSecs": 253429.964, "totalHrs": 215.09, "validHrs": 70.39 }, "ga-IE": { "buckets": { "dev": 849, "test": 851, "train": 899, "validated": 13303, "invalidated": 1300, "other": 647 }, "duration": 58143231, "reportedSentences": 42, "validatedSentences": 4883, "unvalidatedSentences": 1470, "clips": 15250, "splits": { "accent": {}, "age": { "": 0.3, "twenties": 0.35, "thirties": 0.24, "teens": 0.01, "fourties": 0.05, "fifties": 0.04, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.33, "male_masculine": 0.34, "female_feminine": 0.33, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 14992, "agriculture_food": 4, "automotive_transport": 5, "finance": 1, "service_retail": 5, "general": 289, "healthcare": 2, "history_law_government": 8, "language_fundamentals": 0, "media_entertainment": 6, "nature_environment": 4, "news_current_affairs": 4, "technology_robotics": 3 } }, "users": 269, "size": 374564231, "checksum": "c168b4ac1d65c39d3ab6929fc367b4d538be48bc00a5b11a673d2f2c3cdebbb0", "avgDurationSecs": 3.813, "validDurationSecs": 50719.961, "totalHrs": 16.15, "validHrs": 14.08 }, "gej": { "buckets": { "dev": 949, "test": 950, "train": 1289, "validated": 16413, "invalidated": 334, "other": 27 }, "duration": 41018184, "reportedSentences": 0, "validatedSentences": 3188, "unvalidatedSentences": -1, "clips": 16774, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 16774, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 20, "size": 225917577, "checksum": "1f7870efd16f99741bcd905e464244ce381d3ce0eeaa6e7f490e0c67580d6515", "avgDurationSecs": 2.445, "validDurationSecs": 40135.415, "totalHrs": 11.39, "validHrs": 11.14 }, "ggg": { "buckets": { "dev": 0, "test": 318, "train": 1687, "validated": 6684, "invalidated": 3, "other": 4393 }, "duration": 44190504, "reportedSentences": 0, "validatedSentences": 2005, "unvalidatedSentences": -1, "clips": 11080, "splits": { "accent": {}, "age": { "": 0.3, "twenties": 0.19, "thirties": 0.33, "teens": 0, "fourties": 0.18, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 11080, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 24, "size": 258835300, "checksum": "bc9718ed0f4bea207db1bd5d310fb95b21a43120398ab6d78cf2b6800da7a769", "avgDurationSecs": 3.988, "validDurationSecs": 26657.882, "totalHrs": 12.27, "validHrs": 7.4 }, "gid": { "buckets": { "dev": 286, "test": 302, "train": 329, "validated": 5111, "invalidated": 208, "other": 0 }, "duration": 37833048, "reportedSentences": 0, "validatedSentences": 917, "unvalidatedSentences": -1, "clips": 5319, "splits": { "accent": {}, "age": { "": 0.99, "twenties": 0, "thirties": 0.01, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 5319, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 16, "size": 216320607, "checksum": "4462a0507beddd3b261cc280cf31eab8ad4f2923c78c0f14d155f25c3eed3186", "avgDurationSecs": 7.113, "validDurationSecs": 36353.583, "totalHrs": 10.5, "validHrs": 10.09 }, "gig": { "buckets": { "dev": 0, "test": 135, "train": 1869, "validated": 12130, "invalidated": 6, "other": 23 }, "duration": 36376452, "reportedSentences": 0, "validatedSentences": 2005, "unvalidatedSentences": -1, "clips": 12159, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.67, "thirties": 0.16, "teens": 0, "fourties": 0, "fifties": 0.16, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 12159, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 20, "size": 212046431, "checksum": "e1e3433e86c377a60c22f15c4c9829d681e462b17ecef43d8ad274b69f27851d", "avgDurationSecs": 2.992, "validDurationSecs": 36289.692, "totalHrs": 10.1, "validHrs": 10.08 }, "giz": { "buckets": { "dev": 308, "test": 277, "train": 406, "validated": 6494, "invalidated": 149, "other": 5 }, "duration": 37043316, "reportedSentences": 14, "validatedSentences": 991, "unvalidatedSentences": -1, "clips": 6648, "splits": { "accent": {}, "age": { "": 0.89, "twenties": 0.03, "thirties": 0.07, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 6648, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 32, "size": 216330762, "checksum": "614987927289d3380aa526d5aa2643d891d914399155067d0a357e272de313ee", "avgDurationSecs": 5.572, "validDurationSecs": 36185.213, "totalHrs": 10.28, "validHrs": 10.05 }, "gjk": { "buckets": { "dev": 570, "test": 623, "train": 808, "validated": 8548, "invalidated": 168, "other": 10 }, "duration": 39656844, "reportedSentences": 0, "validatedSentences": 2004, "unvalidatedSentences": -1, "clips": 8726, "splits": { "accent": {}, "age": { "": 0.02, "twenties": 0.12, "thirties": 0.59, "teens": 0.04, "fourties": 0.23, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.74, "male_masculine": 0, "female_feminine": 0.26, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8726, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 23, "size": 230571438, "checksum": "e992d46d525e358225180418fa277c0f0f517ab5f8687d9974e522c4cfd3ab59", "avgDurationSecs": 4.545, "validDurationSecs": 38847.892, "totalHrs": 11.01, "validHrs": 10.79 }, "gju": { "buckets": { "dev": 0, "test": 626, "train": 3204, "validated": 11076, "invalidated": 155, "other": 510 }, "duration": 38540952, "reportedSentences": 0, "validatedSentences": 3852, "unvalidatedSentences": 2, "clips": 11741, "splits": { "accent": {}, "age": { "": 0.22, "twenties": 0, "thirties": 0.01, "teens": 0, "fourties": 0.77, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 11738, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 3, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 6, "size": 220134491, "checksum": "073b80d594a9faf861e0ca4d07abf885d01a933845f5fdd4df4065714f8304e1", "avgDurationSecs": 3.283, "validDurationSecs": 36358.026, "totalHrs": 10.7, "validHrs": 10.09 }, "gl": { "buckets": { "dev": 14970, "test": 14969, "train": 149131, "validated": 183801, "invalidated": 25176, "other": 60920 }, "duration": 1350675288, "reportedSentences": 872, "validatedSentences": 1001730, "unvalidatedSentences": 3827, "clips": 269897, "splits": { "accent": {}, "age": { "": 0.54, "twenties": 0.16, "thirties": 0.07, "teens": 0.02, "fourties": 0.09, "fifties": 0.1, "sixties": 0.01, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.64, "male_masculine": 0.13, "female_feminine": 0.22, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.01 }, "sentence_domain": { "": 269452, "agriculture_food": 33, "automotive_transport": 4, "finance": 40, "service_retail": 17, "general": 264, "healthcare": 3, "history_law_government": 52, "language_fundamentals": 19, "media_entertainment": 41, "nature_environment": 15, "news_current_affairs": 14, "technology_robotics": 5 } }, "users": 6397, "size": 7840048937, "checksum": "e33bf85d88497fa1ed5595210c9a251326c1b84df1f59f2de31ac655518c3093", "avgDurationSecs": 5.004, "validDurationSecs": 919815.591, "totalHrs": 375.18, "validHrs": 255.5 }, "gn": { "buckets": { "dev": 661, "test": 1105, "train": 1720, "validated": 4029, "invalidated": 220, "other": 21610 }, "duration": 119240820, "reportedSentences": 52, "validatedSentences": 5894, "unvalidatedSentences": 301, "clips": 25859, "splits": { "accent": {}, "age": { "": 0.19, "twenties": 0.54, "thirties": 0.17, "teens": 0.02, "fourties": 0.08, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.2, "male_masculine": 0.33, "female_feminine": 0.46, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 25859, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 313, "size": 683967749, "checksum": "c97bc800ba00c3736e80658c681027d90edde530882544768fc9e4a4276e4249", "avgDurationSecs": 4.611, "validDurationSecs": 18578.494, "totalHrs": 33.12, "validHrs": 5.16 }, "gsw": { "buckets": { "dev": 17, "test": 18, "train": 24, "validated": 228, "invalidated": 36, "other": 437 }, "duration": 4008276, "reportedSentences": 2, "validatedSentences": 64, "unvalidatedSentences": 19, "clips": 701, "splits": { "accent": {}, "age": { "": 0.17, "twenties": 0.01, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0.2, "sixties": 0.52, "seventies": 0.1, "eighties": 0.01, "nineties": 0 }, "gender": { "": 0.51, "male_masculine": 0, "female_feminine": 0.49, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 0, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 5, "general": 27, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 674, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 24, "size": 22386915, "checksum": "1a5f38f432bf02d93bcb7d100c8cb82784229d404e92e985e42a0c81e49769c4", "avgDurationSecs": 5.718, "validDurationSecs": 1303.69, "totalHrs": 1.11, "validHrs": 0.36 }, "gv": { "buckets": { "dev": 1166, "test": 525, "train": 2420, "validated": 6302, "invalidated": 151, "other": 137 }, "duration": 38105820, "reportedSentences": 267, "validatedSentences": 4219, "unvalidatedSentences": 21, "clips": 6590, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.54, "thirties": 0.04, "teens": 0, "fourties": 0.39, "fifties": 0.02, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.46, "male_masculine": 0.5, "female_feminine": 0.04, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 6590, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 9, "size": 224868436, "checksum": "a0e4c22483d334c9b745f0cf56dad8e4395a65a67b52c73a3a63ca5f0bb4e5b8", "avgDurationSecs": 5.782, "validDurationSecs": 36440.497, "totalHrs": 10.58, "validHrs": 10.12 }, "gwc": { "buckets": { "dev": 776, "test": 918, "train": 3268, "validated": 7421, "invalidated": 683, "other": 1699 }, "duration": 57059136, "reportedSentences": 1, "validatedSentences": 5574, "unvalidatedSentences": -1, "clips": 9803, "splits": { "accent": {}, "age": { "": 0.03, "twenties": 0.34, "thirties": 0, "teens": 0, "fourties": 0.48, "fifties": 0.14, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 9803, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 22, "size": 335348506, "checksum": "efd083b343f3f52d11b21a749e837b2d39afc35abf3f125ba59dfba024a1f14a", "avgDurationSecs": 5.821, "validDurationSecs": 43194.517, "totalHrs": 15.84, "validHrs": 11.99 }, "gwt": { "buckets": { "dev": 0, "test": 220, "train": 3136, "validated": 7681, "invalidated": 57, "other": 0 }, "duration": 44273880, "reportedSentences": 0, "validatedSentences": 3719, "unvalidatedSentences": 2087, "clips": 7738, "splits": { "accent": {}, "age": { "": 0.16, "twenties": 0, "thirties": 0.4, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0.43, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7738, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 5, "size": 261938785, "checksum": "fea63dc5528a2639f0d20c17fab85fd64e20a98c6cf7ce92cd0dcd56c269dbd8", "avgDurationSecs": 5.722, "validDurationSecs": 43947.748, "totalHrs": 12.29, "validHrs": 12.2 }, "gya": { "buckets": { "dev": 346, "test": 346, "train": 362, "validated": 6914, "invalidated": 491, "other": 0 }, "duration": 38369700, "reportedSentences": 1, "validatedSentences": 1054, "unvalidatedSentences": -1, "clips": 7405, "splits": { "accent": {}, "age": { "": 0.86, "twenties": 0, "thirties": 0.14, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7405, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 31, "size": 221180027, "checksum": "8676f1ddb77395ec0d4900e61dce291a8f3f28ed7b9909d3c37ad75022b751ce", "avgDurationSecs": 5.182, "validDurationSecs": 35825.538, "totalHrs": 10.65, "validHrs": 9.95 }, "ha": { "buckets": { "dev": 634, "test": 783, "train": 1901, "validated": 3496, "invalidated": 175, "other": 6776 }, "duration": 45455724, "reportedSentences": 34, "validatedSentences": 5450, "unvalidatedSentences": 240, "clips": 10447, "splits": { "accent": {}, "age": { "": 0.19, "twenties": 0.13, "thirties": 0.65, "teens": 0, "fourties": 0, "fifties": 0.02, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.19, "male_masculine": 0.57, "female_feminine": 0.24, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 10447, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 60, "size": 266037995, "checksum": "21b27ecfa4ed161da6007d1900acbdea2216a6553a33aa53431733dc2e9d07ff", "avgDurationSecs": 4.351, "validDurationSecs": 15211.373, "totalHrs": 12.62, "validHrs": 4.22 }, "haz": { "buckets": { "dev": 86, "test": 446, "train": 823, "validated": 8319, "invalidated": 0, "other": 1 }, "duration": 37900836, "reportedSentences": 29, "validatedSentences": 1361, "unvalidatedSentences": -1, "clips": 8320, "splits": { "accent": {}, "age": { "": 0.35, "twenties": 0.32, "thirties": 0.33, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8320, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 8, "size": 183552507, "checksum": "b5944f1622600c6474930fb651ba6cedb8ef1efd32948fe49d7a6b2710e8226b", "avgDurationSecs": 4.555, "validDurationSecs": 37896.281, "totalHrs": 10.52, "validHrs": 10.52 }, "he": { "buckets": { "dev": 394, "test": 910, "train": 1870, "validated": 4059, "invalidated": 346, "other": 1086 }, "duration": 25219404, "reportedSentences": 43, "validatedSentences": 4188, "unvalidatedSentences": 6836, "clips": 5491, "splits": { "accent": {}, "age": { "": 0.07, "twenties": 0.72, "thirties": 0.16, "teens": 0, "fourties": 0.02, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0.04, "nineties": 0 }, "gender": { "": 0.07, "male_masculine": 0.91, "female_feminine": 0.02, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 5490, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 1, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 55, "size": 146911811, "checksum": "2a91a9c2d958efb9182c7077b343d5f049c99eb8cd9bc011487569e0455e922c", "avgDurationSecs": 4.593, "validDurationSecs": 18642.426, "totalHrs": 7, "validHrs": 5.17 }, "hem": { "buckets": { "dev": 337, "test": 337, "train": 345, "validated": 5974, "invalidated": 470, "other": 0 }, "duration": 38994660, "reportedSentences": 2, "validatedSentences": 1020, "unvalidatedSentences": 2, "clips": 6444, "splits": { "accent": {}, "age": { "": 0.12, "twenties": 0.47, "thirties": 0.27, "teens": 0, "fourties": 0.13, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.77, "male_masculine": 0.03, "female_feminine": 0.2, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 6444, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 41, "size": 211316608, "checksum": "04ea4c4c436e486e1023f492b172baa9839cf466e971f904289cef967fbc8eb9", "avgDurationSecs": 6.051, "validDurationSecs": 36150.543, "totalHrs": 10.83, "validHrs": 10.04 }, "hi": { "buckets": { "dev": 2702, "test": 3360, "train": 4876, "validated": 11017, "invalidated": 911, "other": 6553 }, "duration": 92714028, "reportedSentences": 146, "validatedSentences": 32204, "unvalidatedSentences": 9965, "clips": 18481, "splits": { "accent": {}, "age": { "": 0.29, "twenties": 0.28, "thirties": 0.33, "teens": 0.01, "fourties": 0.07, "fifties": 0.01, "sixties": 0.01, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.45, "male_masculine": 0.51, "female_feminine": 0.03, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 18481, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 471, "size": 549742692, "checksum": "2cfba22d28fec767bc8b786da9e22966cc9a703676854d47723c7c0c482518d7", "avgDurationSecs": 5.017, "validDurationSecs": 55269.22, "totalHrs": 25.75, "validHrs": 15.35 }, "hno": { "buckets": { "dev": 765, "test": 708, "train": 863, "validated": 9120, "invalidated": 282, "other": 5 }, "duration": 37708020, "reportedSentences": 21, "validatedSentences": 2349, "unvalidatedSentences": -1, "clips": 9407, "splits": { "accent": {}, "age": { "": 0.09, "twenties": 0.66, "thirties": 0.23, "teens": 0.02, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.52, "male_masculine": 0, "female_feminine": 0.48, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 6162, "agriculture_food": 5816, "automotive_transport": 0, "finance": 3245, "service_retail": 0, "general": 2574, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 5816, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 36, "size": 216280482, "checksum": "999869fa27bf0aaa04c4ba1a44702e1f5c2105bf7644f1d3e912205b7de54861", "avgDurationSecs": 4.009, "validDurationSecs": 36557.579, "totalHrs": 10.47, "validHrs": 10.15 }, "hsb": { "buckets": { "dev": 270, "test": 405, "train": 811, "validated": 1486, "invalidated": 248, "other": 323 }, "duration": 13102884, "reportedSentences": 130, "validatedSentences": 7182, "unvalidatedSentences": 26, "clips": 2057, "splits": { "accent": {}, "age": { "": 0.21, "twenties": 0.1, "thirties": 0.09, "teens": 0.07, "fourties": 0.46, "fifties": 0.03, "sixties": 0.02, "seventies": 0.03, "eighties": 0, "nineties": 0 }, "gender": { "": 0.25, "male_masculine": 0.73, "female_feminine": 0.02, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 2057, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 32, "size": 97504584, "checksum": "c11d0d6356bf0c886d1103e02627a66533de4069678e7b52950a1cb176e9199f", "avgDurationSecs": 6.37, "validDurationSecs": 9465.671, "totalHrs": 3.63, "validHrs": 2.62 }, "ht": { "buckets": { "dev": 6, "test": 5, "train": 13, "validated": 27, "invalidated": 1, "other": 2 }, "duration": 166968, "reportedSentences": 0, "validatedSentences": 76, "unvalidatedSentences": 1629, "clips": 30, "splits": { "accent": {}, "age": { "": 0.67, "twenties": 0, "thirties": 0.33, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 30, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 3, "size": 1091474, "checksum": "0d10797fa8f3be5168535495be6b34ba4ee583800305d4f7430ee223ebb97f37", "avgDurationSecs": 5.566, "validDurationSecs": 150.271, "totalHrs": 0.04, "validHrs": 0.04 }, "hu": { "buckets": { "dev": 12027, "test": 12066, "train": 44352, "validated": 68975, "invalidated": 3473, "other": 45019 }, "duration": 650828773, "reportedSentences": 554, "validatedSentences": 326397, "unvalidatedSentences": 226, "clips": 117467, "splits": { "accent": {}, "age": { "": 0.28, "twenties": 0.11, "thirties": 0.13, "teens": 0.02, "fourties": 0.11, "fifties": 0.32, "sixties": 0.01, "seventies": 0.01, "eighties": 0, "nineties": 0 }, "gender": { "": 0.3, "male_masculine": 0.23, "female_feminine": 0.46, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 117394, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 64, "healthcare": 0, "history_law_government": 19, "language_fundamentals": 0, "media_entertainment": 2, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 9 } }, "users": 1675, "size": 3828056509, "checksum": "3efa8e3df2c1e27dbbddc7fc84ed4b4765d7a8b88d57080b45bf90fcf62e36ea", "avgDurationSecs": 5.541, "validDurationSecs": 382157.667, "totalHrs": 180.78, "validHrs": 106.15 }, "hux": { "buckets": { "dev": 25, "test": 326, "train": 637, "validated": 9285, "invalidated": 1322, "other": 1 }, "duration": 41113224, "reportedSentences": 0, "validatedSentences": 995, "unvalidatedSentences": -1, "clips": 10608, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.19, "thirties": 0.09, "teens": 0, "fourties": 0.26, "fifties": 0.37, "sixties": 0.09, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.37, "male_masculine": 0, "female_feminine": 0.63, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 10608, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 13, "size": 240800853, "checksum": "0cdadf2e8fa73680e4b4afcffef020366a8c6cac4707bf41fdea230f2ae1d35b", "avgDurationSecs": 3.876, "validDurationSecs": 35985.698, "totalHrs": 11.42, "validHrs": 9.99 }, "hy-AM": { "buckets": { "dev": 5874, "test": 5841, "train": 9314, "validated": 21244, "invalidated": 1221, "other": 15123 }, "duration": 202675896, "reportedSentences": 183, "validatedSentences": 237419, "unvalidatedSentences": 1338, "clips": 37588, "splits": { "accent": {}, "age": { "": 0.14, "twenties": 0.63, "thirties": 0.08, "teens": 0.11, "fourties": 0.04, "fifties": 0.01, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.2, "male_masculine": 0.25, "female_feminine": 0.55, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 37586, "agriculture_food": 0, "automotive_transport": 0, "finance": 1, "service_retail": 0, "general": 1, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 441, "size": 1192289812, "checksum": "3469b9deae30a757883b45812c7ed35b69c79187ece74fae9cf2cac3e7fa2010", "avgDurationSecs": 5.392, "validDurationSecs": 114548.439, "totalHrs": 56.29, "validHrs": 31.81 }, "ia": { "buckets": { "dev": 1869, "test": 1865, "train": 4903, "validated": 12077, "invalidated": 352, "other": 2341 }, "duration": 62070024, "reportedSentences": 279, "validatedSentences": 9069, "unvalidatedSentences": 134, "clips": 14770, "splits": { "accent": {}, "age": { "": 0.38, "twenties": 0.05, "thirties": 0.02, "teens": 0, "fourties": 0.29, "fifties": 0.03, "sixties": 0, "seventies": 0.22, "eighties": 0, "nineties": 0 }, "gender": { "": 0.38, "male_masculine": 0.61, "female_feminine": 0.01, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 14770, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 72, "size": 420459353, "checksum": "01fe681194c6779401319a9a312889e9d53d27f4f284fbb239286a5227b30951", "avgDurationSecs": 4.202, "validDurationSecs": 50752.856, "totalHrs": 17.24, "validHrs": 14.09 }, "ibb": { "buckets": { "dev": 319, "test": 307, "train": 372, "validated": 3106, "invalidated": 118, "other": 4238 }, "duration": 96213852, "reportedSentences": 0, "validatedSentences": 1031, "unvalidatedSentences": -1, "clips": 7462, "splits": { "accent": {}, "age": { "": 0.99, "twenties": 0, "thirties": 0.01, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.97, "male_masculine": 0, "female_feminine": 0.03, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7462, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 19, "size": 561149314, "checksum": "d14ec0f9ac2a6f5cbc9455a2d7130ebc0d0935030aa354c89ef2295c65b255e9", "avgDurationSecs": 12.894, "validDurationSecs": 40048.274, "totalHrs": 26.72, "validHrs": 11.12 }, "id": { "buckets": { "dev": 3469, "test": 3691, "train": 4973, "validated": 30256, "invalidated": 2795, "other": 26500 }, "duration": 238450224, "reportedSentences": 363, "validatedSentences": 13318, "unvalidatedSentences": 11864, "clips": 59551, "splits": { "accent": {}, "age": { "": 0.26, "twenties": 0.41, "thirties": 0.1, "teens": 0.22, "fourties": 0.02, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.3, "male_masculine": 0.44, "female_feminine": 0.26, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0, "intersex": 0 }, "sentence_domain": { "": 59551, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 653, "size": 1498957544, "checksum": "abaa6f144cfd71d2144303b2019b4156672e39b10b8e4b0a9555471abd373e3e", "avgDurationSecs": 4.004, "validDurationSecs": 121149.099, "totalHrs": 66.23, "validHrs": 33.65 }, "ig": { "buckets": { "dev": 87, "test": 89, "train": 92, "validated": 269, "invalidated": 138, "other": 8295 }, "duration": 47624184, "reportedSentences": 16, "validatedSentences": 15225, "unvalidatedSentences": 3122, "clips": 8702, "splits": { "accent": {}, "age": { "": 0.39, "twenties": 0.33, "thirties": 0.17, "teens": 0.07, "fourties": 0.01, "fifties": 0, "sixties": 0.02, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.47, "male_masculine": 0.09, "female_feminine": 0.44, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8700, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 1, "language_fundamentals": 1, "media_entertainment": 1, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 159, "size": 279448506, "checksum": "cb99fab21b97ef36c43052b60adba30d81daba5ba44a0d15bd027af70249457c", "avgDurationSecs": 5.473, "validDurationSecs": 1472.179, "totalHrs": 13.22, "validHrs": 0.4 }, "ipk": { "buckets": { "dev": 0, "test": 160, "train": 3104, "validated": 3264, "invalidated": 0, "other": 0 }, "duration": 25908516, "reportedSentences": 0, "validatedSentences": 4386, "unvalidatedSentences": 27, "clips": 3264, "splits": { "accent": {}, "age": { "": 0.05, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0.95, "nineties": 0 }, "gender": { "": 0.05, "male_masculine": 0, "female_feminine": 0.95, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 3264, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 2, "size": 153440333, "checksum": "de70e5900a5aa4d1a8debeaa2ab8b81f41f2c0b496442b0b62eefa6ac1db3c40", "avgDurationSecs": 7.938, "validDurationSecs": 25908.516, "totalHrs": 7.19, "validHrs": 7.19 }, "is": { "buckets": { "dev": 0, "test": 35, "train": 73, "validated": 108, "invalidated": 15, "other": 291 }, "duration": 2660040, "reportedSentences": 1, "validatedSentences": 5083, "unvalidatedSentences": 113, "clips": 414, "splits": { "accent": {}, "age": { "": 0.37, "twenties": 0, "thirties": 0.61, "teens": 0, "fourties": 0.01, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.96, "male_masculine": 0.04, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 414, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 8, "size": 16009584, "checksum": "3e207b41d6eabafe87aae769e8a92e04eae4629727c2da45a1a4b29d1f71ff54", "avgDurationSecs": 6.425, "validDurationSecs": 693.923, "totalHrs": 0.73, "validHrs": 0.19 }, "it": { "buckets": { "dev": 15181, "test": 15181, "train": 173207, "validated": 240195, "invalidated": 20772, "other": 19030 }, "duration": 1520567196, "reportedSentences": 5983, "validatedSentences": 925062, "unvalidatedSentences": 971, "clips": 279997, "splits": { "accent": {}, "age": { "": 0.27, "twenties": 0.2, "thirties": 0.16, "teens": 0.01, "fourties": 0.12, "fifties": 0.14, "sixties": 0.1, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.28, "male_masculine": 0.62, "female_feminine": 0.1, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 279981, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 1, "general": 11, "healthcare": 1, "history_law_government": 5, "language_fundamentals": 3, "media_entertainment": 1, "nature_environment": 3, "news_current_affairs": 1, "technology_robotics": 1 } }, "users": 7319, "size": 10333034887, "checksum": "1371f22127b7ff142c10084ef36278631dd50c39564254729e568d9a19782ec5", "avgDurationSecs": 5.431, "validDurationSecs": 1304416.253, "totalHrs": 422.37, "validHrs": 362.33 }, "ja": { "buckets": { "dev": 9019, "test": 9019, "train": 19694, "validated": 280477, "invalidated": 52382, "other": 225140 }, "duration": 2546437569, "reportedSentences": 793, "validatedSentences": 42286, "unvalidatedSentences": 8231, "clips": 557999, "splits": { "accent": {}, "age": { "": 0.17, "twenties": 0.55, "thirties": 0.07, "teens": 0.08, "fourties": 0.08, "fifties": 0.04, "sixties": 0.01, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.33, "male_masculine": 0.28, "female_feminine": 0.39, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.01, "intersex": 0 }, "sentence_domain": { "": 510070, "agriculture_food": 8157, "automotive_transport": 1910, "finance": 2005, "service_retail": 400, "general": 21766, "healthcare": 2268, "history_law_government": 4518, "language_fundamentals": 3554, "media_entertainment": 4770, "nature_environment": 2540, "news_current_affairs": 971, "technology_robotics": 643 } }, "users": 7498, "size": 14977274557, "checksum": "85c714c97705123d0abbc0bd4715ceefcd1388b9ce6428bc0aa1cfd635754dd1", "avgDurationSecs": 4.564, "validDurationSecs": 1279961.38, "totalHrs": 707.34, "validHrs": 355.54 }, "jgo": { "buckets": { "dev": 336, "test": 336, "train": 362, "validated": 6080, "invalidated": 89, "other": 20 }, "duration": 41432724, "reportedSentences": 0, "validatedSentences": 1035, "unvalidatedSentences": 2, "clips": 6189, "splits": { "accent": {}, "age": { "": 0.44, "twenties": 0.11, "thirties": 0.15, "teens": 0, "fourties": 0.3, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.67, "male_masculine": 0, "female_feminine": 0.33, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 6188, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 1, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 1, "nature_environment": 1, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 16, "size": 227442147, "checksum": "af72614e0dc3c4cc3680a734f56267036c6bcd96142f7be1badbb4257a49627f", "avgDurationSecs": 6.695, "validDurationSecs": 40703.015, "totalHrs": 11.5, "validHrs": 11.3 }, "jqr": { "buckets": { "dev": 323, "test": 273, "train": 403, "validated": 6060, "invalidated": 116, "other": 79 }, "duration": 36995796, "reportedSentences": 0, "validatedSentences": 999, "unvalidatedSentences": -1, "clips": 6255, "splits": { "accent": {}, "age": { "": 0.23, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0.6, "fifties": 0.16, "sixties": 0.01, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.48, "male_masculine": 0, "female_feminine": 0.52, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 6255, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 12, "size": 215086389, "checksum": "196799a74d3b72510f615fd7ae28df31eb8d189ada4ed46e0e9bc768abd25b12", "avgDurationSecs": 5.915, "validDurationSecs": 35842.45, "totalHrs": 10.27, "validHrs": 9.95 }, "ka": { "buckets": { "dev": 13047, "test": 13116, "train": 63056, "validated": 117702, "invalidated": 6766, "other": 103078 }, "duration": 1184559984, "reportedSentences": 1101, "validatedSentences": 132626, "unvalidatedSentences": 1891, "clips": 227546, "splits": { "accent": {}, "age": { "": 0.23, "twenties": 0.22, "thirties": 0.33, "teens": 0.11, "fourties": 0.07, "fifties": 0.04, "sixties": 0.02, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.29, "male_masculine": 0.17, "female_feminine": 0.54, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 226990, "agriculture_food": 9, "automotive_transport": 10, "finance": 4, "service_retail": 9, "general": 256, "healthcare": 10, "history_law_government": 202, "language_fundamentals": 32, "media_entertainment": 23, "nature_environment": 17, "news_current_affairs": 10, "technology_robotics": 3 } }, "users": 2759, "size": 6926976886, "checksum": "c5af491be4210fdda49378bfe330bced7a26c0d4250a15826947b93610146a4c", "avgDurationSecs": 5.206, "validDurationSecs": 612733.598, "totalHrs": 329.04, "validHrs": 170.2 }, "kab": { "buckets": { "dev": 15003, "test": 15003, "train": 152504, "validated": 614748, "invalidated": 20076, "other": 112425 }, "duration": 2497072912, "reportedSentences": 9747, "validatedSentences": 182804, "unvalidatedSentences": 205837, "clips": 747249, "splits": { "accent": {}, "age": { "": 0.28, "twenties": 0.12, "thirties": 0.29, "teens": 0, "fourties": 0.09, "fifties": 0.18, "sixties": 0.02, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.26, "male_masculine": 0.53, "female_feminine": 0.2, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 747249, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 1599, "size": 18644707031, "checksum": "e1103bdf8cc84a32f499e8d9a17d0b19f21ec2a7a9cb3d245678db2a9bc55149", "avgDurationSecs": 3.342, "validDurationSecs": 2054295.929, "totalHrs": 693.63, "validHrs": 570.63 }, "kbd": { "buckets": { "dev": 6954, "test": 6958, "train": 11996, "validated": 102361, "invalidated": 2499, "other": 7602 }, "duration": 701074224, "reportedSentences": 3359, "validatedSentences": 27620, "unvalidatedSentences": 2376, "clips": 112462, "splits": { "accent": {}, "age": { "": 0.15, "twenties": 0.19, "thirties": 0.28, "teens": 0.03, "fourties": 0.11, "fifties": 0.24, "sixties": 0.01, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.51, "male_masculine": 0, "female_feminine": 0.48, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 2728, "agriculture_food": 4, "automotive_transport": 5, "finance": 0, "service_retail": 0, "general": 121798, "healthcare": 64, "history_law_government": 245, "language_fundamentals": 16, "media_entertainment": 7, "nature_environment": 131, "news_current_affairs": 5, "technology_robotics": 0 } }, "users": 289, "size": 3912180592, "checksum": "9b163af0d093d3f5ca9b9b951e7070edb9b3390121392625ee8f58166ad31fe7", "avgDurationSecs": 6.234, "validDurationSecs": 638105.837, "totalHrs": 194.74, "validHrs": 177.25 }, "kdh": { "buckets": { "dev": 356, "test": 363, "train": 498, "validated": 13513, "invalidated": 279, "other": 496 }, "duration": 38163852, "reportedSentences": 0, "validatedSentences": 1219, "unvalidatedSentences": -1, "clips": 14288, "splits": { "accent": {}, "age": { "": 0.98, "twenties": 0, "thirties": 0.02, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 14288, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 20, "size": 201028275, "checksum": "5ea464a0bdbe326b2387f543219a0041c01542d14c73fc43f3aef755098aff3c", "avgDurationSecs": 2.671, "validDurationSecs": 36093.794, "totalHrs": 10.6, "validHrs": 10.02 }, "khw": { "buckets": { "dev": 1607, "test": 1535, "train": 2642, "validated": 8500, "invalidated": 261, "other": 1138 }, "duration": 72903024, "reportedSentences": 4, "validatedSentences": 7051, "unvalidatedSentences": 200, "clips": 9899, "splits": { "accent": {}, "age": { "": 0.07, "twenties": 0.11, "thirties": 0.26, "teens": 0, "fourties": 0.55, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 9542, "agriculture_food": 18, "automotive_transport": 53, "finance": 2, "service_retail": 0, "general": 253, "healthcare": 4, "history_law_government": 9, "language_fundamentals": 30, "media_entertainment": 4, "nature_environment": 9, "news_current_affairs": 4, "technology_robotics": 1 } }, "users": 50, "size": 429795765, "checksum": "70e00b56fb6b888e406d195247bad0983a437a5002f7d43d8eade7189d4b27cc", "avgDurationSecs": 7.365, "validDurationSecs": 62599.829, "totalHrs": 20.25, "validHrs": 17.38 }, "kk": { "buckets": { "dev": 551, "test": 573, "train": 616, "validated": 1748, "invalidated": 259, "other": 743 }, "duration": 13561848, "reportedSentences": 42, "validatedSentences": 6210, "unvalidatedSentences": 260, "clips": 2750, "splits": { "accent": {}, "age": { "": 0.55, "twenties": 0.23, "thirties": 0.05, "teens": 0.06, "fourties": 0.07, "fifties": 0.05, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.57, "male_masculine": 0.31, "female_feminine": 0.12, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 2750, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 193, "size": 77693598, "checksum": "cdc3e608667382d61aaf3b729170d701c87aab9dfe830eb4d63209e0169e4afd", "avgDurationSecs": 4.932, "validDurationSecs": 8620.404, "totalHrs": 3.76, "validHrs": 2.39 }, "kln": { "buckets": { "dev": 6412, "test": 6076, "train": 11065, "validated": 32315, "invalidated": 537, "other": 37348 }, "duration": 330293556, "reportedSentences": 0, "validatedSentences": 29900, "unvalidatedSentences": 61, "clips": 70200, "splits": { "accent": {}, "age": { "": 0.02, "twenties": 0.59, "thirties": 0.05, "teens": 0.05, "fourties": 0.29, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.27, "male_masculine": 0.03, "female_feminine": 0.7, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 4, "agriculture_food": 5, "automotive_transport": 16, "finance": 32, "service_retail": 626, "general": 68952, "healthcare": 54, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 2, "nature_environment": 23, "news_current_affairs": 2, "technology_robotics": 484 } }, "users": 41, "size": 1800892624, "checksum": "f60908bb36e29ad4f747b8875c2c85ba4e2935a197e27cd43c2dca1b71d266c9", "avgDurationSecs": 4.705, "validDurationSecs": 152043.252, "totalHrs": 91.74, "validHrs": 42.23 }, "kls": { "buckets": { "dev": 1258, "test": 1233, "train": 1415, "validated": 9774, "invalidated": 163, "other": 11 }, "duration": 37741320, "reportedSentences": 2, "validatedSentences": 3912, "unvalidatedSentences": 4, "clips": 9948, "splits": { "accent": {}, "age": { "": 0.64, "twenties": 0.06, "thirties": 0, "teens": 0, "fourties": 0.3, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 9948, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 23, "size": 215514534, "checksum": "0294f5272cd1f2757c79e4b71f25c659663f19d87840532241b86527250b7649", "avgDurationSecs": 3.794, "validDurationSecs": 37081.188, "totalHrs": 10.48, "validHrs": 10.3 }, "kmr": { "buckets": { "dev": 4125, "test": 4133, "train": 5509, "validated": 64397, "invalidated": 2616, "other": 24285 }, "duration": 378044424, "reportedSentences": 1078, "validatedSentences": 17001, "unvalidatedSentences": 1116, "clips": 91298, "splits": { "accent": {}, "age": { "": 0.48, "twenties": 0.35, "thirties": 0.09, "teens": 0.01, "fourties": 0.03, "fifties": 0.04, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.49, "male_masculine": 0.42, "female_feminine": 0.09, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 91284, "agriculture_food": 2, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 8, "healthcare": 0, "history_law_government": 2, "language_fundamentals": 2, "media_entertainment": 2, "nature_environment": 4, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 682, "size": 2009041404, "checksum": "de85490aed2ac9bd1059fe2f8e69c73aa1bc9f1121dca90a36052582da48a0e5", "avgDurationSecs": 4.141, "validDurationSecs": 266653.451, "totalHrs": 105.01, "validHrs": 74.07 }, "ko": { "buckets": { "dev": 504, "test": 523, "train": 658, "validated": 1686, "invalidated": 477, "other": 4857 }, "duration": 36998208, "reportedSentences": 29, "validatedSentences": 7401, "unvalidatedSentences": 2622, "clips": 7020, "splits": { "accent": {}, "age": { "": 0.18, "twenties": 0.53, "thirties": 0.2, "teens": 0.03, "fourties": 0.04, "fifties": 0.03, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.4, "male_masculine": 0.32, "female_feminine": 0.28, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7015, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 1, "general": 1, "healthcare": 0, "history_law_government": 1, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 2 } }, "users": 194, "size": 216225690, "checksum": "82ecf582beb0ea54ea81c75ef42a17ca1bc74ba4231764cadab87849e1c67f07", "avgDurationSecs": 5.27, "validDurationSecs": 8885.894, "totalHrs": 10.27, "validHrs": 2.46 }, "ksf": { "buckets": { "dev": 308, "test": 320, "train": 376, "validated": 7414, "invalidated": 305, "other": 222 }, "duration": 73970280, "reportedSentences": 0, "validatedSentences": 1004, "unvalidatedSentences": -1, "clips": 7941, "splits": { "accent": {}, "age": { "": 0.88, "twenties": 0.07, "thirties": 0.05, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.95, "male_masculine": 0, "female_feminine": 0.05, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7941, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 24, "size": 407838646, "checksum": "e5c2f4171648dd9e8a66e8023d5a9e56ea61fc49864fff82ca9516776d9f99d9", "avgDurationSecs": 9.315, "validDurationSecs": 69061.284, "totalHrs": 20.54, "validHrs": 19.18 }, "kvx": { "buckets": { "dev": 654, "test": 450, "train": 913, "validated": 7464, "invalidated": 36, "other": 57 }, "duration": 40217904, "reportedSentences": 2, "validatedSentences": 2025, "unvalidatedSentences": -1, "clips": 7557, "splits": { "accent": {}, "age": { "": 0.04, "twenties": 0.2, "thirties": 0.27, "teens": 0.28, "fourties": 0.21, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.79, "male_masculine": 0, "female_feminine": 0.21, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7557, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 22, "size": 230134556, "checksum": "9a96384afff97ae5082f1a0c87f9cf0b53a8330138262b0568d668872fc53679", "avgDurationSecs": 5.322, "validDurationSecs": 39722.964, "totalHrs": 11.17, "validHrs": 11.03 }, "kw": { "buckets": { "dev": 0, "test": 2401, "train": 6223, "validated": 10806, "invalidated": 402, "other": 60 }, "duration": 46633392, "reportedSentences": 43, "validatedSentences": 9609, "unvalidatedSentences": -1, "clips": 11268, "splits": { "accent": {}, "age": { "": 0.12, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0.34, "fifties": 0.47, "sixties": 0.02, "seventies": 0.05, "eighties": 0, "nineties": 0 }, "gender": { "": 0.66, "male_masculine": 0, "female_feminine": 0.34, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 0, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 12725, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 10, "size": 273350876, "checksum": "5aa9cc98cbcf49c06eb88af972ef563e727f06c8a975f0b49d93c63607e6ad6d", "avgDurationSecs": 4.139, "validDurationSecs": 44721.373, "totalHrs": 12.95, "validHrs": 12.42 }, "kxp": { "buckets": { "dev": 0, "test": 197, "train": 1881, "validated": 11644, "invalidated": 95, "other": 20 }, "duration": 40016700, "reportedSentences": 0, "validatedSentences": 2079, "unvalidatedSentences": -1, "clips": 11759, "splits": { "accent": {}, "age": { "": 0.01, "twenties": 0.28, "thirties": 0.53, "teens": 0.01, "fourties": 0.18, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 11759, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 22, "size": 231110501, "checksum": "4f8988ad38bc6c0ef5dc05b8cb0b30e25ce8da6c306d3a2534718bcbeb516a7f", "avgDurationSecs": 3.403, "validDurationSecs": 39625.347, "totalHrs": 11.11, "validHrs": 11 }, "ky": { "buckets": { "dev": 1614, "test": 1615, "train": 1790, "validated": 30706, "invalidated": 5680, "other": 1460 }, "duration": 172310520, "reportedSentences": 39, "validatedSentences": 5045, "unvalidatedSentences": 242, "clips": 37846, "splits": { "accent": {}, "age": { "": 0.07, "twenties": 0.65, "thirties": 0.09, "teens": 0.17, "fourties": 0.01, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.12, "male_masculine": 0.54, "female_feminine": 0.34, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 37846, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 298, "size": 1108204541, "checksum": "a0f04ffe114d62699d006bf112c35d79ce7689d7b1b6683ca2fb0df7ac25e970", "avgDurationSecs": 4.553, "validDurationSecs": 139802.537, "totalHrs": 47.86, "validHrs": 38.83 }, "lg": { "buckets": { "dev": 13354, "test": 13390, "train": 71089, "validated": 271885, "invalidated": 39183, "other": 37695 }, "duration": 2017262871, "reportedSentences": 6485, "validatedSentences": 191409, "unvalidatedSentences": 179, "clips": 348763, "splits": { "accent": {}, "age": { "": 0.26, "twenties": 0.38, "thirties": 0.22, "teens": 0.01, "fourties": 0.07, "fifties": 0.05, "sixties": 0.02, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.26, "male_masculine": 0.36, "female_feminine": 0.39, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 348763, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 665, "size": 11842344489, "checksum": "f60e779e1a0852718866540cd6cd09b5fd7b05cd5db2839b01708eb5c865ce7b", "avgDurationSecs": 5.784, "validDurationSecs": 1572596.622, "totalHrs": 560.35, "validHrs": 436.83 }, "lij": { "buckets": { "dev": 943, "test": 1358, "train": 2304, "validated": 4686, "invalidated": 585, "other": 0 }, "duration": 20676960, "reportedSentences": 378, "validatedSentences": 6079, "unvalidatedSentences": 50, "clips": 5271, "splits": { "accent": {}, "age": { "": 0.19, "twenties": 0.07, "thirties": 0.45, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0.17, "seventies": 0.11, "eighties": 0, "nineties": 0 }, "gender": { "": 0.27, "male_masculine": 0.45, "female_feminine": 0.28, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 4890, "agriculture_food": 14, "automotive_transport": 1, "finance": 0, "service_retail": 0, "general": 366, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 1, "nature_environment": 0, "news_current_affairs": 1, "technology_robotics": 0 } }, "users": 39, "size": 115145015, "checksum": "7c9213de879b7214f580c6421b855b5f731b7b757e96bc80160c78a9ec42ce67", "avgDurationSecs": 3.923, "validDurationSecs": 18382.135, "totalHrs": 5.74, "validHrs": 5.1 }, "lo": { "buckets": { "dev": 28, "test": 28, "train": 106, "validated": 162, "invalidated": 11, "other": 50 }, "duration": 1456560, "reportedSentences": 0, "validatedSentences": 5145, "unvalidatedSentences": 5925, "clips": 223, "splits": { "accent": {}, "age": { "": 0.11, "twenties": 0.33, "thirties": 0.56, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.11, "male_masculine": 0.89, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 223, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 16, "size": 9346586, "checksum": "a09fcebc44a72c0cca612a5394902a5c5dac06e190da915df06b3a0bf2cc9fa0", "avgDurationSecs": 6.532, "validDurationSecs": 1058.129, "totalHrs": 0.4, "validHrs": 0.29 }, "lrk": { "buckets": { "dev": 0, "test": 347, "train": 1654, "validated": 11462, "invalidated": 206, "other": 123 }, "duration": 42216012, "reportedSentences": 0, "validatedSentences": 2006, "unvalidatedSentences": -1, "clips": 11791, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.28, "thirties": 0.01, "teens": 0.34, "fourties": 0.19, "fifties": 0.01, "sixties": 0.17, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.83, "male_masculine": 0, "female_feminine": 0.17, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 11791, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 20, "size": 246865264, "checksum": "bdb71407d5327ccbf5ab12239dca33c77dd6d6a12d85a366494f89367fda0ca3", "avgDurationSecs": 3.58, "validDurationSecs": 41038.074, "totalHrs": 11.72, "validHrs": 11.39 }, "lss": { "buckets": { "dev": 474, "test": 645, "train": 903, "validated": 10326, "invalidated": 34, "other": 94 }, "duration": 36300708, "reportedSentences": 0, "validatedSentences": 2029, "unvalidatedSentences": -1, "clips": 10454, "splits": { "accent": {}, "age": { "": 0.04, "twenties": 0.45, "thirties": 0.33, "teens": 0, "fourties": 0.19, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.7, "male_masculine": 0, "female_feminine": 0.19, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.11 }, "sentence_domain": { "": 10454, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 15, "size": 183610168, "checksum": "f9aba4d8963a6aa930762bb41dc1a12b8278860044600ed9e136b2c9a156209e", "avgDurationSecs": 3.472, "validDurationSecs": 35856.238, "totalHrs": 10.08, "validHrs": 9.96 }, "lt": { "buckets": { "dev": 5111, "test": 5517, "train": 9061, "validated": 19891, "invalidated": 910, "other": 4040 }, "duration": 127317788, "reportedSentences": 192, "validatedSentences": 129304, "unvalidatedSentences": 4814, "clips": 24841, "splits": { "accent": {}, "age": { "": 0.16, "twenties": 0.26, "thirties": 0.23, "teens": 0.03, "fourties": 0.29, "fifties": 0.03, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.42, "male_masculine": 0.41, "female_feminine": 0.16, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 24841, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 328, "size": 777846668, "checksum": "6b14a22ba834499d6918a05b6f3af067f34f2d88a95890ad07569715aaae4947", "avgDurationSecs": 5.125, "validDurationSecs": 101947.511, "totalHrs": 35.36, "validHrs": 28.31 }, "ltg": { "buckets": { "dev": 3490, "test": 3639, "train": 4937, "validated": 22653, "invalidated": 1867, "other": 629 }, "duration": 120455748, "reportedSentences": 79, "validatedSentences": 15079, "unvalidatedSentences": 2269, "clips": 25149, "splits": { "accent": {}, "age": { "": 0.34, "twenties": 0.09, "thirties": 0.23, "teens": 0, "fourties": 0.32, "fifties": 0.01, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.34, "male_masculine": 0.05, "female_feminine": 0.61, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 19190, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 6297, "healthcare": 1, "history_law_government": 709, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 382, "size": 694917582, "checksum": "be380d8e082f5bf47659b57b62c5bd34b426633464aa22f91a2a30c30c707eee", "avgDurationSecs": 4.79, "validDurationSecs": 108500.698, "totalHrs": 33.45, "validHrs": 30.13 }, "lua": { "buckets": { "dev": 291, "test": 291, "train": 298, "validated": 4801, "invalidated": 894, "other": 0 }, "duration": 46917972, "reportedSentences": 0, "validatedSentences": 880, "unvalidatedSentences": -1, "clips": 5695, "splits": { "accent": {}, "age": { "": 0.13, "twenties": 0.67, "thirties": 0.19, "teens": 0, "fourties": 0.01, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.68, "male_masculine": 0, "female_feminine": 0.32, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 5695, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 46, "size": 272331674, "checksum": "4f209c15a0ad7c21fcbb0840985b9439e98c6a074a74bfbcf774b992c2265c33", "avgDurationSecs": 8.238, "validDurationSecs": 39552.798, "totalHrs": 13.03, "validHrs": 10.98 }, "luo": { "buckets": { "dev": 3060, "test": 3001, "train": 4498, "validated": 20343, "invalidated": 792, "other": 61603 }, "duration": 430613136, "reportedSentences": 8, "validatedSentences": 14691, "unvalidatedSentences": 13870, "clips": 82738, "splits": { "accent": {}, "age": { "": 0.36, "twenties": 0.33, "thirties": 0.28, "teens": 0, "fourties": 0, "fifties": 0.02, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.6, "male_masculine": 0, "female_feminine": 0.4, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 11, "agriculture_food": 1135, "automotive_transport": 341, "finance": 967, "service_retail": 2748, "general": 69488, "healthcare": 2237, "history_law_government": 865, "language_fundamentals": 555, "media_entertainment": 806, "nature_environment": 634, "news_current_affairs": 2710, "technology_robotics": 241 } }, "users": 47, "size": 2392815146, "checksum": "88eb400a20c69e9f2be64afc31058da8cc5aa947759c50b1692551562b1b8c71", "avgDurationSecs": 5.205, "validDurationSecs": 105875.934, "totalHrs": 119.61, "validHrs": 29.4 }, "lv": { "buckets": { "dev": 7781, "test": 7781, "train": 14619, "validated": 197952, "invalidated": 11580, "other": 21328 }, "duration": 1110350141, "reportedSentences": 3144, "validatedSentences": 34599, "unvalidatedSentences": 64990, "clips": 230860, "splits": { "accent": {}, "age": { "": 0.44, "twenties": 0.06, "thirties": 0.28, "teens": 0.01, "fourties": 0.09, "fifties": 0.08, "sixties": 0.02, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.45, "male_masculine": 0.25, "female_feminine": 0.3, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 229992, "agriculture_food": 8, "automotive_transport": 3, "finance": 5, "service_retail": 16, "general": 722, "healthcare": 36, "history_law_government": 8, "language_fundamentals": 9, "media_entertainment": 16, "nature_environment": 44, "news_current_affairs": 5, "technology_robotics": 13 } }, "users": 6530, "size": 6221788585, "checksum": "4c3f8684153e45f57f249cec4c7509723d0a0d54791aec22f65faf13f0e3f2bb", "avgDurationSecs": 4.81, "validDurationSecs": 952074.985, "totalHrs": 308.43, "validHrs": 264.46 }, "lzz": { "buckets": { "dev": 815, "test": 772, "train": 972, "validated": 5779, "invalidated": 418, "other": 927 }, "duration": 27077688, "reportedSentences": 16, "validatedSentences": 4412, "unvalidatedSentences": 1203, "clips": 7124, "splits": { "accent": {}, "age": { "": 0.11, "twenties": 0.17, "thirties": 0.07, "teens": 0, "fourties": 0.25, "fifties": 0.09, "sixties": 0.3, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.58, "male_masculine": 0, "female_feminine": 0.42, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 33, "agriculture_food": 3, "automotive_transport": 8, "finance": 1, "service_retail": 0, "general": 7558, "healthcare": 6, "history_law_government": 2, "language_fundamentals": 3, "media_entertainment": 0, "nature_environment": 48, "news_current_affairs": 3, "technology_robotics": 0 } }, "users": 57, "size": 143891652, "checksum": "deac6c71e8f65378eb69fb49ada05679946bd726bc91517cfd089d6ecb137fb7", "avgDurationSecs": 3.801, "validDurationSecs": 21965.463, "totalHrs": 7.52, "validHrs": 6.1 }, "mau": { "buckets": { "dev": 252, "test": 312, "train": 555, "validated": 6040, "invalidated": 13, "other": 216 }, "duration": 38969352, "reportedSentences": 0, "validatedSentences": 1119, "unvalidatedSentences": -1, "clips": 6269, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.21, "thirties": 0.43, "teens": 0, "fourties": 0.36, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.65, "male_masculine": 0, "female_feminine": 0.35, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 6269, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 7, "size": 207459818, "checksum": "9fad9bf14acb1702c1dad989373134a59527bc856cb646c14fab5ba68d8f5da5", "avgDurationSecs": 6.216, "validDurationSecs": 37545.842, "totalHrs": 10.82, "validHrs": 10.42 }, "mbo": { "buckets": { "dev": 321, "test": 263, "train": 410, "validated": 7106, "invalidated": 75, "other": 701 }, "duration": 43456968, "reportedSentences": 4, "validatedSentences": 998, "unvalidatedSentences": 4, "clips": 7882, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7882, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 13, "size": 254177118, "checksum": "a2dc5f7ffa82e73d1adddffc372eaac7352ad5b11da6c51ac53bc85dfd9ef728", "avgDurationSecs": 5.513, "validDurationSecs": 39178.535, "totalHrs": 12.07, "validHrs": 10.88 }, "mcf": { "buckets": { "dev": 0, "test": 320, "train": 677, "validated": 13884, "invalidated": 28, "other": 78 }, "duration": 37156428, "reportedSentences": 0, "validatedSentences": 997, "unvalidatedSentences": -1, "clips": 13990, "splits": { "accent": {}, "age": { "": 0.05, "twenties": 0.28, "thirties": 0.34, "teens": 0.25, "fourties": 0.07, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.74, "male_masculine": 0, "female_feminine": 0.26, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 13990, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 21, "size": 183268786, "checksum": "2555d944cbce5510565439960845916a40b02de78d389ec58b271b98df975aec", "avgDurationSecs": 2.656, "validDurationSecs": 36874.9, "totalHrs": 10.32, "validHrs": 10.24 }, "mcn": { "buckets": { "dev": 316, "test": 316, "train": 325, "validated": 8621, "invalidated": 32, "other": 607 }, "duration": 39026016, "reportedSentences": 4, "validatedSentences": 959, "unvalidatedSentences": -1, "clips": 9260, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 9260, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 35, "size": 228253357, "checksum": "98814c19f4f6e35d188f95d96196847bd9e10d15283ce6de237f7d7945605deb", "avgDurationSecs": 4.214, "validDurationSecs": 36332.968, "totalHrs": 10.84, "validHrs": 10.09 }, "mcx": { "buckets": { "dev": 111, "test": 249, "train": 543, "validated": 5491, "invalidated": 67, "other": 2 }, "duration": 36755964, "reportedSentences": 0, "validatedSentences": 903, "unvalidatedSentences": -1, "clips": 5560, "splits": { "accent": {}, "age": { "": 0.99, "twenties": 0, "thirties": 0.01, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 5560, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 10, "size": 217211497, "checksum": "6876d86e0d40bbabe5bc77b2f459d86ff19363646185be82b5d8d667db1fb66b", "avgDurationSecs": 6.611, "validDurationSecs": 36299.82, "totalHrs": 10.2, "validHrs": 10.08 }, "mdd": { "buckets": { "dev": 0, "test": 46, "train": 877, "validated": 5542, "invalidated": 31, "other": 0 }, "duration": 36437112, "reportedSentences": 0, "validatedSentences": 923, "unvalidatedSentences": -1, "clips": 5573, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 5573, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 7, "size": 208708874, "checksum": "143398b834b4d612570753e124c3b8fef58d8343f6c4d05b463c6c5b14667bd8", "avgDurationSecs": 6.538, "validDurationSecs": 36234.429, "totalHrs": 10.12, "validHrs": 10.06 }, "mdf": { "buckets": { "dev": 54, "test": 107, "train": 175, "validated": 336, "invalidated": 9, "other": 0 }, "duration": 1811340, "reportedSentences": 15, "validatedSentences": 6039, "unvalidatedSentences": 4, "clips": 345, "splits": { "accent": {}, "age": { "": 0.58, "twenties": 0.02, "thirties": 0, "teens": 0, "fourties": 0.34, "fifties": 0, "sixties": 0.06, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.58, "male_masculine": 0.08, "female_feminine": 0.34, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 345, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 11, "size": 11056956, "checksum": "705c18c73d1217495c84bcdd6df8953d6d6fe0244665b8f807c4af7c416525ef", "avgDurationSecs": 5.25, "validDurationSecs": 1764.088, "totalHrs": 0.5, "validHrs": 0.49 }, "mgg": { "buckets": { "dev": 296, "test": 212, "train": 483, "validated": 4863, "invalidated": 290, "other": 0 }, "duration": 39065004, "reportedSentences": 0, "validatedSentences": 991, "unvalidatedSentences": -1, "clips": 5153, "splits": { "accent": {}, "age": { "": 0.99, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0.01, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.99, "male_masculine": 0, "female_feminine": 0.01, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 5153, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 8, "size": 231037660, "checksum": "017f84fba3b42e99cbcf1939b7f5264644b54749cc1b1b96d32afc7ba51b9fa6", "avgDurationSecs": 7.581, "validDurationSecs": 36866.508, "totalHrs": 10.85, "validHrs": 10.24 }, "mhk": { "buckets": { "dev": 305, "test": 202, "train": 493, "validated": 6597, "invalidated": 52, "other": 46 }, "duration": 41164560, "reportedSentences": 0, "validatedSentences": 1000, "unvalidatedSentences": -1, "clips": 6695, "splits": { "accent": {}, "age": { "": 0.93, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0.07, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 6695, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 9, "size": 230628274, "checksum": "5b79a388485e539bcb27d890f5b85a1177b4549eda7a11064624f596f4a53c03", "avgDurationSecs": 6.149, "validDurationSecs": 40562.002, "totalHrs": 11.43, "validHrs": 11.26 }, "mhr": { "buckets": { "dev": 14663, "test": 15152, "train": 186565, "validated": 218744, "invalidated": 16027, "other": 5 }, "duration": 1085410764, "reportedSentences": 102, "validatedSentences": 328269, "unvalidatedSentences": 3, "clips": 234776, "splits": { "accent": {}, "age": { "": 0.12, "twenties": 0.33, "thirties": 0.21, "teens": 0.14, "fourties": 0.12, "fifties": 0.04, "sixties": 0.03, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.12, "male_masculine": 0.19, "female_feminine": 0.69, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 234776, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 500, "size": 6124380934, "checksum": "21c80f3897057743d21e15f591d413f4348aa398905c066efeb00a4ae1861a6b", "avgDurationSecs": 4.623, "validDurationSecs": 1011292.007, "totalHrs": 301.5, "validHrs": 280.91 }, "mk": { "buckets": { "dev": 1736, "test": 1800, "train": 2111, "validated": 17439, "invalidated": 989, "other": 22573 }, "duration": 197182728, "reportedSentences": 161, "validatedSentences": 6046, "unvalidatedSentences": 648, "clips": 41001, "splits": { "accent": {}, "age": { "": 0.11, "twenties": 0.36, "thirties": 0.27, "teens": 0.03, "fourties": 0.2, "fifties": 0.02, "sixties": 0.03, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.33, "male_masculine": 0.28, "female_feminine": 0.39, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 40735, "agriculture_food": 14, "automotive_transport": 0, "finance": 7, "service_retail": 0, "general": 211, "healthcare": 27, "history_law_government": 7, "language_fundamentals": 0, "media_entertainment": 7, "nature_environment": 21, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 466, "size": 1082253769, "checksum": "053b8c57582d47d876ac6ea4632704a6f0749279c2257ba46b864e42cfead76c", "avgDurationSecs": 4.809, "validDurationSecs": 83867.945, "totalHrs": 54.77, "validHrs": 23.29 }, "mki": { "buckets": { "dev": 0, "test": 23, "train": 2008, "validated": 11181, "invalidated": 134, "other": 12 }, "duration": 36287784, "reportedSentences": 0, "validatedSentences": 2055, "unvalidatedSentences": -1, "clips": 11327, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.28, "thirties": 0.72, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.82, "male_masculine": 0, "female_feminine": 0.18, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 11327, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 12, "size": 196588067, "checksum": "a9c2835deea7cad075681efd6f30fe65cb3139779ee119ba80bcdfb14c89de51", "avgDurationSecs": 3.204, "validDurationSecs": 35820.051, "totalHrs": 10.07, "validHrs": 9.95 }, "ml": { "buckets": { "dev": 934, "test": 882, "train": 1232, "validated": 3466, "invalidated": 121, "other": 6043 }, "duration": 40854852, "reportedSentences": 243, "validatedSentences": 5487, "unvalidatedSentences": 4728, "clips": 9630, "splits": { "accent": {}, "age": { "": 0.22, "twenties": 0.59, "thirties": 0.08, "teens": 0, "fourties": 0.11, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.34, "male_masculine": 0.47, "female_feminine": 0.19, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 9630, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 154, "size": 230927465, "checksum": "09bad714c75c67807062977871629e6aed94df29c196c3edd6e9230b28fb20a2", "avgDurationSecs": 4.242, "validDurationSecs": 14704.353, "totalHrs": 11.34, "validHrs": 4.08 }, "mn": { "buckets": { "dev": 1934, "test": 1934, "train": 2190, "validated": 33704, "invalidated": 3239, "other": 59365 }, "duration": 506019608, "reportedSentences": 46, "validatedSentences": 6098, "unvalidatedSentences": 16, "clips": 96308, "splits": { "accent": {}, "age": { "": 0.04, "twenties": 0.92, "thirties": 0.03, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0.01 }, "gender": { "": 0.46, "male_masculine": 0.14, "female_feminine": 0.4, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 96251, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 33, "healthcare": 2, "history_law_government": 2, "language_fundamentals": 2, "media_entertainment": 2, "nature_environment": 2, "news_current_affairs": 16, "technology_robotics": 0 } }, "users": 606, "size": 3078079672, "checksum": "384488bb777f7478ec8ad9467e402a8864b04a38aee2d8da728c887e24cd51a5", "avgDurationSecs": 5.254, "validDurationSecs": 177086.897, "totalHrs": 140.56, "validHrs": 49.19 }, "mr": { "buckets": { "dev": 1766, "test": 1796, "train": 2189, "validated": 10995, "invalidated": 2292, "other": 2804 }, "duration": 99768888, "reportedSentences": 59, "validatedSentences": 6717, "unvalidatedSentences": 12102, "clips": 16091, "splits": { "accent": {}, "age": { "": 0.06, "twenties": 0.28, "thirties": 0.13, "teens": 0.53, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.06, "male_masculine": 0.19, "female_feminine": 0.75, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 16091, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 105, "size": 586525379, "checksum": "3e4cdbb5d87e20a12bb888459baba7a8f41b2e635c2884da6cfad34c8a165b9b", "avgDurationSecs": 6.2, "validDurationSecs": 68172.203, "totalHrs": 27.71, "validHrs": 18.93 }, "mrj": { "buckets": { "dev": 7314, "test": 7164, "train": 14325, "validated": 28973, "invalidated": 1261, "other": 1459 }, "duration": 132879852, "reportedSentences": 50, "validatedSentences": 54143, "unvalidatedSentences": 4, "clips": 31693, "splits": { "accent": {}, "age": { "": 0.1, "twenties": 0.35, "thirties": 0.22, "teens": 0.06, "fourties": 0.12, "fifties": 0.11, "sixties": 0.04, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.13, "male_masculine": 0.25, "female_feminine": 0.62, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 31693, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 60, "size": 747239471, "checksum": "a01e3933ee8dcc0b3c211c7867e29f775164505ffd7b00bd0242dd29509819c3", "avgDurationSecs": 4.193, "validDurationSecs": 121475.656, "totalHrs": 36.91, "validHrs": 33.74 }, "ms": { "buckets": { "dev": 6, "test": 5, "train": 11, "validated": 27, "invalidated": 1, "other": 2064 }, "duration": 12876444, "reportedSentences": 0, "validatedSentences": 257, "unvalidatedSentences": 9, "clips": 2092, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 2057, "agriculture_food": 0, "automotive_transport": 6, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 29, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 9 } }, "users": 27, "size": 76000823, "checksum": "20ff7d48d859b7bf3f2b51fed187c349efde41d9f03bc99049791df447ecebf4", "avgDurationSecs": 6.155, "validDurationSecs": 166.187, "totalHrs": 3.57, "validHrs": 0.04 }, "mse": { "buckets": { "dev": 327, "test": 284, "train": 391, "validated": 4338, "invalidated": 310, "other": 18 }, "duration": 38836476, "reportedSentences": 0, "validatedSentences": 1002, "unvalidatedSentences": -1, "clips": 4666, "splits": { "accent": {}, "age": { "": 0.79, "twenties": 0.21, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 4666, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 18, "size": 218219565, "checksum": "77b8d72d1483f1a82384abbde1971c2e7ddc5cf816e2230358b2010706185f9e", "avgDurationSecs": 8.323, "validDurationSecs": 36106.437, "totalHrs": 10.78, "validHrs": 10.02 }, "mt": { "buckets": { "dev": 1625, "test": 1660, "train": 1910, "validated": 6595, "invalidated": 326, "other": 6286 }, "duration": 62787780, "reportedSentences": 10, "validatedSentences": 5273, "unvalidatedSentences": 11773, "clips": 13207, "splits": { "accent": {}, "age": { "": 0.27, "twenties": 0.19, "thirties": 0.09, "teens": 0.03, "fourties": 0.17, "fifties": 0.25, "sixties": 0.01, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.28, "male_masculine": 0.25, "female_feminine": 0.47, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 13207, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 222, "size": 466475288, "checksum": "f6be17867ef174e2235020c7fb7f997fb8530dfbbde9d84a23bb3816ee0a0d85", "avgDurationSecs": 4.754, "validDurationSecs": 31353.48, "totalHrs": 17.44, "validHrs": 8.7 }, "mua": { "buckets": { "dev": 286, "test": 281, "train": 428, "validated": 8677, "invalidated": 33, "other": 27 }, "duration": 38936952, "reportedSentences": 5, "validatedSentences": 995, "unvalidatedSentences": -1, "clips": 8737, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8737, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 17, "size": 217979209, "checksum": "1f30809c317d59d91a3c7060140e5500e212a30d240aef8ebfcb802ef1a679e5", "avgDurationSecs": 4.457, "validDurationSecs": 38669.558, "totalHrs": 10.81, "validHrs": 10.74 }, "mug": { "buckets": { "dev": 297, "test": 297, "train": 404, "validated": 2687, "invalidated": 263, "other": 0 }, "duration": 45123948, "reportedSentences": 0, "validatedSentences": 1002, "unvalidatedSentences": -1, "clips": 2950, "splits": { "accent": {}, "age": { "": 0.99, "twenties": 0, "thirties": 0.01, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 2950, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 17, "size": 266758088, "checksum": "61707c1c6eb4ad4d852e43a142e108600c37feb3d1ba3c565e07c8fb1473bd30", "avgDurationSecs": 15.296, "validDurationSecs": 41101.033, "totalHrs": 12.53, "validHrs": 11.41 }, "mve": { "buckets": { "dev": 555, "test": 146, "train": 1296, "validated": 7648, "invalidated": 47, "other": 11 }, "duration": 38372904, "reportedSentences": 0, "validatedSentences": 2003, "unvalidatedSentences": -1, "clips": 7706, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.26, "thirties": 0.33, "teens": 0, "fourties": 0.39, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7706, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 20, "size": 225592528, "checksum": "0935f7b6789e38c6e935bff6a15922f7875d44a208f789b7e02dc6545e52bc6e", "avgDurationSecs": 4.98, "validDurationSecs": 38084.086, "totalHrs": 10.65, "validHrs": 10.57 }, "mvy": { "buckets": { "dev": 1946, "test": 2076, "train": 2558, "validated": 16600, "invalidated": 590, "other": 1285 }, "duration": 90013968, "reportedSentences": 90, "validatedSentences": 6634, "unvalidatedSentences": 222, "clips": 18475, "splits": { "accent": {}, "age": { "": 0.04, "twenties": 0.39, "thirties": 0.47, "teens": 0, "fourties": 0.06, "fifties": 0.03, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 18245, "agriculture_food": 33, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 108, "healthcare": 0, "history_law_government": 78, "language_fundamentals": 0, "media_entertainment": 11, "nature_environment": 7, "news_current_affairs": 0, "technology_robotics": 9 } }, "users": 56, "size": 476972904, "checksum": "298600a827aec8372df257483745fe3093c54509d1ae657995f5e382dad8b7cb", "avgDurationSecs": 4.872, "validDurationSecs": 80878.586, "totalHrs": 25, "validHrs": 22.46 }, "mxu": { "buckets": { "dev": 309, "test": 317, "train": 333, "validated": 7749, "invalidated": 67, "other": 2 }, "duration": 50839092, "reportedSentences": 0, "validatedSentences": 959, "unvalidatedSentences": -1, "clips": 7818, "splits": { "accent": {}, "age": { "": 0.56, "twenties": 0.32, "thirties": 0.12, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7818, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 22, "size": 298287692, "checksum": "bc7d32fbc9d4c35e91d2797ce5eb7a8b4d26ee805b4f3f4b67eec6f28ed8f3d0", "avgDurationSecs": 6.503, "validDurationSecs": 50390.397, "totalHrs": 14.12, "validHrs": 13.99 }, "myv": { "buckets": { "dev": 239, "test": 482, "train": 1241, "validated": 1972, "invalidated": 23, "other": 15 }, "duration": 11624940, "reportedSentences": 31, "validatedSentences": 5066, "unvalidatedSentences": 7, "clips": 2010, "splits": { "accent": {}, "age": { "": 0.39, "twenties": 0.09, "thirties": 0.24, "teens": 0.01, "fourties": 0.02, "fifties": 0, "sixties": 0.26, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.39, "male_masculine": 0.54, "female_feminine": 0.07, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 2010, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 13, "size": 68321817, "checksum": "13aadf802fc4548ef59760746fbc04c9a1c9e9705db95169602e338745bb6064", "avgDurationSecs": 5.784, "validDurationSecs": 11405.165, "totalHrs": 3.22, "validHrs": 3.16 }, "nan-tw": { "buckets": { "dev": 5923, "test": 6383, "train": 11559, "validated": 29405, "invalidated": 576, "other": 2265 }, "duration": 85243932, "reportedSentences": 226, "validatedSentences": 26907, "unvalidatedSentences": 370, "clips": 32246, "splits": { "accent": {}, "age": { "": 0.13, "twenties": 0.51, "thirties": 0.15, "teens": 0.01, "fourties": 0.17, "fifties": 0.01, "sixties": 0.02, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.27, "male_masculine": 0.62, "female_feminine": 0.11, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 31563, "agriculture_food": 4, "automotive_transport": 0, "finance": 0, "service_retail": 2, "general": 622, "healthcare": 1, "history_law_government": 0, "language_fundamentals": 55, "media_entertainment": 0, "nature_environment": 55, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 297, "size": 485404206, "checksum": "fe5cd5420acf6d284ff9cd006c475844ef8f68874863d7c09c2cb6d75fd8d513", "avgDurationSecs": 2.644, "validDurationSecs": 77733.605, "totalHrs": 23.67, "validHrs": 21.59 }, "nb-NO": { "buckets": { "dev": 415, "test": 312, "train": 1273, "validated": 2001, "invalidated": 96, "other": 140 }, "duration": 9378972, "reportedSentences": 1, "validatedSentences": 4394, "unvalidatedSentences": 3674, "clips": 2237, "splits": { "accent": {}, "age": { "": 0.18, "twenties": 0, "thirties": 0.62, "teens": 0, "fourties": 0.19, "fifties": 0.02, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.4, "male_masculine": 0.6, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1426, "agriculture_food": 3, "automotive_transport": 0, "finance": 4, "service_retail": 37, "general": 717, "healthcare": 0, "history_law_government": 21, "language_fundamentals": 13, "media_entertainment": 17, "nature_environment": 37, "news_current_affairs": 32, "technology_robotics": 0 } }, "users": 67, "size": 54581626, "checksum": "7e02d3de626e49f7fec04ffb61e7215a2c4c16c2c4c943abfa5864ed994cce44", "avgDurationSecs": 4.193, "validDurationSecs": 8389.505, "totalHrs": 2.6, "validHrs": 2.33 }, "ncx": { "buckets": { "dev": 339, "test": 345, "train": 360, "validated": 8641, "invalidated": 62, "other": 806 }, "duration": 42381792, "reportedSentences": 2, "validatedSentences": 1518, "unvalidatedSentences": 5, "clips": 9509, "splits": { "accent": {}, "age": { "": 0.04, "twenties": 0.15, "thirties": 0.63, "teens": 0, "fourties": 0.17, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.61, "male_masculine": 0.01, "female_feminine": 0.38, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 2832, "agriculture_food": 0, "automotive_transport": 0, "finance": 212, "service_retail": 0, "general": 0, "healthcare": 212, "history_law_government": 0, "language_fundamentals": 2047, "media_entertainment": 4700, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 41, "size": 243130501, "checksum": "0e68bdaab632f8183451a1a44ad9790ecab34678fbe9ad22c9ffee0fb3ca76bf", "avgDurationSecs": 4.457, "validDurationSecs": 38513.1, "totalHrs": 11.77, "validHrs": 10.69 }, "ne-NP": { "buckets": { "dev": 314, "test": 289, "train": 355, "validated": 1179, "invalidated": 100, "other": 415 }, "duration": 6964560, "reportedSentences": 5, "validatedSentences": 1316, "unvalidatedSentences": 30, "clips": 1694, "splits": { "accent": {}, "age": { "": 0.31, "twenties": 0.57, "thirties": 0.12, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.38, "male_masculine": 0.61, "female_feminine": 0.01, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1693, "agriculture_food": 1, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 61, "size": 40868769, "checksum": "d7860601d5d1fdcd2993e90efeac9730ca0f40e46be9516f52f0e17403b213d5", "avgDurationSecs": 4.111, "validDurationSecs": 4847.235, "totalHrs": 1.93, "validHrs": 1.34 }, "nhi": { "buckets": { "dev": 10, "test": 6, "train": 24, "validated": 40, "invalidated": 0, "other": 387 }, "duration": 2169576, "reportedSentences": 0, "validatedSentences": 758, "unvalidatedSentences": 11, "clips": 427, "splits": { "accent": {}, "age": { "": 0.19, "twenties": 0.73, "thirties": 0.08, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.19, "male_masculine": 0.08, "female_feminine": 0.73, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 427, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 6, "size": 12735162, "checksum": "244897ae41792379b265414bbaf44bffbccca8e24dd0487c8646862137dafd94", "avgDurationSecs": 5.081, "validDurationSecs": 203.239, "totalHrs": 0.6, "validHrs": 0.05 }, "nl": { "buckets": { "dev": 12225, "test": 12225, "train": 46082, "validated": 103597, "invalidated": 6133, "other": 5700 }, "duration": 504525061, "reportedSentences": 406, "validatedSentences": 260817, "unvalidatedSentences": 10596, "clips": 115430, "splits": { "accent": {}, "age": { "": 0.36, "twenties": 0.18, "thirties": 0.12, "teens": 0.02, "fourties": 0.18, "fifties": 0.11, "sixties": 0.02, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.38, "male_masculine": 0.52, "female_feminine": 0.1, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 114703, "agriculture_food": 16, "automotive_transport": 21, "finance": 7, "service_retail": 0, "general": 368, "healthcare": 56, "history_law_government": 55, "language_fundamentals": 175, "media_entertainment": 2, "nature_environment": 55, "news_current_affairs": 3, "technology_robotics": 5 } }, "users": 1865, "size": 3373398122, "checksum": "21eb500aa204e5084516690f5d271e1502c1b3c5f15580ace2e114f75eb6dbf2", "avgDurationSecs": 4.371, "validDurationSecs": 452805.014, "totalHrs": 140.14, "validHrs": 125.77 }, "nla": { "buckets": { "dev": 172, "test": 220, "train": 592, "validated": 4635, "invalidated": 176, "other": 5 }, "duration": 37346544, "reportedSentences": 0, "validatedSentences": 984, "unvalidatedSentences": -1, "clips": 4816, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 4816, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 15, "size": 212123306, "checksum": "63ada318ffc0fbf732daed24b8fdd805fa05d7face5c1c5c1b8d66a18bc4e831", "avgDurationSecs": 7.755, "validDurationSecs": 35942.947, "totalHrs": 10.37, "validHrs": 9.98 }, "nlv": { "buckets": { "dev": 248, "test": 291, "train": 467, "validated": 6656, "invalidated": 128, "other": 60 }, "duration": 42922260, "reportedSentences": 1, "validatedSentences": 1006, "unvalidatedSentences": -1, "clips": 6844, "splits": { "accent": {}, "age": { "": 0.01, "twenties": 0.13, "thirties": 0.85, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.91, "male_masculine": 0, "female_feminine": 0.09, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 5103, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 698, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 824, "media_entertainment": 944, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 16, "size": 249248700, "checksum": "1d501ae8bc18eaec8ce2835947f36f0c6a9d3323057b7415ce2fa00e00ae0791", "avgDurationSecs": 6.272, "validDurationSecs": 41743.215, "totalHrs": 11.92, "validHrs": 11.59 }, "nmg": { "buckets": { "dev": 272, "test": 270, "train": 483, "validated": 5865, "invalidated": 89, "other": 5 }, "duration": 38142936, "reportedSentences": 1, "validatedSentences": 1025, "unvalidatedSentences": -1, "clips": 5959, "splits": { "accent": {}, "age": { "": 0.86, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0.14, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 5959, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 11, "size": 217274870, "checksum": "42a73b308a7cc5bdbd0f62c73c9ad6c159ff34a87ae4a37ba67a38e5fd0dd41e", "avgDurationSecs": 6.401, "validDurationSecs": 37541.252, "totalHrs": 10.59, "validHrs": 10.42 }, "nmz": { "buckets": { "dev": 795, "test": 795, "train": 846, "validated": 13698, "invalidated": 109, "other": 313 }, "duration": 41779332, "reportedSentences": 2, "validatedSentences": 2446, "unvalidatedSentences": 1, "clips": 14120, "splits": { "accent": {}, "age": { "": 0.92, "twenties": 0, "thirties": 0.08, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.99, "male_masculine": 0, "female_feminine": 0.01, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 14120, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 35, "size": 215687900, "checksum": "46566952dd93ab8bb6cd9563df118dc892b434554ecaec441218bddfc7830e0c", "avgDurationSecs": 2.959, "validDurationSecs": 40530.686, "totalHrs": 11.6, "validHrs": 11.25 }, "nn-NO": { "buckets": { "dev": 322, "test": 392, "train": 588, "validated": 1307, "invalidated": 61, "other": 11 }, "duration": 6050232, "reportedSentences": 23, "validatedSentences": 5318, "unvalidatedSentences": 6, "clips": 1379, "splits": { "accent": {}, "age": { "": 0.26, "twenties": 0.28, "thirties": 0.4, "teens": 0.02, "fourties": 0.03, "fifties": 0.01, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.29, "male_masculine": 0.58, "female_feminine": 0.13, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1379, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 40, "size": 35178699, "checksum": "7d63636ad50966fbed2f6d092060a4a0e95735df571726f2faed08c336b1ca8a", "avgDurationSecs": 4.387, "validDurationSecs": 5734.339, "totalHrs": 1.68, "validHrs": 1.59 }, "nnh": { "buckets": { "dev": 186, "test": 288, "train": 412, "validated": 7631, "invalidated": 156, "other": 1 }, "duration": 82297008, "reportedSentences": 0, "validatedSentences": 886, "unvalidatedSentences": -1, "clips": 7788, "splits": { "accent": {}, "age": { "": 0.89, "twenties": 0, "thirties": 0.11, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.89, "male_masculine": 0, "female_feminine": 0.11, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7788, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 17, "size": 486872826, "checksum": "babd44c2f72627c3a056b231c56db4202e847d9634009ed258b84f1d097bc1ba", "avgDurationSecs": 10.567, "validDurationSecs": 80637.965, "totalHrs": 22.86, "validHrs": 22.39 }, "nr": { "buckets": { "dev": 0, "test": 0, "train": 0, "validated": 0, "invalidated": 0, "other": 7 }, "duration": 60696, "reportedSentences": 0, "validatedSentences": 319, "unvalidatedSentences": 7468, "clips": 7, "splits": { "accent": {}, "age": { "": 0.29, "twenties": 0, "thirties": 0.71, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 2, "size": 881984, "checksum": "56bf8efe6e787631d2167e53ea0f75d5d8d23574400c1ded2dee82f52a1c513c", "avgDurationSecs": 8.671, "validDurationSecs": 0, "totalHrs": 0.01, "validHrs": 0 }, "nso": { "buckets": { "dev": 0, "test": 0, "train": 2, "validated": 2, "invalidated": 0, "other": 18 }, "duration": 92592, "reportedSentences": 0, "validatedSentences": 2244, "unvalidatedSentences": 14227, "clips": 20, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 20, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 1, "size": 1552765, "checksum": "73e9b4a6e2b9eab02599ace56ee43a4dbe7acaeb4bf184f546d5462a60e73d65", "avgDurationSecs": 4.63, "validDurationSecs": 9.259, "totalHrs": 0.02, "validHrs": 0 }, "nyu": { "buckets": { "dev": 0, "test": 248, "train": 1023, "validated": 3639, "invalidated": 76, "other": 1 }, "duration": 38390760, "reportedSentences": 0, "validatedSentences": 1271, "unvalidatedSentences": -1, "clips": 3716, "splits": { "accent": {}, "age": { "": 0.32, "twenties": 0.33, "thirties": 0.34, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.67, "male_masculine": 0, "female_feminine": 0.33, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 2624, "agriculture_food": 4, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 1082, "healthcare": 2, "history_law_government": 2, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 4, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 5, "size": 219323882, "checksum": "3bb330e84c386c143ac89e39312aadbc3742b2e53b4f8411f22d18b535b73df2", "avgDurationSecs": 10.331, "validDurationSecs": 37595.257, "totalHrs": 10.66, "validHrs": 10.44 }, "oc": { "buckets": { "dev": 272, "test": 274, "train": 304, "validated": 1977, "invalidated": 203, "other": 7705 }, "duration": 48154680, "reportedSentences": 13, "validatedSentences": 4934, "unvalidatedSentences": 14, "clips": 9885, "splits": { "accent": {}, "age": { "": 0.5, "twenties": 0.02, "thirties": 0.04, "teens": 0.01, "fourties": 0.17, "fifties": 0.16, "sixties": 0.11, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.52, "male_masculine": 0.08, "female_feminine": 0.4, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 9885, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 149, "size": 274106967, "checksum": "e0331248b393bf9364ece8f85c0ecc71d33de74652847bcb4c143cdcccb186a2", "avgDurationSecs": 4.871, "validDurationSecs": 9630.936, "totalHrs": 13.37, "validHrs": 2.67 }, "odk": { "buckets": { "dev": 467, "test": 627, "train": 941, "validated": 6341, "invalidated": 46, "other": 0 }, "duration": 40676832, "reportedSentences": 0, "validatedSentences": 2047, "unvalidatedSentences": -1, "clips": 6387, "splits": { "accent": {}, "age": { "": 0.31, "twenties": 0.2, "thirties": 0.18, "teens": 0.15, "fourties": 0.08, "fifties": 0.08, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.7, "male_masculine": 0.14, "female_feminine": 0.16, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 6387, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 20, "size": 236342138, "checksum": "be42f35dacc8897e6d6adac8e837baa719bb06bbfe31c9fe43193174451b8ea6", "avgDurationSecs": 6.369, "validDurationSecs": 40383.872, "totalHrs": 11.29, "validHrs": 11.21 }, "or": { "buckets": { "dev": 640, "test": 479, "train": 2151, "validated": 4085, "invalidated": 437, "other": 19622 }, "duration": 134612700, "reportedSentences": 100, "validatedSentences": 6197, "unvalidatedSentences": 87, "clips": 24144, "splits": { "accent": {}, "age": { "": 0.06, "twenties": 0.65, "thirties": 0.27, "teens": 0, "fourties": 0.01, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.42, "male_masculine": 0.34, "female_feminine": 0.03, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.21 }, "sentence_domain": { "": 24137, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 7, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 163, "size": 832546925, "checksum": "0f23ae006a91ba4ef4a980488409c233cb8af7d9bbf397d69368182b569674b1", "avgDurationSecs": 5.575, "validDurationSecs": 22775.55, "totalHrs": 37.39, "validHrs": 6.32 }, "oru": { "buckets": { "dev": 0, "test": 1210, "train": 6079, "validated": 8490, "invalidated": 86, "other": 160 }, "duration": 65019456, "reportedSentences": 0, "validatedSentences": 7355, "unvalidatedSentences": 902, "clips": 8736, "splits": { "accent": {}, "age": { "": 0.23, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0.77, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.23, "male_masculine": 0.4, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.37 }, "sentence_domain": { "": 8630, "agriculture_food": 106, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 106, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 106, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 13, "size": 385828863, "checksum": "b2c9859c26e48cd41a5a54439c6d570676e2399015b6fd591646093d4e05617f", "avgDurationSecs": 7.443, "validDurationSecs": 63188.551, "totalHrs": 18.06, "validHrs": 17.55 }, "os": { "buckets": { "dev": 251, "test": 219, "train": 414, "validated": 915, "invalidated": 35, "other": 6 }, "duration": 5280084, "reportedSentences": 5, "validatedSentences": 1888, "unvalidatedSentences": 34, "clips": 956, "splits": { "accent": {}, "age": { "": 0.23, "twenties": 0.09, "thirties": 0.46, "teens": 0.02, "fourties": 0.2, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.78, "male_masculine": 0.22, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 955, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 1, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 37, "size": 30907997, "checksum": "ab156c9fbdce44f05645cbfeb8814d7169bbd6ac5f7f67c6620eace2ec4231ba", "avgDurationSecs": 5.523, "validDurationSecs": 5053.637, "totalHrs": 1.46, "validHrs": 1.4 }, "pa-IN": { "buckets": { "dev": 489, "test": 524, "train": 808, "validated": 1821, "invalidated": 104, "other": 1357 }, "duration": 16778510, "reportedSentences": 251, "validatedSentences": 14825, "unvalidatedSentences": 22, "clips": 3282, "splits": { "accent": {}, "age": { "": 0.28, "twenties": 0.21, "thirties": 0.39, "teens": 0, "fourties": 0.07, "fifties": 0.04, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.36, "male_masculine": 0.63, "female_feminine": 0.01, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 3281, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 1, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 75, "size": 116221215, "checksum": "51e1408f6a42373d70e5c58619df034be28766a7204b2734d55d4c82240ce543", "avgDurationSecs": 5.112, "validDurationSecs": 9309.466, "totalHrs": 4.66, "validHrs": 2.58 }, "pcm": { "buckets": { "dev": 326, "test": 326, "train": 335, "validated": 7754, "invalidated": 64, "other": 1146 }, "duration": 54050724, "reportedSentences": 0, "validatedSentences": 987, "unvalidatedSentences": -1, "clips": 8964, "splits": { "accent": {}, "age": { "": 0.73, "twenties": 0, "thirties": 0.11, "teens": 0, "fourties": 0.16, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.85, "male_masculine": 0, "female_feminine": 0.15, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8964, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 59, "size": 308334350, "checksum": "68d6dea59c9ee3f8eb160acc202796feefb2a580413055b740e562a2a11d85fc", "avgDurationSecs": 6.03, "validDurationSecs": 46754.72, "totalHrs": 15.01, "validHrs": 12.98 }, "phl": { "buckets": { "dev": 1408, "test": 1377, "train": 1947, "validated": 15556, "invalidated": 83, "other": 5519 }, "duration": 105392160, "reportedSentences": 0, "validatedSentences": 4745, "unvalidatedSentences": 1184, "clips": 21158, "splits": { "accent": {}, "age": { "": 0.06, "twenties": 0.48, "thirties": 0.23, "teens": 0.06, "fourties": 0.18, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 21120, "agriculture_food": 0, "automotive_transport": 4, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 10, "history_law_government": 24, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 20, "size": 619742106, "checksum": "4aaf371feffca8920d87fccab54c5b30110428b624fbf5aa6df513b488798f3d", "avgDurationSecs": 4.981, "validDurationSecs": 77487.496, "totalHrs": 29.27, "validHrs": 21.52 }, "phr": { "buckets": { "dev": 673, "test": 656, "train": 743, "validated": 12695, "invalidated": 139, "other": 10 }, "duration": 52106364, "reportedSentences": 1, "validatedSentences": 2077, "unvalidatedSentences": -1, "clips": 12844, "splits": { "accent": {}, "age": { "": 0.29, "twenties": 0.52, "thirties": 0.17, "teens": 0, "fourties": 0.02, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.7, "male_masculine": 0, "female_feminine": 0.3, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 12844, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 63, "size": 296556266, "checksum": "f9105e948fa3db9fd4b6cb7bd31d7f11851197874fef8268e0b64f6571e7f16d", "avgDurationSecs": 4.057, "validDurationSecs": 51501.891, "totalHrs": 14.47, "validHrs": 14.3 }, "pl": { "buckets": { "dev": 9975, "test": 9975, "train": 24903, "validated": 138335, "invalidated": 6952, "other": 2689 }, "duration": 676710182, "reportedSentences": 604, "validatedSentences": 230081, "unvalidatedSentences": 11038, "clips": 147976, "splits": { "accent": {}, "age": { "": 0.24, "twenties": 0.27, "thirties": 0.35, "teens": 0.02, "fourties": 0.11, "fifties": 0.01, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0.01 }, "gender": { "": 0.28, "male_masculine": 0.58, "female_feminine": 0.14, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 147959, "agriculture_food": 0, "automotive_transport": 0, "finance": 12, "service_retail": 0, "general": 3, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 2, "technology_robotics": 3 } }, "users": 3455, "size": 4784731518, "checksum": "1070367840751023da2a7b99c964ddfb1bd00df77f42b9c9e546341c1520cf04", "avgDurationSecs": 4.573, "validDurationSecs": 632620.851, "totalHrs": 187.97, "validHrs": 175.72 }, "plk": { "buckets": { "dev": 1237, "test": 662, "train": 2517, "validated": 9015, "invalidated": 960, "other": 1960 }, "duration": 59980824, "reportedSentences": 0, "validatedSentences": 4657, "unvalidatedSentences": -1, "clips": 11935, "splits": { "accent": {}, "age": { "": 0.14, "twenties": 0, "thirties": 0.16, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0.71, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 11935, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 10, "size": 345834596, "checksum": "54b9322f0140b9d249ea831a54d67c1a5287b7c32df06944c06cf830c8f3e7d4", "avgDurationSecs": 5.026, "validDurationSecs": 45306.002, "totalHrs": 16.66, "validHrs": 12.58 }, "prq": { "buckets": { "dev": 282, "test": 287, "train": 417, "validated": 7422, "invalidated": 68, "other": 179 }, "duration": 37282968, "reportedSentences": 0, "validatedSentences": 986, "unvalidatedSentences": -1, "clips": 7669, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.17, "thirties": 0.26, "teens": 0, "fourties": 0.57, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.16, "male_masculine": 0, "female_feminine": 0.84, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7669, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 13, "size": 202924151, "checksum": "ad6dcb53dbe2e7b600d7748b77db0238ebda964a1bdf225bdb95986ce3b79a1b", "avgDurationSecs": 4.862, "validDurationSecs": 36082.173, "totalHrs": 10.35, "validHrs": 10.02 }, "ps": { "buckets": { "dev": 13791, "test": 13791, "train": 80525, "validated": 848687, "invalidated": 51866, "other": 1507246 }, "duration": 9967341528, "reportedSentences": 4230, "validatedSentences": 246535, "unvalidatedSentences": 15712, "clips": 2407799, "splits": { "accent": {}, "age": { "": 132867, "twenties": 1433630, "thirties": 472795, "teens": 191562, "fourties": 90848, "fifties": 83885, "sixties": 2123, "seventies": 89, "eighties": 0, "nineties": 0 }, "gender": { "": 1010482, "male_masculine": 6244, "female_feminine": 1390861, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 212 }, "sentence_domain": { "": 2053505, "agriculture_food": 24125, "automotive_transport": 3647, "finance": 6460, "service_retail": 14974, "general": 278899, "healthcare": 11001, "history_law_government": 69867, "language_fundamentals": 16045, "media_entertainment": 13696, "nature_environment": 79412, "news_current_affairs": 4381, "technology_robotics": 14030 } }, "users": 6654, "size": 53663559573, "checksum": "c2dc2c2b16e6ddfe831bd3c92c24761767fac439be809d26c0c7bbb55b3e18b4", "avgDurationSecs": 4.14, "validDurationSecs": 3513230.622, "totalHrs": 2768.7, "validHrs": 975.89 }, "pt": { "buckets": { "dev": 9659, "test": 9662, "train": 23046, "validated": 160548, "invalidated": 7825, "other": 27822 }, "duration": 821649031, "reportedSentences": 2853, "validatedSentences": 43602, "unvalidatedSentences": 96, "clips": 196195, "splits": { "accent": {}, "age": { "": 0.24, "twenties": 0.36, "thirties": 0.18, "teens": 0.02, "fourties": 0.13, "fifties": 0.03, "sixties": 0.04, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.27, "male_masculine": 0.68, "female_feminine": 0.06, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 194404, "agriculture_food": 147, "automotive_transport": 37, "finance": 27, "service_retail": 24, "general": 1357, "healthcare": 191, "history_law_government": 66, "language_fundamentals": 17, "media_entertainment": 76, "nature_environment": 49, "news_current_affairs": 4, "technology_robotics": 181 } }, "users": 3804, "size": 5148282839, "checksum": "f326e333e79da755db71a0c66986c87729ad4a9d5b1630758e5fcc09dfa2d5af", "avgDurationSecs": 4.188, "validDurationSecs": 672362.235, "totalHrs": 228.23, "validHrs": 186.76 }, "pua": { "buckets": { "dev": 495, "test": 547, "train": 1153, "validated": 7536, "invalidated": 199, "other": 445 }, "duration": 40235256, "reportedSentences": 1, "validatedSentences": 2201, "unvalidatedSentences": -1, "clips": 8180, "splits": { "accent": {}, "age": { "": 0.14, "twenties": 0.55, "thirties": 0.31, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.72, "male_masculine": 0, "female_feminine": 0.28, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8180, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 9, "size": 228610574, "checksum": "de0c8d62ccc4b94c825efc9dbb360145a74d33b1ae7cef91ba064562a9d0c685", "avgDurationSecs": 4.919, "validDurationSecs": 37067.59, "totalHrs": 11.17, "validHrs": 10.29 }, "pwn": { "buckets": { "dev": 722, "test": 724, "train": 761, "validated": 10800, "invalidated": 138, "other": 0 }, "duration": 53298360, "reportedSentences": 0, "validatedSentences": 2207, "unvalidatedSentences": 241, "clips": 10938, "splits": { "accent": {}, "age": { "": 0.29, "twenties": 0.05, "thirties": 0.43, "teens": 0, "fourties": 0, "fifties": 0.22, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.49, "male_masculine": 0.04, "female_feminine": 0.23, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.24 }, "sentence_domain": { "": 0, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 13132, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 27, "size": 294314757, "checksum": "eefcdc85a1ef010bd40d4f03afa4ab837c54348584ecbd9fc389377d564154fb", "avgDurationSecs": 4.873, "validDurationSecs": 52625.918, "totalHrs": 14.8, "validHrs": 14.61 }, "qup": { "buckets": { "dev": 288, "test": 254, "train": 449, "validated": 7202, "invalidated": 2, "other": 2465 }, "duration": 57452508, "reportedSentences": 4, "validatedSentences": 991, "unvalidatedSentences": -1, "clips": 9669, "splits": { "accent": {}, "age": { "": 0.08, "twenties": 0.11, "thirties": 0.72, "teens": 0, "fourties": 0, "fifties": 0.1, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.79, "male_masculine": 0, "female_feminine": 0.21, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 9669, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 15, "size": 330081092, "checksum": "46e1197dc29db5ba3a884162c74dce7d54cfc3a893e5a06dd548443bac96cd22", "avgDurationSecs": 5.942, "validDurationSecs": 42793.77, "totalHrs": 15.95, "validHrs": 11.88 }, "qur": { "buckets": { "dev": 0, "test": 32, "train": 977, "validated": 10408, "invalidated": 27, "other": 41 }, "duration": 36351540, "reportedSentences": 0, "validatedSentences": 1010, "unvalidatedSentences": -1, "clips": 10476, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.76, "thirties": 0.24, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.19, "male_masculine": 0, "female_feminine": 0.81, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 10476, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 12, "size": 194563538, "checksum": "f10ccb583f4878442eb4a5e8360e9646c427bbc9086d7e05b5fda7926fc999ad", "avgDurationSecs": 3.47, "validDurationSecs": 36115.581, "totalHrs": 10.09, "validHrs": 10.03 }, "qus": { "buckets": { "dev": 314, "test": 330, "train": 354, "validated": 10323, "invalidated": 93, "other": 433 }, "duration": 41653512, "reportedSentences": 0, "validatedSentences": 998, "unvalidatedSentences": -1, "clips": 10849, "splits": { "accent": {}, "age": { "": 0.2, "twenties": 0.36, "thirties": 0.32, "teens": 0, "fourties": 0.03, "fifties": 0.09, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.54, "male_masculine": 0, "female_feminine": 0.46, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 10849, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 24, "size": 222384268, "checksum": "237121fcf9e890d51858bed67c6c5b586f1a2c6e46c171a3378a1bb18f6baf42", "avgDurationSecs": 3.839, "validDurationSecs": 39633.994, "totalHrs": 11.57, "validHrs": 11 }, "qux": { "buckets": { "dev": 280, "test": 299, "train": 399, "validated": 6156, "invalidated": 25, "other": 2008 }, "duration": 48318408, "reportedSentences": 0, "validatedSentences": 978, "unvalidatedSentences": -1, "clips": 8189, "splits": { "accent": {}, "age": { "": 0.02, "twenties": 0.24, "thirties": 0.39, "teens": 0, "fourties": 0, "fifties": 0.24, "sixties": 0.12, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.37, "male_masculine": 0, "female_feminine": 0.63, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8189, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 15, "size": 270613847, "checksum": "ca676f40d62b0b50d21aebda5a610c10147ebf9a5d773490d23df80ddacff2ce", "avgDurationSecs": 5.9, "validDurationSecs": 36322.887, "totalHrs": 13.42, "validHrs": 10.08 }, "quy": { "buckets": { "dev": 0, "test": 10, "train": 27, "validated": 38, "invalidated": 7, "other": 1255 }, "duration": 11227752, "reportedSentences": 0, "validatedSentences": 759, "unvalidatedSentences": 282, "clips": 1300, "splits": { "accent": {}, "age": { "": 0.02, "twenties": 0.71, "thirties": 0, "teens": 0, "fourties": 0.02, "fifties": 0, "sixties": 0.25, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.82, "male_masculine": 0, "female_feminine": 0.18, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1300, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 8, "size": 65531078, "checksum": "14cb3d8261136c2ace09b7d83a7fc1dcfd0da22dea239b40af1e9dc175bc7c7a", "avgDurationSecs": 8.637, "validDurationSecs": 328.196, "totalHrs": 3.11, "validHrs": 0.09 }, "qva": { "buckets": { "dev": 200, "test": 326, "train": 473, "validated": 8222, "invalidated": 21, "other": 23 }, "duration": 36399420, "reportedSentences": 0, "validatedSentences": 1000, "unvalidatedSentences": -1, "clips": 8266, "splits": { "accent": {}, "age": { "": 0.11, "twenties": 0.1, "thirties": 0.54, "teens": 0, "fourties": 0, "fifties": 0.12, "sixties": 0.12, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.12, "male_masculine": 0, "female_feminine": 0.88, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8266, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 13, "size": 199010373, "checksum": "1ecd84244857b93d4dda453a25651a68ee58ef415180043cce8b9949069a4b00", "avgDurationSecs": 4.404, "validDurationSecs": 36205.666, "totalHrs": 10.11, "validHrs": 10.05 }, "qvi": { "buckets": { "dev": 364, "test": 379, "train": 405, "validated": 9266, "invalidated": 237, "other": 693 }, "duration": 45140940, "reportedSentences": 0, "validatedSentences": 1149, "unvalidatedSentences": -1, "clips": 10196, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.26, "thirties": 0.64, "teens": 0.1, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.28, "male_masculine": 0, "female_feminine": 0.72, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 10196, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 15, "size": 262118236, "checksum": "34799bc58736d1665788583381e2e2547bc03b4b9df9a49a7c587dfec0356765", "avgDurationSecs": 4.427, "validDurationSecs": 41023.534, "totalHrs": 12.53, "validHrs": 11.39 }, "qvj": { "buckets": { "dev": 349, "test": 348, "train": 362, "validated": 6552, "invalidated": 8, "other": 186 }, "duration": 40215924, "reportedSentences": 0, "validatedSentences": 1059, "unvalidatedSentences": -1, "clips": 6746, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.58, "thirties": 0.02, "teens": 0, "fourties": 0.39, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.2, "male_masculine": 0, "female_feminine": 0.8, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 6746, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 16, "size": 232485499, "checksum": "bfe433ba3421daf0a5804f8f518e655ea5fa2b85a09953d70512f13aaffbc329", "avgDurationSecs": 5.961, "validDurationSecs": 39059.403, "totalHrs": 11.17, "validHrs": 10.84 }, "qvl": { "buckets": { "dev": 222, "test": 321, "train": 457, "validated": 9082, "invalidated": 5, "other": 13 }, "duration": 36219708, "reportedSentences": 0, "validatedSentences": 1000, "unvalidatedSentences": -1, "clips": 9100, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.83, "thirties": 0.11, "teens": 0.06, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.39, "male_masculine": 0, "female_feminine": 0.61, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 9100, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 19, "size": 201087771, "checksum": "f4559bce00466942b0a8e55590927112e8cf351bc45d8419a1c571dc0e6e84a4", "avgDurationSecs": 3.98, "validDurationSecs": 36148.065, "totalHrs": 10.06, "validHrs": 10.04 }, "qwa": { "buckets": { "dev": 106, "test": 308, "train": 586, "validated": 7217, "invalidated": 1, "other": 1147 }, "duration": 41537916, "reportedSentences": 0, "validatedSentences": 1000, "unvalidatedSentences": -1, "clips": 8365, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.12, "thirties": 0.32, "teens": 0, "fourties": 0.2, "fifties": 0.36, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.6, "male_masculine": 0, "female_feminine": 0.4, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8365, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 13, "size": 220832456, "checksum": "88a62630ce0768c38b6a0f7470a3232266794c6ae5cf84ba7fa9d6b2221e34f6", "avgDurationSecs": 4.966, "validDurationSecs": 35837.315, "totalHrs": 11.53, "validHrs": 9.95 }, "qws": { "buckets": { "dev": 0, "test": 61, "train": 937, "validated": 8879, "invalidated": 2, "other": 96 }, "duration": 37376136, "reportedSentences": 0, "validatedSentences": 998, "unvalidatedSentences": -1, "clips": 8977, "splits": { "accent": {}, "age": { "": 0.22, "twenties": 0.55, "thirties": 0.11, "teens": 0, "fourties": 0.11, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.44, "male_masculine": 0, "female_feminine": 0.56, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8977, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 12, "size": 211202213, "checksum": "266632544eb4aa83b13d013c0c97c020365f5e7e4d239ba8263f5414ace24090", "avgDurationSecs": 4.164, "validDurationSecs": 36968.109, "totalHrs": 10.38, "validHrs": 10.26 }, "qxa": { "buckets": { "dev": 233, "test": 315, "train": 451, "validated": 8353, "invalidated": 8, "other": 359 }, "duration": 37918800, "reportedSentences": 0, "validatedSentences": 999, "unvalidatedSentences": -1, "clips": 8720, "splits": { "accent": {}, "age": { "": 0.02, "twenties": 0.67, "thirties": 0.2, "teens": 0, "fourties": 0.11, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.45, "male_masculine": 0, "female_feminine": 0.55, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8720, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 18, "size": 208033129, "checksum": "8b23b4d8ef2a7cddd582e412e7a8ba13c90058c890a6c34f2c7d314ffc322cbc", "avgDurationSecs": 4.348, "validDurationSecs": 36322.906, "totalHrs": 10.53, "validHrs": 10.08 }, "qxp": { "buckets": { "dev": 0, "test": 561, "train": 1503, "validated": 7679, "invalidated": 213, "other": 1141 }, "duration": 41874264, "reportedSentences": 53, "validatedSentences": 2065, "unvalidatedSentences": -1, "clips": 9033, "splits": { "accent": {}, "age": { "": 0.01, "twenties": 0.76, "thirties": 0.23, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.46, "male_masculine": 0, "female_feminine": 0.54, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 0, "agriculture_food": 8998, "automotive_transport": 0, "finance": 43, "service_retail": 0, "general": 7043, "healthcare": 7055, "history_law_government": 485, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 3488, "news_current_affairs": 58, "technology_robotics": 0 } }, "users": 14, "size": 241523276, "checksum": "31afe9f6c1aa3241a72436d14c9e0a5f4571b110f6d8ccd8a1d01052cfee99ab", "avgDurationSecs": 4.636, "validDurationSecs": 35597.528, "totalHrs": 11.63, "validHrs": 9.88 }, "qxt": { "buckets": { "dev": 60, "test": 321, "train": 616, "validated": 8647, "invalidated": 12, "other": 2469 }, "duration": 47738988, "reportedSentences": 0, "validatedSentences": 998, "unvalidatedSentences": -1, "clips": 11128, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.19, "thirties": 0.18, "teens": 0, "fourties": 0.54, "fifties": 0.09, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.27, "male_masculine": 0, "female_feminine": 0.73, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 11128, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 16, "size": 273938595, "checksum": "27dcfd0f8307753b66bfb50406b1b17885482fb9d03211d6654ac60c750613cf", "avgDurationSecs": 4.29, "validDurationSecs": 37095.527, "totalHrs": 13.26, "validHrs": 10.3 }, "qxu": { "buckets": { "dev": 0, "test": 325, "train": 673, "validated": 8712, "invalidated": 298, "other": 1899 }, "duration": 47439360, "reportedSentences": 0, "validatedSentences": 998, "unvalidatedSentences": -1, "clips": 10909, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.47, "thirties": 0.34, "teens": 0.09, "fourties": 0.09, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.46, "male_masculine": 0, "female_feminine": 0.54, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 10909, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 16, "size": 272676268, "checksum": "057cbb265953728900cfab48882a24391502e5bff4f9c33580d0238cef5d5959", "avgDurationSecs": 4.349, "validDurationSecs": 37885.389, "totalHrs": 13.17, "validHrs": 10.52 }, "qxw": { "buckets": { "dev": 167, "test": 227, "train": 608, "validated": 8021, "invalidated": 82, "other": 1150 }, "duration": 48633444, "reportedSentences": 0, "validatedSentences": 1002, "unvalidatedSentences": -1, "clips": 9253, "splits": { "accent": {}, "age": { "": 0.02, "twenties": 0.54, "thirties": 0.11, "teens": 0, "fourties": 0.22, "fifties": 0, "sixties": 0, "seventies": 0.11, "eighties": 0, "nineties": 0 }, "gender": { "": 0.46, "male_masculine": 0, "female_feminine": 0.54, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 9253, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 14, "size": 275514194, "checksum": "e2105521891aad5524d884b3768e5e584819e1df9035f3bb096de930ff64849b", "avgDurationSecs": 5.256, "validDurationSecs": 42158.095, "totalHrs": 13.5, "validHrs": 11.71 }, "rm-sursilv": { "buckets": { "dev": 1369, "test": 1419, "train": 1604, "validated": 4411, "invalidated": 687, "other": 2406 }, "duration": 40806869, "reportedSentences": 17, "validatedSentences": 8780, "unvalidatedSentences": 7455, "clips": 7504, "splits": { "accent": {}, "age": { "": 0.61, "twenties": 0.09, "thirties": 0.07, "teens": 0.05, "fourties": 0.18, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.65, "male_masculine": 0.17, "female_feminine": 0.18, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7504, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 91, "size": 306286617, "checksum": "fe04ea27af47298e1ec01b64d7e36f5f87c496d4b707909a6066f0a671ca3426", "avgDurationSecs": 5.438, "validDurationSecs": 23987.087, "totalHrs": 11.33, "validHrs": 6.66 }, "rm-vallader": { "buckets": { "dev": 500, "test": 463, "train": 557, "validated": 1527, "invalidated": 394, "other": 740 }, "duration": 15519074, "reportedSentences": 38, "validatedSentences": 5913, "unvalidatedSentences": 1172, "clips": 2661, "splits": { "accent": {}, "age": { "": 0.37, "twenties": 0.14, "thirties": 0.06, "teens": 0, "fourties": 0.41, "fifties": 0, "sixties": 0.03, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.37, "male_masculine": 0.44, "female_feminine": 0.19, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 2661, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 55, "size": 118485233, "checksum": "8b1c3bcd86f0dddd121218222fd4d9e8b88a9f38181f601671effc328db77b67", "avgDurationSecs": 5.832, "validDurationSecs": 8905.534, "totalHrs": 4.31, "validHrs": 2.47 }, "ro": { "buckets": { "dev": 3927, "test": 3912, "train": 5192, "validated": 19569, "invalidated": 1093, "other": 22919 }, "duration": 176104975, "reportedSentences": 487, "validatedSentences": 13753, "unvalidatedSentences": 89202, "clips": 43581, "splits": { "accent": {}, "age": { "": 0.15, "twenties": 0.59, "thirties": 0.13, "teens": 0.02, "fourties": 0.09, "fifties": 0.02, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.17, "male_masculine": 0.7, "female_feminine": 0.13, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 43581, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 459, "size": 1096596634, "checksum": "485f929bb94328403e43bfd9e930e7815b5fc7b1cdf776b3cdac27ba5c425a3c", "avgDurationSecs": 4.041, "validDurationSecs": 79075.704, "totalHrs": 48.91, "validHrs": 21.96 }, "rof": { "buckets": { "dev": 461, "test": 461, "train": 477, "validated": 9557, "invalidated": 835, "other": 0 }, "duration": 41952420, "reportedSentences": 0, "validatedSentences": 1399, "unvalidatedSentences": -1, "clips": 10392, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.35, "thirties": 0.41, "teens": 0, "fourties": 0.23, "fifties": 0.02, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.37, "male_masculine": 0, "female_feminine": 0.63, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 10392, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 24, "size": 239899208, "checksum": "42454b644bd2374c5ec0424f0b255391090b9cd7ae157a14377cd352cdea3644", "avgDurationSecs": 4.037, "validDurationSecs": 38581.532, "totalHrs": 11.65, "validHrs": 10.71 }, "ru": { "buckets": { "dev": 10260, "test": 10261, "train": 26772, "validated": 173750, "invalidated": 10594, "other": 16982 }, "duration": 1044851472, "reportedSentences": 577, "validatedSentences": 47849, "unvalidatedSentences": 230, "clips": 201326, "splits": { "accent": {}, "age": { "": 0.24, "twenties": 0.33, "thirties": 0.18, "teens": 0.09, "fourties": 0.13, "fifties": 0.03, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.26, "male_masculine": 0.59, "female_feminine": 0.15, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 201199, "agriculture_food": 4, "automotive_transport": 4, "finance": 8, "service_retail": 12, "general": 41, "healthcare": 6, "history_law_government": 44, "language_fundamentals": 4, "media_entertainment": 18, "nature_environment": 5, "news_current_affairs": 3, "technology_robotics": 16 } }, "users": 3636, "size": 7008716262, "checksum": "9a2ed32a0574f74f505cd7740a599f0b9edc9f52ba1e7d6624b66f258db4c0ea", "avgDurationSecs": 5.19, "validDurationSecs": 901736.205, "totalHrs": 290.23, "validHrs": 250.48 }, "rup": { "buckets": { "dev": 5, "test": 8, "train": 16, "validated": 29, "invalidated": 17, "other": 16 }, "duration": 370260, "reportedSentences": 0, "validatedSentences": 3507, "unvalidatedSentences": -1, "clips": 62, "splits": { "accent": {}, "age": { "": 0.32, "twenties": 0.02, "thirties": 0.26, "teens": 0.24, "fourties": 0, "fifties": 0.16, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.58, "male_masculine": 0, "female_feminine": 0.42, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 62, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 9, "size": 2309540, "checksum": "31b2483416f226ff7dc6b52ce3a70c781e6627cab96e5f7090c0331a4316fd8c", "avgDurationSecs": 5.972, "validDurationSecs": 173.186, "totalHrs": 0.1, "validHrs": 0.04 }, "rw": { "buckets": { "dev": 15987, "test": 16213, "train": 1003033, "validated": 1439127, "invalidated": 227838, "other": 47253 }, "duration": 8583672569, "reportedSentences": 634, "validatedSentences": 1404857, "unvalidatedSentences": 8, "clips": 1714218, "splits": { "accent": {}, "age": { "": 0.05, "twenties": 0.61, "thirties": 0.12, "teens": 0.2, "fourties": 0.02, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.1, "male_masculine": 0.57, "female_feminine": 0.33, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1714218, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 1179, "size": 61200840427, "checksum": "b61528d19c78687020b28328c916f0a517ff57fbb17749e30ce6f5f43bdee834", "avgDurationSecs": 5.007, "validDurationSecs": 7206198.368, "totalHrs": 2384.35, "validHrs": 2001.72 }, "sah": { "buckets": { "dev": 1746, "test": 1808, "train": 2313, "validated": 9282, "invalidated": 477, "other": 3341 }, "duration": 82989732, "reportedSentences": 26, "validatedSentences": 6076, "unvalidatedSentences": 385, "clips": 13100, "splits": { "accent": {}, "age": { "": 0.31, "twenties": 0.23, "thirties": 0.15, "teens": 0.03, "fourties": 0.1, "fifties": 0.18, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.32, "male_masculine": 0.24, "female_feminine": 0.44, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 13100, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 247, "size": 527460914, "checksum": "96e747ace1cbfd7d97775f8ecd454ea53683a6c521ccdbee2bfe8952714cfd0b", "avgDurationSecs": 6.335, "validDurationSecs": 58802.343, "totalHrs": 23.05, "validHrs": 16.33 }, "sat": { "buckets": { "dev": 68, "test": 127, "train": 333, "validated": 528, "invalidated": 18, "other": 303 }, "duration": 3801708, "reportedSentences": 7, "validatedSentences": 5421, "unvalidatedSentences": 540, "clips": 849, "splits": { "accent": {}, "age": { "": 0.42, "twenties": 0.42, "thirties": 0.12, "teens": 0.01, "fourties": 0.01, "fifties": 0.01, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.4, "male_masculine": 0.59, "female_feminine": 0.01, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 849, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 13, "size": 21352261, "checksum": "016b9d7b4488b688147e480956d81ff41584cb61e31b14904130fca4505e95cf", "avgDurationSecs": 4.478, "validDurationSecs": 2364.313, "totalHrs": 1.05, "validHrs": 0.65 }, "sbn": { "buckets": { "dev": 0, "test": 247, "train": 1754, "validated": 10957, "invalidated": 12, "other": 18 }, "duration": 38755044, "reportedSentences": 0, "validatedSentences": 2001, "unvalidatedSentences": -1, "clips": 10987, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.55, "thirties": 0, "teens": 0.19, "fourties": 0.26, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 10987, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 21, "size": 226528570, "checksum": "5184a7f673b0020c469e718b17213d18f6e40f363334a3c27fe823436debce0f", "avgDurationSecs": 3.527, "validDurationSecs": 38649.223, "totalHrs": 10.76, "validHrs": 10.73 }, "sc": { "buckets": { "dev": 551, "test": 637, "train": 926, "validated": 2288, "invalidated": 120, "other": 407 }, "duration": 13224744, "reportedSentences": 36, "validatedSentences": 5473, "unvalidatedSentences": 361, "clips": 2815, "splits": { "accent": {}, "age": { "": 0.45, "twenties": 0.09, "thirties": 0.28, "teens": 0, "fourties": 0.01, "fifties": 0.15, "sixties": 0.01, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.55, "male_masculine": 0.12, "female_feminine": 0.33, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 2800, "agriculture_food": 2, "automotive_transport": 1, "finance": 1, "service_retail": 0, "general": 9, "healthcare": 2, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 1, "nature_environment": 1, "news_current_affairs": 3, "technology_robotics": 0 } }, "users": 41, "size": 76855546, "checksum": "1c16219cc05fc6e18c1d77709ab43c8b0e37723332c573ce12ddfe772d848e79", "avgDurationSecs": 4.698, "validDurationSecs": 10748.922, "totalHrs": 3.67, "validHrs": 2.98 }, "scl": { "buckets": { "dev": 862, "test": 984, "train": 1407, "validated": 8876, "invalidated": 146, "other": 3 }, "duration": 37147104, "reportedSentences": 0, "validatedSentences": 3300, "unvalidatedSentences": 4, "clips": 9025, "splits": { "accent": {}, "age": { "": 0.16, "twenties": 0.02, "thirties": 0.82, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.98, "male_masculine": 0, "female_feminine": 0.02, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 9021, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 4, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 40, "size": 217100806, "checksum": "bab306d96c7d7d0ac7eaf676270e92194df0f33da5c23bcf35835e73f6364531", "avgDurationSecs": 4.116, "validDurationSecs": 36533.817, "totalHrs": 10.31, "validHrs": 10.14 }, "sd": { "buckets": { "dev": 0, "test": 42, "train": 277, "validated": 319, "invalidated": 197, "other": 34384 }, "duration": 143157636, "reportedSentences": 6, "validatedSentences": 13348, "unvalidatedSentences": 71, "clips": 34900, "splits": { "accent": {}, "age": { "": 0.02, "twenties": 0, "thirties": 0.11, "teens": 0, "fourties": 0.87, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.89, "male_masculine": 0.11, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 34808, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 89, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 3, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 26, "size": 755876846, "checksum": "b65a12ef79e5458d9432027cbfa5472b070bb1325bc177343b3f761aac8fda94", "avgDurationSecs": 4.102, "validDurationSecs": 1308.518, "totalHrs": 39.76, "validHrs": 0.36 }, "sei": { "buckets": { "dev": 435, "test": 452, "train": 728, "validated": 8006, "invalidated": 254, "other": 0 }, "duration": 37573452, "reportedSentences": 0, "validatedSentences": 1615, "unvalidatedSentences": -1, "clips": 8260, "splits": { "accent": {}, "age": { "": 0.01, "twenties": 0.23, "thirties": 0.27, "teens": 0, "fourties": 0.49, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.18, "male_masculine": 0, "female_feminine": 0.81, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.01 }, "sentence_domain": { "": 8260, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 16, "size": 218623843, "checksum": "7f56cbcb9f0c95d371b2cb863488d914d11bc03f01eae8ef2c45dd77056d4cf9", "avgDurationSecs": 4.549, "validDurationSecs": 36418.046, "totalHrs": 10.43, "validHrs": 10.11 }, "sk": { "buckets": { "dev": 5090, "test": 5239, "train": 7846, "validated": 44126, "invalidated": 1219, "other": 1373 }, "duration": 200036880, "reportedSentences": 347, "validatedSentences": 20639, "unvalidatedSentences": 2347, "clips": 46718, "splits": { "accent": {}, "age": { "": 0.23, "twenties": 0.07, "thirties": 0.18, "teens": 0.05, "fourties": 0.12, "fifties": 0.36, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.62, "male_masculine": 0.35, "female_feminine": 0.04, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 33942, "agriculture_food": 3, "automotive_transport": 263, "finance": 2, "service_retail": 0, "general": 12454, "healthcare": 4, "history_law_government": 7803, "language_fundamentals": 101, "media_entertainment": 405, "nature_environment": 260, "news_current_affairs": 278, "technology_robotics": 895 } }, "users": 269, "size": 1154587658, "checksum": "9228980a35d828225c66215ac342840b633d62927afd27de46b2678eacd361b9", "avgDurationSecs": 4.282, "validDurationSecs": 188938.468, "totalHrs": 55.56, "validHrs": 52.48 }, "skr": { "buckets": { "dev": 1144, "test": 1037, "train": 1557, "validated": 3750, "invalidated": 467, "other": 1620 }, "duration": 24307020, "reportedSentences": 17, "validatedSentences": 6011, "unvalidatedSentences": 93, "clips": 5837, "splits": { "accent": {}, "age": { "": 0.35, "twenties": 0.24, "thirties": 0.01, "teens": 0.02, "fourties": 0, "fifties": 0.37, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.37, "male_masculine": 0.63, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 5837, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 60, "size": 139959301, "checksum": "f8cb9841fc74b8f954a189d24492bbecdb5a26610c0db700bd8abe3898373576", "avgDurationSecs": 4.164, "validDurationSecs": 15616.126, "totalHrs": 6.75, "validHrs": 4.33 }, "sl": { "buckets": { "dev": 1337, "test": 1340, "train": 1463, "validated": 15650, "invalidated": 511, "other": 3364 }, "duration": 78119074, "reportedSentences": 55, "validatedSentences": 4209, "unvalidatedSentences": 29, "clips": 19525, "splits": { "accent": {}, "age": { "": 0.37, "twenties": 0.31, "thirties": 0.03, "teens": 0.05, "fourties": 0.15, "fifties": 0.05, "sixties": 0.04, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.39, "male_masculine": 0.52, "female_feminine": 0.1, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 19523, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 1, "healthcare": 0, "history_law_government": 1, "language_fundamentals": 0, "media_entertainment": 1, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 1002, "size": 511824211, "checksum": "044c8a2e25f1c3f08c203c9f57caa1cad227ba31ec46cdf615af7631e6253d6f", "avgDurationSecs": 4.001, "validDurationSecs": 62615.289, "totalHrs": 21.69, "validHrs": 17.39 }, "sq": { "buckets": { "dev": 1795, "test": 1874, "train": 2658, "validated": 6337, "invalidated": 180, "other": 21 }, "duration": 33475068, "reportedSentences": 144, "validatedSentences": 50009, "unvalidatedSentences": 2635, "clips": 6538, "splits": { "accent": {}, "age": { "": 0.24, "twenties": 0.09, "thirties": 0.16, "teens": 0, "fourties": 0.18, "fifties": 0.34, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.39, "male_masculine": 0.47, "female_feminine": 0.14, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1576, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 1801, "healthcare": 0, "history_law_government": 3136, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 25, "technology_robotics": 0 } }, "users": 150, "size": 199485140, "checksum": "d1598491e686237a7e9c8b688bfd1d1203e3c08f71395e623fa030bf2810b256", "avgDurationSecs": 5.12, "validDurationSecs": 32445.932, "totalHrs": 9.29, "validHrs": 9.01 }, "sr": { "buckets": { "dev": 1816, "test": 1915, "train": 2522, "validated": 8300, "invalidated": 425, "other": 5029 }, "duration": 44748936, "reportedSentences": 185, "validatedSentences": 8066, "unvalidatedSentences": 661, "clips": 13754, "splits": { "accent": {}, "age": { "": 0.14, "twenties": 0.25, "thirties": 0.12, "teens": 0, "fourties": 0.1, "fifties": 0.13, "sixties": 0.26, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.54, "male_masculine": 0.31, "female_feminine": 0.15, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 13705, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 13, "healthcare": 0, "history_law_government": 1, "language_fundamentals": 3, "media_entertainment": 0, "nature_environment": 2, "news_current_affairs": 0, "technology_robotics": 31 } }, "users": 183, "size": 250988892, "checksum": "6243b57a8ce83b37f2d2d2fc17f66289d37b0eb80d296a117c0ebc143521a3e8", "avgDurationSecs": 3.254, "validDurationSecs": 27004.229, "totalHrs": 12.43, "validHrs": 7.5 }, "ss": { "buckets": { "dev": 0, "test": 0, "train": 0, "validated": 0, "invalidated": 0, "other": 111 }, "duration": 825840, "reportedSentences": 0, "validatedSentences": 1614, "unvalidatedSentences": 6796, "clips": 111, "splits": { "accent": {}, "age": { "": 0.45, "twenties": 0.55, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 111, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 2, "size": 5075058, "checksum": "205e5a5d055ccd73e332c5d27ebcda25b074496a7019065d1f4d59375d0dcd42", "avgDurationSecs": 7.44, "validDurationSecs": 0, "totalHrs": 0.22, "validHrs": 0 }, "ssi": { "buckets": { "dev": 0, "test": 161, "train": 1845, "validated": 10188, "invalidated": 12, "other": 0 }, "duration": 37951740, "reportedSentences": 0, "validatedSentences": 2007, "unvalidatedSentences": -1, "clips": 10200, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.6, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0.39, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.99, "male_masculine": 0, "female_feminine": 0.01, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 10200, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 21, "size": 221549575, "checksum": "a2085ac91e1eb686756187de472a1b4305f9b448ed6cc80a2e928017eaf6ae60", "avgDurationSecs": 3.721, "validDurationSecs": 37907.091, "totalHrs": 10.54, "validHrs": 10.52 }, "st": { "buckets": { "dev": 0, "test": 0, "train": 1, "validated": 1, "invalidated": 0, "other": 208 }, "duration": 673668, "reportedSentences": 0, "validatedSentences": 2339, "unvalidatedSentences": 14837, "clips": 209, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.29, "thirties": 0.71, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.29, "male_masculine": 0.71, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 209, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 2, "size": 4961419, "checksum": "0410f551552a71c2d4889273236202907ec723bb99fda4331c0ea44c4a640750", "avgDurationSecs": 3.223, "validDurationSecs": 3.223, "totalHrs": 0.18, "validHrs": 0 }, "sv-SE": { "buckets": { "dev": 5455, "test": 5489, "train": 8232, "validated": 42543, "invalidated": 1598, "other": 6046 }, "duration": 201935247, "reportedSentences": 597, "validatedSentences": 26257, "unvalidatedSentences": 7125, "clips": 50187, "splits": { "accent": {}, "age": { "": 0.19, "twenties": 0.12, "thirties": 0.25, "teens": 0.03, "fourties": 0.37, "fifties": 0.03, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.21, "male_masculine": 0.47, "female_feminine": 0.32, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 50184, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 2, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 1, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 885, "size": 1275732190, "checksum": "cd66ab8d6cba060cac10a005b5f0369a5ac9371cd5d13cec7c24958e576c0610", "avgDurationSecs": 4.024, "validDurationSecs": 171178.417, "totalHrs": 56.09, "validHrs": 47.54 }, "sva": { "buckets": { "dev": 467, "test": 503, "train": 567, "validated": 9567, "invalidated": 1376, "other": 16 }, "duration": 64961820, "reportedSentences": 9, "validatedSentences": 1538, "unvalidatedSentences": 11, "clips": 10959, "splits": { "accent": {}, "age": { "": 0.07, "twenties": 0.1, "thirties": 0.2, "teens": 0, "fourties": 0.24, "fifties": 0.21, "sixties": 0.13, "seventies": 0.04, "eighties": 0, "nineties": 0 }, "gender": { "": 0.2, "male_masculine": 0, "female_feminine": 0.8, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 10593, "agriculture_food": 108, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 96, "healthcare": 162, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 55, "size": 369385417, "checksum": "f524918b5aaa9974d92b794a59471d9a43966c7c9dd9fbce460434ad523ba998", "avgDurationSecs": 5.928, "validDurationSecs": 56710.442, "totalHrs": 18.04, "validHrs": 15.75 }, "sw": { "buckets": { "dev": 12269, "test": 12269, "train": 46704, "validated": 268255, "invalidated": 80837, "other": 379914 }, "duration": 3934927116, "reportedSentences": 1902, "validatedSentences": 134725, "unvalidatedSentences": 5758, "clips": 729006, "splits": { "accent": {}, "age": { "": 0.3, "twenties": 0.5, "thirties": 0.11, "teens": 0.01, "fourties": 0.03, "fifties": 0.04, "sixties": 0.01, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.29, "male_masculine": 0.34, "female_feminine": 0.37, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 729006, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 1497, "size": 22967482338, "checksum": "709aa10aadbc920e36e51bb238185dde5400f26e24f212f5d50a637a67d8e4e6", "avgDurationSecs": 5.398, "validDurationSecs": 1447949.5, "totalHrs": 1093.03, "validHrs": 402.2 }, "szy": { "buckets": { "dev": 257, "test": 264, "train": 280, "validated": 9158, "invalidated": 485, "other": 0 }, "duration": 52040448, "reportedSentences": 0, "validatedSentences": 801, "unvalidatedSentences": 2, "clips": 9643, "splits": { "accent": {}, "age": { "": 0.49, "twenties": 0.13, "thirties": 0.08, "teens": 0, "fourties": 0, "fifties": 0.11, "sixties": 0.1, "seventies": 0.08, "eighties": 0, "nineties": 0 }, "gender": { "": 0.26, "male_masculine": 0, "female_feminine": 0.35, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.39 }, "sentence_domain": { "": 27, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 9825, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 9, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 26, "size": 294380934, "checksum": "212dcc3f01dc91273007f706ff98ff6677d25dd9e7914071efb75cd50e612169", "avgDurationSecs": 5.397, "validDurationSecs": 49423.045, "totalHrs": 14.45, "validHrs": 13.72 }, "ta": { "buckets": { "dev": 12163, "test": 12230, "train": 46411, "validated": 136580, "invalidated": 5745, "other": 105244 }, "duration": 1534227252, "reportedSentences": 3438, "validatedSentences": 118260, "unvalidatedSentences": 577, "clips": 247569, "splits": { "accent": {}, "age": { "": 0.66, "twenties": 0.11, "thirties": 0.12, "teens": 0.04, "fourties": 0.03, "fifties": 0.02, "sixties": 0, "seventies": 0.02, "eighties": 0, "nineties": 0 }, "gender": { "": 0.66, "male_masculine": 0.19, "female_feminine": 0.15, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 247569, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 975, "size": 9196249656, "checksum": "f62fbf8c6b44ba63c2ee58da74ce12d08147851b844a00218915b4817750a4af", "avgDurationSecs": 6.197, "validDurationSecs": 846409.518, "totalHrs": 426.17, "validHrs": 235.11 }, "tar": { "buckets": { "dev": 406, "test": 404, "train": 430, "validated": 7889, "invalidated": 23, "other": 10 }, "duration": 36039168, "reportedSentences": 32, "validatedSentences": 1258, "unvalidatedSentences": -1, "clips": 7922, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.11, "thirties": 0.47, "teens": 0, "fourties": 0.38, "fifties": 0.04, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.34, "male_masculine": 0, "female_feminine": 0.66, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7922, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 17, "size": 211005134, "checksum": "d126a9e6662bfb16bbe9b26aa09652d0dd2b730f03f693fad37e3621051b6df3", "avgDurationSecs": 4.549, "validDurationSecs": 35889.043, "totalHrs": 10.01, "validHrs": 9.96 }, "tay": { "buckets": { "dev": 452, "test": 851, "train": 1299, "validated": 7446, "invalidated": 411, "other": 0 }, "duration": 44092728, "reportedSentences": 0, "validatedSentences": 3790, "unvalidatedSentences": 77, "clips": 7857, "splits": { "accent": {}, "age": { "": 0.33, "twenties": 0.22, "thirties": 0, "teens": 0, "fourties": 0.13, "fifties": 0.18, "sixties": 0.15, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.22, "male_masculine": 0, "female_feminine": 0.46, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.33 }, "sentence_domain": { "": 291, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 9021, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 18, "size": 260194128, "checksum": "fc18314c67752531deee56c5fa549687c5588003e6bd2df6bcec3743312d3a2f", "avgDurationSecs": 5.612, "validDurationSecs": 41786.236, "totalHrs": 12.24, "validHrs": 11.6 }, "te": { "buckets": { "dev": 66, "test": 69, "train": 74, "validated": 363, "invalidated": 59, "other": 2031 }, "duration": 10282608, "reportedSentences": 15, "validatedSentences": 336, "unvalidatedSentences": 19289, "clips": 2453, "splits": { "accent": {}, "age": { "": 0.13, "twenties": 0.69, "thirties": 0.02, "teens": 0.07, "fourties": 0.01, "fifties": 0, "sixties": 0.07, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.19, "male_masculine": 0.64, "female_feminine": 0.17, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 2453, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 61, "size": 61298335, "checksum": "18b9c95fd488185388c56952a3ebf3ff449d9586183c767a5d189e6ce5dd3bd0", "avgDurationSecs": 4.192, "validDurationSecs": 1521.642, "totalHrs": 2.85, "validHrs": 0.42 }, "tg": { "buckets": { "dev": 123, "test": 119, "train": 252, "validated": 494, "invalidated": 42, "other": 76 }, "duration": 3037968, "reportedSentences": 18, "validatedSentences": 3991, "unvalidatedSentences": 6780, "clips": 612, "splits": { "accent": {}, "age": { "": 0.02, "twenties": 0.98, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.83, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.17 }, "sentence_domain": { "": 39, "agriculture_food": 7, "automotive_transport": 11, "finance": 15, "service_retail": 16, "general": 108, "healthcare": 12, "history_law_government": 29, "language_fundamentals": 299, "media_entertainment": 143, "nature_environment": 5, "news_current_affairs": 52, "technology_robotics": 9 } }, "users": 7, "size": 18178867, "checksum": "8cdb1433f285efc9ac413ec879034588bc2fcc8d2835cb57d047cd5c8c9dec3a", "avgDurationSecs": 4.964, "validDurationSecs": 2452.216, "totalHrs": 0.84, "validHrs": 0.68 }, "th": { "buckets": { "dev": 11059, "test": 11059, "train": 32971, "validated": 148714, "invalidated": 9358, "other": 208329 }, "duration": 1536467772, "reportedSentences": 4318, "validatedSentences": 64491, "unvalidatedSentences": 121701, "clips": 366401, "splits": { "accent": {}, "age": { "": 0.4, "twenties": 0.24, "thirties": 0.07, "teens": 0.04, "fourties": 0.04, "fifties": 0.2, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.41, "male_masculine": 0.42, "female_feminine": 0.17, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 366401, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 7982, "size": 8964895041, "checksum": "f3ff5f97625cb56ecdfafe5d0a37bfb70646aca7f50eab1074bcffceeddacb3a", "avgDurationSecs": 4.193, "validDurationSecs": 623618.026, "totalHrs": 426.79, "validHrs": 173.22 }, "ti": { "buckets": { "dev": 21, "test": 17, "train": 32, "validated": 70, "invalidated": 6, "other": 375 }, "duration": 2342484, "reportedSentences": 3, "validatedSentences": 4570, "unvalidatedSentences": 111, "clips": 451, "splits": { "accent": {}, "age": { "": 0.18, "twenties": 0.31, "thirties": 0.03, "teens": 0, "fourties": 0.49, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.96, "male_masculine": 0.04, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 451, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 16, "size": 14067846, "checksum": "115e0cd6ba7886a2eb1d5b9306d9123af5a7165a6587089da1fde95f4ea0a021", "avgDurationSecs": 5.194, "validDurationSecs": 363.578, "totalHrs": 0.65, "validHrs": 0.1 }, "tig": { "buckets": { "dev": 1615, "test": 1609, "train": 1990, "validated": 6433, "invalidated": 245, "other": 92 }, "duration": 42956856, "reportedSentences": 39, "validatedSentences": 5417, "unvalidatedSentences": 90, "clips": 6770, "splits": { "accent": {}, "age": { "": 0.7, "twenties": 0.21, "thirties": 0.1, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.99, "male_masculine": 0.01, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 6757, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 6, "healthcare": 0, "history_law_government": 6, "language_fundamentals": 1, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 151, "size": 230415362, "checksum": "5d68f963754089ec2085a170fbb1d2530a46884259c85043fb283e041d260889", "avgDurationSecs": 6.345, "validDurationSecs": 40818.531, "totalHrs": 11.93, "validHrs": 11.33 }, "tk": { "buckets": { "dev": 522, "test": 516, "train": 734, "validated": 1999, "invalidated": 135, "other": 2813 }, "duration": 27210240, "reportedSentences": 27, "validatedSentences": 2494, "unvalidatedSentences": 238, "clips": 4947, "splits": { "accent": {}, "age": { "": 0.36, "twenties": 0.53, "thirties": 0.08, "teens": 0, "fourties": 0.02, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.42, "male_masculine": 0.41, "female_feminine": 0.17, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 4947, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 141, "size": 152311909, "checksum": "3a6b65006014e9e6e2a8060f0c338c5e60ac38b39c1013522d7d3038ba09e342", "avgDurationSecs": 5.5, "validDurationSecs": 10995.203, "totalHrs": 7.55, "validHrs": 3.05 }, "tli": { "buckets": { "dev": 0, "test": 524, "train": 2316, "validated": 2840, "invalidated": 0, "other": 0 }, "duration": 36638964, "reportedSentences": 0, "validatedSentences": 7863, "unvalidatedSentences": 10, "clips": 2840, "splits": { "accent": {}, "age": { "": 0.82, "twenties": 0, "thirties": 0.18, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 2840, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 3, "size": 217513417, "checksum": "60deb24a69131763cccdff92492c2ede732407b944dfb6b32c9c9eabf68cd7b8", "avgDurationSecs": 12.901, "validDurationSecs": 36638.964, "totalHrs": 10.17, "validHrs": 10.17 }, "tn": { "buckets": { "dev": 311, "test": 369, "train": 1079, "validated": 3506, "invalidated": 11, "other": 532 }, "duration": 17693028, "reportedSentences": 1, "validatedSentences": 1765, "unvalidatedSentences": 15342, "clips": 4049, "splits": { "accent": {}, "age": { "": 0.03, "twenties": 0.02, "thirties": 0.51, "teens": 0, "fourties": 0, "fifties": 0.43, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.48, "male_masculine": 0, "female_feminine": 0.48, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.04 }, "sentence_domain": { "": 4049, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 17, "size": 89812531, "checksum": "5eab9c278d45f0002d82343e0b2e138ec6c98a1e0ec44d48c1469903be956f51", "avgDurationSecs": 4.37, "validDurationSecs": 15320.266, "totalHrs": 4.91, "validHrs": 4.25 }, "tok": { "buckets": { "dev": 2250, "test": 2251, "train": 2635, "validated": 12954, "invalidated": 399, "other": 5973 }, "duration": 83304972, "reportedSentences": 165, "validatedSentences": 7502, "unvalidatedSentences": 2257, "clips": 19326, "splits": { "accent": {}, "age": { "": 0.31, "twenties": 0.19, "thirties": 0.06, "teens": 0.21, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0.23, "nineties": 0 }, "gender": { "": 0.4, "male_masculine": 0.52, "female_feminine": 0.05, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.02 }, "sentence_domain": { "": 19324, "agriculture_food": 0, "automotive_transport": 0, "finance": 2, "service_retail": 0, "general": 2, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 171, "size": 487505279, "checksum": "193da8657cab1eacfe7fb5cc78a7392f95c99ec86d026df0551afc866ecad17c", "avgDurationSecs": 4.311, "validDurationSecs": 55838.384, "totalHrs": 23.14, "validHrs": 15.51 }, "tr": { "buckets": { "dev": 11756, "test": 11803, "train": 40650, "validated": 120610, "invalidated": 4942, "other": 317 }, "duration": 483090831, "reportedSentences": 484, "validatedSentences": 410403, "unvalidatedSentences": 3475, "clips": 125869, "splits": { "accent": {}, "age": { "": 0.25, "twenties": 0.23, "thirties": 0.09, "teens": 0.02, "fourties": 0.03, "fifties": 0.07, "sixties": 0.2, "seventies": 0.03, "eighties": 0.1, "nineties": 0 }, "gender": { "": 0.26, "male_masculine": 0.42, "female_feminine": 0.32, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 125854, "agriculture_food": 0, "automotive_transport": 1, "finance": 0, "service_retail": 0, "general": 1, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 12, "media_entertainment": 1, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 1795, "size": 2947404719, "checksum": "e37186670c9d71c6bb4904f349f3d640aa1288ca3a458aa884ab56ce83bf486a", "avgDurationSecs": 3.838, "validDurationSecs": 462906.555, "totalHrs": 134.19, "validHrs": 128.58 }, "trv": { "buckets": { "dev": 558, "test": 529, "train": 885, "validated": 6386, "invalidated": 104, "other": 0 }, "duration": 36415152, "reportedSentences": 1, "validatedSentences": 1974, "unvalidatedSentences": 2, "clips": 6490, "splits": { "accent": {}, "age": { "": 0.93, "twenties": 0.07, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.68, "male_masculine": 0.07, "female_feminine": 0.13, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.12 }, "sentence_domain": { "": 465, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 6276, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 10, "size": 214885747, "checksum": "5620ad2d3d39f3dfbb26bcd3ea9ac5a07c402f1138c5dff7224a6e9ebf770886", "avgDurationSecs": 5.611, "validDurationSecs": 35831.612, "totalHrs": 10.11, "validHrs": 9.95 }, "trw": { "buckets": { "dev": 2083, "test": 1956, "train": 2859, "validated": 11054, "invalidated": 1372, "other": 14 }, "duration": 67715892, "reportedSentences": 578, "validatedSentences": 7770, "unvalidatedSentences": 27, "clips": 12440, "splits": { "accent": {}, "age": { "": 0.05, "twenties": 0.34, "thirties": 0.11, "teens": 0.04, "fourties": 0.36, "fifties": 0.09, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 12245, "agriculture_food": 57, "automotive_transport": 2, "finance": 2, "service_retail": 57, "general": 55, "healthcare": 49, "history_law_government": 49, "language_fundamentals": 17, "media_entertainment": 1, "nature_environment": 63, "news_current_affairs": 67, "technology_robotics": 0 } }, "users": 27, "size": 397034706, "checksum": "06ea0c07f054817a3141d1b0e0d95da505b85062fde465f202bef6fc80e79eaf", "avgDurationSecs": 5.443, "validDurationSecs": 60171.34, "totalHrs": 18.8, "validHrs": 16.71 }, "ts": { "buckets": { "dev": 0, "test": 0, "train": 0, "validated": 0, "invalidated": 1, "other": 0 }, "duration": 8928, "reportedSentences": 0, "validatedSentences": 352, "unvalidatedSentences": 16012, "clips": 1, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 1, "size": 1040823, "checksum": "3abc4849fb791ef192ec46d21cc07b8cfb15791e2ffa3a0425a174e5193deaa0", "avgDurationSecs": 8.928, "validDurationSecs": 0, "totalHrs": 0, "validHrs": 0 }, "tt": { "buckets": { "dev": 4402, "test": 5062, "train": 8522, "validated": 30199, "invalidated": 539, "other": 262 }, "duration": 118759526, "reportedSentences": 6, "validatedSentences": 18051, "unvalidatedSentences": 32, "clips": 31000, "splits": { "accent": {}, "age": { "": 0.21, "twenties": 0.05, "thirties": 0.71, "teens": 0.01, "fourties": 0, "fifties": 0.01, "sixties": 0.01, "seventies": 0.01, "eighties": 0, "nineties": 0 }, "gender": { "": 0.21, "male_masculine": 0.76, "female_feminine": 0.03, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 30988, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 12, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 288, "size": 865339305, "checksum": "dfa2a8760b49bb5120b78a9514f1055d6c358d5594c6f1c55ca15e37564438f6", "avgDurationSecs": 3.831, "validDurationSecs": 115690.933, "totalHrs": 32.98, "validHrs": 32.13 }, "tui": { "buckets": { "dev": 602, "test": 644, "train": 722, "validated": 7570, "invalidated": 129, "other": 904 }, "duration": 42402492, "reportedSentences": 6, "validatedSentences": 1971, "unvalidatedSentences": 5, "clips": 8603, "splits": { "accent": {}, "age": { "": 0.23, "twenties": 0.21, "thirties": 0.51, "teens": 0, "fourties": 0.04, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.93, "male_masculine": 0.01, "female_feminine": 0.06, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8603, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 50, "size": 248346597, "checksum": "904887b509115378a44bc51046b1638985aeec56f1fd80cda980e84393bffb94", "avgDurationSecs": 4.929, "validDurationSecs": 37311.039, "totalHrs": 11.77, "validHrs": 10.36 }, "tvu": { "buckets": { "dev": 495, "test": 438, "train": 725, "validated": 5247, "invalidated": 122, "other": 65 }, "duration": 38085048, "reportedSentences": 24, "validatedSentences": 1943, "unvalidatedSentences": 347, "clips": 5434, "splits": { "accent": {}, "age": { "": 0.8, "twenties": 0, "thirties": 0.2, "teens": 0, "fourties": 0.01, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.81, "male_masculine": 0, "female_feminine": 0.19, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 5434, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 13, "size": 204873124, "checksum": "2dcd5291c53124cc7d603d5cce483bd9dc8d286831ee284f0b0d25f03148c635", "avgDurationSecs": 7.009, "validDurationSecs": 36774.429, "totalHrs": 10.57, "validHrs": 10.21 }, "tw": { "buckets": { "dev": 0, "test": 27, "train": 213, "validated": 240, "invalidated": 5, "other": 96 }, "duration": 1495440, "reportedSentences": 3, "validatedSentences": 49159, "unvalidatedSentences": 22, "clips": 341, "splits": { "accent": {}, "age": { "": 0.27, "twenties": 0.09, "thirties": 0.65, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.35, "male_masculine": 0.65, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 341, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 19, "size": 11552065, "checksum": "90fe28ee202d593067b5a04a0b25c991f892089f1448f2ae4a707f74e1e54e96", "avgDurationSecs": 4.385, "validDurationSecs": 1052.509, "totalHrs": 0.41, "validHrs": 0.29 }, "udl": { "buckets": { "dev": 285, "test": 329, "train": 396, "validated": 6400, "invalidated": 112, "other": 32 }, "duration": 38688012, "reportedSentences": 1, "validatedSentences": 1011, "unvalidatedSentences": -1, "clips": 6544, "splits": { "accent": {}, "age": { "": 0.85, "twenties": 0.15, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 6544, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 20, "size": 227536919, "checksum": "64b6b0594df78415759d30d41bd45cebc484383ffbe453b0e36f0c41f2fc27c0", "avgDurationSecs": 5.912, "validDurationSecs": 37836.687, "totalHrs": 10.74, "validHrs": 10.51 }, "ug": { "buckets": { "dev": 14656, "test": 14656, "train": 122911, "validated": 269390, "invalidated": 21500, "other": 14191 }, "duration": 1820354616, "reportedSentences": 1539, "validatedSentences": 231426, "unvalidatedSentences": 11032, "clips": 305081, "splits": { "accent": {}, "age": { "": 0.21, "twenties": 0.34, "thirties": 0.27, "teens": 0.06, "fourties": 0.1, "fifties": 0.01, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.53, "male_masculine": 0.26, "female_feminine": 0.2, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.01, "intersex": 0 }, "sentence_domain": { "": 302526, "agriculture_food": 2, "automotive_transport": 2, "finance": 1, "service_retail": 1, "general": 2522, "healthcare": 27, "history_law_government": 3, "language_fundamentals": 10, "media_entertainment": 15, "nature_environment": 1, "news_current_affairs": 0, "technology_robotics": 10 } }, "users": 1836, "size": 10384973335, "checksum": "7b709a2dc3e624791eebc0f4202e8b59bd5a50b3cd051c1d65e0b697b54f98d6", "avgDurationSecs": 5.967, "validDurationSecs": 1607393.872, "totalHrs": 505.65, "validHrs": 446.49 }, "uk": { "buckets": { "dev": 10297, "test": 10295, "train": 27058, "validated": 77993, "invalidated": 3340, "other": 8811 }, "duration": 418806240, "reportedSentences": 660, "validatedSentences": 212668, "unvalidatedSentences": 1625, "clips": 90144, "splits": { "accent": {}, "age": { "": 0.23, "twenties": 0.33, "thirties": 0.25, "teens": 0.09, "fourties": 0.09, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.24, "male_masculine": 0.58, "female_feminine": 0.17, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 90144, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 1164, "size": 2748721118, "checksum": "5fe1c9be7116d14cf6928f326b25f4910875fcc770500e1315137c9ac52931e5", "avgDurationSecs": 4.646, "validDurationSecs": 362353.069, "totalHrs": 116.33, "validHrs": 100.65 }, "ur": { "buckets": { "dev": 5089, "test": 5091, "train": 7339, "validated": 68229, "invalidated": 11008, "other": 173662 }, "duration": 1087276644, "reportedSentences": 411, "validatedSentences": 21705, "unvalidatedSentences": 48258, "clips": 252899, "splits": { "accent": {}, "age": { "": 0.06, "twenties": 0.92, "thirties": 0, "teens": 0, "fourties": 0.01, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.23, "male_masculine": 0.52, "female_feminine": 0.25, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 252792, "agriculture_food": 12, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 48, "healthcare": 47, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 498, "size": 6347527720, "checksum": "391a79277ca6855ef6da612366584cf47a8dfb5b4eeed1f5902f496413faee64", "avgDurationSecs": 4.299, "validDurationSecs": 293333.695, "totalHrs": 302.02, "validHrs": 81.48 }, "ush": { "buckets": { "dev": 195, "test": 357, "train": 586, "validated": 3861, "invalidated": 82, "other": 18 }, "duration": 24351012, "reportedSentences": 0, "validatedSentences": 1170, "unvalidatedSentences": -1, "clips": 3961, "splits": { "accent": {}, "age": { "": 0.15, "twenties": 0.23, "thirties": 0.01, "teens": 0.02, "fourties": 0.6, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 3958, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 3, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 23, "size": 135793370, "checksum": "f41fd2137282ea84e7fc35a6775016b710a2d9a37110128993660817f50dad77", "avgDurationSecs": 6.148, "validDurationSecs": 23736.243, "totalHrs": 6.76, "validHrs": 6.59 }, "uz": { "buckets": { "dev": 12264, "test": 12388, "train": 48762, "validated": 87181, "invalidated": 14141, "other": 128515 }, "duration": 955631808, "reportedSentences": 1833, "validatedSentences": 148734, "unvalidatedSentences": 137880, "clips": 229837, "splits": { "accent": {}, "age": { "": 0.41, "twenties": 0.4, "thirties": 0.01, "teens": 0.18, "fourties": 0.01, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.41, "male_masculine": 0.44, "female_feminine": 0.15, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 229837, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 2281, "size": 5363124452, "checksum": "71593db33b13a634292eb7e2a3b471373c5ce2682a163994140460e32933d9be", "avgDurationSecs": 4.158, "validDurationSecs": 362487.052, "totalHrs": 265.45, "validHrs": 100.69 }, "var": { "buckets": { "dev": 546, "test": 611, "train": 752, "validated": 6851, "invalidated": 291, "other": 864 }, "duration": 42487380, "reportedSentences": 246, "validatedSentences": 1977, "unvalidatedSentences": -1, "clips": 8006, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.29, "thirties": 0.57, "teens": 0.14, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.06, "male_masculine": 0, "female_feminine": 0.94, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8006, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 12, "size": 247635388, "checksum": "ba7c24ada264068bafc39298c431215a1f52d8b01d516b7d8d211bcd190d8409", "avgDurationSecs": 5.307, "validDurationSecs": 36357.862, "totalHrs": 11.8, "validHrs": 10.09 }, "ve": { "buckets": { "dev": 0, "test": 0, "train": 0, "validated": 0, "invalidated": 0, "other": 20 }, "duration": 113076, "reportedSentences": 0, "validatedSentences": 1735, "unvalidatedSentences": 7843, "clips": 20, "splits": { "accent": {}, "age": { "": 0.25, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0.75, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.25, "male_masculine": 0, "female_feminine": 0.75, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 20, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 2, "size": 1206489, "checksum": "f8a215f053ce4f46dd6e73e56aa7dd2339d5c13770903ed6a0c3a035672937ef", "avgDurationSecs": 5.654, "validDurationSecs": 0, "totalHrs": 0.03, "validHrs": 0 }, "vi": { "buckets": { "dev": 1094, "test": 1383, "train": 2009, "validated": 6036, "invalidated": 457, "other": 12721 }, "duration": 76849892, "reportedSentences": 201, "validatedSentences": 8159, "unvalidatedSentences": 5398, "clips": 19214, "splits": { "accent": {}, "age": { "": 0.25, "twenties": 0.2, "thirties": 0.05, "teens": 0.2, "fourties": 0.02, "fifties": 0, "sixties": 0.26, "seventies": 0.02, "eighties": 0, "nineties": 0 }, "gender": { "": 0.3, "male_masculine": 0.49, "female_feminine": 0.21, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 18475, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 739, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 370, "size": 447769009, "checksum": "93520f4e269fda549cd22d716085a76b5096554d43836d70c7798e218ac9b208", "avgDurationSecs": 4, "validDurationSecs": 24142.081, "totalHrs": 21.34, "validHrs": 6.7 }, "vot": { "buckets": { "dev": 0, "test": 7, "train": 96, "validated": 103, "invalidated": 324, "other": 0 }, "duration": 1029972, "reportedSentences": 0, "validatedSentences": 5437, "unvalidatedSentences": 1, "clips": 427, "splits": { "accent": {}, "age": { "": 0.25, "twenties": 0.74, "thirties": 0, "teens": 0.01, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.25, "male_masculine": 0.75, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 427, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 6, "size": 8186608, "checksum": "cd4765febc933489d5ffd3c43c4bd0815a0e1f42aa1141824645fd2434bf8eeb", "avgDurationSecs": 2.412, "validDurationSecs": 248.448, "totalHrs": 0.28, "validHrs": 0.06 }, "wbl": { "buckets": { "dev": 1110, "test": 1128, "train": 2542, "validated": 6464, "invalidated": 89, "other": 1639 }, "duration": 55320552, "reportedSentences": 1, "validatedSentences": 5493, "unvalidatedSentences": 114, "clips": 8192, "splits": { "accent": {}, "age": { "": 0.21, "twenties": 0, "thirties": 0.01, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0.12, "seventies": 0.65, "eighties": 0, "nineties": 0 }, "gender": { "": 0.88, "male_masculine": 0.12, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8189, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 3, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 14, "size": 320971415, "checksum": "4b3d8ccd1a9477f1e2c037386cdacd855e3186fe48a19242eac174d8bfc5c05b", "avgDurationSecs": 6.753, "validDurationSecs": 43651.373, "totalHrs": 15.36, "validHrs": 12.12 }, "wes": { "buckets": { "dev": 324, "test": 323, "train": 351, "validated": 9003, "invalidated": 51, "other": 363 }, "duration": 38779632, "reportedSentences": 0, "validatedSentences": 999, "unvalidatedSentences": -1, "clips": 9417, "splits": { "accent": {}, "age": { "": 0.94, "twenties": 0.01, "thirties": 0, "teens": 0, "fourties": 0.06, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.94, "male_masculine": 0, "female_feminine": 0.06, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 9417, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 18, "size": 209712696, "checksum": "8955146c6bd3521a103b24e1c4542c937bfdac93dab69c21037d993d0d6bf83e", "avgDurationSecs": 4.118, "validDurationSecs": 37074.761, "totalHrs": 10.77, "validHrs": 10.29 }, "xh": { "buckets": { "dev": 0, "test": 2, "train": 7, "validated": 9, "invalidated": 2, "other": 19 }, "duration": 179712, "reportedSentences": 0, "validatedSentences": 1476, "unvalidatedSentences": 14922, "clips": 30, "splits": { "accent": {}, "age": { "": 1, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 30, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 4, "size": 2197868, "checksum": "084813607f5d5a858df95a199a9930074f238efc2891d7f0c28a80dbc91f30b7", "avgDurationSecs": 5.99, "validDurationSecs": 53.914, "totalHrs": 0.04, "validHrs": 0.01 }, "xhe": { "buckets": { "dev": 0, "test": 1443, "train": 3542, "validated": 11429, "invalidated": 160, "other": 14 }, "duration": 37269792, "reportedSentences": 1, "validatedSentences": 5040, "unvalidatedSentences": 2, "clips": 11603, "splits": { "accent": {}, "age": { "": 0.15, "twenties": 0.85, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 11603, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 11, "size": 217956696, "checksum": "801266f1540c987cfa379241f4c76a1da6f558f14ded2becd2f9ea405bdf6565", "avgDurationSecs": 3.212, "validDurationSecs": 36710.89, "totalHrs": 10.35, "validHrs": 10.19 }, "xka": { "buckets": { "dev": 0, "test": 399, "train": 1571, "validated": 11163, "invalidated": 66, "other": 583 }, "duration": 38274120, "reportedSentences": 4, "validatedSentences": 1980, "unvalidatedSentences": 46, "clips": 11853, "splits": { "accent": {}, "age": { "": 0.01, "twenties": 0.74, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0.25, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 11827, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 26, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 9, "size": 203456160, "checksum": "9b23e454211b544e89586a5b5ba1bdbf3bf8f9e79593e48e7e63fec6bfbc0442", "avgDurationSecs": 3.229, "validDurationSecs": 36046.064, "totalHrs": 10.63, "validHrs": 10.01 }, "xmf": { "buckets": { "dev": 327, "test": 327, "train": 334, "validated": 6753, "invalidated": 587, "other": 31 }, "duration": 45608148, "reportedSentences": 20, "validatedSentences": 1004, "unvalidatedSentences": 35, "clips": 7371, "splits": { "accent": {}, "age": { "": 0.23, "twenties": 0.32, "thirties": 0.3, "teens": 0.02, "fourties": 0.13, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.45, "male_masculine": 0.05, "female_feminine": 0.49, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7333, "agriculture_food": 9, "automotive_transport": 19, "finance": 0, "service_retail": 0, "general": 19, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 87, "size": 267430804, "checksum": "95f40af15d55c3cf065fae9257bb2e076a4517e9af57f10e84e9657d6c45df33", "avgDurationSecs": 6.188, "validDurationSecs": 41784.266, "totalHrs": 12.66, "validHrs": 11.6 }, "yaq": { "buckets": { "dev": 131, "test": 800, "train": 1897, "validated": 6925, "invalidated": 1, "other": 845 }, "duration": 41273208, "reportedSentences": 0, "validatedSentences": 2838, "unvalidatedSentences": -1, "clips": 7771, "splits": { "accent": {}, "age": { "": 0, "twenties": 0.36, "thirties": 0.27, "teens": 0, "fourties": 0.36, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.36, "male_masculine": 0, "female_feminine": 0.64, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 7771, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 5, "size": 243158559, "checksum": "579c5858fe2779f7659bf56c6772b8d95bdafe8995ec69e2846fc1f485df2ca1", "avgDurationSecs": 5.311, "validDurationSecs": 36779.947, "totalHrs": 11.46, "validHrs": 10.21 }, "yav": { "buckets": { "dev": 274, "test": 316, "train": 423, "validated": 4679, "invalidated": 413, "other": 506 }, "duration": 47985372, "reportedSentences": 0, "validatedSentences": 1013, "unvalidatedSentences": -1, "clips": 5598, "splits": { "accent": {}, "age": { "": 0.89, "twenties": 0, "thirties": 0, "teens": 0, "fourties": 0.11, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.89, "male_masculine": 0, "female_feminine": 0.11, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 5598, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 10, "size": 279281015, "checksum": "7a07ce50e5b8a9d33b5d4780d29f851d56199f22ba69c315281de787d82d2343", "avgDurationSecs": 8.572, "validDurationSecs": 40107.816, "totalHrs": 13.32, "validHrs": 11.14 }, "ydg": { "buckets": { "dev": 0, "test": 321, "train": 1474, "validated": 10556, "invalidated": 10, "other": 636 }, "duration": 40096152, "reportedSentences": 0, "validatedSentences": 1882, "unvalidatedSentences": 109, "clips": 11202, "splits": { "accent": {}, "age": { "": 0.88, "twenties": 0, "thirties": 0.12, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 11202, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 15, "size": 233778099, "checksum": "733fdddd0a1f594c3606862c30560225c4e33ac33664ce0ebd468b45e4383766", "avgDurationSecs": 3.579, "validDurationSecs": 37783.876, "totalHrs": 11.13, "validHrs": 10.49 }, "yi": { "buckets": { "dev": 440, "test": 456, "train": 488, "validated": 1826, "invalidated": 86, "other": 87 }, "duration": 7946640, "reportedSentences": 17, "validatedSentences": 1550, "unvalidatedSentences": 84, "clips": 1999, "splits": { "accent": {}, "age": { "": 0.77, "twenties": 0.06, "thirties": 0.06, "teens": 0.11, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 1, "male_masculine": 0, "female_feminine": 0, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1981, "agriculture_food": 0, "automotive_transport": 0, "finance": 2, "service_retail": 0, "general": 13, "healthcare": 0, "history_law_government": 1, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 3, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 124, "size": 44764597, "checksum": "4674aa3e92e5b8e5620004b5c473d8cd4245aa973a642abf781899e88179b458", "avgDurationSecs": 3.975, "validDurationSecs": 7258.912, "totalHrs": 2.2, "validHrs": 2.01 }, "yo": { "buckets": { "dev": 915, "test": 1122, "train": 1412, "validated": 3451, "invalidated": 261, "other": 1140 }, "duration": 29313072, "reportedSentences": 21, "validatedSentences": 5419, "unvalidatedSentences": 17, "clips": 4852, "splits": { "accent": {}, "age": { "": 0.29, "twenties": 0.61, "thirties": 0.03, "teens": 0.04, "fourties": 0, "fifties": 0.02, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.33, "male_masculine": 0.3, "female_feminine": 0.37, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 4852, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 132, "size": 170839274, "checksum": "6afad07dac589bd86a1794c2d918c6d3da232590bc79c4d19085abbf836cf368", "avgDurationSecs": 6.041, "validDurationSecs": 20849.013, "totalHrs": 8.14, "validHrs": 5.79 }, "yue": { "buckets": { "dev": 5130, "test": 5130, "train": 7420, "validated": 191396, "invalidated": 8103, "other": 79741 }, "duration": 1107782964, "reportedSentences": 2257, "validatedSentences": 18556, "unvalidatedSentences": 10171, "clips": 279240, "splits": { "accent": {}, "age": { "": 0.19, "twenties": 0.29, "thirties": 0.47, "teens": 0.01, "fourties": 0.04, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.2, "male_masculine": 0.17, "female_feminine": 0.62, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 276394, "agriculture_food": 18, "automotive_transport": 51, "finance": 128, "service_retail": 606, "general": 1678, "healthcare": 417, "history_law_government": 67, "language_fundamentals": 0, "media_entertainment": 192, "nature_environment": 188, "news_current_affairs": 114, "technology_robotics": 95 } }, "users": 1174, "size": 6420496257, "checksum": "755100899533b01d42d1ca5d4a607afa72c519fab5fae7b0750de62d82db1893", "avgDurationSecs": 3.967, "validDurationSecs": 759293.898, "totalHrs": 307.71, "validHrs": 210.91 }, "zgh": { "buckets": { "dev": 302, "test": 233, "train": 871, "validated": 1406, "invalidated": 91, "other": 672 }, "duration": 7560684, "reportedSentences": 6, "validatedSentences": 2738, "unvalidatedSentences": 355, "clips": 2169, "splits": { "accent": {}, "age": { "": 0.1, "twenties": 0.38, "thirties": 0.52, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.15, "male_masculine": 0.82, "female_feminine": 0.03, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 2126, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 34, "healthcare": 3, "history_law_government": 0, "language_fundamentals": 5, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 1 } }, "users": 38, "size": 41386121, "checksum": "679955e7c53e8c0ce7b890df2f5a7e914bd0abeea91edeb8ca1199ee790aeaca", "avgDurationSecs": 3.486, "validDurationSecs": 4901.024, "totalHrs": 2.1, "validHrs": 1.36 }, "zh-CN": { "buckets": { "dev": 10647, "test": 10647, "train": 29560, "validated": 189406, "invalidated": 59164, "other": 602833 }, "duration": 3865791552, "reportedSentences": 1145, "validatedSentences": 59126, "unvalidatedSentences": 909, "clips": 851403, "splits": { "accent": {}, "age": { "": 0.92, "twenties": 0.05, "thirties": 0.01, "teens": 0.01, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.93, "male_masculine": 0.06, "female_feminine": 0.01, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 848200, "agriculture_food": 51, "automotive_transport": 71, "finance": 101, "service_retail": 58, "general": 829, "healthcare": 132, "history_law_government": 369, "language_fundamentals": 86, "media_entertainment": 1591, "nature_environment": 53, "news_current_affairs": 178, "technology_robotics": 236 } }, "users": 7525, "size": 22886754844, "checksum": "858c5ab1dc55d7a8e9802e5fa896683f17be84ca25edbeb79b9abd25a99b2a91", "avgDurationSecs": 4.54, "validDurationSecs": 859997.104, "totalHrs": 1073.83, "validHrs": 238.88 }, "zh-HK": { "buckets": { "dev": 5604, "test": 5604, "train": 8450, "validated": 94010, "invalidated": 4632, "other": 25129 }, "duration": 513685212, "reportedSentences": 824, "validatedSentences": 20146, "unvalidatedSentences": 29, "clips": 123771, "splits": { "accent": {}, "age": { "": 0.38, "twenties": 0.33, "thirties": 0.11, "teens": 0.02, "fourties": 0.12, "fifties": 0.03, "sixties": 0.01, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.37, "male_masculine": 0.4, "female_feminine": 0.22, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 122401, "agriculture_food": 0, "automotive_transport": 29, "finance": 44, "service_retail": 295, "general": 925, "healthcare": 90, "history_law_government": 72, "language_fundamentals": 85, "media_entertainment": 53, "nature_environment": 54, "news_current_affairs": 24, "technology_robotics": 45 } }, "users": 3108, "size": 3653748292, "checksum": "213c03ce1bd553168a1f964b5be8a5cab3dc626a68fb1a569fa4ee955ed812c0", "avgDurationSecs": 4.15, "validDurationSecs": 390168.511, "totalHrs": 142.69, "validHrs": 108.38 }, "zh-TW": { "buckets": { "dev": 5107, "test": 5107, "train": 7369, "validated": 84883, "invalidated": 4905, "other": 50436 }, "duration": 471662698, "reportedSentences": 179, "validatedSentences": 20751, "unvalidatedSentences": 849, "clips": 140224, "splits": { "accent": {}, "age": { "": 0.27, "twenties": 0.3, "thirties": 0.19, "teens": 0.06, "fourties": 0.09, "fifties": 0.09, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.29, "male_masculine": 0.49, "female_feminine": 0.22, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 138740, "agriculture_food": 12, "automotive_transport": 274, "finance": 1, "service_retail": 150, "general": 1103, "healthcare": 22, "history_law_government": 167, "language_fundamentals": 8, "media_entertainment": 167, "nature_environment": 12, "news_current_affairs": 43, "technology_robotics": 543 } }, "users": 2304, "size": 3146644633, "checksum": "478f55259cf02eed454ef9bba979e879d008c7b98c4aaa4d57c16f8371ff6af3", "avgDurationSecs": 3.364, "validDurationSecs": 285515.638, "totalHrs": 131.01, "validHrs": 79.3 }, "zoc": { "buckets": { "dev": 483, "test": 474, "train": 524, "validated": 8886, "invalidated": 2, "other": 60 }, "duration": 36533628, "reportedSentences": 0, "validatedSentences": 1481, "unvalidatedSentences": 7, "clips": 8948, "splits": { "accent": {}, "age": { "": 0.09, "twenties": 0.38, "thirties": 0.22, "teens": 0, "fourties": 0.31, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.56, "male_masculine": 0, "female_feminine": 0.44, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 8948, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 12, "size": 213960228, "checksum": "54186fba91b69e7c71ba70046387d4d385eea9e7e2ab21eeeac8157684de13e3", "avgDurationSecs": 4.083, "validDurationSecs": 36280.489, "totalHrs": 10.14, "validHrs": 10.07 }, "zu": { "buckets": { "dev": 0, "test": 1, "train": 15, "validated": 16, "invalidated": 12, "other": 175 }, "duration": 1123272, "reportedSentences": 4, "validatedSentences": 1320, "unvalidatedSentences": 19379, "clips": 203, "splits": { "accent": {}, "age": { "": 0.49, "twenties": 0.51, "thirties": 0, "teens": 0, "fourties": 0, "fifties": 0, "sixties": 0, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.49, "male_masculine": 0, "female_feminine": 0.17, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0.34 }, "sentence_domain": { "": 203, "agriculture_food": 0, "automotive_transport": 0, "finance": 0, "service_retail": 0, "general": 0, "healthcare": 0, "history_law_government": 0, "language_fundamentals": 0, "media_entertainment": 0, "nature_environment": 0, "news_current_affairs": 0, "technology_robotics": 0 } }, "users": 8, "size": 7938516, "checksum": "dff28383d0ba714cb7e49d597f2c21579e5e14c0aa8e06534b57a77a08ed690e", "avgDurationSecs": 5.533, "validDurationSecs": 88.534, "totalHrs": 0.31, "validHrs": 0.02 }, "zza": { "buckets": { "dev": 463, "test": 424, "train": 790, "validated": 1677, "invalidated": 245, "other": 298 }, "duration": 9090864, "reportedSentences": 2338, "validatedSentences": 5655, "unvalidatedSentences": 974, "clips": 2220, "splits": { "accent": {}, "age": { "": 0.22, "twenties": 0, "thirties": 0.65, "teens": 0, "fourties": 0, "fifties": 0.01, "sixties": 0.12, "seventies": 0, "eighties": 0, "nineties": 0 }, "gender": { "": 0.7, "male_masculine": 0.28, "female_feminine": 0.02, "transgender": 0, "non-binary": 0, "do_not_wish_to_say": 0 }, "sentence_domain": { "": 1481, "agriculture_food": 3, "automotive_transport": 1, "finance": 1, "service_retail": 9, "general": 675, "healthcare": 16, "history_law_government": 0, "language_fundamentals": 27, "media_entertainment": 2, "nature_environment": 4, "news_current_affairs": 0, "technology_robotics": 2 } }, "users": 20, "size": 53259616, "checksum": "d4d2407866c14b3fdab77c42fde3557e4f20c45e2a53c0323f7bc5380950263b", "avgDurationSecs": 4.095, "validDurationSecs": 6867.288, "totalHrs": 2.52, "validHrs": 1.9 } }, "totalDuration": 140161062895, "totalValidDurationSecs": 93193530, "totalHrs": 38932, "totalValidHrs": 25886 }