From 7799fc7a9f16972e0d9e7a164f8d5084714c1609 Mon Sep 17 00:00:00 2001 From: Aidan Pine Date: Fri, 22 Nov 2024 10:27:30 -0800 Subject: [PATCH] add sts --- add_new_language.py | 2 +- locales/all.json | 3 +- locales/contributable.json | 3 +- locales/native-names.json | 1 + locales/translated.json | 1 + web/locales/aaa/messages.ftl | 1 + web/locales/aab/messages.ftl | 1 + web/locales/aac/messages.ftl | 1 + web/locales/aae/messages.ftl | 1 + web/locales/aam/messages.ftl | 1 + web/locales/aan/messages.ftl | 1 + web/locales/crk/messages.ftl | 1 + web/locales/crl/messages.ftl | 1 + web/locales/en/messages.ftl | 1 + web/locales/git/messages.ftl | 1 + web/locales/mok/messages.ftl | 1 + web/locales/moo/messages.ftl | 1 + web/locales/ore/messages.ftl | 1 + web/locales/orm/messages.ftl | 1 + web/locales/str/messages.ftl | 1 + web/locales/sts/cross-locale.ftl | 18 + web/locales/sts/messages.ftl | 1441 ++++++++++++++++++++++++++++++ 22 files changed, 1481 insertions(+), 3 deletions(-) create mode 100644 web/locales/sts/cross-locale.ftl create mode 100644 web/locales/sts/messages.ftl diff --git a/add_new_language.py b/add_new_language.py index 1004a4499..627219a82 100644 --- a/add_new_language.py +++ b/add_new_language.py @@ -2,7 +2,7 @@ def main(): # insert your ISO code and dropdown description - lang_info = {"ISO":"aam", "description":"Kanien'kéha Medium Speed"} + lang_info = {"ISO":"sts", "description":"SENĆOŦEN Special Words and Paragraphs"} # Visit https://github.com/EveryVoiceTTS/common-voice and make sure you are on branch dev/ilt; # Add str to locales/all.json in order to get that new language to show up in the UI's top-right dropdown box; diff --git a/locales/all.json b/locales/all.json index 565ab54f1..579953174 100644 --- a/locales/all.json +++ b/locales/all.json @@ -11,5 +11,6 @@ "moo", "ore", "orm", - "str" + "str", + "sts" ] \ No newline at end of file diff --git a/locales/contributable.json b/locales/contributable.json index 565ab54f1..579953174 100644 --- a/locales/contributable.json +++ b/locales/contributable.json @@ -11,5 +11,6 @@ "moo", "ore", "orm", - "str" + "str", + "sts" ] \ No newline at end of file diff --git a/locales/native-names.json b/locales/native-names.json index d415e4cca..a1b5d65bc 100644 --- a/locales/native-names.json +++ b/locales/native-names.json @@ -126,6 +126,7 @@ "sq": "Shqip", "sr": "Српски", "str": "SENĆOŦEN", + "sts": "SENĆOŦEN Special Words and Paragraphs", "sv-SE": "Svenska", "sw": "Kiswahili", "syr": "ܣܘܼܪܝܝܐ", diff --git a/locales/translated.json b/locales/translated.json index 348247d16..7178c6922 100644 --- a/locales/translated.json +++ b/locales/translated.json @@ -106,6 +106,7 @@ "sq", "sr", "str", + "sts", "sv-SE", "sw", "ta", diff --git a/web/locales/aaa/messages.ftl b/web/locales/aaa/messages.ftl index 31cb44a2e..059809030 100644 --- a/web/locales/aaa/messages.ftl +++ b/web/locales/aaa/messages.ftl @@ -17,6 +17,7 @@ not-available-abbreviation = N/A # Don't rename the following section, its contents are auto-inserted based on the name (see scripts/pontoon-languages-to-ftl.js) # [Languages] ## Languages +sts = SENĆOŦEN Special Words and Paragraphs aam = Kanien'kéha Medium Speed orm = Ohsweken Medium Speed crl = nêhiyawêwin short diff --git a/web/locales/aab/messages.ftl b/web/locales/aab/messages.ftl index 31cb44a2e..059809030 100644 --- a/web/locales/aab/messages.ftl +++ b/web/locales/aab/messages.ftl @@ -17,6 +17,7 @@ not-available-abbreviation = N/A # Don't rename the following section, its contents are auto-inserted based on the name (see scripts/pontoon-languages-to-ftl.js) # [Languages] ## Languages +sts = SENĆOŦEN Special Words and Paragraphs aam = Kanien'kéha Medium Speed orm = Ohsweken Medium Speed crl = nêhiyawêwin short diff --git a/web/locales/aac/messages.ftl b/web/locales/aac/messages.ftl index 31cb44a2e..059809030 100644 --- a/web/locales/aac/messages.ftl +++ b/web/locales/aac/messages.ftl @@ -17,6 +17,7 @@ not-available-abbreviation = N/A # Don't rename the following section, its contents are auto-inserted based on the name (see scripts/pontoon-languages-to-ftl.js) # [Languages] ## Languages +sts = SENĆOŦEN Special Words and Paragraphs aam = Kanien'kéha Medium Speed orm = Ohsweken Medium Speed crl = nêhiyawêwin short diff --git a/web/locales/aae/messages.ftl b/web/locales/aae/messages.ftl index 31cb44a2e..059809030 100644 --- a/web/locales/aae/messages.ftl +++ b/web/locales/aae/messages.ftl @@ -17,6 +17,7 @@ not-available-abbreviation = N/A # Don't rename the following section, its contents are auto-inserted based on the name (see scripts/pontoon-languages-to-ftl.js) # [Languages] ## Languages +sts = SENĆOŦEN Special Words and Paragraphs aam = Kanien'kéha Medium Speed orm = Ohsweken Medium Speed crl = nêhiyawêwin short diff --git a/web/locales/aam/messages.ftl b/web/locales/aam/messages.ftl index 31cb44a2e..059809030 100644 --- a/web/locales/aam/messages.ftl +++ b/web/locales/aam/messages.ftl @@ -17,6 +17,7 @@ not-available-abbreviation = N/A # Don't rename the following section, its contents are auto-inserted based on the name (see scripts/pontoon-languages-to-ftl.js) # [Languages] ## Languages +sts = SENĆOŦEN Special Words and Paragraphs aam = Kanien'kéha Medium Speed orm = Ohsweken Medium Speed crl = nêhiyawêwin short diff --git a/web/locales/aan/messages.ftl b/web/locales/aan/messages.ftl index 31cb44a2e..059809030 100644 --- a/web/locales/aan/messages.ftl +++ b/web/locales/aan/messages.ftl @@ -17,6 +17,7 @@ not-available-abbreviation = N/A # Don't rename the following section, its contents are auto-inserted based on the name (see scripts/pontoon-languages-to-ftl.js) # [Languages] ## Languages +sts = SENĆOŦEN Special Words and Paragraphs aam = Kanien'kéha Medium Speed orm = Ohsweken Medium Speed crl = nêhiyawêwin short diff --git a/web/locales/crk/messages.ftl b/web/locales/crk/messages.ftl index a231d5aba..f02d11a20 100644 --- a/web/locales/crk/messages.ftl +++ b/web/locales/crk/messages.ftl @@ -17,6 +17,7 @@ not-available-abbreviation = N/A # Don't rename the following section, its contents are auto-inserted based on the name (see scripts/pontoon-languages-to-ftl.js) # [Languages] ## Languages +sts = SENĆOŦEN Special Words and Paragraphs aam = Kanien'kéha Medium Speed orm = Ohsweken Medium Speed crl = nêhiyawêwin short diff --git a/web/locales/crl/messages.ftl b/web/locales/crl/messages.ftl index 31cb44a2e..059809030 100644 --- a/web/locales/crl/messages.ftl +++ b/web/locales/crl/messages.ftl @@ -17,6 +17,7 @@ not-available-abbreviation = N/A # Don't rename the following section, its contents are auto-inserted based on the name (see scripts/pontoon-languages-to-ftl.js) # [Languages] ## Languages +sts = SENĆOŦEN Special Words and Paragraphs aam = Kanien'kéha Medium Speed orm = Ohsweken Medium Speed crl = nêhiyawêwin short diff --git a/web/locales/en/messages.ftl b/web/locales/en/messages.ftl index 31cb44a2e..059809030 100644 --- a/web/locales/en/messages.ftl +++ b/web/locales/en/messages.ftl @@ -17,6 +17,7 @@ not-available-abbreviation = N/A # Don't rename the following section, its contents are auto-inserted based on the name (see scripts/pontoon-languages-to-ftl.js) # [Languages] ## Languages +sts = SENĆOŦEN Special Words and Paragraphs aam = Kanien'kéha Medium Speed orm = Ohsweken Medium Speed crl = nêhiyawêwin short diff --git a/web/locales/git/messages.ftl b/web/locales/git/messages.ftl index 31cb44a2e..059809030 100644 --- a/web/locales/git/messages.ftl +++ b/web/locales/git/messages.ftl @@ -17,6 +17,7 @@ not-available-abbreviation = N/A # Don't rename the following section, its contents are auto-inserted based on the name (see scripts/pontoon-languages-to-ftl.js) # [Languages] ## Languages +sts = SENĆOŦEN Special Words and Paragraphs aam = Kanien'kéha Medium Speed orm = Ohsweken Medium Speed crl = nêhiyawêwin short diff --git a/web/locales/mok/messages.ftl b/web/locales/mok/messages.ftl index 31cb44a2e..059809030 100644 --- a/web/locales/mok/messages.ftl +++ b/web/locales/mok/messages.ftl @@ -17,6 +17,7 @@ not-available-abbreviation = N/A # Don't rename the following section, its contents are auto-inserted based on the name (see scripts/pontoon-languages-to-ftl.js) # [Languages] ## Languages +sts = SENĆOŦEN Special Words and Paragraphs aam = Kanien'kéha Medium Speed orm = Ohsweken Medium Speed crl = nêhiyawêwin short diff --git a/web/locales/moo/messages.ftl b/web/locales/moo/messages.ftl index 31cb44a2e..059809030 100644 --- a/web/locales/moo/messages.ftl +++ b/web/locales/moo/messages.ftl @@ -17,6 +17,7 @@ not-available-abbreviation = N/A # Don't rename the following section, its contents are auto-inserted based on the name (see scripts/pontoon-languages-to-ftl.js) # [Languages] ## Languages +sts = SENĆOŦEN Special Words and Paragraphs aam = Kanien'kéha Medium Speed orm = Ohsweken Medium Speed crl = nêhiyawêwin short diff --git a/web/locales/ore/messages.ftl b/web/locales/ore/messages.ftl index b372cc0f3..678c75d10 100644 --- a/web/locales/ore/messages.ftl +++ b/web/locales/ore/messages.ftl @@ -17,6 +17,7 @@ not-available-abbreviation = N/A # Don't rename the following section, its contents are auto-inserted based on the name (see scripts/pontoon-languages-to-ftl.js) # [Languages] ## Languages +sts = SENĆOŦEN Special Words and Paragraphs aam = Kanien'kéha Medium Speed orm = Ohsweken Medium Speed crl = nêhiyawêwin short diff --git a/web/locales/orm/messages.ftl b/web/locales/orm/messages.ftl index 31cb44a2e..059809030 100644 --- a/web/locales/orm/messages.ftl +++ b/web/locales/orm/messages.ftl @@ -17,6 +17,7 @@ not-available-abbreviation = N/A # Don't rename the following section, its contents are auto-inserted based on the name (see scripts/pontoon-languages-to-ftl.js) # [Languages] ## Languages +sts = SENĆOŦEN Special Words and Paragraphs aam = Kanien'kéha Medium Speed orm = Ohsweken Medium Speed crl = nêhiyawêwin short diff --git a/web/locales/str/messages.ftl b/web/locales/str/messages.ftl index 31cb44a2e..059809030 100644 --- a/web/locales/str/messages.ftl +++ b/web/locales/str/messages.ftl @@ -17,6 +17,7 @@ not-available-abbreviation = N/A # Don't rename the following section, its contents are auto-inserted based on the name (see scripts/pontoon-languages-to-ftl.js) # [Languages] ## Languages +sts = SENĆOŦEN Special Words and Paragraphs aam = Kanien'kéha Medium Speed orm = Ohsweken Medium Speed crl = nêhiyawêwin short diff --git a/web/locales/sts/cross-locale.ftl b/web/locales/sts/cross-locale.ftl new file mode 100644 index 000000000..486515e2b --- /dev/null +++ b/web/locales/sts/cross-locale.ftl @@ -0,0 +1,18 @@ +## Languages +contribute = Contribute +get-involved-button = Get Involved +get-involved-title = Contribute to { $lang } +get-involved-text = + Thank you for your interest in contributing to { $lang }. We work hard to get every language ready for launch and keep + the teams updated via email. If you want to contribute, please provide your email below. + +get-involved-form-title = Sign up for { $lang } updates: +get-involved-email = + .label = Email +get-involved-opt-in = Yes, send me emails. I'd like to stay informed about the progress of this language on Common Voice. +get-involved-submit = Submit +get-involved-stayintouch = We at Mozilla are building a community around voice technology. We would like to stay in touch with updates, new data sources and to hear more about how you're using this data. +get-involved-privacy-info = We promise to handle your information with care. Read more in our Privacy Notice. +get-involved-success-title = You've successfully signed up for contributing to { $language }. Thank you. +get-involved-success-text = We will be in touch with more information as it becomes available. +get-involved-return-to-languages = Return to Languages diff --git a/web/locales/sts/messages.ftl b/web/locales/sts/messages.ftl new file mode 100644 index 000000000..059809030 --- /dev/null +++ b/web/locales/sts/messages.ftl @@ -0,0 +1,1441 @@ +## General +yes-receive-emails = Yes, send me emails. I’d like to stay informed about the Common Voice Project. +stayintouch = We at Mozilla are building a community around voice technology. We would like to stay in touch with updates, new data sources and to hear more about how you're using this data. +privacy-info = We promise to handle your information with care. Read more in our Privacy Notice. +return-to-cv = Return to Common Voice +email-input = + .label = Email +submit-form-action = Submit +loading = Loading… +email-opt-in-info = I'd like to receive emails such as goal reminders, my progress updates and newsletters about Common Voice. +email-opt-in-info-title = Join the Common Voice mailing list +email-opt-in-info-sub-with-challenge = Receive emails such as challenge and goal reminders, progress updates, and newsletters about Common Voice. +email-opt-in-privacy-v2 = By opting in to receive emails you state that you are okay with Mozilla handling this info as explained in Mozilla’s Privacy Policy. +indicates-required = * Indicates required field +not-available-abbreviation = N/A + +# Don't rename the following section, its contents are auto-inserted based on the name (see scripts/pontoon-languages-to-ftl.js) +# [Languages] +## Languages +sts = SENĆOŦEN Special Words and Paragraphs +aam = Kanien'kéha Medium Speed +orm = Ohsweken Medium Speed +crl = nêhiyawêwin short +ore = Ohswekèn:’a Natural & Careful Speech Set +aaa = SENĆOŦEN Origin Stories +aab = Kanyen'kéha (Ohswekèn:'a) moo-Latest +aac = Kanien’kéha (Kahnawa’kéha) test set +aae = Kanien’kéha Edu/Careful Speech Set +aan = Kanien’kéha Natural Speech Set +ab = Abkhaz +ace = Acehnese +ady = Adyghe +af = Afrikaans +am = Amharic +an = Aragonese +ar = Arabic +arn = Mapudungun +as = Assamese +ast = Asturian +az = Azerbaijani +ba = Bashkir +bas = Basaa +be = Belarusian +bg = Bulgarian +bn = Bengali +br = Breton +bs = Bosnian +bxr = Buryat +ca = Catalan +cak = Kaqchikel +ckb = Central Kurdish +cnh = Hakha Chin +crk = NÊHIYAWÊWIN +co = Corsican +cs = Czech +cv = Chuvash +cy = Welsh +da = Danish +de = German +dsb = Sorbian, Lower +dv = Dhivehi +el = Greek +en = English +eo = Esperanto +es = Spanish +et = Estonian +eu = Basque +fa = Persian +ff = Fulah +fi = Finnish +fo = Faroese +fr = French +fy-NL = Frisian +ga-IE = Irish +git = Gitksan +gl = Galician +gn = Guarani +gom = Goan Konkani +ha = Hausa +he = Hebrew +hi = Hindi +hr = Croatian +hsb = Sorbian, Upper +ht = Haitian +hu = Hungarian +hy-AM = Armenian +hyw = Armenian Western +ia = Interlingua +id = Indonesian +ie = Interlingue +ig = Igbo +is = Icelandic +it = Italian +izh = Izhorian +ja = Japanese +ka = Georgian +kaa = Karakalpak +kab = Kabyle +kbd = Kabardian +ki = Kikuyu +kk = Kazakh +km = Khmer +kmr = Kurmanji Kurdish +knn = Konkani (Devanagari) +ko = Korean +kpv = Komi-Zyrian +kw = Cornish +ky = Kyrgyz +lg = Luganda +lij = Ligurian +lt = Lithuanian +lv = Latvian +mai = Maithili +mdf = Moksha +mg = Malagasy +mhr = Meadow Mari +mk = Macedonian +ml = Malayalam +mn = Mongolian +mni = Meetei Lon +mok = Kanien’kéha (Kahnawa’kéha) +moo = Kanyen'kéha (Ohswekèn:'a) +mos = Mossi +mr = Marathi +mrj = Hill Mari +ms = Malay +mt = Maltese +my = Burmese +myv = Erzya +nan-tw = Taiwanese (Minnan) +nb-NO = Norwegian Bokmål +ne-NP = Nepali +nia = Nias +nl = Dutch +nn-NO = Norwegian Nynorsk +nyn = Runyankole +oc = Occitan +or = Odia +pa-IN = Punjabi +pap-AW = Papiamento (Aruba) +pl = Polish +ps = Pashto +pt = Portuguese +quc = K'iche' +quy = Quechua Chanka +rm-sursilv = Romansh Sursilvan +rm-vallader = Romansh Vallader +ro = Romanian +ru = Russian +rw = Kinyarwanda +sah = Sakha +sat = Santali (Ol Chiki) +sc = Sardinian +scn = Sicilian +shi = Shilha +si = Sinhala +sk = Slovak +sl = Slovenian +so = Somali +sq = Albanian +sr = Serbian +str = SENĆOŦEN +sv-SE = Swedish +sw = Swahili +syr = Syriac +ta = Tamil +te = Telugu +tg = Tajik +th = Thai +ti = Tigrinya +tig = Tigre +tk = Turkmen +tl = Tagalog +tr = Turkish +tt = Tatar +tw = Twi +ty = Tahitian +uby = Ubykh +udm = Udmurt +ug = Uyghur +uk = Ukrainian +ur = Urdu +uz = Uzbek +vec = Venetian +vi = Vietnamese +vot = Votic +yi = Yiddish +yo = Yoruba +yue = Cantonese +zh-CN = Chinese (China) +zh-HK = Chinese (Hong Kong) +zh-TW = Chinese (Taiwan) +# [/] + +## Layout +speak = Speak +speak-now = Speak now +datasets = Datasets +languages = Languages +about = About +profile = Profile +help = Help +contact = Contact +privacy = Privacy +terms = Terms +cookies = Cookies +faq = FAQ +content-license-text = Content available under a Creative Commons license +share-title = Help us find others to donate their voice! +share-text = Help teach machines how real people speak, donate your voice at { $link } +link-copied = Link Copied +back-top = Back to Top +logout = Log Out + +## Home Page +home-title = Common Voice is Mozilla's initiative to help teach machines how real people speak. +default-tagline = Speech Generation for Indigenous Language Education project +home-cta = Speak up, contribute here! +wall-of-text-start = + Voice is natural, voice is human. That’s why we’re fascinated with creating usable voice + technology for our machines. But to create voice systems, a large amount of voice + data is required. +wall-of-text-more-mobile = + While there is no replacement for a speaker of an Indigenous language, there are possible applications for speech synthesis (text-to-speech) to supplement existing text-based tools like verb conjugators, dictionaries and phrasebooks. The National Research Council has partnered with the Onkwawenna Kentyohkwa Kanyen’kéha immersion school, W̱SÁNEĆ School Board, University nuhelot’įne thaiyots’į nistameyimâkanak Blue Quills, and the University of Edinburgh to research and develop state-of-the-art speech synthesis (text-to-speech) systems and techniques for Indigenous languages in Canada, with a focus on how to integrate text-to-speech technology into the classroom. +wall-of-text-more-desktop = + While there is no replacement for a speaker of an Indigenous language, there are possible applications for speech synthesis (text-to-speech) to supplement existing text-based tools like verb conjugators, dictionaries and phrasebooks. The National Research Council has partnered with the Onkwawenna Kentyohkwa Kanyen’kéha immersion school, W̱SÁNEĆ School Board, University nuhelot’įne thaiyots’į nistameyimâkanak Blue Quills, and the University of Edinburgh to research and develop state-of-the-art speech synthesis (text-to-speech) systems and techniques for Indigenous languages in Canada, with a focus on how to integrate text-to-speech technology into the classroom. +wall-of-text-first = + There are approximately 70 Indigenous languages spoken in Canada from 10 distinct language families. As a consequence of the residential school system and other policies of cultural suppression, the majority of these languages now have fewer than 500 fluent speakers remaining, most of them elderly. +wall-of-text-second = + Despite this, Indigenous people have resisted colonial policies and continued speaking their languages, with interest by students and parents in Indigenous language education continuing to grow. Teachers are often overwhelmed by the number of students, and the trend towards online education means many students who have not previously had access to language classes now do. Supporting these growing cohorts of students comes with unique challenges in languages with few fluent first-language speakers. Teachers are particularly concerned with providing their students with opportunities to hear the language outside of class. +show-wall-of-text = Read More +help-us-title = Help us validate sentences! +help-us-explain = Press play, listen & tell us: did they accurately speak the sentence below? +no-clips-to-validate = Looks like there aren't any clips to listen to in this language. Help us fill the queue by recording some now. +vote-yes = Yes +vote-no = No +toggle-play-tooltip = Press { shortcut-play-toggle } to toggle play mode +speak-subtitle = Donate your voice +speak-paragraph = Recording voice clips is an integral part of building a dataset; some would say it's the fun part too. +speak-goal-text = Clips recorded +listen-subtitle = Help us validate voices +listen-paragraph = Validating recorded clips is equally important to the Common Voice mission. Take a listen and help us create quality voice data. +listen-goal-text = Clips validated +hours-recorded = Hours Recorded +hours-validated = Hours Validated +voices-online = Voices Online Now +todays-progress = Today's Progress +help-reach-goal = Help us get to { $goal } +read-terms-q = Have you read our Terms? +ready-to-record = Ready to donate your voice? +all-locales = All +today = Today +x-weeks-short = + { $count -> + [one] Week + *[other] { $count }wk + } +x-months-short = + { $count -> + *[other] { $count }mo + } +x-years-short = + { $count -> + *[other] { $count }y + } +help-make-dataset = Help build a high quality dataset for your language. +sign-up-account = Sign up for an account +email-subscription-title = sign up for email updates +email-subscription-title-new = Sign up for Common Voice newsletters, goal reminders and progress updates + +## Account Benefits +benefits = Benefits +rich-data = Make your submitted data as rich as possible by providing some anonymous demographic data. We de-identify all demographic data before making it public. +improve-audio = Profile information improves the audio data used in training speech recognition accuracy. +keep-track = Keep track of your progress and metrics across multiple languages. +compare-progress = See how your progress compares to other contributors all over the world. +view-goals = View your progress against personal and project goals. +join-newsletter = Optionally join on our email list for updates and new information about the project. + +## What's public +whats-public = What's Public? +email-not-public = We will not make your data public. +recordings-and-locale-public = The recordings are to be used in the Speech Generation for Indigenous Language Education (SGILE) project only. +username-optin-public = Only SGILE members will have access to this website. Please do not share it, or any of the data in it, with anyone outside of the project. +demographic-deidentified-clarity-2 = If you want to add more sentences, please contact Sam at NRC +username-email-not-demographic = If you have any concerns, please contact the Aidan at NRC + + +## Speak & Listen Shortcuts +# Must be one letter that appears in the translated { skip } string. +shortcut-skip = s + +## Listen Shortcuts +# Must be one letter that appears in the translated play-string inside of { shortcut-play-toggle-label }. +# Must be different from { shortcut-skip }, { shortcut-vote-yes } and { shortcut-vote-no } +shortcut-play-toggle = p +shortcut-play-toggle-label = Play/Stop +# Must be one letter that appears in the { vote-yes } string. +# Must be different from { shortcut-skip }, { shortcut-vote-no } and { shortcut-play-toggle } +shortcut-vote-yes = y +# Must be one letter that appears in the { vote-no } string. +# Must be different from { shortcut-skip }, { shortcut-vote-yes } and { shortcut-play-toggle } +shortcut-vote-no = n + +## Speak Shortcuts +# Must be one letter that appears in the translated record-string inside of { shortcut-record-toggle-label }. +# Must be different from { shortcut-skip }, { shortcut-vote-yes } and { shortcut-vote-no } +shortcut-record-toggle = r +shortcut-record-toggle-label = Record/Stop + +shortcut-rerecord-toggle = [1-5] +shortcut-rerecord-toggle-label = Re-record clip + +shortcut-discard-ongoing-recording = ESC +shortcut-discard-ongoing-recording-label = Discard ongoing recording + +shortcut-submit = Return +shortcut-submit-label = Submit clips + +request-language-text = Don't see your language on Common Voice yet? +request-language-text-learn = Learn how to request it here! +request-language-button = Request a Language + +## ProjectStatus +status-title = Overall project status: see how far we’ve come! +status-contribute = Contribute Your Voice +status-hours = + { $hours -> + [one] One validated hour so far! + *[other] { $hours } validated hours so far! + } +# Variables: +# $goal - number of hours representing the next goal +status-goal = Next Goals: { $goal } +english = English + +## ProfileForm +profile-form-username = + .label = User Name +profile-form-native-language = + .label = Native Language +profile-form-additional-language = + .label = Additional Language +profile-form-language = + .label = Language +profile-form-accent = + .label = Accent +profile-form-custom-accent-help-text = + .label = How would you describe your accent? +profile-form-custom-accent-placeholder-2 = Start typing to describe your accent +profile-form-age = + .label = Age +profile-form-gender-2 = + .label = Gender +leaderboard-visibility = + .label = Leaderboard Visibility +hidden = Hidden +visible = Visible +native-language = + .label = Native Language +profile-form-add-accent = Add new custom accent "{ $inputValue }" + + +profile-form-submit-save = Save +profile-form-submit-saved = Saved + +male = Male +female = Female +# Gender +other = Other +why-profile-title = Why a profile? +why-profile-text = + By providing some information about yourself, the audio data you submit to Common Voice will be more useful to Speech + Recognition engines that use this data to improve their accuracy. + +dashboard = Dashboard +build-profile = Build Profile +avatar = Avatar +goals = Goals +settings = Settings +edit-profile = Edit Profile +profile-create-success = Success, profile created! +profile-close = Close +profile-explanation = Keep track of your progress with a profile and help our voice data be more accurate. +thanks-for-account = Thanks for confirming your account, now let's build your profile. +why-demographic = Why does this matter? +why-demographic-explanation-2 = Anonymized user data like age, gender, and accent helps improve the audio data used to train the accuracy of speech recognition engines. Your username and email will never be associated with your submitted data, and you can choose whether to make your username public or anonymous. lorem ipsum +accept-privacy = I'm okay with you handling this info as you explain in Mozilla's Privacy Policy +accept-privacy-title = Privacy Policy +login-identity = Login Identity +login-signup = Log In / Sign Up +edit = Edit +email-subscriptions = Email Subscriptions +download-profile = Download My Data +contribution-experience = Contribution Experience +skip-submission-feedback = Skip Submission Feedback +skip-submission-description = During contribution submission feedback will be skipped after clicking 'Submit'. Contribution will continue directly with the next set of 5 recordings or validations. +skip-submission-note = Note: You will still need to select between Speak or Listen to change contribution type. +off = Off +on = On +help-accent = Need some help with accent? +help-accent-explanation = Your accent is the way you pronounce words. It can be shaped by where you have lived, which other languages you speak and lots of other factors. You can share any information you feel is relevant here. + +## Profile - Email +browse-file-title = Upload an image file +browse-file = Drag and drop or Browse +connect-gravatar = Connect with Gravatar +gravatar_not_found = No gravatar found for your email +file_too_large = The selected file is too large +avatar-uploaded = Avatar uploaded +max-file-size = { $kb }kb max + +## Profile - Email +manage-subscriptions = Manage Subscriptions +manage-email-subscriptions = Manage Email Subscriptions +email-already-used = Email is already used for a different account +add-language = Add Language +change-email-setings = Change your email via Settings under Login Identity + +## FAQ +faq-title = Frequently Asked Questions + +faq-what-cv-q = What is Common Voice? +faq-what-cv-a = + Voice recognition technology is revolutionizing the way we interact with machines, but the currently available systems are expensive and proprietary. Common Voice is part of Mozilla’s initiative to make voice recognition technologies better and more accessible for everyone. Common Voice is a massive global database of donated voices that lets anyone quickly and easily train voice-enabled apps in potentially every language. lorem ipsum not sure what we want to keep here. +faq-what-cv-a-2 = + Voice recognition technology is revolutionizing the way we interact with machines, but the currently available systems are expensive and proprietary. Mozilla Common Voice is an initiative to make voice recognition technologies better and more accessible for everyone. Common Voice is a massive global database of donated voices that lets anyone quickly and easily train voice-enabled apps in potentially every language. lorem ipsum + + We're not only collecting voice samples in widely spoken languages but also in those with a smaller population of speakers. Publishing a diverse dataset of voices will empower developers, entrepreneurs, and communities to address this gap themselves. lorem ipsum + +faq-why-important-q = Why is it important? +faq-why-important-a = + Speech is often the most natural way we communicate with each other and voice technologies are bringing that convenience to our computers and mobile devices. We want to empower developers to build amazing voice recognition applications like real-time translators and voice-enabled digital assistants. But right now most of the voice data required to build these kinds of apps is expensive and proprietary. We hope the Common Voice dataset will give developers what they need to innovate and make speech technology available in their own language. lorem ipsum again, not appropriate since we're not building public datasets... + + To make voice recognition even more universal, we're collecting voice samples in widely spoken languages as well as those with a smaller population of speakers often underserved by commercial speech recognition services. Publishing a diverse dataset of voices will empower developers, entrepreneurs, and entire speech communities to address this gap themselves. lorem ipsum + +faq-how-get-q = How can I get the Common Voice data? +faq-how-get-a = The Common Voice dataset is available for download under the CC0 license on our Datasets page. You can also download several other publicly available datasets from the same page. lorem ipsum do we customize all the FAQs? + +faq-when-release2-q = When will you release Common Voice data in other languages? +faq-when-release2-a = The multi-language version of the Common Voice dataset is currently undergoing community supported bundling and cleaning. If you would like to help us bring Common Voice to new languages, go check out the Sentence Collection Tool for adding new sentences to the dataset, and Mozilla Pontoon for translating the website itself. New languages are added to Common Voice for voice contribution when 5000 approved sentences have been collected. lorem ipsum + +faq-why-mission-q = Why is Common Voice part of the Mozilla mission? +faq-why-mission-a = Mozilla is dedicated to keeping the web open and accessible for everyone. To do that we need to empower web creators through projects like Common Voice. As voice technologies proliferate beyond niche applications, we believe they must serve all users equally. That means investing in more languages and accommodating diverse accents and demographics when building and testing voice technologies. Common Voice is a public resource available to everyone and Mozilla teams and developers around the world are already using it on our own projects as well. lorem ipsum + +faq-what-cv-and-deepspeech-q = What’s the difference between Common Voice and Deep Speech? +faq-what-cv-and-deepspeech-a = The Common Voice dataset complements Mozilla’s open source voice recognition engine Deep Speech. The first version of Deep Speech was released in November 2017 and has continued to evolve ever since. Together with the Common Voice dataset, we believe this open source voice recognition technology should be available to everybody. It’s our hope these technologies will enable developers to build a wave of innovative products and services. lorem ipsum + +faq-is-goal-assistant-q = Is the goal of Common Voice to build a voice assistant? +faq-is-goal-assistant-a = The goal of the Common Voice dataset is to enable anyone in the world to build speech recognition, speaker recognition, or any other type of application that requires voice data. A voice assistant is just one of many types of applications you could use the dataset to build. lorem ipsum + +faq-do-want-native-q = I am a non-native speaker and I speak with an accent, do you still want my voice? +faq-do-want-native-a = Yes, we especially want your voice! Part of the aim of Common Voice is to gather as many different accents as possible so that voice recognition services work equally well for everyone. This means donations from non-native speakers are particularly important. lorem ipsum + +faq-why-different-speakers-q = Why do you need so many different speakers per language? +faq-why-different-speakers-a = + Most speech databases are trained with an overrepresentation of certain demographics which results in a bias towards male and middle class. Accents and dialects that tend to be under-represented in training data sets are typically associated with groups of people who are already marginalised. Many machines also struggle to understand female voices. + This is why in our voice database we want variety! lorem ipsum + +faq-why-my-lang-q = Why is my language not included yet? +faq-why-my-lang-new-a = Mozilla doesn’t pick or favor any one language over another. Instead, Common Voice is a purely community-driven initiative, but it takes several steps to add a new language and begin collecting voice donations. First, the Common Voice website needs to be translated so community members can access the contributor experience in their own language. Next, we need a large collection of copyright-free sentences for people to read outloud. Once both of those requirements are satisfied a language is “launched” on Common Voice for people to start recording their voice and validating others donations. If you want to help launch a new language, head over to our sentence collection tool to get started. lorem ipsum + +faq-what-quality-q = What level of audio quality is required for a voice clip to be used in the dataset? +faq-what-quality-a = We want the Common Voice dataset to reflect the audio quality a speech-to-text engine will hear in the wild, so we’re looking for variety. In addition to a diverse community of speakers, a dataset with varying audio quality will teach the speech-to-text engine to handle various real-world situations, from background talking to car noise. As long as your voice clip is intelligible, it should be good enough for the dataset. lorem ipsum here we'll want to say we need high quality for TTS + +faq-why-10k-hours-q = Why is 10,000 validated hours the per language goal for capturing audio? +faq-why-10k-hours-a = This is approximately the number of hours required to train a production speech-to-text system. lorem ipsum + +faq-how-calc-hours-q = How does Common Voice calculate hours? +faq-how-calc-hours-a = We calculate hours by estimating the average length of each recording, and then multiplying that number by the total number of recordings across all languages. lorem ipsum + +faq-where-src-from-2-q = Where does the source text come from? +faq-where-src-from-2-a = + Our source text is made up of original contributor donations as well as dialogue from public domain movie scripts like It’s a Wonderful Life. + + You can view our source sentences in this GitHub folder. lorem ipsum I assume we'll be using closed source text... + +faq-why-not-ask-read-q = Why don’t you ask people to read from books or Wikipedia articles in different languages? +faq-why-not-ask-read-a = To make the Common Voice dataset as useful as possible we have decided to only allow source text that is available under a Creative Commons (CC0) license. Using the CC0 standard means its more difficult to find and collect source text, but allows anyone to use the resulting voice data without usage restrictions or authorization from Mozilla. Ultimately, we want to make the multi-language dataset as useful as possible to everyone, including researchers, universities, startups, governments, social purpose organizations, and hobbyists. lorem ipsum + +faq-why-account-q = Why should I sign up for an account? +faq-is-account-public-q = Is my account information public? + +faq-how-privacy-q = How do you ensure anonymity and privacy of the people who donated their voices? +faq-how-privacy-a = All voice clips in the dataset are scrubbed of personally identifying information. When a contributor provides demographic data via their profile, that information is de-identified from their voice clips before being bundled for download in the dataset and is never made public on their profile page. lorem ipsum + +faq-what-determine-identity-q = What does it mean that I can’t “determine the identity” of speakers in the Common Voice dataset? +faq-what-determine-identity-a = + The Common Voice dataset is an open and publicly available resource that can be used to train a wide variety of speech-enabled applications. To protect the security of our contributors, we ask everyone who downloads the Common Voice dataset to respect contributors’ privacy. + + All voice clips in the dataset are scrubbed of personally identifying information. When you download the dataset, you agree to not attempt to determine the identity of any contributor. That means you cannot try to link information in the dataset to a contributor’s personal information. You may, however, use the dataset to train speech recognition, speaker recognition, or other applications, by, for instance, linking information in the dataset to other information already in the dataset. + lorem ipsum + +faq-what-is-cv = What is Common Voice? +faq-using-cv = Using Common Voice +faq-description = Common Voice is part of Mozilla's initiative to help teach machines how real people speak. +faq-search-for-answers = + .label = Search for answers + +## ABOUT US +about-title = Why Common Voice for the Speech Generation for Indigenous Language Education (SGILE) project? +about-header-description-v2 = +

There are a lot of people working on the SGILE project, and maintaining a record of what needs to be recorded, and what has been recorded already is fairly complicated! We wanted to build a tool that simplified this process, and still protected our data.

+

Mozilla's Common Voice is a tool for crowd-sourcing recordings for Mozilla's speech technologies (mostly speech recognition). The tool is great, but it requires you to make your data open to the world, and this isn't appropriate for our project. So, we "forked" or copied the code base (legally, and with permission!) and made our own version of the website with the help of Indigenous web services company Ursa Creative. Our version is called the EveryVoice Recording Studio.

+

In the SGILE project, there are three main streams or work happening simultaneously - a text stream, where people are working to determine what text will be synthesized (some people are working on verb conjugators or dictionaries, or other models of the grammar). The second stream is the recording stream where we are recording examples of audio from text. The third stream is the modelling stream where people are helping teach computers about how to pronounce the languages given examples of the text and audio. All streams will use our instance of Common Voice. The people in the text stream will upload text to be recorded. The people in the recording stream will log in and record any unrecorded utterances, and the modelling stream will retrieve the audio and text from the website once recording has taken place. It's a single, unified place for keeping track of all of our text and audio, that remains private to our working group.

+ +how-does-it-work-title-v2 = How does Common Voice Indigenous work? +how-does-it-work-text = We’re crowdsourcing a lorem ipsum dataset of voices. Donate your voice, validate the accuracy of other people’s clips, make the dataset better for everyone. lorem ipsum + +## How does it work section +about-language-req-subtitle = Someone asks for a language to be added. +about-localization-title = Website Localization +about-localization-subtitle = The website text is translated into that language. +about-sentence-collection-title = Sentence Collection +about-sentence-collection-subtitle = Sentences are collected for people to read aloud. +about-new-lang-title = New Language Launch +about-new-lang-subtitle = We launch the Common Voice site in this language. +about-voice-contrib-title = Voice Contribution +about-voice-contrib-subtitle = People come and contribute their voices. +about-voice-validation-title = Voice Validation +about-voice-validation-subtitle = Other people validate those voice clips. +about-dataset-release-title = Dataset Release +about-dataset-release-subtitle = Lorem ipsum We release the dataset every 3 months. + +about-subscribe-text = Want to stay in touch with Common Voice? + +about-speak = Speak +about-speak-text = Contributors record voice clips by reading from a bank of donated sentences. +about-listen-queue = Listen-Queue +about-listen-queue-text = Voice clips are entered into a submission queue that readies them for listening. +about-listen = Listen +about-listen-text = Users validate the accuracy of donated clips, checking that the speaker read the sentence correctly. +about-is-it-valid = Is the clip valid? +about-is-it-valid-text = A voice clip is marked "valid" when a user gives it a Yes vote. +about-yes-votes = ≥ 2 Yes votes +about-yes-votes-text = To make it into the Common Voice dataset, a voice clip must be validated by two separate users. +about-no-votes = ≥ 2 No votes +about-no-votes-text = When a user rejects a voice clip it returns to the Queue. If rejected a second time, the voice clip is moved to the Clip Graveyard. +about-dataset-new = Common Voice Dataset +about-dataset-new-text = The Common Voice Dataset contains hundreds of thousands of voice samples that help developers build voice recognition tools. +about-clip-graveyard = Clip Graveyard +about-clip-graveyard-text = The Clip Graveyard consists of voice clips that didn't make it into the Common Voice dataset. Just like the dataset, the Clip Graveyard is available for download. + +about-partners = Partners +about-become-a-partner = Become a partner +about-partnership = Common Voice is a collaborative project, and we're depending on our community of partners and contributors to build the largest open-source dataset of voices ever. + + We would like to thank the following people and organizations for their help with the project: +about-get-involved = Get involved +about-get-involved-text-2 = Want to help make Common Voice even better? + Great! Get in touch via email or Discourse + forums, submit site issues via GitHub, or join the + Matrix community chat. + +about-stay-in-touch = How do I stay in touch? +about-stay-in-touch-text-1 = Sign up to our mailing list to learn how you can take part in campaigns, events and co-design features on Common Voice. +about-stay-in-touch-text-2 = You can meet others in the Mozilla language communities by joining Discourse for topical conversations, or Matrix for quick advice. + +about-nav-why-common-voice = Why ? +about-nav-how-it-works = How ? +about-nav-partners = Partners +about-nav-get-involved = Get involved + +about-nav-how-it-works-2 = How does Common Voice work? +about-nav-playbook = Learn how to take part + +## Community Playbook Content +## What is a language +about-playbook-what-is-language = What is a language on Common Voice? +about-playbook-what-is-language-content-1 = There are lots of ways to think about language. For the purposes of speech recognition models, Common Voice suggests focussing on ‘mutual intelligibility’, or ‘can speakers of this language mostly understand one another if they try to?’ +about-playbook-what-is-language-content-2 = We want speech models to be better at understanding a diverse range of speakers. For this to happen, a voice dataset must represent lots of different people. +about-playbook-what-is-language-content-3 = Some languages have enormous variation in grammar, vocabulary and pronunciation. For this reason, we are introducing ‘Variants’ in 2022. This gives communities a way to distinguish their languages within the larger dataset. + +## How do I add a language +about-playbook-how-add-language = How do I add a language? +about-playbook-how-add-language-content-1 = First, check if your language already exists. If it doesn’t you need to translate the site and collect sentences. +about-playbook-how-add-language-content-2 = To translate the site - get set up on Pontoon. Pontoon has lots of languages, but if it doesn’t have yours you can request it. Then ask via GitHub to have the Common Voice project made available for the language. See more on site translation. +about-playbook-how-add-language-content-3 = To collect sentences - set up on Sentence Collector. +about-playbook-how-add-language-content-4 = You can add small numbers of sentences here, or you can do bulk imports via a Github request. Remember that sentences need to be CC0 (or public domain), or you can write your own. See more on sentence collection. + +## How does localization work +about-playbook-how-localize = How does site localization work? +about-playbook-how-localize-content-1 = Translation of the Common Voice site happens on Pontoon. +about-playbook-how-localize-content-2 = Create an account if you don’t have one. Then, choose your language (‘Team’) and then choose the project, Common Voice. There will be files to translate. Click on one, then it shows words in English and a box to translate them. +about-playbook-how-localize-content-3 = Translation is from English, but you can see Suggestions in other languages. Click the Profile icon, then Settings link and add any languages you speak. At the bottom right-hand corner will be a list of translations called Locales. Translations show on the site after one day. +about-playbook-how-localize-content-4 = The site is ready to be launched when it reaches 75% completion. +about-playbook-how-localize-content-5 = Watch our video explainer to help + +## How to add sentences +about-playbook-how-add-sentences = How do I add sentences? +about-playbook-how-add-sentences-content-1 = Sentence Collector is a tool for collecting and validating public domain sentences. You will need to create an account. Then, add your language to your Profile. You can Add sentences or Review previously-added sentences. +about-playbook-how-add-sentences-content-2 = Sentences must be reviewed and accepted by two people to be included in Common Voice. You create guidelines for your language here. Sentences must be in the public domain and shorter than 15 words. You can ask the owner of a text to make it CC0 using our waiver process, and send to us on commonvoice@mozilla.com +about-playbook-how-add-sentences-content-3 = You can use the Sentence extractor to leverage short sentences from Wikipedia. +about-playbook-how-add-sentences-content-4 = Sentences that have been validated are exported on Wednesdays, and are available after the next release. + +## How to record quality +about-playbook-how-record-quality = How do I record a high quality voice clip? +about-playbook-how-record-content-1 = Speak in your normal voice! The way you speak is welcome here - we want your accent as it is, and we want your usual volume, style and intonation. +about-playbook-how-record-content-2 = Avoid too much background noise - it should be easy to hear you. +about-playbook-how-record-content-3 = Read the sentence carefully - don’t miss, change or add words. +about-playbook-how-record-content-4 = Make sure the platform is recording before you start speaking, and that it only stops once you’re finished. +about-playbook-how-record-content-5 = See more on accuracy criteria. + +## How to grow language +about-playbook-how-grow-language = How can we effectively grow a language on Common Voice? +about-playbook-how-grow-language-content-1 = Creating opportunities for a diversity of people to contribute to Common Voice ensures the dataset serves as many people as possible. We’ve created resources and templates that you can use! +about-playbook-how-grow-language-content-2 = Events +about-playbook-how-grow-language-content-3 = You can run events to help people contribute. It’s easier than you think. You could do it online with a videoconferencing tool, or in person if it’s safe. Check out our templates and resources for running events. +about-playbook-how-grow-language-content-4 = Social media +about-playbook-how-grow-language-content-5 = You could use social media platforms to get the message out. Share posts that explain why it matters, and get in touch with other people talking about issues like language rights, voice AI, or bias in tech. See more advice on running a social campaign, including content you can re-use. +about-playbook-how-grow-language-content-6 = Partnerships and networks +about-playbook-how-grow-language-content-7 = Find others who care. That could be universities, language schools, advocacy groups or data science communities. Reach out and explain clearly how they can help and why. See our template outreach emails. +about-playbook-how-grow-language-content-8 = Get creative! Your language community will be unique, and these are just a few ways to get started. + +## How to validate +about-playbook-how-validate = How do I know whether to approve a voice clip? +about-playbook-how-validate-content-1 = If you could hear them and understand them, it’s usually best to approve. +about-playbook-how-validate-content-2 = Do not reject clips where the speaker ‘has an accent’ that is different to your own - this is important for voice recognition to work better for everyone. +about-playbook-how-validate-content-3 = If you think the pronunciation makes it impossible to understand, or there’s a lot of background noise, or there are other people speaking too, then you should reject the clip. See more information in our accuracy criteria. +about-playbook-how-validate-content-4 = If a clip is rejected by 2 people, it is released in a different subset of the dataset. + +## How to access dataset +about-playbook-how-access-dataset = How do I access and use the dataset? +about-playbook-how-access-dataset-content-1 = You can go to the datasets page, select the version and language(s) you want, and download it! The files have associated metadata, such as demographic information and validation data. You’ll need to provide an email address to download the dataset. +about-playbook-how-access-dataset-content-2 = If you’re looking for tools to build ASR models, you can connect to other people in the community on Discourse. + + +## How are decisions made +about-playbook-how-project-governance = How are project decisions made? +about-playbook-how-project-governance-content-1 = Mozilla Common Voice is made possible by a diverse community of activists, linguists, data scientists, academics and software engineers from all over the world. The project is stewarded by the Mozilla Foundation. +about-playbook-how-project-governance-content-2 = Our governance is founded on the pillars of: +about-playbook-how-project-governance-content-3 = Privacy, security and transparency. +about-playbook-how-project-governance-content-4 = Community participation and decision making. +about-playbook-how-project-governance-content-5 = Value and recognition. +about-playbook-how-project-governance-content-6 = Mutual accountability. +about-playbook-how-project-governance-content-7 = Read more about how we're governed + + +mycroft-title = Mycroft Ai +mycroft-subtitle = Artificial intelligence +mycroft-description = Mycroft is the world’s first open source assistant. + Mycroft runs anywhere - on a desktop computer, inside an automobile, or on a Raspberry Pi. +mycroft-secondary-description = This is open source software which can be freely remixed, extended, and improved. Mycroft may be used in anything from a science project to an enterprise software application. + +## Glossary +glossary = Glossary +localization = Localization +localization-explanation = This is our process for translating and adapting our content for many locales (languages). +sentence-collection = Sentence Collection +sentence-collection-explanation = Collecting sentences from the public domain, or writing new ones for the public domain. +hours-recorded-explanation = The count of voice recording hours we have collected so far. +hours-validated-explanation = The count of voice recording hours that have been validated by 2 out of 3 users with a vote of “Yes”. These mark progress toward the overall project 10k hours goal. +sst = Speech-to-text (STT) +sst-explanation = Speech-to-text (STT) technologies convert voice data into text. +de-identified = De-identified +de-identified-explanation = The process by which a contributor’s profile information is obscured from their donated voice clips when packaged for download as a part of the dataset. + +## Error pages +error-title-404 = We couldn’t find that page for you +error-content-404 = Maybe our homepage will help? To ask a question, please join the Matrix community chat, monitor site issues via GitHub or visit our Discourse forums. +error-title-503 = We’re experiencing unexpected downtime +error-content-503 = The site will be back up as soon as possible. For the latest information, please join the Matrix community chat or visit GitHub or our Discourse forums to submit and monitor site experience issues. +error-code = Error { $code } + +## Data +data-download-button = Download Common Voice Data +data-download-yes = Yes +data-download-deny = No +data-download-license = License: CC-0 +data-download-modal = You are about to initiate a download of { $size }GB, proceed? +data-subtitle = We are building an open and publicly available dataset of voices that everyone can use to train speech-enabled applications. +data-explanatory-text = We believe that large and publicly available voice datasets foster innovation and healthy commercial competition in machine-learning based speech technology. This is a global effort and we invite everyone to participate. Our aim is to help speech technology be more inclusive, reflecting the diversity of voices from around the world. +data-get-started = Get Started with Speech Recognition +data-other-title = Other voice datasets… +data-other-goto = Go to { $name } +data-other-download = Download Data +data-bundle-button = Download Dataset Bundle +data-bundle-description = Common Voice data plus all other voice datasets above. +release-version = Version +dataset-date = Date +license = License: { $license } +license-mixed = Mixed +data-download-singleword-title = Download the Single Word Target Segment +data-download-singleword-callout-v2 = This is a use case driven segment containing data to power spoken digit recognition and yes / no detection. + +review-terms = By using Common Voice, you agree to our Terms and Privacy Notice +terms-agree = I agree +terms-disagree = I do not agree +review-aborted = Upload aborted. Do you want to delete your recordings? +review-submit-title = Review & Submit +review-submit-msg = Thank you for recording!Now review and submit your clips below. +review-recording = Review +review-rerecord = Re-record +review-cancel = Cancel Submission +review-keep-recordings = Keep the recordings +review-delete-recordings = Delete my recordings + +## Datasets Page +datasets-headline = We’re building an open source, multi-language dataset of voices that anyone can use to train speech-enabled applications. +datasets-positioning = + We believe that large, publicly available voice datasets will foster innovation and healthy commercial competition in machine-learning based speech technology. + + Common Voice’s multi-language dataset is already the largest publicly available voice dataset of its kind, but it’s not the only one. + + Look to this page as a reference hub for other open source voice datasets and, as Common Voice continues to grow, a home for our release updates. +language = Language +# File size in gigabytes +size = Size +validated-hr-total = Validated Hr. Total +overall-hr-total = Overall Hr. Total +cv-license = License +audio-format = Audio Format +number-of-voices = Number of Voices +splits = Splits +email-to-download = Enter Email to Download +why-email = Why an email? We may need to contact you in the future about changes to the dataset, an email provides us a point of contact. +confirm-size = You are prepared to initiate a download of { $size } +size-gigabyte = GB +size-megabyte = MB +confirm-no-identify = You agree to not attempt to determine the identity of speakers in the Common Voice dataset +download-language = Download { $language } +validated-hours = Validated Hours +recorded-hours = Recorded Hours +whats-inside = What’s inside the Common Voice dataset? +dataset-description-hours = + Each entry in the dataset consists of a unique MP3 and corresponding text file. Many of the { $total } recorded hours in the dataset also include demographic metadata like age, sex, and accent that can help train the accuracy of speech recognition engines. + + The dataset currently consists of { $valid } validated hours in { $languages } languages, but we’re always adding more voices and languages. Take a look at our Languages page to request a language or start contributing. +want-dataset-update = Want updates when we release a new version of the Common Voice dataset? Subscribe to our newsletter. +subscribe = Subscribe +get-started-speech = Get Started with Speech Recognition +other-datasets = Other Voice Datasets +feedback-q = Have Feedback? + +resource-nemo-info = NVIDIA NeMo™ is an open-source toolkit for researchers developing state-of-the-art conversational AI models. +resource-deepspeech-info = Mozilla’s open source voice recognition engine Deep Speech can be used to build speech recognition applications. Read our Github overview or join the DeepSpeech Discourse to learn how to get started. +resource-coqui-info = Coqui is dedicated to open speech technology. Their projects include deep learning based STT and TTS engines. +community-playbook = Community Playbook +resource-playbook-info = Find helpful guidance on the entire Common Voice journey, from localisation to dataset usage, as well as how to connect with our community. + +data-other-librispeech-description = LibriSpeech is a corpus of approximately 1000 hours of 16Khz read English speech derived from read audiobooks from the LibriVox project. +data-other-ted-name = TED-LIUM Corpus +data-other-ted-description = The TED-LIUM corpus was made from audio talks and their transcriptions available on the TED website. +data-other-voxforge-description = VoxForge was set up to collect transcribed speech for use with Free and Open Source Speech Recognition Engines. +data-other-tatoeba-description = Tatoeba is a large database of sentences, translations, and spoken audio for use in language learning. This download contains spoken English recorded by their community. +your-feedback = Do you have ideas on how we can make the Common Voice dataset better? Let us know on Discourse +go-discourse = Go to Discourse +missing-language = Don’t see your language reflected in the Dataset? To request a language head over to our Languages page. +go-languages-page = Go to Languages Page +ready-to-validate = Ready to help validate sentences? +more = More +close = Close +download = Download +dataset-version = Version + +## Download Modal +download-title = Your download has started. +download-helpus = Help us build a community around voice technology, stay in touch via email. +download-form-email = + .label = Enter your email + .value = Thank you, we'll be in touch. +download-back = Return to Common Voice Datasets +download-no = No Thanks + +## Contact Modal +contact-title = Contact Form +contact-form-name = + .label = Name +contact-form-message = + .label = Message +contact-required = *required + +## Request Language Modal +request-language-title = Language Request +request-language-form-language = + .label = Language +request-language-success-title = Language request successfully submitted, thank you. +request-language-success-content = We will be in touch with more information about how to add your language to Common Voice very soon. +select-language = Select a Language... +other-language = Other Language + +## Languages Overview +language-section-in-progress = In Progress +language-section-in-progress-new-description = These languages are currently under community development. The progress bars indicate how far each language is in the process of website localization and sentence collection. +language-section-launched = Launched +language-section-launched-description = For these launched languages the website has been successfully localized, and has enough sentences collected to allow for ongoing Speak and Listen contributions. +languages-show-more = See More +languages-show-less = See Less +language-meter-in-progress = Progress +language-total-progress = Total +language-search-input = + .placeholder = Search +language-speakers = Speakers +localized = Localized +sentences = Sentences +total-hours = Validated Hrs + +## Contribution +action-click = Click +action-tap = Tap +contribute = Contribute +listen = Listen +skip = Skip +shortcuts = Shortcuts +clips-with-count-pluralized = { $count -> + [one] { $count } Clip + *[other] { $count } Clips +} +goal-help-recording = You've helped Common Voice reach of our daily { $goalValue } recording goal! +goal-help-validation = You've helped Common Voice reach of our daily { $goalValue } validation goal! +contribute-more = + { $count -> + *[other] Ready to do { $count } more? + } +record-cta = Start recording +record-platform-not-supported = We’re sorry, your platform is not currently supported. +record-platform-not-supported-desktop = On desktop devices you can contribute by downloading… +record-platform-not-supported-ios-non-safari = On iOS please continue with Safari to enable recording… +record-must-allow-microphone = You must allow microphone access. +record-no-mic-found = No microphone found. +record-error-too-short = The recording was too short. +record-error-too-long = The recording was too long. +record-error-too-quiet = The recording was too quiet. +record-cancel = Cancel Re-recording +record-instruction = { $actionType } then read the sentence aloud +record-stop-instruction = { $actionType } when done +record-three-more-instruction = Three to go! +record-again-instruction = Great! Record your next clip +record-again-instruction2 = Keep it up, record again +record-last-instruction = Last one! +review-tooltip = Review & re-record clips here as you go +share-clip = Share your clip +share-common-voice = Share Common Voice +review-instruction = Review & re-record clips if needed +record-submit-tooltip = { $actionType } submit when ready +clips-uploaded = Clips Uploaded +record-abort-title = Finish recording first? +record-abort-text = Leaving now means you'll lose your progress +record-abort-submit = Submit clips +record-abort-continue = Finish recording +record-abort-delete = Exit & Delete clips +listen-instruction = { $actionType } did they accurately speak the sentence? +listen-again-instruction = Great work! Listen again when you're ready +listen-3rd-time-instruction = 2 down, keep it up! +listen-last-time-instruction = Last one! +listen-empty-state = We've run out of clips to validate in this language... +speak-empty-state = We've run out of sentences to record in this language... +speak-empty-state-cta = Contribute sentences +record-button-label = Record your voice +share-title-new = Help us find more voices +keep-track-profile = Keep track of your progress with a profile +login-to-get-started = Log in or sign up to get started +target-segment-first-card = You’re contributing to our first target segment +target-segment-generic-card = You’re contributing to a target segment +target-segment-first-banner = Help create Common Voice’s first target segment in { $locale } +target-segment-add-voice = Add Your Voice +target-segment-learn-more = Learn More + +## Reporting +report = Report +report-title = Submit a report +report-ask = What issues are you experiencing with this sentence? +report-offensive-language = Offensive language +report-offensive-language-detail = The sentence has disrespectful or offensive language. +report-grammar-or-spelling = Grammatical / spelling error +report-grammar-or-spelling-detail = The sentence has a grammatical or spelling error. +report-different-language = Different language +report-different-language-detail = It is written in a language different than what I’m speaking. +report-difficult-pronounce = Difficult to pronounce +report-difficult-pronounce-detail = It contains words or phrases that are hard to read or pronounce. +report-offensive-speech = Offensive speech +report-offensive-speech-detail = The clip has disrespectful or offensive language. +report-other-comment = + .placeholder = Comment +success = Success +continue = Continue +report-success = Report was passed successfully + + +## Goals +streaks = Streaks +days = { $count -> + [one] Day + *[other] Days +} +recordings = { $count -> + [one] Recording + *[other] Recordings +} +validations = { $count -> + [one] Validation + *[other] Validations +} + + +## Dashboard +your-languages = Your Languages +toward-next-goal = Toward next goal +goal-reached = Goal reached +clips-you-recorded = Clips You've Recorded +clips-you-validated = Clips You've Validated +todays-recorded-progress = Today's Common Voice progress on clips recorded +todays-validated-progress = Today's Common Voice progress on clips validated +stats = Stats +awards = Awards +you = You +everyone = Everyone +contribution-activity = Contribution Activity +top-contributors = Top Contributors +recorded-clips = Recorded Clips +validated-clips = Validated Clips +total-approved = Total Approved +overall-accuracy = Overall Accuracy +set-visibility = Set my visibility +visibility-explainer = This setting controls your leaderboard visibility. When hidden, your progress will be private. This means your image, user name and progress will not appear on the leaderboard. Note that leaderboard refresh takes ~{ $minutes }min to populate changes. +visibility-overlay-note = Note: When set to 'Visible', this setting can be changed from the Profile page +show-ranking = Show my ranking + +## Custom Goals +get-started-goals = Get started with goals +create-custom-goal = Create a Custom Goal +goal-type = What kind of goal do you want to build? +both-speak-and-listen = Both +both-speak-and-listen-long = Both (Speak and Listen) +daily-goal = Daily Goal +weekly-goal = Weekly Goal +easy-difficulty = Easy +average-difficulty = Average +difficult-difficulty = Difficult +pro-difficulty = Pro +lose-goal-progress-warning = By editing your goal, you may lose your existing progress. +want-to-continue = Do you want to continue? +finish-editing = Finish editing first? +lose-changes-warning = Leaving now means you’ll lose your changes +build-custom-goal = Build a custom goal +help-reach-hours-pluralized = Help reach { NUMBER($hours) -> +[one] {$hours} hour +*[other] {$hours} hours + } in { $language } with a personal goal +help-reach-hours-general-pluralized = Help Common Voice reach { NUMBER($hours) -> + [one] {$hours} hour + *[other] {$hours} hours + } in a language with a personal goal +set-a-goal = Set a goal +cant-decide = Can't decide? +activity-needed-calculation-plural = { NUMBER($totalHours) -> + [one] {$totalHours} hour + *[other] {$totalHours} hours + } is achievable in just over { NUMBER($periodMonths) -> + [one] {$periodMonths} month + *[other] {$periodMonths} months + } if { NUMBER($people) -> + [one] {$people} person + *[other] {$people} people + } record { NUMBER($clipsPerDay) -> + [one] {$clipsPerDay} clip + *[other] {$clipsPerDay} clips + } a day. +how-many-per-day = Great! How many clips per day? +how-many-a-week = Great! How many clips a week? +which-goal-type = Do you want to Speak, Listen or both? +receiving-emails-info = You're currently set to receive emails such as goal reminders, my + progress updates and newsletters about Common Voice +not-receiving-emails-info = You're currently set to NOT receive emails such as goal reminders, my + progress updates and newsletters about Common Voice +n-clips-pluralized = { NUMBER($count) -> + [one] {$count} clip + *[other] {$count} clips + } +help-share-goal = Help us find more voices, share your goal +confirm-goal = Confirm Goal +goal-interval-weekly = Weekly +# $type is one of share-goal-type-* +share-n-daily-contribution-goal = Share your { $count } Clip Daily Goal for { $type } +# $type is one of share-goal-type-* +share-n-weekly-contribution-goal = Share your { $count } Clip Weekly Goal for { $type } +share-goal-type-speak = Speaking +share-goal-type-listen = Listening +share-goal-type-both = Speaking and Listening +# LINK will be replaced with the current URL +goal-share-text = I just created a personal goal for voice donation to #CommonVoice -- join me and help teach machines how real people speak { $link } +weekly-goal-created = Your weekly goal has been created +daily-goal-created = Your daily goal has been created +track-progress = Track progress here and on your stats page. +return-to-edit-goal = Return here to edit your goal anytime. +share-goal = Share my goal + +## Profile Delete +delete-q = Would you like to request your voice recordings be deleted too, or do you prefer to keep them in the Common Voice dataset? +keep = Keep +remove = Remove +keep-info = Your anonymous voice recordings will remain in the Common Voice dataset. Once you delete your profile you will no longer be able to submit a request to remove your recordings from the dataset +remove-info = We will review your request to remove your voice recordings from the dataset. If your request is approved, we will contact those who have downloaded the dataset and request they remove your voice recordings as well. +why-delete-recordings = Common Voice recordings are used by academics, small businesses, and voice recognition enthusiasts to help train and grow publicly available resources like voice models. + + Can you let us know why you would like your recordings deleted? +profile-form-delete = Delete Profile + +## Profile Download +download-q = Need to download your data? +download-info = Tell us what you'd like to download: +download-profile-title = Profile +download-profile-info = Includes email, username & demographic info, available right away +download-profile-size = A few bytes +download-recordings-title = Recordings +download-recordings-info = Includes mp3s and related sentences, may take some time to prepare +download-recordings-size = Typically megabytes +download-recordings-unavailable = You cannot request your recordings while another request is already in progress. +download-recently-requested = You can request a new takeout of your recordings every { $days } days. +download-size = Size +download-selected = Selected +download-start = Download profile data +download-request = Request recordings +download-requests = Past recordings download requests +download-requests-info = When you request your recordings, we compile them into one or multiple ZIP files. Here are your past requests: +download-request-button = Download +download-request-title = { $created } +download-request-description = { $clipCount } voice clips, total archive size { $size }. Expires { $expires }. +download-request-archive-single = Single ZIP file containing +download-request-archive-multiple = Split into { $archiveCount } ZIP files containing +download-request-assembling-description = Your files are being assembled. Please check again later. +download-request-refresh-button = Refresh +download-request-modal-title = Download Links +download-request-modal-description = Here are the links to download your ZIP files. +download-request-link-text = Zip #{ $offset } of { $total } +download-request-metadata-link = Sentence text +download-request-link-single = You can also copy and paste the direct URLs into your favorite download manager. They will expire in 12 hours, but you can come back to this page to generate new ones any time. + +## Landing +welcome-staff = Welcome { $company } staff! +help-contribute = You can help build a diverse, open-source dataset by creating a Common Voice profile and contributing your voice. +login-company = Log In / Sign Up with { $company } email +profile-not-required = Make sure to sign up before contributing! +read-more-about = Read more on our About page + + +## DemoLayout +demo-get-started = Let's Get Started +demo-welcome = Welcome to Common Voice +demo-welcome-subheader = Interested in learning more and contributing to the project? + +## Demo Datasets +demo-language-select-card-header = Common Voice is the world’s largest publicly available, multi-language voice dataset. +demo-language-select-card-body = Thanks to contributions from over 259k people in over 50 languages, this data is being used to train speech-enabled applications to better respond to the human voice. +card-button-next = Next +card-button-back = Back +demo-language-select-label = Browse Languages +demo-eofy-header = 2019 End-of-Year Release +demo-eofy-sub_header = Voice Dataset, Ready for Download +demo-account = Account + +## Demo Account +demo-account-card-header = Having an account is not required to contribute, though it is helpful. +demo-account-card-body = To the right we outline the benefits and clarify what information we make public. Use the links below to get started with a Common Voice account on your own device. +demo-account-enter-email = +.label = Enter email to send a sign up link +demo-account-sign-up = Send sign up link + +## Demo Contribute +demo-contribute-card-header = Ready to add your voice or lend your ear? +demo-contribute-card-body-v2 = Now that you know a little bit more about Common Voice, why not try it out? Click on the microphone icon to start reading sentences aloud.

If you prefer to review other people's voice contributions, click on the play icon. You’ll help confirm that recordings match the sentences written on screen. +demo-listen-subtitle = Ready to contribute? + +## Demo Dashboard +demo-dashboard-card-header = Personal dashboards keep you up-to-date with individual and community progress. +demo-dashboard-card-body = For every voice clip donated, and every audio clip validated, your account dashboards are updated to reflect your latest progress in each language you contribute to. Yes, you can contribute to more than one!

Use dashboards to track your stats, see how you're doing alongside others in the community, and set daily or weekly contribution goals. + + + +## Validation criteria +contribution-criteria-nav = Criteria +contribution-criteria-link = Understand contribution criteria + +contribution-criteria-page-title = Contribution Criteria +contribution-criteria-page-description = Understand what to look for when listening to voice clips and help make your voice recordings richer too! +contribution-for-example = for example + +contribution-misreadings-title = Misreadings +contribution-misreadings-description = When listening, check very carefully that what has been recorded is exactly what has been written; reject if there are even minor errors.
Very common mistakes include: +contribution-misreadings-description-extended-list-1 = Missing 'A' or 'The' at the beginning of the recording. +contribution-misreadings-description-extended-list-2 = Missing an 's' at the end of a word. +contribution-misreadings-description-extended-list-3 = Reading contractions that aren't actually there, such as "We're" instead of "We are", or vice versa. +contribution-misreadings-description-extended-list-4 = Missing the end of the last word by cutting off the recording too quickly. +contribution-misreadings-description-extended-list-5 = Taking several attempts to read a word. + +contribution-misreadings-example-1-title = The giant dinosaurs of the Triassic. +contribution-misreadings-example-2-title = The giant dinosaur of the Triassic. +contribution-misreadings-example-2-explanation = [Should be ‘dinosaurs’] +contribution-misreadings-example-3-title = The giant dinosaurs of the Triassi-. +contribution-misreadings-example-3-explanation = [Recording cut off before the end of the last word] +contribution-misreadings-example-4-title = The giant dinosaurs of the Triassic. Yes. +contribution-misreadings-example-4-explanation = [More has been recorded than the required text] +contribution-misreadings-example-5-title = We are going out to get coffee. +contribution-misreadings-example-6-title = We’re going out to get coffee. +contribution-misreadings-example-6-explanation = [Should be “We are”] +contribution-misreadings-example-7-title = We are going out to get a coffee. +contribution-misreadings-example-7-explanation = [No ‘a’ in the original text] +contribution-misreadings-example-8-title = The bumblebee sped by. +contribution-misreadings-example-8-explanation = [Mismatched content] + +contribution-varying-pronunciations-title = Varying Pronunciations +contribution-varying-pronunciations-description = Be cautious before rejecting a clip on the ground that the reader has mispronounced a word, has put the stress in the wrong place, or has apparently ignored a question mark. There are a wide variety of pronunciations in use around the world, some of which you may not have heard in your local community. Please provide a margin of appreciation for those who may speak differently from you. +contribution-varying-pronunciations-description-extended = On the other hand, if you think that the reader has probably never come across the word before, and is simply making an incorrect guess at the pronunciation, please reject. If you are unsure, use the skip button. +contribution-varying-pronunciations-example-1-title = On his head he wore a beret. +contribution-varying-pronunciations-example-1-explanation = [‘Beret’ is OK whether with stress on the first syllable (UK) or the second (US)] +contribution-varying-pronunciations-example-2-title = His hand was rais-ed. +contribution-varying-pronunciations-example-2-explanation = [‘Raised’ in English is always pronounced as one syllable, not two] + +contribution-background-noise-title = Background Noise +contribution-background-noise-description = We want the machine learning algorithms to able to handle a variety of background noise, and even relatively loud noises can be accepted provided that they don’t prevent you from hearing the entirety of the text. Quiet background music is OK; music loud enough to prevent you from hearing each and every word is not. +contribution-background-noise-description-extended = If the recording breaks up, or has crackles, reject unless the entirety of the text can still be heard. +contribution-background-noise-example-1-fixed-title = [Sneeze] The giant dinosaurs of the [cough] Triassic. +contribution-background-noise-example-2-fixed-title = The giant dino [cough] the Triassic. +contribution-background-noise-example-2-explanation = [Part of the text can’t be heard] +contribution-background-noise-example-3-fixed-title = [Crackle] giant dinosaurs of [crackle] -riassic. + +contribution-background-voices-title = Background Voices +contribution-background-voices-description = A quiet background hubbub is OK, but we don’t want additional voices that may cause a machine algorithm to identify words that are not in the written text. If you can hear distinct words apart from those of the text, the clip should be rejected. Typically this happens where the TV has been left on, or where there is a conversation going on nearby. +contribution-background-voices-description-extended = If the recording breaks up, or has crackles, reject unless the entirety of the text can still be heard. +contribution-background-voices-example-1-title = The giant dinosaurs of the Triassic. [read by one voice] +contribution-background-voices-example-1-explanation = Are you coming? [called by another] + +contribution-volume-title = Volume +contribution-volume-description = There will be natural variations in volume between readers. Reject only if the volume is so high that the recording breaks up, or (more commonly) if it is so low that you can’t hear what is being said without reference to the written text. + +contribution-reader-effects-title = Reader Effects +contribution-reader-effects-description = Most recordings are of people talking in their natural voice. You can accept the occasional non-standard recording that is shouted, whispered, or obviously delivered in a ‘dramatic’ voice. Please reject sung recordings and those using a computer-synthesized voice. + +contribution-just-unsure-title = Just Unsure? +contribution-just-unsure-description = If you come across something that these guidelines don’t cover, please vote according to your best judgement. If you really can’t decide, use the skip button and go on to the next recording. + +see-more = See more +see-less = See less + +# Don't rename the following section, its contents are auto-inserted based on the name. These strings are +# automatically exported from Sentence Collector. +# [SentenceCollector] +## HEADER/FOOTER +sc-header-home = Home +sc-header-how-to = How-to +sc-header-add = Add +sc-header-review = Review +sc-header-rejected = Rejected Sentences +sc-header-my = My Sentences +sc-header-statistics = Statistics +sc-header-profile = Profile +sc-footer-discourse = Discourse +sc-footer-report-bugs = Report Bugs +sc-footer-translate = Translate this page +sc-footer-report-copyright = Report copyright issues +sc-footer-privacy = Privacy +sc-footer-terms = Terms +sc-footer-cookies = Cookies +sc-login-signup-button = Login / Signup +sc-logout-button = Logout + +## HOME +sc-home-title = Welcome to the Common Voice Sentence Collector +sc-home-intro = The Sentence Collector is part of Common Voice. It allows contributors to collect and validate sentences created by the community. You can use this tool also to import and clean-up small-to-medium-sized public domain corpus you have found or collected. All sentences need to be Public Domain. Approved sentences are exported every week to the Common Voice repository and are released on the Common Voice website on every new deployment. +sc-home-collect-title = Collect sentences +sc-home-collect-text = Help us by writing or collecting Public Domain sentences. +sc-home-review-title = Review sentences +sc-home-review-text = Help us by reviewing sentences for correctness according to the guidelines. + +## HOW-TO +sc-howto-title = How to +sc-howto-addlang-title = Adding languages to work with +sc-howto-addlang-text = Once logged in you can select your languages from the profile section. +sc-howto-addsen-title = Add new sentences +sc-howto-addsen-item-1 = All sentences you submit must be under Public Domain (CC-0) license. To support the inclusion of work not under public licence, we have created a Contributions Agreement template for works where the copyright owner would like to contribute the material to Common Voice. +sc-howto-addsen-item-2 = Numbers. There should be no digits in the source text because they can cause problems when read aloud. The way a number is read depends on context and might introduce confusion in the dataset. For example, the number “2409” could be accurately read as both “twenty-four zero nine” and “two thousand four hundred nine”. +sc-howto-addsen-item-3 = Abbreviations and Acronyms. Abbreviations and acronyms like “USA” or “ICE” should be avoided in the source text because they may be read in a way that does not coincide with their spelling. Additionally, there may be multiple accurate readings for a single abbreviation. For example, the acronym “ICE” could be pronounced “I-C-E” or as a single word. +sc-howto-addsen-item-4 = Punctuation. Special symbols and punctuation should only be included when absolutely necessary. For example, an apostrophe is included in English words like “don’t” and “we’re” and should be included in the source text, but it’s unlikely you’ll ever need a special symbol like “@” or “#.” +sc-howto-addsen-item-5 = Foreign letters. Letters must be valid in the language being spoken. For example, “ж” is a letter in the Russian alphabet but is never used in English and so should never appear in any English source text. +sc-howto-addsen-item-6 = Languages can have their own validation rules with additional requirements. If there is no specific validation file for a language, we are using the generic English rules. +sc-howto-addsen-post-1 = We prefer natural/conversational sentences. While phonetic diversity and different words in sentences is important, we are trying to make recording sentences as much fun as possible. Therefore it would be great if you could try to keep your sentences as natural/engaging as possible. +sc-howto-cite-title = How to Cite +sc-howto-cite-pre-1 = It's important that you reference where you found the public licence to avoid plagiarism and to allow for follow ups on copyright issues. Here are a few ways you can cite the work. +sc-howto-cite-item-1 = You could include the website, e.g "Common Voice - https://commonvoice.mozilla.org/" +sc-howto-cite-item-2 = You could use academic referencing style, e.g Harvard style "Mozilla (2021) Common Voice. Available at https://commonvoice.mozilla.org/ (Accessed: 15th September 2021)" +sc-howto-cite-item-3 = For public domain text not available online, you could use academic referencing style e.g Harvard style "Jess (2021) My Public licence poems" +sc-howto-review-title = Review Sentences +sc-howto-review-subtitle = Make sure the sentence meets the following criteria: +sc-howto-review-criteria-1 = The sentence must be spelled correctly. +sc-howto-review-criteria-2 = The sentence must be grammatically correct. +sc-howto-review-criteria-3 = The sentence must be speakable. +sc-howto-review-criteria-4 = If the sentence meets the criteria, click the "Approve" button. +sc-howto-review-criteria-5 = If the sentence does not meet the above criteria, click the "Reject" button. If you are unsure about the sentence, you may also skip it and move on to the next one. +sc-howto-review-criteria-6 = If you run out of sentences to review, please help us collect more sentences! +sc-howto-findpd-title = Finding existing sentences in the Public Domain +sc-howto-findpd-subtitle = Search for them on the Internet +sc-howto-findpd-text-2 = Remember that we need permission to publish those sentences, so always ensure that the text belongs to the public domain. If there is no explicit indication, reach out to the person that the text belongs to and ask if they want to contribute their text to the Public Domain. If they want to, help them go through the Contributions Agreement process. If they do not want to contribute the text, then you are not allowed to use that text. +sc-howto-findpd-tips = Here are some tips to find sentences: +sc-howto-findpd-tips-1 = The best sources you can look for are podcasts, transcripts, movie scripts and anything that potential can contain everyday conversations. +sc-howto-findpd-tips-2 = Government proceedings, books and articles are also great however since the text tends to be a little more formal they are less of a priority. +sc-howto-findpd-tips-3 = Unfortunately we can’t have Wikimedia articles yet. So do not copy paste from there. +sc-howto-findpd-subtitle-2 = Partner with local organizations or individuals +sc-howto-findpd-partner-1 = There are a lot of public organizations that might want to collaborate and already have a lot of texts they can donate as public domain. Reach out to local universities, Governments and open source organizations to talk about the project and ask for their help. +sc-howto-findpd-partner-2 = Expert linguists can also help, try to reach out to local linguistic universities (both teachers and students) and see if they can help to gather a diverse set of sound-diverse sentences in your language. + +## MY SENTENCES +sc-my-title = My Sentences +sc-my-description = This page gives you an overview of all your submitted sentences. You may also delete already submitted sentences if needed, by marking the checkbox next to it and clicking on "Delete selected sentences" at the bottom. Please only remove sentences if absolutely necessary, for example if you noticed after the fact that a sentence is copyright protected. +sc-my-loading = Loading your sentences… +sc-my-err-fetching = Error while fetching your sentences. Please try again. +sc-my-no-sentences = No sentences found! +# Variables: +# $batchId (String) - A unique ID identifying the submission of sentences - sentences uploaded together all have the same batch ID +sc-my-submission = Submission: { $batchId } +# Variables: +# $source (String) - Associated source the user filled out when uploading the sentence +sc-my-source = Source: { $source } +sc-my-delete = Delete selected sentences +sc-my-deleting = Deleting selected sentences… +sc-my-err-failed-delete = Failed to delete selected sentences… Please try again! + +## REJECTED +sc-rejected-title = Rejected Sentences +sc-rejected-loading = Loading rejected sentences… +sc-rejected-err-fetching = Error while fetching rejected sentences. Please try again. +sc-rejected-none-found = No rejected sentences found! + +## STATS +sc-stats-title = Statistics +# Variables: +# $lastUpdate (Date) - Localized date of last statistics update +sc-stats-last-update = Last Update: { $lastUpdate } +sc-stats-last-update-never = Last Update: never +sc-stats-updating = Updating… +# Variables: +# $sentenceCount (Number) - Total number of sentences uploaded through Sentence Collector +# $languageCount (Number) - Total number of languages these sentences represent +sc-stats-summary = The Common Voice Sentence Collector has collected { $sentenceCount } sentences in { $languageCount } languages! + +## ADD +sc-submit-err-select-lang = Please select a language. +sc-submit-err-add-sentences = Please add sentences. +sc-submit-err-add-source = Please add a source. +sc-submit-err-confirm-pd = Please confirm that these sentences are public domain. +sc-submit-prompt = + .message = Sentences not submitted, are you sure you want to leave? +sc-submit-title = Add Sentences +sc-submit-select-language = + .labelText = Select Language +sc-submit-add-sentences = Add public domain sentences +sc-submit-ph-one-per-line = + .placeholder = One sentence per line +sc-submit-from-where = Where are these public domain sentences from? +sc-submit-ph-read-how-to = + .placeholder = Read our How-to if unsure how to attribute +sc-submit-confirm = I confirm that these sentences are public domain and I have permission to upload them. +sc-submit-button = + .submitText = Submit +sc-submit-filtered = Filtered sentences due to requirements failing (please submit fixed versions as new sentences): +sc-submit-guidelines = Please check the guidelines. + +## ADD LANGUAGE +sc-add-lang-could-not-add = Could not add language +sc-add-lang-sec-label = Add a language you want to contribute to +sc-add-lang-sec-button = Add Language +sc-add-err-unexpected = Unexpected response returned from server +# Variables: +# $duplicates (Number) - Number of sentences which got rejected because they are duplicates +sc-add-result = + {$duplicates -> + [0] Submitted sentences. {$duplicates} sentences were rejected as duplicates. + [one] Submitted sentences. {$duplicates} sentence was rejected as duplicate. + *[other] Submitted sentences. {$duplicates} sentences were rejected as duplicates. + } +# Variables: +# $sentences (Number) - Number of sentences which failed to be saved to the database - could be several different reasons +sc-add-err-failed = + {$sentences -> + [0] No sentences failed + [one] 1 sentence failed + *[other] {$sentences} sentences failed + } +sc-add-err-submission = Submission Error +sc-add-lang-process-notice = If your language is not listed here, you can request it through this process. + +## ADD SENTENCES CONFIRMATION +sc-confirm-are-you-sure = + .message = Sentences not submitted, are you sure you want to leave? +sc-confirm-sentences-title = Confirm New Sentences +# Variables: +# $countOfSentences (Number) - Number of sentences the user has filled in the submission form +sc-confirm-sentences-found = + {$countOfSentences -> + [0] No sentences found. + [one] 1 sentence found. + *[other] {$countOfSentences} sentences found. + } +# Variables: +# $countOfInvalidated (Number) - Number of sentences the user rejected in the review form before submission +sc-confirm-rejected-by-you = { $countOfInvalidated } rejected by you +sc-confirm-already-reviewed = + {$countOfReviewed -> + [0] No sentence is already reviewed. + [one] 1 sentence is already reviewed. Great job! + *[other] {$countOfReviewed} sentences are already reviewed. Great job! + } +# Variables: +# $readyCount (Number) - Number of sentences ready to be uploaded +sc-confirm-ready = + {$readyCount -> + [0] No sentence ready for submission! + [one] 1 sentence ready for submission! + *[other] {$readyCount} sentences ready for submission! + } +# Variables: +# $countOfUnreviewed (Number) - Number of sentences unreviewed before the upload +sc-confirm-unreviewed = { $countOfUnreviewed } sentences are unreviewed. If you want, you can also review your sentences now before submitting them. +sc-confirm-button-text = Confirm +sc-confirm-uploading = Sentences are being uploaded. This can take several minutes depending on the number of sentences added. Please do not close this website. + +## LANGUAGE INFO +# Variables: +# $totalSentences (Number) - Number of sentences uploaded in total for this language +sc-lang-info-total = + {$totalSentences -> + [0] No total sentences. + [one] 1 total sentence. + *[other] {$totalSentences} total sentences. + } +# Variables: +# $totalInReview (Number) - Number of sentences currently in the review state for this language +sc-lang-info-in-review = + {$totalInReview -> + [0] No sentences in review. + [one] 1 sentence in review. + *[other] {$totalInReview} sentences in review. + } +# Variables: +# $unreviewedSentencesByYou (Number) - Number of sentences the user can still review +sc-lang-info-left-for-you = + {$unreviewedSentencesByYou -> + [0] No sentences left for you to review. + [one] 1 sentence left for you to review. + *[other] {$unreviewedSentencesByYou} sentences left for you to review. + } +sc-lang-info-review-now = Review now! +sc-lang-info-add-more = Add more sentences now! +# Variables: +# $validatedSentences (Number) - Number of sentences which have been approved for this language +sc-lang-info-validated = + {$validatedSentences -> + [0] No validated sentences. + [one] 1 validated sentence. + *[other] {$validatedSentences} validated sentences. + } +# Variables: +# $rejectedSentences (Number) - Number of sentences which have been rejected for this language +sc-lang-info-rejected = + {$rejectedSentences -> + [0] No rejected sentences. + [one] 1 rejected sentence. + *[other] {$rejectedSentences} rejected sentences. + } + +## LOGIN +sc-login-err-failed = Login failed +sc-login-err-try-again = Please try again. + +## PROFILE +# Variables: +# $username (String) - eMail address of the logged in user +sc-profile-title = Profile: { $username } +sc-personal-err-lang-not-found = Could not remove language: language not found +sc-personal-err-remove = Could not remove language +sc-personal-your-languages = Your languages: +sc-personal-remove-button = remove +# Variables: +# $sentences (Number) - Number of sentences that were added by the currently logged in user for this language +sc-personal-added-by-you = { $sentences } added by you +sc-personal-not-added = You have not added any languages yet. + +## REVIEW CRITERIA +sc-criteria-modal = ⓘ Review Criteria +sc-criteria-title = Review Criteria +sc-criteria-make-sure = Make sure the sentence meets the following criteria: +sc-criteria-item-1 = The sentence must be spelled correctly. +sc-criteria-item-2 = The sentence must be grammatically correct. +sc-criteria-item-3 = The sentence must be speakable. +sc-criteria-item-4 = If the sentence meets the criteria, click the "Approve" button on the right. +sc-criteria-item-5-2 = If the sentence does not meet the above criteria, click the "Reject" button on the left. If you are unsure about the sentence, you may also skip it and move on to the next one. +sc-criteria-item-6 = If you run out of sentences to review, please help us collect more sentences! + +## REVIEW +sc-review-lang-not-selected = You have not selected any languages. Please go to your Profile to select languages. +sc-review-title = Review Sentences +sc-review-loading = Loading sentences… +sc-review-select-language = Please select a language to review sentences. +sc-review-no-sentences = No sentences to review. Add more sentences now! +sc-review-form-prompt = + .message = Reviewed sentences not submitted, are sure? +sc-review-form-usage = Swipe right to approve the sentence. Swipe left to reject it. Swipe up to skip it. Do not forget to submit your review! +# Variables: +# $sentenceSource (Number) - Associated source the user filled out when uploading the sentence +sc-review-form-source = Source: { $sentenceSource } +sc-review-form-button-reject = Reject +sc-review-form-button-skip = Skip +sc-review-form-button-approve = Approve +# Keyboard shortcut to use to approve a sentence (sc-review-form-button-approve) +sc-review-form-button-approve-shortcut = Y +# Keyboard shortcut to use to reject a sentence (sc-review-form-button-reject) +sc-review-form-button-reject-shortcut = N +# Keyboard shortcut to use to skip a sentence (sc-review-form-button-skip) +sc-review-form-button-skip-shortcut = S +sc-review-form-keyboard-usage-custom = You can also use Keyboard Shortcuts: { sc-review-form-button-approve-shortcut } to Approve, { sc-review-form-button-reject-shortcut } to Reject, { sc-review-form-button-skip-shortcut } to Skip +sc-review-form-button-submit = + .submitText = Finish Review +# Variables: +# $sentences (Number) - Number of sentences the user has reviewed in this session +sc-review-form-reviewed-message = + {$sentences -> + [0] No sentences reviewed. + [one] 1 sentence reviewed. Thank you! + *[other] { $sentences } sentences reviewed. Thank you! + } +sc-review-form-review-failure = Review could not be saved. Please try again later. +sc-review-link = Review + +## SETTINGS +sc-settings-title = Settings +sc-settings-ui-language = Interface Language +sc-settings-language-translated-warning = The pages for this language might not be fully translated. You can help out with translation on Pontoon. +sc-settings-reset-skipped = Reset skipped sentences +sc-settings-skipped-decription = You previously skipped sentences while reviewing. Resetting skipped sentences will show all skipped sentences again. This is independent of the language. +sc-settings-show-all-button = Show all skipped sentences again +sc-settings-failed = Could not change settings. Please try again. + +# VALIDATION +sc-validation-number-of-words = Sentence must contain between 1 and 14 (inclusive) words +sc-validation-no-numbers = Sentence should not contain numbers +sc-validation-no-symbols = Sentence should not contain symbols +sc-validation-no-abbreviations = Sentence should not contain abbreviations + +# [/SentenceCollector] + +localization-select = + .label = Choose language/localization