From 4210e677ac7c50f8831c15b302bd270e2fc4cae9 Mon Sep 17 00:00:00 2001 From: Dale Lane Date: Mon, 25 Mar 2019 13:51:15 +0000 Subject: [PATCH] docs: Document storage implications for training data Contributes to: #172 Signed-off-by: Dale Lane --- public/components/help/help.html | 16 ++++++++++++++++ public/languages/de.json | 9 ++++++++- public/languages/en.json | 9 ++++++++- public/languages/es.json | 9 ++++++++- public/languages/fr.json | 9 ++++++++- public/languages/ko.json | 9 ++++++++- public/languages/nl-be.json | 9 ++++++++- public/languages/pt-br.json | 9 ++++++++- public/languages/si-lk.json | 9 ++++++++- public/languages/sv-se.json | 9 ++++++++- public/languages/tr.json | 9 ++++++++- public/languages/zh-cn.json | 9 ++++++++- 12 files changed, 104 insertions(+), 11 deletions(-) diff --git a/public/components/help/help.html b/public/components/help/help.html index 8754c3b98..a23a9052a 100644 --- a/public/components/help/help.html +++ b/public/components/help/help.html @@ -379,6 +379,22 @@

+
+
+

+ +

+
+
+
+

+

+

+

+

+
+
+
diff --git a/public/languages/de.json b/public/languages/de.json index 490a1fdaa..226d1d204 100644 --- a/public/languages/de.json +++ b/public/languages/de.json @@ -1007,7 +1007,14 @@ "Q4-A-6": "Allgemeine Information, die in allen Accounts gespeichert wird", "Q4-A-7": "Für das Benutzermanagement bei Machine Learnign for Kids wird der Service Auth0 genutzt. Auth0 speichert die IP Adresse und den Browser, den du benutzt.", "Q4-A-8": "Um Fehler im Webbrowser festzustellen, nutzt Machine Learning for Kids den Service Sentry. Wenn ein Fehler auftritt, werde der Benutzername, die IP Adresse, die Browserart und eine technische Beschreibung des Fehlers, gesammelt.", - "Q4-A-9": "Wir nutzen Google Analytics, um einen Überblick darüber zu erhalten, wie viele Nutzer unsere Plattform - Machine Learning for Kids - jeden Tag besuchen. Getrackte geographische Informationen sowie Informationen über den genutzten Browser werden nur in anonymisierter Form angezeigt." + "Q4-A-9": "Wir nutzen Google Analytics, um einen Überblick darüber zu erhalten, wie viele Nutzer unsere Plattform - Machine Learning for Kids - jeden Tag besuchen. Getrackte geographische Informationen sowie Informationen über den genutzten Browser werden nur in anonymisierter Form angezeigt.", + + "Q5": "What happens to training data created by students?", + "Q5-A-1": "A step in all machine learning projects that students do using this site is to create or collect training examples. For text projects, this can mean typing in short text passages. For image projects, this can means drawing pictures onto an on-screen canvas or taking photos using the webcam. For numbers projects, this means typing in sets of numbers", + "Q5-A-2": "All of these training examples are stored in a MySQL database hosted on IBM Cloud. As the database administrator, I have access to all of these training examples for all student projects, however I do not use it for any other purposes other than enabling students to access and work on their own projects. I do not publish the training data (either publicly or to individuals or third parties) or otherwise share it, with the two exceptions of submitting it to IBM Watson APIs described below.", + "Q5-A-3": "Machine learning models for text projects are created using the IBM Watson Assistant cloud service, which means when students train a model, a copy of the training examples that they have entered will be submitted to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-4": "Machine learning models for images projects are created using the IBM Visual Recognition cloud service, which means when students train a model, a copy of their training images will be uploaded to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-5": "IBM Watson provides some general guidance for sharing training data with their services, which also apply to training data created and collected in Machine Learning for Kids. Specifically, students should be advised not to include personally identifiable information in the examples that they collect." } } } diff --git a/public/languages/en.json b/public/languages/en.json index 0bb3e8cf8..7e9f9df0e 100644 --- a/public/languages/en.json +++ b/public/languages/en.json @@ -1007,7 +1007,14 @@ "Q4-A-6": "General information stored about all accounts", "Q4-A-7": "User management for Machine Learning for Kids is implemented using the third party service, Auth0. They store the IP address that you last logged into Machine Learning for Kids from, and the type of browser you used. I've never found a reason to use that, but it is stored if I did want to go and look for it.", "Q4-A-8": "Errors that happen in the web browser are captured using the third party service, Sentry. If something goes wrong, it will capture information about the error, including your username, IP address, type of browser you were using, and a technical description of what went wrong.", - "Q4-A-9": "I use Google Analytics so that I know how many users visit Machine Learning for Kids each day. Although it captures information such as geographic location and browser type, this is only ever displayed to me in an anonymised aggregate way." + "Q4-A-9": "I use Google Analytics so that I know how many users visit Machine Learning for Kids each day. Although it captures information such as geographic location and browser type, this is only ever displayed to me in an anonymised aggregate way.", + + "Q5": "What happens to training data created by students?", + "Q5-A-1": "A step in all machine learning projects that students do using this site is to create or collect training examples. For text projects, this can mean typing in short text passages. For image projects, this can means drawing pictures onto an on-screen canvas or taking photos using the webcam. For numbers projects, this means typing in sets of numbers", + "Q5-A-2": "All of these training examples are stored in a MySQL database hosted on IBM Cloud. As the database administrator, I have access to all of these training examples for all student projects, however I do not use it for any other purposes other than enabling students to access and work on their own projects. I do not publish the training data (either publicly or to individuals or third parties) or otherwise share it, with the two exceptions of submitting it to IBM Watson APIs described below.", + "Q5-A-3": "Machine learning models for text projects are created using the IBM Watson Assistant cloud service, which means when students train a model, a copy of the training examples that they have entered will be submitted to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-4": "Machine learning models for images projects are created using the IBM Visual Recognition cloud service, which means when students train a model, a copy of their training images will be uploaded to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-5": "IBM Watson provides some general guidance for sharing training data with their services, which also apply to training data created and collected in Machine Learning for Kids. Specifically, students should be advised not to include personally identifiable information in the examples that they collect." } } } diff --git a/public/languages/es.json b/public/languages/es.json index 9ddd3c024..806c7f2cb 100644 --- a/public/languages/es.json +++ b/public/languages/es.json @@ -1007,7 +1007,14 @@ "Q4-A-6": "Información general sobre todas las cuentas. ", "Q4-A-7": "La gestión de usuarios de Machine Learning for Kids se lleva a cabo mediante un Servicio de terceros, Auth0. Almacenan la dirección IP del ultimo inicio de session y el tipo de navegador usado. Nunca he encontrado una razón para usarlo, pero se guarda por si resulta necesario..", "Q4-A-8": "Los errors del navegador se recogen mediante un servicio de tercerosa Sentry. Si algo falla, recogerá la información del error, incluyendo nombre de usurio, dirección IP, tipo de navegador y una descripción técnica de lo que ha fallado.", - "Q4-A-9": "Uso Google Analytics para saber cuántos usuarios visitan visit Machine Learning for Kids cada día. Aunque también recoge información geográfica o tipo de navegador, esto solo puedo verlo de forma agregada y anonimizada." + "Q4-A-9": "Uso Google Analytics para saber cuántos usuarios visitan visit Machine Learning for Kids cada día. Aunque también recoge información geográfica o tipo de navegador, esto solo puedo verlo de forma agregada y anonimizada.", + + "Q5": "What happens to training data created by students?", + "Q5-A-1": "A step in all machine learning projects that students do using this site is to create or collect training examples. For text projects, this can mean typing in short text passages. For image projects, this can means drawing pictures onto an on-screen canvas or taking photos using the webcam. For numbers projects, this means typing in sets of numbers", + "Q5-A-2": "All of these training examples are stored in a MySQL database hosted on IBM Cloud. As the database administrator, I have access to all of these training examples for all student projects, however I do not use it for any other purposes other than enabling students to access and work on their own projects. I do not publish the training data (either publicly or to individuals or third parties) or otherwise share it, with the two exceptions of submitting it to IBM Watson APIs described below.", + "Q5-A-3": "Machine learning models for text projects are created using the IBM Watson Assistant cloud service, which means when students train a model, a copy of the training examples that they have entered will be submitted to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-4": "Machine learning models for images projects are created using the IBM Visual Recognition cloud service, which means when students train a model, a copy of their training images will be uploaded to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-5": "IBM Watson provides some general guidance for sharing training data with their services, which also apply to training data created and collected in Machine Learning for Kids. Specifically, students should be advised not to include personally identifiable information in the examples that they collect." } } } diff --git a/public/languages/fr.json b/public/languages/fr.json index 43bc47afb..c2cf2e1d8 100644 --- a/public/languages/fr.json +++ b/public/languages/fr.json @@ -1007,7 +1007,14 @@ "Q4-A-6": "Informations générales stockées sur tous les comptes", "Q4-A-7": "La gestion des utilisateurs pour Machine Learning for Kids est implémentée en utilisant le service tiers, Auth0. Ils enregistrent l'adresse IP à partir de laquelle vous vous êtes connecté pour la dernière fois à Machine Learning for Kids et le type de navigateur que vous avez utilisé. Je n'ai jamais trouvé de raison de l'utiliser, mais il est stocké si je veux aller le chercher.", "Q4-A-8": "Les erreurs qui se produisent dans le navigateur Web sont capturées en utilisant le service tiers, Sentry. Si quelque chose ne va pas, il saisira des informations sur l'erreur, y compris votre nom d'utilisateur, votre adresse IP, le type de navigateur que vous utilisiez et une description technique de ce qui a dysfonctionné.", - "Q4-A-9": "J'utilise Google Analytics pour savoir combien d'utilisateurs visitent Machine Learning for Kids chaque jour. Bien qu'il capture des informations telles que l'emplacement géographique et le type de navigateur, il ne me les affiche uniquement que sous forme d'agrégat anonyme." + "Q4-A-9": "J'utilise Google Analytics pour savoir combien d'utilisateurs visitent Machine Learning for Kids chaque jour. Bien qu'il capture des informations telles que l'emplacement géographique et le type de navigateur, il ne me les affiche uniquement que sous forme d'agrégat anonyme.", + + "Q5": "What happens to training data created by students?", + "Q5-A-1": "A step in all machine learning projects that students do using this site is to create or collect training examples. For text projects, this can mean typing in short text passages. For image projects, this can means drawing pictures onto an on-screen canvas or taking photos using the webcam. For numbers projects, this means typing in sets of numbers", + "Q5-A-2": "All of these training examples are stored in a MySQL database hosted on IBM Cloud. As the database administrator, I have access to all of these training examples for all student projects, however I do not use it for any other purposes other than enabling students to access and work on their own projects. I do not publish the training data (either publicly or to individuals or third parties) or otherwise share it, with the two exceptions of submitting it to IBM Watson APIs described below.", + "Q5-A-3": "Machine learning models for text projects are created using the IBM Watson Assistant cloud service, which means when students train a model, a copy of the training examples that they have entered will be submitted to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-4": "Machine learning models for images projects are created using the IBM Visual Recognition cloud service, which means when students train a model, a copy of their training images will be uploaded to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-5": "IBM Watson provides some general guidance for sharing training data with their services, which also apply to training data created and collected in Machine Learning for Kids. Specifically, students should be advised not to include personally identifiable information in the examples that they collect." } } } diff --git a/public/languages/ko.json b/public/languages/ko.json index 78316f10d..ee5982a65 100644 --- a/public/languages/ko.json +++ b/public/languages/ko.json @@ -1007,7 +1007,14 @@ "Q4-A-6": "모든 계정에 대해 저장되는 일반 정보", "Q4-A-7": "아이들을 위한 머신러닝의 사용자 관리는 서드파티 서비스 인 Auth0를 사용합니다. 그들은 아이들을 위한 머신러닝에 마지막으로 로그인 한 IP 주소와 사용한 브라우저 유형을 저장합니다. 그 이유는 알지 못하지만 그 정보를 볼 수 있습니다.", "Q4-A-8": "웹 브라우저에서 발생하는 오류는 서드파티 서비스인 Sentry 를 사용하여 캡처됩니다. 문제가 발생하면, 사용자 이름, IP 주소, 사용하고 있는 브라우저 유형 및 잘못된 점에 대한 기술적 설명을 포함하여 오류에 대한 정보를 캡처합니다.", - "Q4-A-9": " Google Analytics 를 사용하여 얼마나 많은 사람들이 아이들을 위한 머신러닝 사이트에 방문하는지 알고 있습니다. 지리적 위치 및 브라우저 유형과 같은 정보는 캡처되지만 이것은 익명의 통합 방식으로 표시됩니다." + "Q4-A-9": " Google Analytics 를 사용하여 얼마나 많은 사람들이 아이들을 위한 머신러닝 사이트에 방문하는지 알고 있습니다. 지리적 위치 및 브라우저 유형과 같은 정보는 캡처되지만 이것은 익명의 통합 방식으로 표시됩니다.", + + "Q5": "What happens to training data created by students?", + "Q5-A-1": "A step in all machine learning projects that students do using this site is to create or collect training examples. For text projects, this can mean typing in short text passages. For image projects, this can means drawing pictures onto an on-screen canvas or taking photos using the webcam. For numbers projects, this means typing in sets of numbers", + "Q5-A-2": "All of these training examples are stored in a MySQL database hosted on IBM Cloud. As the database administrator, I have access to all of these training examples for all student projects, however I do not use it for any other purposes other than enabling students to access and work on their own projects. I do not publish the training data (either publicly or to individuals or third parties) or otherwise share it, with the two exceptions of submitting it to IBM Watson APIs described below.", + "Q5-A-3": "Machine learning models for text projects are created using the IBM Watson Assistant cloud service, which means when students train a model, a copy of the training examples that they have entered will be submitted to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-4": "Machine learning models for images projects are created using the IBM Visual Recognition cloud service, which means when students train a model, a copy of their training images will be uploaded to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-5": "IBM Watson provides some general guidance for sharing training data with their services, which also apply to training data created and collected in Machine Learning for Kids. Specifically, students should be advised not to include personally identifiable information in the examples that they collect." } } } diff --git a/public/languages/nl-be.json b/public/languages/nl-be.json index b88559792..90729fcbe 100644 --- a/public/languages/nl-be.json +++ b/public/languages/nl-be.json @@ -1007,7 +1007,14 @@ "Q4-A-6": "Algemene informatie opgeslagen over alle accounts", "Q4-A-7": "Gebruikersmanagement voor Machine Learning voor Kids is geïmplementeerd door de derde partij service, Auth0. Zij slaan het IP adres op waarmee je laatst inlogde op Machine Learning voor Kids en het type browser dat je gebruikte. Ik ken hiervoor de reden niet.", "Q4-A-8": "Fouten die voorkomen in de webbrowser worden opgemerkt door de derde partij service, Sentry. Als er iets misloopt, wordt er informatie over de fout, inclusief je gebruikersnaam, IP adres en type browser dat je gebruikt opgeslagen, net als een technische beschrijving van wat er misliep.", - "Q4-A-9": "Ik gebruik Google Analytics zodat ik weet hoeveel bezoekers er elke dag komen op Machine Learning voor Kids. Ondanks dat informatie zoals geografische locatie en browsertype worden opgeslagen, wordt dit enkel op geanonimiseerde en gecombineerde wijze aan mij getoond. " + "Q4-A-9": "Ik gebruik Google Analytics zodat ik weet hoeveel bezoekers er elke dag komen op Machine Learning voor Kids. Ondanks dat informatie zoals geografische locatie en browsertype worden opgeslagen, wordt dit enkel op geanonimiseerde en gecombineerde wijze aan mij getoond. ", + + "Q5": "What happens to training data created by students?", + "Q5-A-1": "A step in all machine learning projects that students do using this site is to create or collect training examples. For text projects, this can mean typing in short text passages. For image projects, this can means drawing pictures onto an on-screen canvas or taking photos using the webcam. For numbers projects, this means typing in sets of numbers", + "Q5-A-2": "All of these training examples are stored in a MySQL database hosted on IBM Cloud. As the database administrator, I have access to all of these training examples for all student projects, however I do not use it for any other purposes other than enabling students to access and work on their own projects. I do not publish the training data (either publicly or to individuals or third parties) or otherwise share it, with the two exceptions of submitting it to IBM Watson APIs described below.", + "Q5-A-3": "Machine learning models for text projects are created using the IBM Watson Assistant cloud service, which means when students train a model, a copy of the training examples that they have entered will be submitted to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-4": "Machine learning models for images projects are created using the IBM Visual Recognition cloud service, which means when students train a model, a copy of their training images will be uploaded to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-5": "IBM Watson provides some general guidance for sharing training data with their services, which also apply to training data created and collected in Machine Learning for Kids. Specifically, students should be advised not to include personally identifiable information in the examples that they collect." } } } diff --git a/public/languages/pt-br.json b/public/languages/pt-br.json index 57905f525..0ed79ec26 100644 --- a/public/languages/pt-br.json +++ b/public/languages/pt-br.json @@ -1007,7 +1007,14 @@ "Q4-A-6": "Informação geral armazenada de todas as contas", "Q4-A-7": "A gestão de usuários para o Machine Learning for Kids é implementados usando um serviço de terceiros, Auth0. Eles armazenam endereço IP de onde você fez o seu último Login no Machine Learning for Kids, e que tipo de navegador você usou. Eu nunca tive razões para usar isso, mas isso é armazenado para caso eu quisesse procurar por esses dados.", "Q4-A-8": "Erros que acontecem no navegador são capturados por um serviço de terceiros, Sentry. Se algo dá errado, as informações do erro serão capturados, incluindo nome de usuário, endereço IP, tipo de navegador que você está usando, e uma descrição técnica do que aconteceu de errado.", - "Q4-A-9": "Eu uso Google Analytics para saber quantos usuários acessam Machine Learning for Kids todo dia. Embora eles tenham informações de localização geográfica e tipo de navegador, isso só me é exibido de forma agregada e anônima." + "Q4-A-9": "Eu uso Google Analytics para saber quantos usuários acessam Machine Learning for Kids todo dia. Embora eles tenham informações de localização geográfica e tipo de navegador, isso só me é exibido de forma agregada e anônima.", + + "Q5": "What happens to training data created by students?", + "Q5-A-1": "A step in all machine learning projects that students do using this site is to create or collect training examples. For text projects, this can mean typing in short text passages. For image projects, this can means drawing pictures onto an on-screen canvas or taking photos using the webcam. For numbers projects, this means typing in sets of numbers", + "Q5-A-2": "All of these training examples are stored in a MySQL database hosted on IBM Cloud. As the database administrator, I have access to all of these training examples for all student projects, however I do not use it for any other purposes other than enabling students to access and work on their own projects. I do not publish the training data (either publicly or to individuals or third parties) or otherwise share it, with the two exceptions of submitting it to IBM Watson APIs described below.", + "Q5-A-3": "Machine learning models for text projects are created using the IBM Watson Assistant cloud service, which means when students train a model, a copy of the training examples that they have entered will be submitted to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-4": "Machine learning models for images projects are created using the IBM Visual Recognition cloud service, which means when students train a model, a copy of their training images will be uploaded to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-5": "IBM Watson provides some general guidance for sharing training data with their services, which also apply to training data created and collected in Machine Learning for Kids. Specifically, students should be advised not to include personally identifiable information in the examples that they collect." } } } diff --git a/public/languages/si-lk.json b/public/languages/si-lk.json index cef8a9ec0..fb67ce0c7 100644 --- a/public/languages/si-lk.json +++ b/public/languages/si-lk.json @@ -1007,7 +1007,14 @@ "Q4-A-6": "General information stored about all accounts", "Q4-A-7": "User management for Machine Learning for Kids is implemented using the third party service, Auth0. They store the IP address that you last logged into Machine Learning for Kids from, and the type of browser you used. I've never found a reason to use that, but it is stored if I did want to go and look for it.", "Q4-A-8": "Errors that happen in the web browser are captured using the third party service, Sentry. If something goes wrong, it will capture information about the error, including your username, IP address, type of browser you were using, and a technical description of what went wrong.", - "Q4-A-9": "I use Google Analytics so that I know how many users visit Machine Learning for Kids each day. Although it captures information such as geographic location and browser type, this is only ever displayed to me in an anonymised aggregate way." + "Q4-A-9": "I use Google Analytics so that I know how many users visit Machine Learning for Kids each day. Although it captures information such as geographic location and browser type, this is only ever displayed to me in an anonymised aggregate way.", + + "Q5": "What happens to training data created by students?", + "Q5-A-1": "A step in all machine learning projects that students do using this site is to create or collect training examples. For text projects, this can mean typing in short text passages. For image projects, this can means drawing pictures onto an on-screen canvas or taking photos using the webcam. For numbers projects, this means typing in sets of numbers", + "Q5-A-2": "All of these training examples are stored in a MySQL database hosted on IBM Cloud. As the database administrator, I have access to all of these training examples for all student projects, however I do not use it for any other purposes other than enabling students to access and work on their own projects. I do not publish the training data (either publicly or to individuals or third parties) or otherwise share it, with the two exceptions of submitting it to IBM Watson APIs described below.", + "Q5-A-3": "Machine learning models for text projects are created using the IBM Watson Assistant cloud service, which means when students train a model, a copy of the training examples that they have entered will be submitted to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-4": "Machine learning models for images projects are created using the IBM Visual Recognition cloud service, which means when students train a model, a copy of their training images will be uploaded to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-5": "IBM Watson provides some general guidance for sharing training data with their services, which also apply to training data created and collected in Machine Learning for Kids. Specifically, students should be advised not to include personally identifiable information in the examples that they collect." } } } diff --git a/public/languages/sv-se.json b/public/languages/sv-se.json index 9c01b7c61..22ff16606 100644 --- a/public/languages/sv-se.json +++ b/public/languages/sv-se.json @@ -1007,7 +1007,14 @@ "Q4-A-6": "General information stored about all accounts", "Q4-A-7": "User management for Machine Learning for Kids is implemented using the third party service, Auth0. They store the IP address that you last logged into Machine Learning for Kids from, and the type of browser you used. I've never found a reason to use that, but it is stored if I did want to go and look for it.", "Q4-A-8": "Errors that happen in the web browser are captured using the third party service, Sentry. If something goes wrong, it will capture information about the error, including your username, IP address, type of browser you were using, and a technical description of what went wrong.", - "Q4-A-9": "I use Google Analytics so that I know how many users visit Machine Learning for Kids each day. Although it captures information such as geographic location and browser type, this is only ever displayed to me in an anonymised aggregate way." + "Q4-A-9": "I use Google Analytics so that I know how many users visit Machine Learning for Kids each day. Although it captures information such as geographic location and browser type, this is only ever displayed to me in an anonymised aggregate way.", + + "Q5": "What happens to training data created by students?", + "Q5-A-1": "A step in all machine learning projects that students do using this site is to create or collect training examples. For text projects, this can mean typing in short text passages. For image projects, this can means drawing pictures onto an on-screen canvas or taking photos using the webcam. For numbers projects, this means typing in sets of numbers", + "Q5-A-2": "All of these training examples are stored in a MySQL database hosted on IBM Cloud. As the database administrator, I have access to all of these training examples for all student projects, however I do not use it for any other purposes other than enabling students to access and work on their own projects. I do not publish the training data (either publicly or to individuals or third parties) or otherwise share it, with the two exceptions of submitting it to IBM Watson APIs described below.", + "Q5-A-3": "Machine learning models for text projects are created using the IBM Watson Assistant cloud service, which means when students train a model, a copy of the training examples that they have entered will be submitted to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-4": "Machine learning models for images projects are created using the IBM Visual Recognition cloud service, which means when students train a model, a copy of their training images will be uploaded to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-5": "IBM Watson provides some general guidance for sharing training data with their services, which also apply to training data created and collected in Machine Learning for Kids. Specifically, students should be advised not to include personally identifiable information in the examples that they collect." } } } diff --git a/public/languages/tr.json b/public/languages/tr.json index 10882ce4f..16eda38bf 100644 --- a/public/languages/tr.json +++ b/public/languages/tr.json @@ -963,7 +963,14 @@ "Q4-A-6": "General information stored about all accounts", "Q4-A-7": "User management for Machine Learning for Kids is implemented using the third party service, Auth0. They store the IP address that you last logged into Machine Learning for Kids from, and the type of browser you used. I've never found a reason to use that, but it is stored if I did want to go and look for it.", "Q4-A-8": "Errors that happen in the web browser are captured using the third party service, Sentry. If something goes wrong, it will capture information about the error, including your username, IP address, type of browser you were using, and a technical description of what went wrong.", - "Q4-A-9": "I use Google Analytics so that I know how many users visit Machine Learning for Kids each day. Although it captures information such as geographic location and browser type, this is only ever displayed to me in an anonymised aggregate way." + "Q4-A-9": "I use Google Analytics so that I know how many users visit Machine Learning for Kids each day. Although it captures information such as geographic location and browser type, this is only ever displayed to me in an anonymised aggregate way.", + + "Q5": "What happens to training data created by students?", + "Q5-A-1": "A step in all machine learning projects that students do using this site is to create or collect training examples. For text projects, this can mean typing in short text passages. For image projects, this can means drawing pictures onto an on-screen canvas or taking photos using the webcam. For numbers projects, this means typing in sets of numbers", + "Q5-A-2": "All of these training examples are stored in a MySQL database hosted on IBM Cloud. As the database administrator, I have access to all of these training examples for all student projects, however I do not use it for any other purposes other than enabling students to access and work on their own projects. I do not publish the training data (either publicly or to individuals or third parties) or otherwise share it, with the two exceptions of submitting it to IBM Watson APIs described below.", + "Q5-A-3": "Machine learning models for text projects are created using the IBM Watson Assistant cloud service, which means when students train a model, a copy of the training examples that they have entered will be submitted to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-4": "Machine learning models for images projects are created using the IBM Visual Recognition cloud service, which means when students train a model, a copy of their training images will be uploaded to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-5": "IBM Watson provides some general guidance for sharing training data with their services, which also apply to training data created and collected in Machine Learning for Kids. Specifically, students should be advised not to include personally identifiable information in the examples that they collect." } } } diff --git a/public/languages/zh-cn.json b/public/languages/zh-cn.json index 8ea439f17..1949f1cde 100644 --- a/public/languages/zh-cn.json +++ b/public/languages/zh-cn.json @@ -1007,7 +1007,14 @@ "Q4-A-6": "General information stored about all accounts", "Q4-A-7": "User management for Machine Learning for Kids is implemented using the third party service, Auth0. They store the IP address that you last logged into Machine Learning for Kids from, and the type of browser you used. I've never found a reason to use that, but it is stored if I did want to go and look for it.", "Q4-A-8": "Errors that happen in the web browser are captured using the third party service, Sentry. If something goes wrong, it will capture information about the error, including your username, IP address, type of browser you were using, and a technical description of what went wrong.", - "Q4-A-9": "I use Google Analytics so that I know how many users visit Machine Learning for Kids each day. Although it captures information such as geographic location and browser type, this is only ever displayed to me in an anonymised aggregate way." + "Q4-A-9": "I use Google Analytics so that I know how many users visit Machine Learning for Kids each day. Although it captures information such as geographic location and browser type, this is only ever displayed to me in an anonymised aggregate way.", + + "Q5": "What happens to training data created by students?", + "Q5-A-1": "A step in all machine learning projects that students do using this site is to create or collect training examples. For text projects, this can mean typing in short text passages. For image projects, this can means drawing pictures onto an on-screen canvas or taking photos using the webcam. For numbers projects, this means typing in sets of numbers", + "Q5-A-2": "All of these training examples are stored in a MySQL database hosted on IBM Cloud. As the database administrator, I have access to all of these training examples for all student projects, however I do not use it for any other purposes other than enabling students to access and work on their own projects. I do not publish the training data (either publicly or to individuals or third parties) or otherwise share it, with the two exceptions of submitting it to IBM Watson APIs described below.", + "Q5-A-3": "Machine learning models for text projects are created using the IBM Watson Assistant cloud service, which means when students train a model, a copy of the training examples that they have entered will be submitted to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-4": "Machine learning models for images projects are created using the IBM Visual Recognition cloud service, which means when students train a model, a copy of their training images will be uploaded to IBM Watson. IBM Watson does not use these training examples for any other purposes. This is because Machine Learning for Kids requests an opt-out for student training examples being used by IBM to improve the service, as described in the Watson documentation.", + "Q5-A-5": "IBM Watson provides some general guidance for sharing training data with their services, which also apply to training data created and collected in Machine Learning for Kids. Specifically, students should be advised not to include personally identifiable information in the examples that they collect." } } }