From 550443fbb03566f72ce1b422c4fc60a752da0a42 Mon Sep 17 00:00:00 2001 From: Xyyzzz11 <807817099@qq.com> Date: Sun, 16 Feb 2020 22:27:39 -0500 Subject: [PATCH 1/2] part one --- Prediction.Rmd | 27 +++++++++++++++++++++++++++ 1 file changed, 27 insertions(+) create mode 100644 Prediction.Rmd diff --git a/Prediction.Rmd b/Prediction.Rmd new file mode 100644 index 0000000..ab9faab --- /dev/null +++ b/Prediction.Rmd @@ -0,0 +1,27 @@ +--- +title: "prediction" +output: html_document +--- + +```{r} +library (dplyr) +library(tidyr) +#import dataset +D1<- read.csv("vle.csv") +D2<- read.csv("assessments.csv") +D3<- read.csv("studentVle.csv") + +#Calculate the average daily number of clicks (site interactions) for each student from the `studentVle` dataset +daily<-aggregate(D3$date,list(D3$id_student), mean) +colnames(daily)<-c("id_student","average_daily_click") +daily$average_daily_click<-round(daily$average_daily_click,2) + +#Calculate the average assessment score for each student from the `studentAssessment` dataset +D2 +``` + + + + + + From ac1bbd3c90489c99b66c9bdc2d5f2eb35e90d2ea Mon Sep 17 00:00:00 2001 From: Xyyzzz11 <807817099@qq.com> Date: Sun, 16 Feb 2020 23:21:28 -0500 Subject: [PATCH 2/2] Explore --- Prediction.Rmd | 30 ++++++++++++++++++++++++------ 1 file changed, 24 insertions(+), 6 deletions(-) diff --git a/Prediction.Rmd b/Prediction.Rmd index ab9faab..c3a75d7 100644 --- a/Prediction.Rmd +++ b/Prediction.Rmd @@ -7,19 +7,37 @@ output: html_document library (dplyr) library(tidyr) #import dataset -D1<- read.csv("vle.csv") -D2<- read.csv("assessments.csv") +D1<- read.csv("studentInfo.csv") +D2<- read.csv("studentAssessment.csv") D3<- read.csv("studentVle.csv") #Calculate the average daily number of clicks (site interactions) for each student from the `studentVle` dataset -daily<-aggregate(D3$date,list(D3$id_student), mean) -colnames(daily)<-c("id_student","average_daily_click") -daily$average_daily_click<-round(daily$average_daily_click,2) +daily_click<-aggregate(D3$date,list(D3$id_student), mean) +colnames(daily_click)<-c("id_student","average_daily_click") +daily_click$average_daily_click<-round(daily$average_daily_click,2) #Calculate the average assessment score for each student from the `studentAssessment` dataset -D2 +daily_score<-aggregate(D2$score,list(D2$id_student), mean) +colnames(daily_score)<-c("id_student","average_daily_score") +daily_score$average_daily_score<-round(daily_score$average_daily_score,2) + +# Merge your click and assessment score average values into the the `studentInfo` dataset +D1<- merge(D1,daily_click,by="id_student") +D1<- merge(D1,daily_score,by="id_student") +``` + +```{r} +#Split your data into two new datasets, `TRAINING` and `TEST`, by **randomly** selecting 25% of the students for the `TEST` set +number<- sample(1:nrow(D1), size = round(.25*nrow(D1)), replace = FALSE) +TEST = D1[number,] +TRAINING = D1[-number,] ``` +```{r} +# Generate summary statistics for the variable `final_result` +TRAINING <- na.omit(TRAINING) +Final_result_summary<-count(TRAINING,final_result) +```