From bbed2039d1a52c70e5ccf3e29200b6444bf3305d Mon Sep 17 00:00:00 2001
From: lfaf373 <lfaf373@gmail.com>
Date: Wed, 28 Sep 2016 15:50:13 -0400
Subject: [PATCH 1/2] this is draft 1

---
 Assignment7class.R | 40 ++++++++++++++++++++++++++++++++++++++++
 cLASS7.Rproj       | 13 +++++++++++++
 2 files changed, 53 insertions(+)
 create mode 100644 Assignment7class.R
 create mode 100644 cLASS7.Rproj

diff --git a/Assignment7class.R b/Assignment7class.R
new file mode 100644
index 0000000..a1c7f4e
--- /dev/null
+++ b/Assignment7class.R
@@ -0,0 +1,40 @@
+#Opening data set
+data_wide <- read.table("C:/Users/lfaf373/Documents/RStudioProj/cLASS7/instructor_activity_wide.csv", sep = ",", header = TRUE)
+#Now view the data you have uploaded and notice how its structure: each variable is a date and each row is a type of measure.
+View(data_wide)
+# opening the library of these two packages to tidy data
+library(tidyr, dplyr)
+#R doesn't like having variable names that consist only of numbers so, as you can see, every variable starts with the letter "X". The numbers represent dates in the format year-month-day.
+#this converts wide to long->> by date
+data_long <- gather(data_wide, date, variables)
+#Rename the variables so we don't get confused about what is what!
+names(data_long) <- c("variables", "date", "measure")
+#Take a look at your new data, looks weird huh?
+View(data_long)
+# Converting long format into seperate columns, seperating by type of measure
+instructor_data <- spread(data_long, variables, measure)
+# upload student data
+student_data<- read.csv("C:/Users/lfaf373/Documents/RStudioProj/cLASS7/student_activity.csv")
+# first we have to make sure r knows to use dplyr command
+# Here we are only including data from the second clas
+student_data_2 <- dplyr::filter(student_data, date == 20160204)
+# Here we are only including data from students who sat at table 4
+# Subsetted from the original dataset
+student_data_3 <- dplyr::filter(student_data, variable == "table" & measure == 4)
+# usinging mutate to make a new variable, total sleep... which is lite plus deep sleep
+instructor_data <- dplyr::mutate(instructor_data, total_sleep = s_deep + s_light)
+#making a new data frame that only includes total_sleep 
+instructor_sleep<- dplyr::select(instructor_data, total_sleep)
+# create a grouping variable called week
+# for some reason, there are 8 days in week 1
+instructor_data <- dplyr::mutate(instructor_data, week = dplyr::ntile(date, 3))
+# Same as above but for stduent
+student_data <- dplyr::mutate(student_data, week = dplyr::ntile(date, 3))
+#
+# motivation <- dplyr::filter(student_data, variable == "motivation")
+# Summarize data
+dplyr::summarise(student_data, avg=mean(variable))
+
+#That isn't super interesting, so let's break it down by week:
+
+student_data %>% dplyr::group_by(date) %>% dplyr::summarise(mean(motivation))
diff --git a/cLASS7.Rproj b/cLASS7.Rproj
new file mode 100644
index 0000000..8e3c2eb
--- /dev/null
+++ b/cLASS7.Rproj
@@ -0,0 +1,13 @@
+Version: 1.0
+
+RestoreWorkspace: Default
+SaveWorkspace: Default
+AlwaysSaveHistory: Default
+
+EnableCodeIndexing: Yes
+UseSpacesForTab: Yes
+NumSpacesForTab: 2
+Encoding: UTF-8
+
+RnwWeave: Sweave
+LaTeX: pdfLaTeX

From 3293900f090d0e5ffd4add381d363035932facca Mon Sep 17 00:00:00 2001
From: lfaf373 <lfaf373@gmail.com>
Date: Fri, 30 Sep 2016 08:30:17 -0400
Subject: [PATCH 2/2] Final Assignment

---
 Assignment7class.R | 22 +++++++++++++++++++---
 1 file changed, 19 insertions(+), 3 deletions(-)

diff --git a/Assignment7class.R b/Assignment7class.R
index a1c7f4e..17c2b8b 100644
--- a/Assignment7class.R
+++ b/Assignment7class.R
@@ -14,13 +14,15 @@ View(data_long)
 # Converting long format into seperate columns, seperating by type of measure
 instructor_data <- spread(data_long, variables, measure)
 # upload student data
-student_data<- read.csv("C:/Users/lfaf373/Documents/RStudioProj/cLASS7/student_activity.csv")
+data_wide2<- read.csv("C:/Users/lfaf373/Documents/RStudioProj/cLASS7/student_activity.csv")
+#data_long2 <- gather(data_wide2, measure, variable)
+student_data <- spread(data_wide2, variable, measure)
 # first we have to make sure r knows to use dplyr command
 # Here we are only including data from the second clas
 student_data_2 <- dplyr::filter(student_data, date == 20160204)
 # Here we are only including data from students who sat at table 4
 # Subsetted from the original dataset
-student_data_3 <- dplyr::filter(student_data, variable == "table" & measure == 4)
+student_data_3 <- dplyr::filter(student_data, table == 4)
 # usinging mutate to make a new variable, total sleep... which is lite plus deep sleep
 instructor_data <- dplyr::mutate(instructor_data, total_sleep = s_deep + s_light)
 #making a new data frame that only includes total_sleep 
@@ -33,8 +35,22 @@ student_data <- dplyr::mutate(student_data, week = dplyr::ntile(date, 3))
 #
 # motivation <- dplyr::filter(student_data, variable == "motivation")
 # Summarize data
-dplyr::summarise(student_data, avg=mean(variable))
+student_data %>% dplyr::summarise(mean(motivation))
 
 #That isn't super interesting, so let's break it down by week:
 
 student_data %>% dplyr::group_by(date) %>% dplyr::summarise(mean(motivation))
+
+#Create two new data sets using this method. One that sumarizes average motivation for students for each week (student_week) 
+# and another than sumarizes "m_active_time" for the instructor per week (instructor_week).
+
+student_week<-student_data %>% dplyr::group_by(week) %>% dplyr::summarise(mean(motivation))
+instructor_week<-instructor_data %>% dplyr::group_by(week) %>% dplyr::summarise(mean(m_active_time))
+
+#merge these two data set
+merge <- dplyr::full_join(instructor_week, student_week, "week")
+
+# plot mean motivation with mean activity time
+names(merge) <- c("week", "m2", "m3")
+plotting<-cor(merge$m2, merge$m3)
+plot(merge$m2, merge$m3)