-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathrun_analysis.R
More file actions
49 lines (34 loc) · 1.86 KB
/
run_analysis.R
File metadata and controls
49 lines (34 loc) · 1.86 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
library(plyr)
library(dplyr)
if(!file.exists("datafile.zip")) {
Url <- "https://d396qusza40orc.cloudfront.net/getdata%2Fprojectfiles%2FUCI%20HAR%20Dataset.zip"
download.file(Url, destfile = "datafile.zip",method = "curl")
}
activity_labels<- read.table("UCI HAR Dataset/activity_labels.txt")
X_training <- read.table("UCI HAR Dataset/train/X_train.txt")
y_training <- read.table("UCI HAR Dataset/train/y_train.txt")
subject_train <- read.table("UCI HAR Dataset/train/subject_train.txt")
subject_test <- read.table("UCI HAR Dataset/test/subject_test.txt")
X_test <- read.table("UCI HAR Dataset/test/X_test.txt")
y_test <- read.table("UCI HAR Dataset/test/y_test.txt")
training_sensor <- rbind(subject_train,subject_test)
train_initial <- cbind(X_training, subject_train)
test_initial <- cbind(X_test, subject_test)
train_sensor <- cbind(train_initial,y_training)
test_sensor <- cbind(test_initial,y_test)
sensor_data <- rbind(train_sensor,test_sensor)
activity_labels <-dplyr::rename(activity_labels, Activity_ID = V1,Activity_name = V2)
features <- read.table("UCI HAR Dataset/features.txt")
features[,2] <- as.character(features[,2])
activity_labels[,2] <- as.character(activity_labels[,2])
sensor_labels_row <- rbind(features, c(562,"Subject"))
sensor_labels <- rbind(sensor_labels_row, c(563,"Activity_ID"))[,2]
names(sensor_data) <- sensor_labels
mean_data <- sensor_data[,grepl("mean",names(sensor_data))]
std_data <- sensor_data[,grepl("mean|std|Subject|Activity_ID", names(sensor_data))]
merged_data <- join(std_data, activity_labels , by = "Activity_ID", match = "first")
merged_data <- merged_data[,-1]
names(merged_data) <- tolower(names(merged_data))%s%
names(merged_data) <- gsub("_","",merged_data)
tidy_dataset <- ddply(merged_data,c("subject",Activity = "activity_name"), function(x) colMeans(x[ 1:66],na.rm= FALSE))
write.table(tidy_dataset,"tidy_dataset.txt")