datafest competition 2019
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
 
 

146 lines
3.7 KiB

# Look at data
library(tidyverse)
library(DBI)
library(RSQLite)
gpsData <- read.csv("data/gps.csv")
gpsDataTibble <- as_tibble(gpsData)
#workingTibble <- head(gpsDataTibble, 500000)
workingTibble <- gpsDataTibble
playerIds <-unique(workingTibble$PlayerID)
cat("Number of Players: ", length(playerIds), sep="")
gameIds <- unique(workingTibble$GameID)
cat("Number of Games: ", length(gameIds), sep="")
playerIDMetrics <- c()
gameIDMetrics <- c()
averageSpeed <- c()
accelDistance <- c()
for(playerID in playerIds)
{
for(gameID in gameIds)
{
cat(playerID, gameID , '\n', sep=" ")
speedTibble <- subset(workingTibble, GameID == gameID & PlayerID == playerID)
# crunch average speed
averageSpeed <- c(averageSpeed, mean(speedTibble$Speed, na.rm = 0))
# average for accel value
accelDistance <- c(accelDistance, mean(sqrt(speedTibble$AccelX^2 + speedTibble$AccelY^2 + speedTibble$AccelZ^ 2), na.rm = 0))
# game and player id to vector
playerIDMetrics <- c(playerIDMetrics, playerID)
gameIDMetrics <- c(gameIDMetrics, gameID)
}
}
plot(accelDistance, averageSpeed)
compressedMetrics <- tibble(gameID = gameIDMetrics, playerID = playerIDMetrics, averageSpeed = averageSpeed, accelerationVector = accelDistance)
length(compressedMetrics$averageSpeed)
length(compressedMetrics$accelerationVector)
write.csv(compressedMetrics, "data/speedData.csv")
#putSQLiteHere <- "gpsData.sqlite" # could also be ":memory:"
#mySQLiteDB <- dbConnect(RSQLite::SQLite(),putSQLiteHere)
#dbWriteTable(mySQLiteDB, "gpsData", compressedMetrics, overwrite=TRUE)
#dbDisconnect(mySQLiteDB)
rpeData <- read.csv("./data/rpe.csv")
rpeDataTibble <- as_tibble(rpeData)
gameData <- read.csv("data/games.csv")
gameDataTibble <- as_tibble(gameData)
wellnessData <- read.csv("./data/wellness_na.csv")
wellnessDataTibble <- as_tibble(wellnessData)
wellnesPlayer1 <- subset(wellnessDataTibble, PlayerID == 1)
plot(wellnesPlayer1$Fatigue * wellnesPlayer1$Soreness * wellnesPlayer1$Irritability, wellnesPlayer1$SleepHours * wellnesPlayer1$SleepQuality)
wellnessCleaned <- as_tibble(read.csv("./cleaned/dirty_wellness.csv"))
ggplot(data = wellnessCleaned) +
theme(plot.title = element_text(hjust = 0.5)) +
ggtitle("Hours of Sleep Box Plot") +
geom_boxplot(na.rm = T, mapping = aes(y=SleepHours, group = PlayerID), outlier.colour = "red", outlier.shape = 1) +
labs(group = "Player ID", y = "Hours of Sleep") +
coord_flip() +
theme_bw()
ggplot(data = wellnessCleaned) +
theme(plot.title = element_text(hjust = 0.5)) +
ggtitle("Hours of Sleep Box Plot") +
geom_boxplot(na.rm = T, mapping = aes(y=Fatigue, group = PlayerID), outlier.colour = "red", outlier.shape = 1) +
labs(group = "Player ID", y = "Fatigue Score") +
coord_flip() +
theme_bw()
ggplot(data = wellnessCleaned) +
theme(plot.title = element_text(hjust = 0.5)) +
ggtitle("Sleep Quality Box Plot") +
geom_boxplot(na.rm = T, mapping = aes(y=SleepQuality, group = PlayerID), outlier.colour = "red", outlier.shape = 1) +
labs(group = "Player ID", y = "Sleep Quality") +
coord_flip() +
theme_bw()
ggplot(data = wellnessCleaned) +
theme(plot.title = element_text(hjust = 0.5)) +
ggtitle("Training Readiness Box Plot") +
geom_boxplot(na.rm = T, mapping = aes(y=TrainingReadinessNum, group = PlayerID), outlier.colour = "red", outlier.shape = 1) +
labs(group = "Player ID", y = "Training Readiness") +
coord_flip() +
theme_bw()
max(wellnessCleaned$SleepHours, na.rm = T)
min(wellnessCleaned$SleepHours, na.rm = T)
playerIdsWellness <-unique(wellnessCleaned$PlayerID)
cat("Number of Players: ", length(playerIdsWellness), sep="")
head(gpsData)