Difference between revisions of "Main Page/Research/MSB/Scripts/conflate timestamp.R"
From phurvitz
Phil Hurvitz (talk | contribs) |
Phil Hurvitz (talk | contribs) |
||
Line 38: | Line 38: | ||
# fix the new column name | # fix the new column name | ||
colnames(my.experience) <- c(colnames(my.experience)[1:ncol(my.experience)-1], "msb.seconds") | colnames(my.experience) <- c(colnames(my.experience)[1:ncol(my.experience)-1], "msb.seconds") | ||
+ | |||
+ | # output | ||
+ | output.file = paste(indir, "myexp_ts.csv", sep="/") | ||
+ | write.table(my.experience, file=output.file, row.names=F, col.names=F, sep=",", quote=F) | ||
+ | |||
+ | # function return | ||
return(my.experience) | return(my.experience) | ||
} | } | ||
</pre> | </pre> |
Revision as of 21:50, 11 October 2007
# timestamp fuzzy match # finds the closest match for timestamp + subject. # adds the seconds.msb field to the MyExperience table # a function timstamp.match <- function(indir, minutes.offset=10) { # offset for matching tolerance seconds.offset <- minutes.offset * 60 # read in the data sets # phone log (from processing of the mailman logs in read.msb_files.3.R phone.log.file <- paste(indir, "phone_log.csv", sep="") phone.log <- read.csv(phone.log.file, stringsAsFactors=F) my.experience.file <- paste(indir, "myexper.csv", sep="") my.experience <- read.csv(my.experience.file, stringsAsFactors=F) # process each record in the phone log file for (i in 1:nrow(phone.log)) { # get the timestamp from the current record timestamp <- as.POSIXct(phone.log[i,6]) # get the MSB seconds value from the current record msb.seconds <- as.numeric(phone.log[i,3]) # get the subject number from the current record subject.num <- phone.log$subject.num[i] # create a T/F vector indicating which record in the MyExperience file # is within 10 minutes of the current phonelog timestamp AND # has the same subject ID time.match <- ((my.experience$date.phone > (timestamp - seconds.offset)) & (my.experience$date.phone < (timestamp + seconds.offset)) & (my.experience$sid == subject.num)) # set the MSB seconds for the record that matches from the T/F matrix my.experience[time.match,12] <- msb.seconds } # fix the new column name colnames(my.experience) <- c(colnames(my.experience)[1:ncol(my.experience)-1], "msb.seconds") # output output.file = paste(indir, "myexp_ts.csv", sep="/") write.table(my.experience, file=output.file, row.names=F, col.names=F, sep=",", quote=F) # function return return(my.experience) }