[Blotter-commits] r726 - pkg/FinancialInstrument/sandbox

Wed Aug 10 22:45:51 CEST 2011

Author: braverock
Date: 2011-08-10 22:45:51 +0200 (Wed, 10 Aug 2011)
New Revision: 726

Modified:
   pkg/FinancialInstrument/sandbox/TRTH_BackFill.R
Log:
- minor improvements

Modified: pkg/FinancialInstrument/sandbox/TRTH_BackFill.R
===================================================================

--- pkg/FinancialInstrument/sandbox/TRTH_BackFill.R	2011-08-10 16:58:05 UTC (rev 725)
+++ pkg/FinancialInstrument/sandbox/TRTH_BackFill.R	2011-08-10 20:45:51 UTC (rev 726)
@@ -1,7 +1,8 @@
 ##############################################################################
 #                     Reuters Backfill Configuration Parameters              #         
 ##############################################################################
-config_file <- "/full/path/to/config.csv" # full path to the config file with instrument metadata in it
+instrument_file <- '/full/path/to/instruments.rda' #where your instrument metadata is stored
+
 archive_dir <- "/full/path/to/archives/" # where the split CSV, job reports, and gz files will be stored
 path.output <- "/full/path/to/output/" # root dir where the .rda files for the xts will be placed
 
@@ -27,6 +28,7 @@
 
 require(xts)
 require(quantmod)
+require(FinancialInstrument)
 require(doMC)
 #require(sendmailR) # for email on failure
 #error.codes<-read.csv('curl.errors.csv',stringsAsFactors=FALSE,header=TRUE,row.names=1)
@@ -51,12 +53,9 @@
         #sendmail(email_to,email_from,"error downloading Reuters file list",msg=tmpmsg)
         Sys.sleep(1800)
     } else listflag=TRUE
+    
 }
 
-# or to start from the file list
-#
-
-
 # now we're past the while loop, so we have a file list
 Reuters.report <- Reuters[grep("report",Reuters)]
 Reuters.output <-  Reuters[-c(grep("report",Reuters),grep("confirmation",Reuters))]
@@ -64,7 +63,11 @@
 
 Reuters.new <- Reuters.output[!(Reuters.output %in% Archive.output)]
 
+# or to start from the file list
+# Reuters.output <-  Archive.output[grep(job.name,Archive.output)]
+# Reuters.new <- Reuters.output
 
+
 for(i in 1:length(Reuters.new))
 {	
 	filename.gz <- Reuters.new[i]
@@ -188,16 +191,21 @@
 
 # now get instrument data
 files.xts$type<-rep(NA,nrow(files.xts))
+missing_i<-''
 instr_s<-unique(files.xts[,'name.new'])
 for(i in 1:length(instr_s)){
     instr<-getInstrument(instr_s[i])
     if(is.instrument(instr)){ 
-        files.xts['name.new'==instr_s,'type']<-as.character(instr$type[1])
+        files.xts[files.xts$name.new ==instr_s[i],]$type<-as.character(instr$type[1])
     } else {
         print(paste(instr_s[i], 'does not appear to be an instrument, setting it to', default_type))
-        files.xts['name.new'==instr_s,'type']<-default_type
+        files.xts[files.xts$name.new==instr_s[i],]$type<-default_type
+        missing_i<-c(missing_i,instr_s[i])
     }
 }
+missing_i<-missing_i[-1]
+missing_i<-data.frame(symbol=missing_i,type=default_type)
+write.csv(missing_i,file=paste(archive_dir,'missing_instruments.csv',sep='')) 
 
 ##If trying to fix a broken set:
 #files.csv<-'';for(dir in list.files(getwd(),pattern="20")) {files.csv<-c(files.csv,list.files(paste(getwd(),'/',dir,'/',sep=''),pattern=".csv"))}[-1]
@@ -205,6 +213,8 @@
 #for(l in 1:length(files.csv)) { rsplit<-as.vector(strsplit(files.csv[l],'.',fixed=TRUE)[[1]]); files.xts<-rbind(files.xts,cbind(rsplit[4],paste(rsplit[1],rsplit[2],rsplit[3],sep='.'))); print(files.xts[l,])}
 #colnames(files.xts)<-c('name.new','date.format')
 
+save(files.xts,file='files.xts.tmp.rda')
+
 H <- read.csv(paste(path.output,"Archives/#RIC.Date[G].csv",sep=""),header=FALSE,stringsAsFactors=FALSE)
 H <- H[nrow(H),]
 H <- make.names(H)
@@ -365,8 +375,9 @@
 files.rm <- files.rm[-grep(".csv.gz",files.rm)]
 files.rm <- files.rm[grep(".csv",files.rm)]
 file.remove(files.rm)
+file.remove('files.xts.tmp.rda')
 
-
+rm(missing_i)
 rm(Out)
 
 ###############################################################################