-
Notifications
You must be signed in to change notification settings - Fork 1
/
Copy pathNDTC27a_SpreadBaseLScenCompare.py
executable file
·361 lines (306 loc) · 16.3 KB
/
NDTC27a_SpreadBaseLScenCompare.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
# -*- coding: utf-8 -*-
# Welcome to the DataNitro Editor
# Use Cell(row,column).value, or Cell(name).value, to read or write to cells
# Cell(1,1) and Cell("A1") refer to the top-left cell in the spreadsheet
#
# Note: To run this file, save it and run it from Excel (click "Run from File")
# If you have trouble saving, try using a different directory
import numpy as np
#=====================
### CUSTOM FUNCTIONS FOR EACH TEST
#=====================
# FUNCTION TO GET THE LISTS OF NAMES AND VALUES OF SOURCE CELLS
def getSrcCellsValueRange( mainSheet, totalFields, valsCol, i, j=0, k=0, \
numProducts=0, numRates=0, spreadInd=0 ):
''' Returns lists of Values and Names of the Source cells
for the given i and j indices '''
src_RowIndices = np.zeros((2,1), dtype=int)
srcCells_Val = np.zeros((2, len( Cell( mainSheet, 2, valsCol).horizontal)) )
for row in range( 0, 2):
src_RowIndices[row] = row*(numProducts*totalFields)+ ((i-1)*totalFields)+ \
(spreadInd+1) + 1
srcCells_Val[row] = Cell( mainSheet, np.asscalar( src_RowIndices[row][0])\
, valsCol ).horizontal
srcCells = Cell( mainSheet, np.asscalar( src_RowIndices[1][0]) \
, valsCol ).horizontal_range
srcCells_Name = np.array( [ cell.name for cell in srcCells ] )
return srcCells_Val, srcCells_Name
# FUNCTION TO GET BAD CELLS' VALUE AND NAME USING A CRITERIA
def getBadCellsValueRange( srcCells_Val, srcCells_Name, thresh, bpsVar):
''' Returns the Values and Names of the Bad Cells based on the Criterion '''
# (We can equivalently use either the filter method or the list comprehensions)
# IMP: But with indexing, must convert numpy array into regular list!
# NOTE: Convert bps to % (divide by 100), then % to decimal (divide by 100)
# OR: Convert "rate difference" to % and then to bps
if ( len(srcCells_Val) > 0 ):
# CRITERION #
#var = abs((srcCells_Val[1] - srcCells_Val[0])*100*100 + bpsVar)/ \
#abs( bpsVar)* 100
var = -((srcCells_Val[1] - srcCells_Val[0])*100 + bpsVar/100.)/ \
(srcCells_Val[1]*100) *100
# OR: abs( (srcCells_Val[1] - srcCells_Val[0]) + bpsVar/100./100.)/ \
# abs( bpsVar/100./100.) > thresh/100.
var = np.array([ round(num, 2) for num in var])
badCells_Var = var[ abs(var)>thresh ].tolist()
badCells_Val = ( srcCells_Val[1][ abs(var) > thresh ] * 100 ).tolist()
badCells_Name = srcCells_Name[ abs(var) > thresh ].tolist()
else:
badCells_Var = badCells_Val = badCells_Name = []
return badCells_Var, badCells_Val, badCells_Name
# FUNCTION TO GET THE ADDRESSES FOR DESTINATION CELLS
def getDestCellsAdd( i, j, k, numProducts=0, totalFields=0, numBalance=0, \
destScenIndex=0, spreadFieldsInd=[] ):
''' Returns Addresses for the Prod, Rate, Stat, and Value Cells in Dest. Sheet'''
#Start with 3rd row, b/c 1st row has Test Title and 2nd row has Threshold
dest_RowIndex = ((destScenIndex-1)*(numProducts*3)) + \
((i-1)*3) + 1 + 1 + 1
destCells_Scen = Cell( dest_RowIndex, 1)
destCells_Prod = Cell( dest_RowIndex, 2)
destCells_Rate = Cell( dest_RowIndex, 3)
destCells_Stat = Cell( dest_RowIndex, 4)
destCells_Add = Cell( dest_RowIndex, 5)
destCells_Val = Cell( dest_RowIndex + 1, 5)
destCells_Var = Cell( dest_RowIndex + 2, 5)
return destCells_Scen, destCells_Prod, destCells_Rate, destCells_Stat, \
destCells_Add, destCells_Val, destCells_Var
#=====================
### GENERIC FUNCTIONS FOR ALL TESTS
#=====================
# FUNCTION TO GET NAMES OF BASELINE AND SCENARIO:
def getBaselineScenarioNames( mainSheet, scenCol, scenarioOnly ):
""" Returns a list of Scenario and Baseline's Names"""
scenarios = np.array( Cell( mainSheet, 2, scenCol).vertical )
scenarios = [ str.encode('ascii') for str in scenarios ]
seen = set()
scenarioList = [ item for item in scenarios \
if item not in seen and not seen.add(item) ];
# 'not in' operation on a set is twice as fast as on a List:
#scenarioList = []
#[scenarioList.append(item) for item in scenarios
# if item not in scenarioList];
numScenarios = len(scenarioList)
# COMMENT OUT BELOW IF YOU WANT ACTUAL NAMES OF BASELINE AND SCENARIO
if numScenarios == 1:
scenarioList = ['Baseline']
else:
if scenarioOnly == 1:
scenarioList = ['Scenario']
else:
scenarioList = ['Baseline', 'Scenario']
return scenarioList, numScenarios
# FUNCTION TO GET NAMES AND COUNT OF ALL PRODUCTS:
def getProdsNamesCount( mainSheet, prodCol ):
""" Returns a list of all Products' Names and their Count"""
allProducts = np.array( Cell( mainSheet, 2, prodCol).vertical )
allProducts = [ str.encode('ascii') for str in allProducts ]
seen = set()
prodsList = [ item for item in allProducts \
if item not in seen and not seen.add(item) ];
# 'not in' operation on a set is twice as fast as on a List:
#prodsList = []
#[prodsList.append(item) for item in allProducts
# if item not in prodsList];
numProducts = len(prodsList)
return prodsList, numProducts
# FUNCTION TO GET NAMES AND COUNTS OF ALL RATE FIELDS:
def getFieldsNamesCount( mainSheet, kpisCol ):
""" Returns a list of all Rate Fields' names and their Count"""
allFields = Cell( mainSheet, 2, kpisCol ).vertical
allFields = [ str.encode('ascii') for str in allFields ]
seen = set()
fieldsList = [ item for item in allFields \
if item not in seen and not seen.add(item) ]
totalFields = len(fieldsList)
return fieldsList, totalFields
# FUNCTION TO GET NAMES AND COUNTS OF ALL BALANCE FIELDS:
def getBalanceNamesCount( mainSheet, kpisCol, numRates, numBalance ):
""" Returns a list of all Rate Fields' names and their Count"""
balanceList = CellRange( mainSheet, (2+numRates,kpisCol), \
(2+numRates+numBalance-1,kpisCol) ).value
balanceList = [ str.encode('ascii') for str in balanceList ]
return balanceList
# FUNCTION TO GET THE ROW INDEX FOR A PRODUCT'S SPREAD
def getSpreadRelatedRowIndices( fieldsList ):
''' Returns the index for the Spread related attributes in the Fields list '''
fields = ['spread', 'ftp', 'published rate']
indices = []
for j in range(0, len(fields) ):
indices.extend( [i for i,item in enumerate( fieldsList ) \
if fields[j] in item.lower()] )
# ''.join(a.split(' '): eliminates all spaces (\n, \t) from the string
return indices[0], indices[1], indices[2]
# FUNCTION TO CONVERT SOURCE CELLS TO FLOAT TYPE
def convertSourceToFloat( srcCells_Val ):
''' Returns the Source Cells converted to Float type '''
if ( len(srcCells_Val) > 0 ):
if ( type( srcCells_Val[0].tolist() ) == unicode ):
srcCells_Val = np.array( [ float( re.sub('\D', '', a) ) \
for a in srcCells_Val ] )
# replace lstrip & replace w/ regular expression: a.encode('ascii').lstrip('R ').replace(',', '')
else:
if len(srcCells_Val.shape)>1:
for row in range(0, len(srcCells_Val)):
srcCells_Val[row] = np.array( [ float(a) for a in srcCells_Val[row] ] )
else:
srcCells_Val = np.array( [ float(a) for a in srcCells_Val ])
return srcCells_Val
# FUNCTION TO CONVERT DATE CELLS NAMES TO DATES
def convertDateCellsToDate( cells_Name ):
''' Returns a list of dates corresponding to the list of cell names '''
cells_Cols = [ re.sub('\d', '', cell) for cell in cells_Name ]
cells_1stRowCols = [ elem + '1' for elem in cells_Cols ]
cells_Date = [ Cell(elem).value.strftime(' %b-%y') \
for elem in cells_1stRowCols]
return cells_Date
# FUNCTION TO CREATE/CLEAR NDTC REPORT WORKSHEET
def createOrClearReportWorksheet(destSheet, i, j, k=0, destScenIndex=0, \
scenarioOnly=0):
""" Creates a new worksheet if not already present,
else Clears it if the script is being run again"""
if destSheet not in all_sheets():
new_sheet(destSheet)
elif scenarioOnly == 1: #if only scenario
if j == -1: #if only 1 parameter displayed
if i == 1:
clear_sheet(destSheet)
elif i == 1 and j == 1:
clear_sheet(destSheet)
elif j == -1:
if i == 1 and destScenIndex == 1:
clear_sheet(destSheet)
elif i == 1 and j == 1 and destScenIndex == 1:
clear_sheet(destSheet)
# FUNCTION TO GET THESHOLD FROM THE WORKSHEET
def getThresholdFromSheet( destSheet, thresh, bpsVar ):
'''Gets the User-entered Threshold value before Clearing the Sheet'''
if destSheet in all_sheets():
if Cell( destSheet, 2, 2) != None:
thresh = Cell( destSheet, 2, 2).value
if Cell( destSheet, 2, 4) != None:
bpsVar = Cell( destSheet, 2, 4).value
return thresh, bpsVar
# FUNCTION TO ENTER HOUSE-KEEPING DATA ONTO THE WORKSHEET
def printTitleAndThreshold( destSheet, testTile, thresh=None, bpsVar=None):
'''Prints Title of the test and Threshold on the Sheet before values'''
Cell(destSheet, 1, 1).value = testTitle
Cell(destSheet, 1, 1).font.bold = True
if thresh != None:
Cell(destSheet, 2, 1).value = 'Threshold:'
Cell(destSheet, 2, 1).font.bold = True
Cell(destSheet, 2, 2).value = thresh
Cell(destSheet, 2, 2).color = 'yellow'
if bpsVar != None:
Cell(destSheet, 2, 3).value = 'bps Var.:'
Cell(destSheet, 2, 3).font.bold = True
Cell(destSheet, 2, 4).value = bpsVar
Cell(destSheet, 2, 4).color = 'yellow'
active_sheet(all_sheets()[0])
# FUNCTION TO SET THE STATUS (WITH COLORS) OF EACH RATE FIELD
def setRatesStatus( destSheet, badCells_Val, destCells_Stat, statColor):
''' Sets the statuses of each of the Rate Field based on
the existence of any bad cells '''
if len(badCells_Val) == 0:
Cell( destSheet, destCells_Stat.name ).value = 'OK'
Cell( destSheet, destCells_Stat.name ).font.color = statColor[0]
else:
Cell( destSheet, destCells_Stat.name ).value = 'WARN'
Cell( destSheet, destCells_Stat.name ).font.color = statColor[1]
#=====================
### MAIN FUNCTION BODY
#=====================
def main( destSheet, testTitle, numRates, numBalance,\
kpisCol, prodsCol, valsCol, ignoreRate, scenarioOnly, thresh, bpsVar):
## MAIN SHEET: Get the name of the sheet containing data & Set it as active
mainSheet = ( all_sheets()[0] ).encode('ascii')
active_sheet(mainSheet)
# THRESHOLD EXTRACTION FROM SHEET
thresh, bpsVar = getThresholdFromSheet( destSheet, thresh, bpsVar)
## PRODUCTS: Get their count and enlist their names
# (We have total of 16 cells representing Rates and Balances)
prodsList, numProducts = getProdsNamesCount( mainSheet, prodCol )
## FIELDS: Get their count and enlist their names as strings
fieldsList, totalFields = getFieldsNamesCount( mainSheet, kpisCol )
## SPREAD: Get the Indices for Fields associated with Spread
spreadInd, ftpInd, pubRateInd = getSpreadRelatedRowIndices( fieldsList )
## SCENARIOS: Get names of baseline and scenario
scenarioList, numScenarios = getBaselineScenarioNames( mainSheet, \
scenCol, scenarioOnly )
# MUST HAVE BASELINE & SCENARIO:
if numScenarios == 1:
Cell( destSheet, 1,2).value = 'ERROR: Needs Both Baseline & Scenario'
Cell( destSheet, 1,2).font.color = 'red'
return
## SET COLORS: for products, rates, and statuses
scenColor = prodColor = fieldsColor = ['blue', 'black']
statColor = ['green', 'red']
# INDEX FOR PRINTING DEST. SCENARIO CELLS
destScenIndex = 1
## FOR EACH SCENARIO:
if (scenarioOnly == 0):
kstart = 1
else:
kstart = 2
for k in range( kstart, numScenarios+1):
## FOR EACH PRODUCT:
for i in range(1, numProducts+1):
## SOURCE CELLS: Get Values and Range of the Corresponding Cells
srcCells_Val, srcCells_Name = getSrcCellsValueRange( mainSheet, \
totalFields, \
valsCol, \
i, 0, 0,\
numProducts,\
numRates,\
spreadInd)
## BALANCE TYPE' CONVERSION: First convert all Balances into Float type
srcCells_Val = convertSourceToFloat( srcCells_Val )
## BAD CELLS INFO: Values and Names of the Outlier Cells
badCells_Var, badCells_Val, badCells_Name = getBadCellsValueRange( srcCells_Val, \
srcCells_Name, \
thresh, bpsVar)
badCells_Date = convertDateCellsToDate( badCells_Name)
## DESTINATION SHEET GENERATION & THRESHOLD EXTRACTION & PRINTING:
# j MUST BE -1 if only 1 parameter is displayed
createOrClearReportWorksheet( destSheet, i, -1, 0, \
destScenIndex, scenarioOnly)
printTitleAndThreshold( destSheet, testTitle, thresh, bpsVar)
## DESTINATION CELLS
destCells_Scen, destCells_Prod, destCells_Rate, destCells_Stat, \
destCells_Add, destCells_Val, destCells_Var = getDestCellsAdd( i, 0, 0,\
numProducts, 0,\
numBalance, destScenIndex,\
[])
## POPULATE DESTINATION CELLS:
if ( i == 1 ): #Scenario Name printed only once
Cell( destSheet, destCells_Scen.name ).value = scenarioList[destScenIndex-1]
Cell( destSheet, destCells_Scen.name ).font.color = scenColor[i%2]
Cell( destSheet, destCells_Prod.name ).value = prodsList[i-1]
Cell( destSheet, destCells_Prod.name ).font.color = prodColor[i%2]
Cell( destSheet, destCells_Rate.name ).value = fieldsList[spreadInd]
Cell( destSheet, destCells_Rate.name ).font.color = fieldsColor[i%2]
setRatesStatus( destSheet, badCells_Val, destCells_Stat, statColor);
Cell( destSheet, destCells_Add.name ).horizontal = badCells_Date
Cell( destSheet, destCells_Val.name ).horizontal = badCells_Val
Cell( destSheet, destCells_Var.name ).horizontal = badCells_Var
CellRange( destSheet, (destCells_Var.row, destCells_Var.col), \
(destCells_Var.row, destCells_Var.col+len(badCells_Var)) ).font.color = 'red'
# Increment the index for Scenario Destination Cell
destScenIndex += 1
#=====================
### SET PARAMETERS AND RUN
#=====================
numRates = 3
numBalance = 10
scenCol = 2
prodCol = 4
kpisCol = 5
valsCol = 6
destSheet = 'NDTC27a'
testTitle = "Spread should 'Increase/Decrease' by x-bps Respectively, "\
"if Published Rate of a Product 'Decreases/Increases' by x-bps Respectively!"
ignoreRate = 'Rate Discretion'
scenarioOnly = 1 #MUST BE 1 FOR COMPARING SCENARIO W/ BASELINE: 1 for Scenario only, 0 for Both Scenario and Baseline
thresh = 2.5
bpsVar = 20
main( destSheet, testTitle, numRates, numBalance,\
kpisCol, prodCol, valsCol, ignoreRate, scenarioOnly, thresh, bpsVar)
display_sheet( destSheet)