from SchedBuilderClasses import * import openpyxl as pyxl import pandas as pd import numpy as np import sqlite3 # def debug(func): # """Print the function signature and return value""" # @functools.wraps(func) # def wrapper_debug(*args, **kwargs): # args_repr = [repr(a) for a in args] # 1 # kwargs_repr = [f"{k}={v!r}" for k, v in kwargs.items()] # 2 # signature = ", ".join(args_repr + kwargs_repr) # 3 # print(f"Calling {func.__name__}({signature})") # value = func(*args, **kwargs) # print(f"{func.__name__!r} returned {value!r}") # 4 # return value # return wrapper_debug def addTBL(tblName,fields="",dTypes=None,data=None,addOn=False): """Create table if not already existing, optionally with data, optionally clearing out old data if present. Fields as list of strings. Datatypes as list of strings, one must be provided for each field. See sqlite3 docs for mroe info""" conn = sqlite3.connect('test14.db') c = conn.cursor() listedFields='' if fields=="": #If none given, make alphabetical fields=[chr(65+i) for i in range(len(data[0]))] if dTypes==None: #Need not specify dtypes for f in fields: listedFields=listedFields+', '+ f else: #define data types at inception of table flds=list(zip(fields,dTypes)) for pair in flds: listedFields=listedFields+', '+pair[0]+' '+pair[1] listedFields='('+listedFields[2:]+''')''' #Add leading and closing bracket, remove naively added comma+space from leading field c.execute('''CREATE TABLE IF NOT EXISTS '''+tblName+listedFields) # Create table. if addOn==False: #Delete if not adding c.execute('''DELETE FROM '''+tblName) if (data is not None) and len(data)>0: stmnt='INSERT INTO '+tblName+' VALUES (' for i in range(len(fields)-1): stmnt=stmnt+'?,'#Add '?,' equal to num columns less 1 stmnt=stmnt+'?)' #add closing ?), no final comma for subEntry in data: c.execute(stmnt, subEntry) conn.commit() def isNumeric(n): try: n=int(n) return True except ValueError: try: n=float(n) return True except: return False def viewTBL(tblName,fields=None,sortBy=None,filterOn=None,returnStatement=0): """return np array of table with optional select fields, filtered, sorted. Sort syntax=[(field1,asc/desc),(field2,asc/desc)...] Filter syntax=[(field1,value),(field2,value)...]""" conn = sqlite3.connect('test14.db') c = conn.cursor() stmnt='SELECT ' if fields!=None: flds='' for f in fields: flds=flds+', '+f stmnt=stmnt+flds[2:]+ ' FROM ' +tblName+' ' else: stmnt=stmnt+'* FROM '+tblName+' ' #unspecified, select all if filterOn!=None: filt='WHERE ' for f in filterOn: if isNumeric(f[1]): filt=filt+f[0]+' = '+ str(f[1])+' AND ' else: filt=filt+str(f[0])+' = "'+ str(f[1])+'" AND ' filt=filt[:-4] #Remove naively added final " and " stmnt=stmnt+filt if sortBy!=None: srt='ORDER BY ' for s in sortBy: srt=srt+s[0]+' '+s[1]+', ' srt=srt[:-2] stmnt=stmnt+srt stmnt=stmnt+';' if returnStatement==True: # Add option to print out the sql statement for troubleshooting return stmnt else: c.execute(stmnt) return [list(x) for x in c.fetchall()] #sqlite3 returns list of tuples.. want sublists for being editable def FTbtRow(ws): """Returns the excel row number for the bottom row with data in FT employee sheet""" #1st find bottom row with data for i in range(5,400): ref="C"+str(i) #Referencing EEID column. Failure mode is EEID missing for someone. Thats a bigger problem than the code not working if ws[ref].internal_value==None: #Condition met when end of data found. btmRow=i-1 #backtrack to last data break return btmRow def getFTinfo(flNm): """Returns dataframe with FT employee info (seniority,crew,eeid,name,refusal hours to date, OT hrs worked this week given path to FT refusal sheet""" myWb=pyxl.load_workbook(flNm) ws=myWb['Hourly OT'] btmRow=FTbtRow(ws) tab=[[x.internal_value for x in sublist] for sublist in ws['A5:I'+str(btmRow)]] #for rec in tab: #numeric values getting cast to string on import. cast back # for i in [0,2]: # rec[i]=int(rec[i]) # for i in [5,6,7]: # rec[i]=float(rec[i]) #Following to turn into dataframe #df_FTinfo=pd.DataFrame(tab) #df_FTinfo=df_FTinfo[[0,1,2,3,4,5,8]] #Pull out only required columns #df_FTinfo.set_axis(['snrty', 'crew', 'eeid','last','first','yrRef','wkOT'], axis='columns', inplace=True) return tab def FTendCol(ws): """Returns column # for last column of skills matrix in excel from FT refusal sheet""" for i in range(0,400): if ws['A1'].offset(0,i).value=='Start-up': #Condition met when end of data found. endCol=i-1 break return endCol def getFTskills(flNm): """Returns a dataframe containing a table with 2 fields: eeid and job name, with one record for every job an ee is trained in""" myWb=pyxl.load_workbook(flNm) ws=myWb['Hourly OT'] endCol=FTendCol(ws) #Get right limit for iteration through skills btmRow=FTbtRow(ws) #Get bottom limit for iteration through skills skills=[] #Initialize empty skills list for i in range(5,btmRow+1): #Data starts on row 5. +1 because range fn not inclusive eeid=ws['C'+str(i)].value for c in range(10,endCol+1): if ws['C'+str(i)].offset(0,c-2).value==1: #subtract 2 from c because the endCol is counted from col A, and we are offsetting from col C, whihc is 2 offset from A jobNm=ws['A2'].offset(0,c).value #if 1 indicates trained, pull job name from header row skills.append([eeid,jobNm]) #Add new record to skills table #idxs=np.array(skills)[:,0] #skills=pd.DataFrame(skills,idxs) #Convert to dataframe #skills.set_axis(['eeid','skill'], axis='columns', inplace=True) return skills def TempbtRow(ws): """Returns the excel row number for the bottom row with data in Temp employee sheet""" #1st find bottom row with data for i in range(4,400): ref="C"+str(i) #Referencing EEID column. Failure mode is EEID missing for someone. Thats a bigger problem than the code not working if ws[ref].internal_value==None: #Condition met when end of data found. btmRow=i-1 #backtrack to last data break return btmRow def getTempinfo(flNm): """Returns dataframe with FT employee info (seniority,crew,eeid,name,refusal hours to date, OT hrs worked this week given path to FT refusal sheet""" myWb=pyxl.load_workbook(flNm) ws=myWb['Temp Refusal'] btmRow=TempbtRow(ws) tab=[[x.internal_value for x in sublist] for sublist in ws['A4:I'+str(btmRow)]] #df_Tempinfo=pd.DataFrame(tab) #df_Tempinfo=df_Tempinfo[[0,1,2,3,4,5,8]] #Pull out only required columns #df_Tempinfo.set_axis(['snrty', 'crew', 'eeid','last','first','yrRef','wkOT'], axis='columns', inplace=True) return tab def TempendCol(ws): """Returns column # for last column of skills matrix in excel from FT refusal sheet""" for i in range(0,400): if ws['A2'].offset(0,i).value=='Start Up': #Condition met when end of data found. endCol=i-1 break return endCol def getTempskills(flNm): """Returns a dataframe containing a table with 2 fields: eeid and job name, with one record for every job an ee is trained in""" myWb=pyxl.load_workbook(flNm) ws=myWb['Temp Refusal'] endCol=TempendCol(ws) #Get right limit for iteration through skills btmRow=TempbtRow(ws) #Get bottom limit for iteration through skills skills=[] #Initialize empty skills list for i in range(4,btmRow+1): #Data starts on row 5. +1 because range fn not inclusive eeid=ws['C'+str(i)].value for c in range(11,endCol+1): #First skills column is 11 offset from col A if ws['C'+str(i)].offset(0,c-2).value==1: #subtract 2 from c because the endCol is counted from col A, and we are offsetting from col C, which is 2 offset from A jobNm=ws['A3'].offset(0,c).value #if 1 indicates trained, pull job name from header row skills.append([eeid,jobNm]) #Add new record to skills table #idxs=np.array(skills)[:,0] #skills=pd.DataFrame(skills,idxs) #Convert to dataframe #skills.set_axis(['eeid','skill'], axis='columns', inplace=True) return skills def imptXlTbl(XlFl,ShtNm,TblNm): myWb=pyxl.load_workbook(XlFl) ws=myWb[ShtNm] tab=ws.tables[TblNm] #Pull out table tab=[[x.value for x in sublist] for sublist in ws[tab.ref]] #Convert to list of lists (each sublist as row of excel table) return tab[1:] #Convert nested lists to array, dropping first row which is table headings def generateMasterPollTbl(pollDict): """Given a dictionary containing the polling tables for all crews, generates a master tbl in SQLlite for being able to filter on peoples availabilities, with '1' indicating interest, '0' no interest, and slot seq 1 starting at index 4""" mPollTbl=[] #the total list of all fields the table has is programmatically generated on these 3 lines flds=["eeid",'lastNm','firstNm','ytdRefHrs'] flds.extend(['slot_'+str(i) for i in range(1,25)])#Note that there is one field for each slot seqID, 1 through 24, for filtering flds.append('Comment') for crewKey in pollDict: tbl=pollDict[crewKey] #Pull the crew specific OT polling table from dictionary for rec in tbl: cmnt=rec[16]#retrieve comment to tag on later slotwise_polling=list(rec[:4]) for i in range(4,16): if rec[i] not in ('n','N',None) : slotwise_polling.extend(['y','y']) #Add two entries because 1 entry in polling sheet applies to two slots else: slotwise_polling.extend(['n','n']) slotwise_polling.append(cmnt) mPollTbl.append(slotwise_polling) addTBL('allPollData',fields=flds, data=mPollTbl,addOn=False) def pullTbls(FtBook,TempBook,AssnBook,PollBook): #Need to make volunteer shift data puller """Take flNm, return ftInfoTbl, ftSkillsMtx, tempInfoTbl, tempSkillsMtx, AssignmentsTbl, slot_Legend, JobTrnCrossRef, pollDict, All_Slots, senList. Uses functions defined previously to return all required tables at once. Function of functions for final script""" a=getFTinfo(FtBook) #to sqlite b=getFTskills(FtBook) #to sqlite b=[[int(d[0]),d[1]] for d in b] #Cast EEid to numeric value c=getTempinfo(TempBook) #to sqlite d=getTempskills(TempBook) #to sqlite d=[[int(data[0]),data[1]] for data in d] #Cast EEid to numeric value e=imptXlTbl(AssnBook,'Assignment_List','Assn_List') f=imptXlTbl(AssnBook,'Slot_Legend','Slot_Legend') g=imptXlTbl(AssnBook,'Job_Training_Crossref','TrainAssnMtx') #to sqlite pollDict={} #Generate empty dictionary to store tables of people voluntary overtime for crew in ['Blue','Bud','Rock']: for eeType in ['FT','Temp']: keyNm='tbl_'+crew+eeType tbl=imptXlTbl(PollBook,'Sheet1',keyNm) pollDict[keyNm]=tbl h=imptXlTbl(AssnBook,'All_Slots','All_Slots') #Generate tables in sqlite addTBL("sklMtx",fields=["EEID","trnNm"],data=b,addOn=False) #Overwrite all training data and populate FT ops, then append temps for a master table addTBL("sklMtx",fields=["EEID","trnNm"],data=d,addOn=True) addTBL("xRef",fields=["dispNm","trnNm"],data=g,addOn=False) #Skill name cross ref table for fcn dispToTrn to work addTBL("FTinfo",fields=['sen','crew','id','last','first','ytd','totref','totchrg','wtdOT'],data=a,addOn=False) addTBL("TempInfo",fields=['sen','crew','id','last','first','ytd','totref','totchrg','wtdOT'],data=c,addOn=False) # addTBL("FTinfo",fields=['sen','crew','id','last','first','ytd','totref','totchrg','wtdOT'],dTypes=['NUM','TEXT','NUM','TEXT','TEXT','NUM','NUM','NUM'],data=a,addOn=False) # addTBL("TempInfo",fields=['sen','crew','id','last','first','ytd','totref','totchrg','wtdOT'],dTypes=['INTEGER','TEXT','INTEGER','TEXT','TEXT','INTEGER','INTEGER','INTEGER'],data=c,addOn=False) #Generate a master seniority table.. following replaces hire date with integers for temps senHiLoTemps=viewTBL('TempInfo',sortBy=[('sen','ASC')]) #First retrieve list of temps, most senior to least i=100000 #Start new seniority number at arbitrarily high value not to interfere with full timer for row in senHiLoTemps: row[0]=i i+=1 #Overwrite/make new master sen ref table. Then append the Temp data with integerized values addTBL("senRef",fields=['sen','crew','id','last','first','ytd','totref','totchrg','wtdOT'],data=a,addOn=False) addTBL("senRef",fields=['sen','crew','id','last','first','ytd','totref','totchrg','wtdOT'],data=senHiLoTemps,addOn=True) senList=viewTBL('senRef',sortBy=[('sen','ASC')]) return a,b,c,d,e,f,g,pollDict,h,senList def dispToTrn(dispNm): """Returns the trnNm associated with Display name for a given job. assumes popualted sqlite table 'xRef' with dispNm/trnNm pairs""" q=viewTBL('xRef',fields=['dispNm','trnNm'],filterOn=[('dispNm',dispNm)]) if len(q)==0: return "Custom func error 'dispToTrn' no entry found in xRef with dispNm="+str(dispNm) return q[0][1] def trnToDisp(trnNm): """Returns the trnNm associated with Display name for a given job. assumes popualted sqlite table 'xRef' with dispNm/trnNm pairs""" q=viewTBL('xRef',fields=['dispNm','trnNm'],filterOn=[('trnNm',trnNm)]) if len(q)==0: return "Custom func error 'trnToDisp' no entry found in xRef with trnNm="+str(trnNm) return [e[0] for e in q] #If multiple DispNms for one train name (e.g. L4 Packer -> Packer, Candling) or Bottle Supply -> etc. #Then return list of all dispNms def sklChk(eeid,dispNm): """Returns True/False if eeid is trained on job with display name or not. Requires skills matrix named sklMtx in sqlite""" trnNm=dispToTrn(dispNm) if len(viewTBL('sklMtx',filterOn=[('EEID',eeid),('trnNm',trnNm)]))==0: return False else: return True def makeEEdict(ftInfoTbl,tempInfoTbl,wkHrs): eeDict={} for dtaTbl in [ftInfoTbl,tempInfoTbl]: for row in dtaTbl: # if row[1].lower().strip() in ['wwf','bud','blue','rock','silver','gold','student']: #Omit people not in packaging, or off, vacation etc eeSkills=viewTBL('sklMtx',['trnNm'],filterOn=[('EEID',row[2])]) eeSkills=[trnToDisp(nm[0]) for nm in eeSkills] #Gather display names for skills trained on, reducing lists within list to spread elements sk=[] #Create empty to accumulate all skills present within sublists of eeSkills for s in eeSkills: sk.extend(s) sen=viewTBL('senRef',fields=['sen'],filterOn=[('id',str(row[2]))])[0][0] anEE=ee(sen,row[1].lower().strip(),int(row[2]),row[3],row[4],row[5],row[8]+wkHrs,skills=sk) #Pull info from Refusals sheet eeDict[anEE.eeID]=anEE return eeDict def makeSlots(eeDict,AllSlots): openSlots={} #Open here meaning unassigned.. Will be required when it comes time to force for row in AllSlots: if row[6]==1: #Check that the slot generation record is labelled as 'active' for i in range(row[0],row[1]+1): #Generate a slot for each index over the range indicated... add 1 because python Range fn not inclusive of end point sl=Slot(i, row[2],dispToTrn(row[2])) #Determine how many eligible volunteers for this slot elig=[] #To track how many people trained for rec in viewTBL('allPollData',filterOn=[('slot_'+str(sl.seqID),'y')]): # iterate through results (employee info's) of query on who said yes to working at the time of this slot if sl.dispNm in eeDict[rec[0]].skills: elig.append(rec[0]) #Append EEID to list 'elig' if the ee is trained on the job sl.eligVol=elig # True values as 1.. sum to see number of eligible volunteers for the slot. openSlots[str(sl.seqID)+'_'+str(sl.dispNm)]=sl #Enter it into the dictionary return openSlots def preProcessData(Acrew,wkHrs,FtBook,TempBook,AssnBook,PollBook,pNT=False): """A function to take input data and generate all necessary tables and objects in memory to carry out algorithm. Return Schedule object containing all workSlot objects, and dictioanry fo all employee objects""" ftInfoTbl, ftSkillsMtx, tempInfoTbl, tempSkillsMtx, AssignmentsTbl, slot_Legend, JobTrnCrossRef,pollDict,AllSlots,senList=pullTbls(FtBook,TempBook,AssnBook,PollBook) #GenerateMasterPollTbl to facilitate making the Slots... require having a table with all employee preferences. generateMasterPollTbl(pollDict) #Generate Worker Objects, and assign to dictionary keyed by eeID (numeric key, not string keys) eeDict=makeEEdict(ftInfoTbl,tempInfoTbl,wkHrs) #Generate Schedule Slot objects (all unassigned slots for weekend) allSlots=makeSlots(eeDict,AllSlots) return Schedule(Acrew,allSlots,eeDict,AssignmentsTbl,senList,pollDict,slot_Legend,pNT=pNT) def pullSomeTbls(FtBook,TempBook,AssnBook,PollBook): #Need to make volunteer shift data puller """Take flNm, return ftInfoTbl, ftSkillsMtx, tempInfoTbl, tempSkillsMtx, AssignmentsTbl, slot_Legend, JobTrnCrossRef, pollDict, All_Slots, senList. Uses functions defined previously to return all required tables at once. Function of functions for final script""" a=getFTinfo(FtBook) #to sqlite b=getFTskills(FtBook) #to sqlite b=[[int(d[0]),d[1]] for d in b] #Cast EEid to numeric value c=getTempinfo(TempBook) #to sqlite d=getTempskills(TempBook) #to sqlite d=[[int(data[0]),data[1]] for data in d] #Cast EEid to numeric value e=imptXlTbl(AssnBook,'Assignment_List','Assn_List') f=imptXlTbl(AssnBook,'Slot_Legend','Slot_Legend') g=imptXlTbl(AssnBook,'Job_Training_Crossref','TrainAssnMtx') #to sqlite pollDict={} #Generate empty dictionary to store tables of people voluntary overtime for crew in ['Blue','Bud','Rock','Silver','Gold']: for eeType in ['FT','Temp']: keyNm='tbl_'+crew+eeType tbl=imptXlTbl(PollBook,'Sheet1',keyNm) pollDict[keyNm]=tbl h=imptXlTbl(AssnBook,'All_Slots','All_Slots') #Generate tables in sqlite addTBL("sklMtx",fields=["EEID","trnNm"],data=b,addOn=False) #Overwrite all training data and populate FT ops, then append temps for a master table addTBL("sklMtx",fields=["EEID","trnNm"],data=d,addOn=True) addTBL("xRef",fields=["dispNm","trnNm"],data=g,addOn=False) #Skill name cross ref table for fcn dispToTrn to work addTBL("FTinfo",fields=['sen','crew','id','last','first','ytd','totref','totchrg','wtdOT'],data=a,addOn=False) addTBL("TempInfo",fields=['sen','crew','id','last','first','ytd','totref','totchrg','wtdOT'],data=c,addOn=False) # addTBL("FTinfo",fields=['sen','crew','id','last','first','ytd','totref','totchrg','wtdOT'],dTypes=['NUM','TEXT','NUM','TEXT','TEXT','NUM','NUM','NUM'],data=a,addOn=False) # addTBL("TempInfo",fields=['sen','crew','id','last','first','ytd','totref','totchrg','wtdOT'],dTypes=['INTEGER','TEXT','INTEGER','TEXT','TEXT','INTEGER','INTEGER','INTEGER'],data=c,addOn=False) #Generate a master seniority table.. following replaces hire date with integers for temps senHiLoTemps=viewTBL('TempInfo',sortBy=[('sen','ASC')]) #First retrieve list of temps, most senior to least i=100000 #Start new seniority number at arbitrarily high value not to interfere with full timer for row in senHiLoTemps: row[0]=i i+=1 #Overwrite/make new master sen ref table. Then append the Temp data with integerized values addTBL("senRef",fields=['sen','crew','id','last','first','ytd','totref','totchrg','wtdOT'],data=a,addOn=False) addTBL("senRef",fields=['sen','crew','id','last','first','ytd','totref','totchrg','wtdOT'],data=senHiLoTemps,addOn=True) senList=viewTBL('senRef',sortBy=[('sen','ASC')]) return a,b,c,d,e,f,g,pollDict,h,senList