import sys
import docplex.mp


# This notebook requires pandas to work
from io import StringIO
import json
import pandas as pd
from pandas import DataFrame

# Make sure that xlrd package, which is a pandas optional dependency, is installed
# This package is required for Excel I/O
try:
    import xlrd
except:
    if hasattr(sys, 'real_prefix'):
        #we are in a virtual env.
        !pip install xlrd 
    else:
        !pip install --user xlrd


import requests
import io

# Use pandas to read the file, one tab for each table.
url="https://api.dataplatform.cloud.ibm.com/v2/gallery-assets/entries/2505b070a22403aac9f84884d315219e/data?accessKey=de4d953f2a766fbc0469723eba0b0e93"
response = requests.get(url)

nurse_xls_file = pd.ExcelFile(io.BytesIO(response.content))
df_skills = nurse_xls_file.parse('Skills')
df_depts  = nurse_xls_file.parse('Departments')
df_shifts = nurse_xls_file.parse('Shifts')
# Rename df_shifts index
df_shifts.index.name = 'shiftId'

# Index is column 0: name
df_nurses = nurse_xls_file.parse('Nurses', header=0, index_col=0)
df_nurse_skilles = nurse_xls_file.parse('NurseSkills')
df_vacations = nurse_xls_file.parse('NurseVacations')
df_associations = nurse_xls_file.parse('NurseAssociations')
df_incompatibilities = nurse_xls_file.parse('NurseIncompatibilities')

# Display the nurses dataframe
print("#nurses = {}".format(len(df_nurses)))
print("#shifts = {}".format(len(df_shifts)))
print("#vacations = {}".format(len(df_vacations)))

#nurses = 32
#shifts = 41
#vacations = 59


# maximum work time (in hours)
max_work_time = 40

# maximum number of shifts worked in a week.
max_nb_shifts = 5


df_shifts


days = ["monday", "tuesday", "wednesday", "thursday", "friday", "saturday", "sunday"]
day_of_weeks = dict(zip(days, range(7)))

# utility to convert a day string e.g. "Monday" to an integer in 0..6
def day_to_day_of_week(day):
    return day_of_weeks[day.strip().lower()]

# for each day name, we normalize it by stripping whitespace and converting it to lowercase
# " Monday" -> "monday"
df_shifts["dow"] = df_shifts.day.apply(day_to_day_of_week)
df_shifts


df_shifts["wstart"] = df_shifts.start_time + 24 * df_shifts.dow


df_shifts


# an auxiliary function to calculate absolute end time of a shift
def calculate_absolute_endtime(row):
    dow = row[6]
    start = row[2]
    end = row[3]
    return 24*dow + end + (24 if start>=end else 0)

df_shifts["wend"] = df_shifts.apply(calculate_absolute_endtime, axis=1, raw=True)


df_shifts["duration"] = df_shifts.wend - df_shifts.wstart


# also compute minimum demand in nurse-hours
df_shifts["min_demand"] = df_shifts.min_req * df_shifts.duration

# finally check the modified shifts dataframe
df_shifts


from docplex.mp.environment import Environment
env = Environment()
env.print_information()

* system is: Linux 64bit
* Python version 3.10.13, located at: /opt/conda/envs/Python-RT23.1-Premium/bin/python
* docplex is present, version is 2.25.236
* CPLEX library is present, version is 22.1.1.0, located at: /opt/conda/envs/Python-RT23.1-Premium/lib/python3.10/site-packages
* pandas is present, version is 1.5.3


from docplex.mp.model import Model
mdl = Model(name="nurses")


# first global collections to iterate upon
all_nurses = df_nurses.index.values
all_shifts = df_shifts.index.values

# the assignment variables.
assigned = mdl.binary_var_matrix(keys1=all_nurses, keys2=all_shifts, name="assign_%s_%s")


# Organize decision variables in a DataFrame
df_assigned = DataFrame({'assigned': assigned})
df_assigned.index.names=['all_nurses', 'all_shifts']

# Re-organize the Data Frame as a pivot table with nurses as row index and shifts as columns:
df_assigned_pivot = df_assigned.unstack(level='all_shifts')

# Create a pivot using nurses and shifts index as dimensions
df_assigned_pivot = df_assigned.reset_index().pivot(index='all_nurses', columns='all_shifts', values='assigned')

# Display first rows of the pivot table
df_assigned_pivot.head()


# Create a Data Frame representing a list of shifts sorted by wstart and duration.
# One keeps only the three relevant columns: 'shiftId', 'wstart' and 'wend' in the resulting Data Frame 
df_sorted_shifts = df_shifts.sort_values(['wstart','duration']).reset_index()[['shiftId', 'wstart', 'wend']]

# Display the first rows of the newly created Data Frame
df_sorted_shifts.head()


number_of_incompatible_shift_constraints = 0
for shift in df_sorted_shifts.itertuples():
    # Iterate over following shifts
    # 'shift[0]' contains the index of the current shift in the df_sorted_shifts Data Frame
    for shift_2 in df_sorted_shifts.iloc[shift[0] + 1:].itertuples():
        if (shift_2.wstart < shift.wend):
            # Iterate over all nurses to force incompatible assignment for the current pair of overlapping shifts
            for nurse_assignments in df_assigned_pivot[[shift.shiftId, shift_2.shiftId]].itertuples():                
                # this is actually a logical OR
                mdl.add_constraint(nurse_assignments[1] + nurse_assignments[2] <= 1)
                number_of_incompatible_shift_constraints += 1
        else:
            # No need to test overlap with following shifts
            break
print("#incompatible shift constraints: {}".format(number_of_incompatible_shift_constraints))

#incompatible shift constraints: 640


# Add 'day of week' column to vacations Data Frame
df_vacations['dow'] = df_vacations.day.apply(day_to_day_of_week)

# Join 'df_vacations', 'df_shifts' and 'df_assigned' Data Frames to create the list of 'forbidden' assigments.
# The 'reset_index()' function is invoked to move 'shiftId' index as a column in 'df_shifts' Data Frame, and
# to move the index pair ('all_nurses', 'all_shifts') as columns in 'df_assigned' Data Frame.
# 'reset_index()' is invoked so that a join can be performed between Data Frame, based on column names.
df_assigned_reindexed = df_assigned.reset_index()
df_vacation_forbidden_assignments = df_vacations.merge(df_shifts.reset_index()[['dow', 'shiftId']]).merge(
    df_assigned_reindexed, left_on=['nurse', 'shiftId'], right_on=['all_nurses', 'all_shifts'])

# Here are the first few rows of the resulting Data Frames joins
df_vacation_forbidden_assignments.head()


for forbidden_assignment in df_vacation_forbidden_assignments.itertuples():
    # to forbid an assignment just set the variable to zero.
    mdl.add_constraint(forbidden_assignment.assigned == 0)
print("# vacation forbids: {} assignments".format(len(df_vacation_forbidden_assignments)))

# vacation forbids: 342 assignments


# Join 'df_assignment' Data Frame twice, based on associations to get corresponding decision variables pairs for all shifts
# The 'suffixes' parameter in the second merge indicates our preference for updating the name of columns that occur both
# in the first and second argument Data Frames (in our case, these columns are 'all_nurses' and 'assigned').
df_preferred_assign = df_associations.merge(
    df_assigned_reindexed, left_on='nurse1', right_on='all_nurses').merge(
    df_assigned_reindexed, left_on=['nurse2', 'all_shifts'], right_on=['all_nurses', 'all_shifts'], suffixes=('_1','_2'))

# Here are the first few rows of the resulting Data Frames joins
df_preferred_assign.head()


for preferred_assign in df_preferred_assign.itertuples():
    mdl.add_constraint(preferred_assign.assigned_1 == preferred_assign.assigned_2)


# Join assignment Data Frame twice, based on incompatibilities Data Frame to get corresponding decision variables pairs
#  for all shifts
df_incompatible_assign = df_incompatibilities.merge(
    df_assigned_reindexed, left_on='nurse1', right_on='all_nurses').merge(
    df_assigned_reindexed, left_on=['nurse2', 'all_shifts'], right_on=['all_nurses', 'all_shifts'], suffixes=('_1','_2'))

# Here are the first few rows of the resulting Data Frames joins
df_incompatible_assign.head()


for incompatible_assign in df_incompatible_assign.itertuples():
    mdl.add_constraint(incompatible_assign.assigned_1 + incompatible_assign.assigned_2 <= 1)


# auxiliary function to create worktime variable from a row
def make_var(row, varname_fmt):
    return mdl.continuous_var(name=varname_fmt % row.name, lb=0)

# apply the function over nurse rows and store result in a new column
df_nurses["worktime"] = df_nurses.apply(lambda r: make_var(r, "worktime_%s"), axis=1)

# display nurse dataframe
df_nurses


# Use pandas' groupby operation to enforce constraint calculating worktime for each nurse as the sum of all assigned
#  shifts times the duration of each shift
for nurse, nurse_assignments in df_assigned.groupby(level='all_nurses'):
    mdl.add_constraint(df_nurses.worktime[nurse] == mdl.dot(nurse_assignments.assigned, df_shifts.duration))
                       
# print model information and check we now have 32 extra continuous variables
mdl.print_information()

Model: nurses
 - number of variables: 1344
   - binary=1312, integer=0, continuous=32
 - number of constraints: 1547
   - linear=1547
 - parameters: defaults
 - objective: none
 - problem type is: MILP


# we use pandas' apply() method to set an upper bound on all worktime variables.
def set_max_work_time(v):
    v.ub = max_work_time
    # Optionally: return a string for fancy display of the constraint in the Output cell
    return str(v) + ' <= ' + str(v.ub)

df_nurses["worktime"].apply(convert_dtype=False, func=set_max_work_time)

name
Anne            worktime_Anne <= 40
Bethanie    worktime_Bethanie <= 40
Betsy          worktime_Betsy <= 40
Cathy          worktime_Cathy <= 40
Cecilia      worktime_Cecilia <= 40
Chris          worktime_Chris <= 40
Cindy          worktime_Cindy <= 40
David          worktime_David <= 40
Debbie        worktime_Debbie <= 40
Dee              worktime_Dee <= 40
Gloria        worktime_Gloria <= 40
Isabelle    worktime_Isabelle <= 40
Jane            worktime_Jane <= 40
Janelle      worktime_Janelle <= 40
Janice        worktime_Janice <= 40
Jemma          worktime_Jemma <= 40
Joan            worktime_Joan <= 40
Joyce          worktime_Joyce <= 40
Jude            worktime_Jude <= 40
Julie          worktime_Julie <= 40
Juliet        worktime_Juliet <= 40
Kate            worktime_Kate <= 40
Nancy          worktime_Nancy <= 40
Nathalie    worktime_Nathalie <= 40
Nicole        worktime_Nicole <= 40
Patricia    worktime_Patricia <= 40
Patrick      worktime_Patrick <= 40
Roberta      worktime_Roberta <= 40
Suzanne      worktime_Suzanne <= 40
Vickie        worktime_Vickie <= 40
Wendie        worktime_Wendie <= 40
Zoe              worktime_Zoe <= 40
Name: worktime, dtype: object


# Use pandas' groupby operation to enforce minimum requirement constraint for each shift
for shift, shift_nurses in df_assigned.groupby(level='all_shifts'):
    mdl.add_constraint(mdl.sum(shift_nurses.assigned) >= df_shifts.min_req[shift])


# again leverage pandas to create a series of expressions: costs of each nurse
total_salary_series = df_nurses.worktime * df_nurses.pay_rate

# compute global salary cost using pandas sum()
# Note that the result is a DOcplex expression: DOcplex if fully compatible with pandas
total_salary_cost = total_salary_series.sum()
mdl.add_kpi(total_salary_cost, "Total salary cost")

DecisionKPI(name=Total salary cost,expr=25worktime_Anne+28worktime_Bethanie+17worktime_Betsy+17worktime_..)


mdl.minimize(total_salary_cost)
mdl.print_information()

Model: nurses
 - number of variables: 1344
   - binary=1312, integer=0, continuous=32
 - number of constraints: 1588
   - linear=1588
 - parameters: defaults
 - objective: minimize
 - problem type is: MILP


# Set Cplex mipgap to 1e-5 to enforce precision to be of the order of a unit (objective value magnitude is ~1e+5).
mdl.parameters.mip.tolerances.mipgap = 1e-5

s = mdl.solve(log_output=True)
assert s, "solve failed"
mdl.report()

WARNING: Number of workers has been reduced to 2 to comply with platform limitations.
Version identifier: 22.1.1.0 | 2022-11-28 | 9160aff4d
CPXPARAM_Read_DataCheck                          1
CPXPARAM_Threads                                 2
CPXPARAM_MIP_Tolerances_MIPGap                   1.0000000000000001e-05
Tried aggregator 2 times.
MIP Presolve eliminated 997 rows and 379 columns.
MIP Presolve modified 90 coefficients.
Aggregator did 41 substitutions.
Reduced MIP has 550 rows, 922 columns, and 2862 nonzeros.
Reduced MIP has 892 binaries, 0 generals, 0 SOSs, and 0 indicators.
Presolve time = 0.02 sec. (3.66 ticks)
Probing time = 0.00 sec. (0.50 ticks)
Tried aggregator 1 time.
Detecting symmetries...
Reduced MIP has 550 rows, 922 columns, and 2862 nonzeros.
Reduced MIP has 892 binaries, 30 generals, 0 SOSs, and 0 indicators.
Presolve time = 0.01 sec. (2.01 ticks)
Probing time = 0.00 sec. (0.50 ticks)
Clique table members: 479.
MIP emphasis: balance optimality and feasibility.
MIP search method: dynamic search.
Parallel mode: deterministic, using up to 2 threads.
Root relaxation solution time = 0.02 sec. (4.73 ticks)

        Nodes                                         Cuts/
   Node  Left     Objective  IInf  Best Integer    Best Bound    ItCnt     Gap

      0     0    28824.0000    45                  28824.0000      499         
      0     0    28824.0000    42                    Cuts: 35      600         
      0     0    28824.0000    67                    Cuts: 91      730         
*     0+    0                        29290.0000    28824.0000             1.59%
      0     0    28824.0000    26    29290.0000      Cuts: 19      810    1.59%
      0     0    28824.0000    40    29290.0000      Cuts: 44      890    1.59%
*     0+    0                        29104.0000    28824.0000             0.96%
*     0+    0                        29020.0000    28824.0000             0.68%
      0     2    28824.0000     9    29020.0000    28824.0000      890    0.68%
Elapsed time = 0.36 sec. (140.76 ticks, tree = 0.02 MB, solutions = 3)
*    10+   10                        28988.0000    28824.0000             0.57%
*    20+   20                        28920.0000    28824.0000             0.33%
*    22+    1                        28842.0000    28824.0000             0.06%
*   634+  554                        28838.0000    28824.0000             0.05%
    831   713    28824.0000     4    28838.0000    28824.0000    14546    0.05%
*   841+  682                        28824.0000    28824.0000             0.00%

GUB cover cuts applied:  17
Cover cuts applied:  17
Flow cuts applied:  2
Mixed integer rounding cuts applied:  14
Zero-half cuts applied:  13
Lift and project cuts applied:  1
Gomory fractional cuts applied:  4

Root node processing (before b&c):
  Real time             =    0.37 sec. (140.55 ticks)
Parallel b&c, 2 threads:
  Real time             =    0.39 sec. (276.47 ticks)
  Sync time (average)   =    0.04 sec.
  Wait time (average)   =    0.00 sec.
                          ------------
Total (root+branch&cut) =    0.76 sec. (417.02 ticks)
* model nurses solved with objective = 28824.000
*  KPI: Total salary cost = 28824.000


# Create a pandas Series containing actual shift assignment decision variables value
s_assigned = df_assigned.assigned.apply(lambda v: v.solution_value)

# Create a pivot table by (nurses, shifts), using pandas' "unstack" method to transform the 'all_shifts' row index
#  into columns
df_res = s_assigned.unstack(level='all_shifts')

# Display the first few rows of the resulting pivot table
df_res.head()


s_demand  = df_shifts.min_req * df_shifts.duration
total_demand = s_demand.sum()
avg_worktime = total_demand / float(len(all_nurses))
print("* theoretical average work time is {0:g} h".format(avg_worktime))

* theoretical average work time is 39 h


# a pandas series of worktimes solution values
s_worktime = df_nurses.worktime.apply(lambda v: v.solution_value)

# returns a new series computed as deviation from average
s_to_mean = s_worktime - avg_worktime

# take the absolute value
s_abs_to_mean = s_to_mean.apply(abs)


total_to_mean = s_abs_to_mean.sum()
print("* the sum of absolute deviations from mean is {}".format(total_to_mean))

* the sum of absolute deviations from mean is 58.0


import matplotlib.pyplot as plt
%matplotlib inline

# we can also plot as a histogram the distribution of worktimes
s_worktime.plot.hist(color='LightBlue')
plt.xlabel("worktime")

Text(0.5, 0, 'worktime')


# a pandas series of #shifts worked
df_worked = df_res[all_shifts].sum(axis=1)
df_res["worked"] = df_worked

df_worked.plot.hist(color="gold", xlim=(0,10))
plt.ylabel("#shifts worked")

Text(0, 0.5, '#shifts worked')


avg_worked = df_shifts["min_req"].sum() / float(len(all_nurses))
print("-- expected avg #shifts worked is {}".format(avg_worked))

worked_to_avg = df_res["worked"] - avg_worked
total_to_mean = worked_to_avg.apply(abs).sum()
print("-- total absolute deviation to mean #shifts is {}".format(total_to_mean))

-- expected avg #shifts worked is 6.875
-- total absolute deviation to mean #shifts is 14.5


# add two extra variables per nurse: deviations above and below average
df_nurses["worked"]      = df_nurses.apply(lambda r: make_var(r, "worked%s"), axis=1)
df_nurses["overworked"]  = df_nurses.apply(lambda r: make_var(r, "overw_%s"), axis=1)
df_nurses["underworked"] = df_nurses.apply(lambda r: make_var(r, "underw_%s"), axis=1)


# Use the pandas groupby operation to enforce the constraint calculating number of worked shifts for each nurse
for nurse, nurse_assignments in df_assigned.groupby(level='all_nurses'):
    # nb of worked shifts is sum of assigned shifts
    mdl.add_constraint(df_nurses.worked[nurse] == mdl.sum(nurse_assignments.assigned))

for nurse in df_nurses.itertuples():
    # nb worked is average + over - under
    mdl.add_constraint(nurse.worked == avg_worked + nurse.overworked - nurse.underworked)


# finally, define kpis for over and under average quantities
total_overw = mdl.sum(df_nurses["overworked"])
mdl.add_kpi(total_overw, "Total over-worked")
total_underw = mdl.sum(df_nurses["underworked"])
mdl.add_kpi(total_underw, "Total under-worked")

DecisionKPI(name=Total under-worked,expr=underw_Anne+underw_Bethanie+underw_Betsy+underw_Cathy+underw_Cec..)


mdl.minimize(total_salary_cost + total_overw + total_underw)  # incorporate over_worked and under_worked in objective


sol2 = mdl.solve(log_output=True)  # solve again and get a new solution
assert sol2, "Solve failed"
mdl.report()

WARNING: Number of workers has been reduced to 2 to comply with platform limitations.
Version identifier: 22.1.1.0 | 2022-11-28 | 9160aff4d
CPXPARAM_Read_DataCheck                          1
CPXPARAM_Threads                                 2
CPXPARAM_MIP_Tolerances_MIPGap                   1.0000000000000001e-05
1 of 11 MIP starts provided solutions.
MIP start 'm1' defined initial solution with objective 28838.5000.
Tried aggregator 2 times.
MIP Presolve eliminated 997 rows and 379 columns.
MIP Presolve modified 90 coefficients.
Aggregator did 73 substitutions.
Reduced MIP has 582 rows, 986 columns, and 3859 nonzeros.
Reduced MIP has 892 binaries, 0 generals, 0 SOSs, and 0 indicators.
Presolve time = 0.02 sec. (4.32 ticks)
Probing time = 0.00 sec. (0.59 ticks)
Tried aggregator 1 time.
Detecting symmetries...
MIP Presolve eliminated 2 rows and 4 columns.
Reduced MIP has 580 rows, 982 columns, and 3814 nonzeros.
Reduced MIP has 892 binaries, 30 generals, 0 SOSs, and 0 indicators.
Presolve time = 0.01 sec. (2.39 ticks)
Probing time = 0.00 sec. (0.58 ticks)
Clique table members: 479.
MIP emphasis: balance optimality and feasibility.
MIP search method: dynamic search.
Parallel mode: deterministic, using up to 2 threads.
Root relaxation solution time = 0.02 sec. (10.52 ticks)

        Nodes                                         Cuts/
   Node  Left     Objective  IInf  Best Integer    Best Bound    ItCnt     Gap

*     0+    0                        28838.5000        0.0000           100.00%
      0     0    28827.9167    72    28838.5000    28827.9167      756    0.04%
      0     0    28829.2500    58    28838.5000      Cuts: 63      868    0.03%
      0     0    28830.3438    59    28838.5000     Cuts: 125     1107    0.03%
      0     0    28831.0000    57    28838.5000      Cuts: 55     1260    0.03%
      0     0    28831.0000    28    28838.5000      Cuts: 10     1352    0.03%
      0     0    28831.0000    31    28838.5000      Cuts: 34     1399    0.03%
      0     2    28831.0000     5    28838.5000    28831.0000     1399    0.03%
Elapsed time = 0.34 sec. (171.74 ticks, tree = 0.02 MB, solutions = 1)
*    88    63      integral     0    28831.0000    28831.0000     3415    0.00%

GUB cover cuts applied:  16
Cover cuts applied:  8
Flow cuts applied:  22
Mixed integer rounding cuts applied:  62
Zero-half cuts applied:  11
Lift and project cuts applied:  2
Gomory fractional cuts applied:  11

Root node processing (before b&c):
  Real time             =    0.35 sec. (171.38 ticks)
Parallel b&c, 2 threads:
  Real time             =    0.09 sec. (60.15 ticks)
  Sync time (average)   =    0.01 sec.
  Wait time (average)   =    0.00 sec.
                          ------------
Total (root+branch&cut) =    0.43 sec. (231.53 ticks)
* model nurses solved with objective = 28831.000
*  KPI: Total salary cost  = 28824.000
*  KPI: Total over-worked  = 3.500
*  KPI: Total under-worked = 3.500


# Create a pandas Series containing actual shift assignment decision variables value
s_assigned2 = df_assigned.assigned.apply(lambda v: v.solution_value)

# Create a pivot table by (nurses, shifts), using pandas' "unstack" method to transform the 'all_shifts' row index
#  into columns
df_res2 = s_assigned2.unstack(level='all_shifts')

# Add a new column to the pivot table containing the #shifts worked by summing over each row
df_res2["worked"] = df_res2[all_shifts].sum(axis=1)

# total absolute deviation from average is directly read on expressions
new_total_to_mean = total_overw.solution_value + total_underw.solution_value
print("-- total absolute deviation to mean #shifts is now {0} down from {1}".format(new_total_to_mean, total_to_mean))

# Display the first few rows of the result Data Frame
df_res2.head()

-- total absolute deviation to mean #shifts is now 7.0 down from 14.5


df_res2["worked"].plot(kind="hist", color="gold", xlim=(3,8))

<Axes: ylabel='Frequency'>


mdl.minimize(total_overw + total_underw)
assert mdl.solve(), "solve failed"
mdl.report()

* model nurses solved with objective = 4.000
*  KPI: Total salary cost  = 29606.000
*  KPI: Total over-worked  = 4.000
*  KPI: Total under-worked = 0.000


# Create a pandas Series containing actual shift assignment decision variables value
s_assigned_fair = df_assigned.assigned.apply(lambda v: v.solution_value)

# Create a pivot table by (nurses, shifts), using pandas' "unstack" method to transform the 'all_shifts' row index
#  into columns
df_res_fair = s_assigned_fair.unstack(level='all_shifts')

# Add a new column to the pivot table containing the #shifts worked by summing over each row
df_res_fair["solution_value_fair"] = df_res_fair[all_shifts].sum(axis=1)
df_res_fair["worked"] = df_res_fair[all_shifts].sum(axis=1)
df_res_fair["worked"].plot.hist(color="plum", xlim=(3,8))

<Axes: ylabel='Frequency'>

all_shifts	0	1	2	3	4	5	6	7	8	9	...	31	32	33	34	35	36	37	38	39	40
all_nurses
Anne	assign_Anne_0	assign_Anne_1	assign_Anne_2	assign_Anne_3	assign_Anne_4	assign_Anne_5	assign_Anne_6	assign_Anne_7	assign_Anne_8	assign_Anne_9	...	assign_Anne_31	assign_Anne_32	assign_Anne_33	assign_Anne_34	assign_Anne_35	assign_Anne_36	assign_Anne_37	assign_Anne_38	assign_Anne_39	assign_Anne_40
Bethanie	assign_Bethanie_0	assign_Bethanie_1	assign_Bethanie_2	assign_Bethanie_3	assign_Bethanie_4	assign_Bethanie_5	assign_Bethanie_6	assign_Bethanie_7	assign_Bethanie_8	assign_Bethanie_9	...	assign_Bethanie_31	assign_Bethanie_32	assign_Bethanie_33	assign_Bethanie_34	assign_Bethanie_35	assign_Bethanie_36	assign_Bethanie_37	assign_Bethanie_38	assign_Bethanie_39	assign_Bethanie_40
Betsy	assign_Betsy_0	assign_Betsy_1	assign_Betsy_2	assign_Betsy_3	assign_Betsy_4	assign_Betsy_5	assign_Betsy_6	assign_Betsy_7	assign_Betsy_8	assign_Betsy_9	...	assign_Betsy_31	assign_Betsy_32	assign_Betsy_33	assign_Betsy_34	assign_Betsy_35	assign_Betsy_36	assign_Betsy_37	assign_Betsy_38	assign_Betsy_39	assign_Betsy_40
Cathy	assign_Cathy_0	assign_Cathy_1	assign_Cathy_2	assign_Cathy_3	assign_Cathy_4	assign_Cathy_5	assign_Cathy_6	assign_Cathy_7	assign_Cathy_8	assign_Cathy_9	...	assign_Cathy_31	assign_Cathy_32	assign_Cathy_33	assign_Cathy_34	assign_Cathy_35	assign_Cathy_36	assign_Cathy_37	assign_Cathy_38	assign_Cathy_39	assign_Cathy_40
Cecilia	assign_Cecilia_0	assign_Cecilia_1	assign_Cecilia_2	assign_Cecilia_3	assign_Cecilia_4	assign_Cecilia_5	assign_Cecilia_6	assign_Cecilia_7	assign_Cecilia_8	assign_Cecilia_9	...	assign_Cecilia_31	assign_Cecilia_32	assign_Cecilia_33	assign_Cecilia_34	assign_Cecilia_35	assign_Cecilia_36	assign_Cecilia_37	assign_Cecilia_38	assign_Cecilia_39	assign_Cecilia_40

The Nurse Assignment Problem¶

Describe the business problem¶

How Decision Optimization can help¶

Use Decision Optimization¶

Step 1: Import the DOcplex package¶

Step 2: Model the data¶

Loading data from Excel with pandas¶

Step 3: Prepare the data¶

Sub-step #1¶

Sub-step #2 : Compute the absolute start time of each shift.¶

Sub-Step #3 : Compute the absolute end time of each shift.¶

Sub-step #4 : Compute the duration of each shift.¶

Sub-step #5 : Compute the minimum demand for each shift.¶

Step 4: Set up the prescriptive model¶

Create the DOcplex model¶

Define the decision variables¶

Express the business constraints¶

Overlapping shifts¶

Vacations¶

Associations¶

Incompatibilities¶

Constraints on work time¶

Define total work time¶

Maximum work time¶

Minimum requirement for shifts¶

Express the objective¶

Minimizing salary cost¶

Solve with the Decision Optimization solve service¶

Step 5: Investigate the solution and run an example analysis¶

Analyzing how worktime is distributed¶

How shifts are distributed¶

Introducing a fairness goal¶

Step #1 : Introduce three new variables per nurse to model the¶

Step #2 : Post the constraint that links these variables together.¶

Step #3 : Define KPIs to measure the result after solve.¶

Analyzing new results¶

The breakdown of shifts over nurses is much closer to the average than it was in the previous version.¶

But what would be the minimal fairness level?¶

Summary¶

References¶

	department	day	start_time	end_time	min_req	max_req
shiftId
0	Emergency	Monday	2	8	3	5
1	Emergency	Monday	8	12	4	7
2	Emergency	Monday	12	18	2	5
3	Emergency	Monday	18	2	3	7
4	Consultation	Monday	8	12	10	13
5	Consultation	Monday	12	18	8	12
6	Cardiac Care	Monday	8	12	10	13
7	Cardiac Care	Monday	12	18	8	12
8	Emergency	Tuesday	8	12	4	7
9	Emergency	Tuesday	12	18	2	5
10	Emergency	Tuesday	18	2	3	7
11	Consultation	Tuesday	8	12	10	13
12	Consultation	Tuesday	12	18	8	12
13	Cardiac Care	Tuesday	8	12	4	7
14	Cardiac Care	Tuesday	12	18	2	5
15	Cardiac Care	Tuesday	18	2	3	7
16	Emergency	Wednesday	2	8	3	5
17	Emergency	Wednesday	8	12	4	7
18	Emergency	Wednesday	12	18	2	5
19	Emergency	Wednesday	18	2	3	7
20	Consultation	Wednesday	8	12	10	13
21	Consultation	Wednesday	12	18	8	12
22	Emergency	Thursday	2	8	3	5
23	Emergency	Thursday	8	12	4	7
24	Emergency	Thursday	12	18	2	5
25	Emergency	Thursday	18	2	3	7
26	Consultation	Thursday	8	12	10	13
27	Consultation	Thursday	12	18	8	12
28	Emergency	Friday	2	8	3	5
29	Emergency	Friday	8	12	4	7
30	Emergency	Friday	12	18	2	5
31	Emergency	Friday	18	2	3	7
32	Consultation	Friday	8	12	10	13
33	Consultation	Friday	12	18	8	12
34	Emergency	Saturday	2	12	5	7
35	Emergency	Saturday	12	20	7	9
36	Emergency	Saturday	20	2	12	12
37	Emergency	Sunday	2	12	5	7
38	Emergency	Sunday	12	20	7	9
39	Emergency	Sunday	20	2	8	12
40	Geriatrics	Sunday	8	10	2	5

	nurse1	nurse2	all_nurses_1	all_shifts	assigned_1	all_nurses_2	assigned_2
0	Isabelle	Dee	Isabelle	0	assign_Isabelle_0	Dee	assign_Dee_0
1	Isabelle	Dee	Isabelle	1	assign_Isabelle_1	Dee	assign_Dee_1
2	Isabelle	Dee	Isabelle	2	assign_Isabelle_2	Dee	assign_Dee_2
3	Isabelle	Dee	Isabelle	3	assign_Isabelle_3	Dee	assign_Dee_3
4	Isabelle	Dee	Isabelle	4	assign_Isabelle_4	Dee	assign_Dee_4

	nurse1	nurse2	all_nurses_1	all_shifts	assigned_1	all_nurses_2	assigned_2
0	Patricia	Patrick	Patricia	0	assign_Patricia_0	Patrick	assign_Patrick_0
1	Patricia	Patrick	Patricia	1	assign_Patricia_1	Patrick	assign_Patrick_1
2	Patricia	Patrick	Patricia	2	assign_Patricia_2	Patrick	assign_Patrick_2
3	Patricia	Patrick	Patricia	3	assign_Patricia_3	Patrick	assign_Patrick_3
4	Patricia	Patrick	Patricia	4	assign_Patricia_4	Patrick	assign_Patrick_4

	seniority	qualification	pay_rate	worktime
name
Anne	11	1	25	worktime_Anne
Bethanie	4	5	28	worktime_Bethanie
Betsy	2	2	17	worktime_Betsy
Cathy	2	2	17	worktime_Cathy
Cecilia	9	5	38	worktime_Cecilia
Chris	11	4	38	worktime_Chris
Cindy	5	2	21	worktime_Cindy
David	1	2	15	worktime_David
Debbie	7	2	24	worktime_Debbie
Dee	3	3	21	worktime_Dee
Gloria	8	2	25	worktime_Gloria
Isabelle	3	1	16	worktime_Isabelle
Jane	3	4	23	worktime_Jane
Janelle	4	3	22	worktime_Janelle
Janice	2	2	17	worktime_Janice
Jemma	2	4	22	worktime_Jemma
Joan	5	3	24	worktime_Joan
Joyce	8	3	29	worktime_Joyce
Jude	4	3	22	worktime_Jude
Julie	6	2	22	worktime_Julie
Juliet	7	4	31	worktime_Juliet
Kate	5	3	24	worktime_Kate
Nancy	8	4	32	worktime_Nancy
Nathalie	9	5	38	worktime_Nathalie
Nicole	0	2	14	worktime_Nicole
Patricia	1	1	13	worktime_Patricia
Patrick	6	1	19	worktime_Patrick
Roberta	3	5	26	worktime_Roberta
Suzanne	5	1	18	worktime_Suzanne
Vickie	7	1	20	worktime_Vickie
Wendie	5	2	21	worktime_Wendie
Zoe	8	3	29	worktime_Zoe

all_shifts	0	1	2	3	4	5	6	7	8	9	...	31	32	33	34	35	36	37	38	39	40
all_nurses
Anne	0.0	0.0	0.0	1.0	1.0	0.0	0.0	0.0	0.0	0.0	...	0.0	0.0	0.0	0.0	0.0	0.0	0.0	0.0	0.0	0.0
Bethanie	0.0	1.0	0.0	0.0	0.0	0.0	0.0	1.0	0.0	0.0	...	1.0	0.0	1.0	0.0	0.0	0.0	0.0	0.0	0.0	0.0
Betsy	0.0	0.0	0.0	0.0	0.0	0.0	0.0	0.0	0.0	0.0	...	1.0	1.0	1.0	0.0	0.0	0.0	0.0	0.0	1.0	0.0
Cathy	1.0	0.0	0.0	0.0	0.0	0.0	1.0	1.0	0.0	0.0	...	0.0	1.0	1.0	0.0	1.0	1.0	0.0	0.0	0.0	0.0
Cecilia	0.0	0.0	1.0	0.0	0.0	0.0	1.0	0.0	1.0	0.0	...	0.0	0.0	0.0	0.0	0.0	0.0	0.0	0.0	0.0	0.0

all_shifts	0	1	2	3	4	5	6	7	8	9	...	32	33	34	35	36	37	38	39	40	worked
all_nurses
Anne	0.0	0.0	0.0	0.0	1.0	0.0	0.0	1.0	0.0	0.0	...	0.0	0.0	0.0	0.0	0.0	0.0	0.0	0.0	0.0	7.0
Bethanie	0.0	0.0	0.0	0.0	1.0	0.0	0.0	0.0	0.0	0.0	...	0.0	1.0	0.0	0.0	0.0	1.0	0.0	0.0	0.0	7.0
Betsy	0.0	0.0	0.0	0.0	0.0	0.0	0.0	0.0	0.0	0.0	...	0.0	0.0	0.0	0.0	0.0	0.0	1.0	0.0	0.0	7.0
Cathy	0.0	0.0	0.0	0.0	1.0	1.0	0.0	0.0	0.0	0.0	...	1.0	1.0	0.0	0.0	1.0	1.0	0.0	0.0	0.0	7.0
Cecilia	0.0	0.0	0.0	0.0	1.0	0.0	0.0	1.0	1.0	0.0	...	0.0	0.0	0.0	0.0	1.0	0.0	0.0	0.0	0.0	6.0