1
|
|
|
module Scheduling |
2
|
|
|
|
3
|
|
|
# A set of sessions which can be scored against a particular schedule. |
4
|
|
|
# |
5
|
|
|
# This can represent either the set of sessions an attendee is interested in seeing, |
6
|
|
|
# or the set a presenter is presenting. Either way, we want sessions booked in |
7
|
|
|
# nonoverlapping timeslots. |
8
|
|
|
# |
9
|
|
|
class SessionSet |
10
|
|
|
def initialize(ctx, superset: nil, penalty_callback: ->(*args) { 0 }) |
11
|
|
|
@ctx = ctx |
12
|
|
|
@superset = superset |
13
|
|
|
@penalty_callback = penalty_callback |
14
|
|
|
|
15
|
|
|
@sessions = Set.new |
16
|
|
|
end |
17
|
|
|
|
18
|
|
|
def add(session_id) |
19
|
|
|
@sessions << session_id |
20
|
|
|
@superset.add(session_id) if @superset |
21
|
|
|
end |
22
|
|
|
|
23
|
|
|
# The score if sessions are evenly distributed among all available timeslots. |
24
|
|
|
# |
25
|
|
|
def best_possible_score |
26
|
|
|
return 1 if empty? |
27
|
|
|
|
28
|
|
|
@best_possible_score ||= begin |
29
|
|
|
slot_count = @ctx.timeslots.size |
30
|
|
|
even_split_floor = size / slot_count |
31
|
|
|
big_slots = size % slot_count |
32
|
|
|
small_slots = slot_count - big_slots |
33
|
|
|
[ |
34
|
|
|
small_slots * slot_value(even_split_floor) + |
35
|
|
|
big_slots * slot_value(even_split_floor + 1), |
36
|
|
|
1.0 |
37
|
|
|
].min |
38
|
|
|
end |
39
|
|
|
end |
40
|
|
|
|
41
|
|
|
# The score if everything is in the same timeslot. |
42
|
|
|
# |
43
|
|
|
def worst_possible_score |
44
|
|
|
return 1 if empty? |
45
|
|
|
1.0 / size |
46
|
|
|
end |
47
|
|
|
|
48
|
|
|
# The average score of a randomly assigned schedule. This is a good baseline |
49
|
|
|
# for what the scheduler is trying to improve on — more so than worst_possible_score, |
50
|
|
|
# which tends to be far worse than any actual schedule would generate. |
51
|
|
|
# |
52
|
|
|
def random_schedule_score |
53
|
|
|
return 1 if empty? |
54
|
|
|
|
55
|
|
|
slot_count = @ctx.timeslots.size |
56
|
|
|
|
57
|
|
|
@@random_schedule_scores ||= {} |
|
|
|
|
58
|
|
|
@@random_schedule_scores[[slot_count, size]] ||= begin |
59
|
|
|
# Someone more knowledgeable than me can probably find |
60
|
|
|
# a closed form for this. But brute force works! |
61
|
|
|
trials = 1000 |
62
|
|
|
total = 0 |
63
|
|
|
trials.times do |
64
|
|
|
counts = [0] * slot_count |
65
|
|
|
size.times { counts[rand(slot_count)] += 1 } |
66
|
|
|
total += counts.sum { |c| slot_value(c) } |
67
|
|
|
end |
68
|
|
|
total / trials.to_f |
69
|
|
|
end |
70
|
|
|
end |
71
|
|
|
|
72
|
|
|
def score(schedule) |
73
|
|
|
return 1 if empty? |
74
|
|
|
|
75
|
|
|
slot_session_count = Hash.new(0) |
76
|
|
|
penalty = 0 |
77
|
|
|
|
78
|
|
|
@sessions.each do |session| |
79
|
|
|
slot = schedule.slot_id_for(session) |
80
|
|
|
slot_session_count[slot] += 1 |
81
|
|
|
penalty += @penalty_callback.call(slot) |
82
|
|
|
end |
83
|
|
|
|
84
|
|
|
satisfaction = slot_session_count.values.sum do |k| |
85
|
|
|
slot_value(k) |
86
|
|
|
end |
87
|
|
|
|
88
|
|
|
satisfaction - penalty / size.to_f |
89
|
|
|
end |
90
|
|
|
|
91
|
|
|
def size |
92
|
|
|
@sessions.size |
93
|
|
|
end |
94
|
|
|
|
95
|
|
|
def empty? |
96
|
|
|
@sessions.empty? |
97
|
|
|
end |
98
|
|
|
|
99
|
|
|
private |
100
|
|
|
|
101
|
|
|
# Assume each attendee has some ranking of all the sessions in which they expressed interest. |
102
|
|
|
# (Not an unreasonable assumption.) Further assume that the attendee values their sessions of interest |
103
|
|
|
# linearly: least interested=1,2,3...N=most interested. (That's more of a stretch, but likely bears |
104
|
|
|
# some resemblance to reality.) |
105
|
|
|
# |
106
|
|
|
# In each timeslot, assume the attendee will choose the session they're most interested in. We don't |
107
|
|
|
# know attendee's actual ranking, so assume sessions of interest are distributed randomly in the schedule. |
108
|
|
|
# The expected maximum of a slot in which there are k sessions is v_slot = k(N+1)/(k+1). The total |
109
|
|
|
# value of all sessions is v_total = N(N+1)/2. The expected fraction of total value in one slot is |
110
|
|
|
# thus v_slot / v_total = 2k/(N(k+1)). Sum that over all slots to get the attendee's overall satisfaction. |
111
|
|
|
# |
112
|
|
|
# A similar logic applies to presenters avoiding double-booking. |
113
|
|
|
# |
114
|
|
|
# (The old scheduling algorithm didn't take into account how deep the overlap ran within a given slot, |
115
|
|
|
# essentially set v_slot = {1/N if any sessions of interest, 0 otherwise}.) |
116
|
|
|
# |
117
|
|
|
def slot_value(k) |
118
|
|
|
2 * k / (size.to_f * (k + 1)) |
119
|
|
|
end |
120
|
|
|
|
121
|
|
|
end |
122
|
|
|
end |
123
|
|
|
|