-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathpreprocess.py
More file actions
28 lines (21 loc) · 801 Bytes
/
preprocess.py
File metadata and controls
28 lines (21 loc) · 801 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
import xlrd
import numpy
# Initial Data
# Open the workbook and define the worksheet
book = xlrd.open_workbook("input/StudentList2.xlsx")
sheet = book.sheet_by_name("Initial Interviews by Firm")
firmNames = sheet.row_values(0)
studentSet = set()
for rx in range(1, sheet.nrows):
for cell in sheet.row_values(rx):
if cell:
studentSet.add(cell)
# firmMap = { firm: index for index, firm in enumerate(firm) }
studentNames = list(studentSet)
studentMap = { student: index for index, student in enumerate(studentNames) }
meetings = numpy.zeros((len(firmNames), len(studentNames)), dtype=numpy.dtype(int))
for rx in range(1, sheet.nrows):
for i, cell in enumerate(sheet.row_values(rx)):
if cell:
meetings[i, studentMap[cell]] = 1
print(meetings)