How We Matched You to Your CodeLabs Team

Julie Cover, SRND

https://codeday.to/codelabs-matching-slides

Watch the slides live on your device!

The Problem, and

Others Like It

Phase 1: Priorities and Recommendations

Phase 2: Placement

for id, project in all_project_data.items():
    if project["proj_size_remaining"] == project["num_first_choice"]:
        all_project_data, 
          student_placements = place_students_of_choice(all_project_data, student_placements, 
                                                        id, 1,
                                                        project["proj_size_remaining"])

for id, project in all_project_data.items():
    if project["proj_size_remaining"] >= project["num_first_choice"]:
        all_project_data, 
          student_placements = place_students_of_choice(all_project_data, student_placements,
                                                        id, 1,
                                                        project["proj_size_remaining"])

_all_project_data = deepcopy(all_project_data)
for id, project in _all_project_data.items():
    if project["proj_size_remaining"] >= project["num_first_choice"]:
        all_project_data, 
          student_placements = place_students_of_choice_balanced(all_project_data, 
                                                                 student_placements,
                                                                 id, [2, 15],
                                                                 project["proj_size_remaining"])

_all_project_data = deepcopy(all_project_data)
for id, project in _all_project_data.items():
    all_project_data, 
      student_placements = place_students_of_choice_balanced(all_project_data, student_placements, 
                                                             id, [1, 2], 
                                                             project["proj_size_remaining"])
for i in range(3, 16, 4):
    _all_project_data = deepcopy(all_project_data)
    for id, project in _all_project_data.items():
        if project["proj_size_remaining"] >= project["num_first_choice"]:
            all_project_data, 
              student_placements = place_students_of_choice_balanced(all_project_data,
                                                                     student_placements, id,
                                                                     [i, i + 1, i + 2, i + 3],
                                                                     project["proj_size_remaining"])

How We Matched You to Your CodeLabs Team Julie Cover, SRND https://codeday.to/codelabs-matching-slides Watch the slides live on your device!

	const mentorSchema = {
	mentor_id: "",
	name: "",
	company: "",
	bio: "",
	backgroundRural: true,
	preferStudentUnderRep: 2, (0-2)
	okExtended: true,
	timezone: -7,
	preferToolExistingKnowledge: true,
	proj_id: "",
	proj_description: "",
	proj_tags: [""],
	studentsSelected: 2,
	};

	const studentSchema = {
	id: "",
	name: "",
	rural: false,
	underrepresented: false,
	requireExtended: true,
	timezone: -3,
	interestCompanies: [""],
	interestTags: [""],
	beginner: true,
	};

	combined_query = Q(
	"function_score",
	query=combined_query,
	functions=[
	SF(
	"script_score",
	script={
	"source": """
	int student_tz = params.student_tz;
	int mentor_tz = 0;
	// Null check. Even though timezone is required, somehow some null rows snuck in and bamboozled me
	if (doc['timezone'].size() == 0) {
	mentor_tz = 0;
	} else {
	mentor_tz = (int)doc['timezone'].value;
	}
	int diff = (int)Math.abs(student_tz - mentor_tz);

	boolean mentor_ok_tz_diff = false;
	if (doc['okTimezoneDifference'].size() == 0) {
	mentor_ok_tz_diff = false;
	} else {
	mentor_ok_tz_diff = doc['okTimezoneDifference'].value;
	}

	if (mentor_ok_tz_diff == true) {
	if (student_tz > 0) {
	// Mentor is OK with the time difference and student has a large time difference
	return 1;
	} else {
	// Mentor is ok with time difference and student has a normal time
	return 0.75;
	}
	} else {
	if (diff <= 2) {
	// Mentor is not ok with time difference and student has normal time
	return 1;
	} else if (diff == 3) {
	return 0.75;
	} else {
	// Mentor is not ok with time difference and student has weird time
	return 0;
	}
	}
	""",
	"params": {"student_tz": student["timezone"]},
	},
	)
	],
	boost_mode="multiply",
	score_mode="sum",
	)

	@app.route("/matches/<student_data>", methods=["GET"])
	def matches(student_data):
	try:
	data = decode(student_data, current_app.jwt_key, algorithms=["HS256"])
	except exceptions.DecodeError:
	raise Unauthorized("Something is wrong with your JWT Encoding.")
	ela_resp = evaluate_score(data, current_app.elasticsearch, 25)
	resp = [
	{"score": hit._score, "project": hit._source.to_dict()}
	for hit in ela_resp.hits.hits
	]
	return json.dumps(resp)

	# This is needed to allow the other libraries to import database,
	# as python doesn't check in the parent directory otherwise.
	currentdir = os.path.dirname(os.path.abspath(
	inspect.getfile(inspect.currentframe())))
	parentdir = os.path.dirname(currentdir)
	sys.path.insert(0, parentdir)

How We Matched You to Your CodeLabs Team

The Problem, and

Others Like It

Phase 1: Priorities and Recommendations

Phase 2: Placement

Stable Roommates Problem

Stable Marriage Problem

Stable Roommates Problem

Stable Marriage Problem

My Solution

Phase 0: Data

Phase 1: Matching w/ Elastic

Phase 1: Matching w/ Elastic

Phase 1: Matching w/ Elastic

Phase 1: Matching w/ Elastic

Phase 1: Matching w/ Elastic

Phase 1: Matching w/ Elastic

Elastic - What's Your Point?

Phase 2: APIs n' Stuff

Phase 2: APIs n' Stuff

Phase 2: APIs n' Stuff

Phase 3: Placement Algorithm

Phase 3: Placement Algorithm

Phase 4: Manual Cleanup - Sometimes

Speed Round

Thanks for Watching!

	# Store any Object on the App object!!
	app.elasticsearch = Elasticsearch(elastic_host)
	app.jwt_key = os.getenv("JWT_KEY")
	-----------------
	from flask import current_app
	print(current_app.jwt_key)

	// Sample GET request input
	const requestData = {
	"id": str(uuid.uuid4()),
	"name": "John Peter",
	"rural": True,
	"underrepresented": False,
	"timezone": -4,
	"interestCompanies": ['Microsoft', "Google"],
	"interestTags": ["Backend", "Data", "python", "php"],
	"requireExtended": False,
	"track": "Advanced"
	}