Teamable-Analytics
diff --git a/‎.gitmodules‎
Lines changed: 3 additions & 0 deletions b/‎.gitmodules‎
Lines changed: 3 additions & 0 deletions
diff --git a/‎api/ai/algorithm_runner.py‎
Lines changed: 11 additions & 0 deletions b/‎api/ai/algorithm_runner.py‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎api/ai/external_algorithms/__init__.py‎ b/‎api/ai/external_algorithms/__init__.py‎
diff --git a/‎api/ai/external_algorithms/group_matcher_algorithm/__init__.py‎ b/‎api/ai/external_algorithms/group_matcher_algorithm/__init__.py‎
diff --git a/‎api/ai/external_algorithms/group_matcher_algorithm/custom_dataclasses.py‎
Lines changed: 90 additions & 0 deletions b/‎api/ai/external_algorithms/group_matcher_algorithm/custom_dataclasses.py‎
Lines changed: 90 additions & 0 deletions
diff --git a/‎api/ai/external_algorithms/group_matcher_algorithm/group-matcher‎ b/‎api/ai/external_algorithms/group_matcher_algorithm/group-matcher‎
diff --git a/‎api/ai/external_algorithms/group_matcher_algorithm/group_matcher_algorithm.py‎
Lines changed: 96 additions & 0 deletions b/‎api/ai/external_algorithms/group_matcher_algorithm/group_matcher_algorithm.py‎
Lines changed: 96 additions & 0 deletions
diff --git a/‎api/ai/external_algorithms/group_matcher_algorithm/utils.py‎
Lines changed: 121 additions & 0 deletions b/‎api/ai/external_algorithms/group_matcher_algorithm/utils.py‎
Lines changed: 121 additions & 0 deletions
diff --git a/‎api/ai/interfaces/algorithm_config.py‎
Lines changed: 14 additions & 0 deletions b/‎api/ai/interfaces/algorithm_config.py‎
Lines changed: 14 additions & 0 deletions
@@ -1,3 +1,6 @@
 [submodule "simulation_cache"]
     path = simulation_cache
     url = https://github.com/Teamable-Analytics/algorithms-simulation-cache.git
+[submodule "api/ai/external_algorithms/group_matcher_algorithm/group-matcher"]
+	path = api/ai/external_algorithms/group_matcher_algorithm/group-matcher
+	url = git@github.com:ketphan02/group-matcher.git
@@ -1,12 +1,16 @@
 from typing import List, TYPE_CHECKING
 
+from api.ai.external_algorithms.group_matcher_algorithm.group_matcher_algorithm import (
+    GroupMatcherAlgorithm,
+)
 from api.ai.geg_algorithm.geg_algorithm import GeneralizedEnvyGraphAlgorithm
 from api.ai.interfaces.algorithm_config import (
     AlgorithmConfig,
     RandomAlgorithmConfig,
     WeightAlgorithmConfig,
     SocialAlgorithmConfig,
     PriorityAlgorithmConfig,
+    GroupMatcherAlgorithmConfig,
 )
 from api.ai.interfaces.algorithm_options import (
     RandomAlgorithmOptions,
@@ -16,6 +20,7 @@
     MultipleRoundRobinAlgorithmOptions,
     GeneralizedEnvyGraphAlgorithmOptions,
     DoubleRoundRobinAlgorithmOptions,
+    GroupMatcherAlgorithmOptions,
 )
 from api.ai.interfaces.team_generation_options import TeamGenerationOptions
 from api.ai.multiple_round_robin_with_adjusted_winner_algorithm.mrr_algorithm import (
@@ -78,6 +83,8 @@ def get_algorithm_from_type(algorithm_type: AlgorithmType):
             return GeneralizedEnvyGraphAlgorithm
         if algorithm_type == AlgorithmType.DRR:
             return DoubleRoundRobinAlgorithm
+        if algorithm_type == AlgorithmType.GROUP_MATCHER:
+            return GroupMatcherAlgorithm
 
         raise NotImplementedError(
             f"Algorithm type {algorithm_type} is not associated with an algorithm class!"
@@ -99,6 +106,8 @@ def get_algorithm_option_class(algorithm_type: AlgorithmType):
             return GeneralizedEnvyGraphAlgorithmOptions
         if algorithm_type == AlgorithmType.DRR:
             return DoubleRoundRobinAlgorithmOptions
+        if algorithm_type == AlgorithmType.GROUP_MATCHER:
+            return GroupMatcherAlgorithmOptions
 
         raise NotImplementedError(
             f"Algorithm type {algorithm_type} is not associated with an algorithm options class!"
@@ -120,6 +129,8 @@ def get_algorithm_config_class(algorithm_type: AlgorithmType):
             return None
         if algorithm_type == AlgorithmType.DRR:
             return None
+        if algorithm_type == AlgorithmType.GROUP_MATCHER:
+            return GroupMatcherAlgorithmConfig
 
         raise NotImplementedError(
             f"Algorithm type {algorithm_type} is not associated with an algorithm config class!"
 
@@ -0,0 +1,90 @@
+from dataclasses import dataclass
+from typing import Dict, Iterator
+
+import faker
+from pandas import DataFrame
+
+from api.ai.external_algorithms.group_matcher_algorithm.utils import (
+    fromYearLevelToAlYearLevel,
+    fromNumbersToTimeSlots,
+    fromGenderToAlGender,
+    fromRaceToAlRace,
+)
+from api.dataclasses.enums import ScenarioAttribute, Gender, Race
+from api.dataclasses.student import Student
+from api.dataclasses.team import Team
+from api.dataclasses.team_set import TeamSet
+
+
+@dataclass
+class GroupMatcherStudent(Student):
+    def __init__(self, student: Student):
+        super().__init__(
+            student.id,
+            student.name,
+            student.attributes,
+            student.relationships,
+            student.project_preferences,
+            student.team,
+        )
+        self.email = faker.Faker().email()
+        if not self.name:
+            self.name = faker.Faker().name()
+
+    def get_formatted_data(self):
+        return {
+            "Email Address": self.email,
+            "SID": self.id,
+            "First name": self.name.split()[0],
+            "Last name": self.name.split()[1],
+            "What year are you": fromYearLevelToAlYearLevel(
+                self.attributes[ScenarioAttribute.YEAR_LEVEL.value][0]
+            ).value,
+            "Would you like to be part of a course study group?": "Yes",
+            "Do you have an existing study group of size 2-6 in mind": "No",
+            "timezone offset": "-7",  # all the same timezone
+            "Would you like to attend the same discussion": "Yes",
+            "discussion section times": fromNumbersToTimeSlots(
+                self.attributes.get(
+                    ScenarioAttribute.TIMESLOT_AVAILABILITY.value, ["1"]
+                )
+            ),
+            "Will you be on the Berkeley campus": "Yes",  # No remote students
+            "Which of these options best describes your race?": fromRaceToAlRace(
+                Race(self.attributes.get(ScenarioAttribute.RACE.value, [Race.Other])[0])
+            ).value,
+            "How do you self-identify?": fromGenderToAlGender(
+                Gender(self.attributes[ScenarioAttribute.GENDER.value][0])
+            ).value,
+        }
+
+    @staticmethod
+    def transform_output_data_to_team_set(
+        output_data: DataFrame,
+        team_trace: Dict[int, Team],
+        student_trace: Dict[int, Student],
+        team_cycler: Iterator[Team],
+    ) -> TeamSet:
+        for _, row in output_data.iterrows():
+            student_id = row["sid"]
+            group_num = int(row["group_num"]) + 1
+            if group_num not in team_trace.keys():
+                new_team_attributes = next(team_cycler)
+                new_team = Team(
+                    _id=len(team_trace) + 1,
+                    name=f"Team {len(team_trace) + 1}",
+                    requirements=new_team_attributes.requirements,
+                    project_id=new_team_attributes.project_id,
+                    students=[],
+                )
+                team_trace[int(row["group_num"]) + 1] = new_team
+
+            student = student_trace[student_id]
+            team = team_trace[int(row["group_num"]) + 1]
+
+            student.add_team(team)
+            team.add_student(student)
+
+        return TeamSet(
+            teams=[team for team in team_trace.values() if len(team.students) > 0]
+        )
@@ -0,0 +1,96 @@
+import csv
+from itertools import cycle
+import os
+import time
+from pathlib import Path
+from typing import List, Dict, Iterator
+
+import pandas as pd
+
+from api.ai.external_algorithms.group_matcher_algorithm.custom_dataclasses import (
+    GroupMatcherStudent,
+)
+from api.ai.interfaces.algorithm import Algorithm
+from api.ai.interfaces.algorithm_config import GroupMatcherAlgorithmConfig
+from api.ai.interfaces.algorithm_options import GroupMatcherAlgorithmOptions
+from api.ai.interfaces.team_generation_options import TeamGenerationOptions
+from api.dataclasses.student import Student
+from api.dataclasses.team import Team
+from api.dataclasses.team_set import TeamSet
+
+
+class GroupMatcherAlgorithm(Algorithm):
+    """
+    From paper: https://sigcse2023.sigcse.org/details/sigcse-ts-2023-papers/163/Inclusive-study-group-formation-at-scale
+    """
+
+    student_trace: Dict[int, Student]
+    team_trace: Dict[int, Team]
+    team_cycler: Iterator[Team]
+
+    group_matcher_input_data_file_path: Path
+    group_matcher_output_data_file_path: Path
+    group_matcher_config_path: Path
+
+    def __init__(
+        self,
+        algorithm_options: GroupMatcherAlgorithmOptions,
+        team_generation_options: TeamGenerationOptions,
+        algorithm_config: GroupMatcherAlgorithmConfig,
+    ):
+        super().__init__(algorithm_options, team_generation_options, algorithm_config)
+        self.group_matcher_input_data_file_path = Path(algorithm_config.csv_input_path)
+        self.group_matcher_run_path = algorithm_config.group_matcher_run_path
+
+        self.prepare_file_environment()
+
+        self.team_trace = {
+            team_idx + 1: team for team_idx, team in enumerate(self.teams)
+        }
+        self.team_cycler = cycle(self.teams)
+
+    def prepare_file_environment(self):
+        class_size = int(self.group_matcher_input_data_file_path.stem.split("-")[0])
+        self.group_matcher_run_path = self.group_matcher_run_path
+        self.group_matcher_output_data_file_path = (
+            Path.cwd() / f"out-private-{class_size}.csv"
+        )
+        if self.group_matcher_output_data_file_path.exists():
+            self.group_matcher_output_data_file_path.unlink()
+        self.group_matcher_config_path = (
+            Path(self.group_matcher_run_path).parent / "example_config.py"
+        )
+        if not self.group_matcher_input_data_file_path.parent.exists():
+            self.group_matcher_input_data_file_path.parent.mkdir(parents=True)
+
+    def export_students_data_to_group_matcher_format_csv(
+        self, students: List[Student]
+    ) -> None:
+        student_data = [
+            GroupMatcherStudent(student).get_formatted_data() for student in students
+        ]
+        self.student_trace = {student.id: student for student in students}
+        with open(self.group_matcher_input_data_file_path, "w") as csvfile:
+            writer = csv.DictWriter(
+                csvfile, fieldnames=student_data[0].keys(), delimiter=";"
+            )
+            writer.writeheader()
+            writer.writerows(student_data)
+
+    def generate(self, students: List[Student]) -> TeamSet:
+        self.export_students_data_to_group_matcher_format_csv(students)
+
+        # Run the group matcher algorithm
+        cmd = f"python3 {self.group_matcher_run_path} {self.group_matcher_config_path} {self.group_matcher_input_data_file_path}"
+        os.system(cmd)
+
+        # This only happens when class size is small and the system I/O speed is not as fast as the runtime
+        while not self.group_matcher_output_data_file_path.exists():
+            print("Not found file " + str(self.group_matcher_output_data_file_path))
+            time.sleep(1)
+        # Read the output csv file and create a TeamSet
+        df = pd.read_csv(self.group_matcher_output_data_file_path)
+
+        return GroupMatcherStudent.transform_output_data_to_team_set(
+            df, self.team_trace, self.student_trace, self.team_cycler
+        )
@@ -0,0 +1,121 @@
+from typing import List
+
+from api.dataclasses.enums import AttributeValueEnum, Gender, Race
+
+
+class AlRace(AttributeValueEnum):
+    White = "White"
+    Asian = "Asian"
+    Hispanic = "Hispanic"
+    Black_Or_African_American = "Black/African American"
+    Indegenous = "Indegenous"
+    Middle_Eastern = "Middle-Eastern"
+    Multiple_Races = "Multiple races"
+
+
+class AlYearLevel(AttributeValueEnum):
+    Freshman = "freshman"
+    Sophomore = "sophomore"
+    Junior = "junior"
+    Senior = "senior"
+    Graduate = "graduate"
+
+
+class AlGender(AttributeValueEnum):
+    Female = "Female"
+    Male = "Male"
+    Other = "Other"
+
+
+def fromGenderToAlGender(gender: Gender) -> AlGender:
+    if gender == Gender.MALE:
+        return AlGender.Male
+    if gender == Gender.FEMALE:
+        return AlGender.Female
+    return AlGender.Other
+
+
+def fromAlGenderToGender(alGenderNum: int or str) -> Gender:
+    if alGenderNum == 0 or alGenderNum == "Male":
+        return Gender.FEMALE
+    if alGenderNum == 1 or alGenderNum == "Female":
+        return Gender.MALE
+    return Gender.OTHER
+
+
+def fromRaceToAlRace(race: Race) -> AlRace:
+    if race == Race.European:
+        return AlRace.White
+    if (
+        race == Race.South_Asian
+        or race == Race.East_Asian
+        or race == Race.South_East_Asian
+    ):
+        return AlRace.Asian
+    if race == Race.Hispanic_or_Latin_American:
+        return AlRace.Hispanic
+    if race == Race.African:
+        return AlRace.Black_Or_African_American
+    if race == Race.First_Nations_or_Indigenous:
+        return AlRace.Indegenous
+    if race == Race.Middle_Eastern:
+        return AlRace.Middle_Eastern
+    if race == Race.Other:
+        return AlRace.Multiple_Races
+
+
+def fromAlRaceToRace(alRaceNum: int or str) -> Race:
+    if alRaceNum == 0 or alRaceNum == "White":
+        return Race.European
+    if alRaceNum == 1 or alRaceNum == "Asian":
+        return Race.South_Asian
+    if alRaceNum == 2 or alRaceNum == "Hispanic":
+        return Race.Hispanic_or_Latin_American
+    if alRaceNum == 3 or alRaceNum == "Black/African American":
+        return Race.African
+    if alRaceNum == 4 or alRaceNum == "Indegenous":
+        return Race.First_Nations_or_Indigenous
+    if alRaceNum == 5 or alRaceNum == "Middle-Eastern":
+        return Race.Middle_Eastern
+    if alRaceNum == 6 or alRaceNum == "Multiple races":
+        return Race.Other
+
+
+def fromYearLevelToAlYearLevel(yearLevel: int) -> AlYearLevel:
+    if yearLevel == 0:
+        return AlYearLevel.Freshman
+    if yearLevel == 1:
+        return AlYearLevel.Sophomore
+    if yearLevel == 2:
+        return AlYearLevel.Junior
+    if yearLevel == 3:
+        return AlYearLevel.Senior
+    return AlYearLevel.Graduate
+
+
+def fromAlYearLevelToYearLevel(alYearLevel: str) -> int:
+    if "freshman" in alYearLevel.lower():
+        return 0
+    if "sophomore" in alYearLevel.lower():
+        return 1
+    if "junior" in alYearLevel.lower():
+        return 2
+    if "senior" in alYearLevel.lower():
+        return 3
+    return 4
+
+
+def fromNumbersToTimeSlots(numbers: List[int]) -> List[str]:
+    return [fromNumberToTimeslot(number) for number in numbers]
+
+
+def fromNumberToTimeslot(number: int) -> str:
+    return str(number)
+
+
+def fromTimeslotToNumber(timeslot: str) -> int:
+    return int(timeslot)
+
+
+def fromTimeslotsToNumbers(timeslots: List[str]) -> List[int]:
+    return [fromTimeslotToNumber(timeslot) for timeslot in timeslots]
@@ -1,6 +1,7 @@
 from abc import ABC, abstractmethod
 from dataclasses import dataclass, field
 from enum import Enum
+from pathlib import Path
 from typing import Callable, Tuple, List
 
 from api.dataclasses.student import Student
@@ -121,3 +122,16 @@ def __init__(self, utility_function: Callable[[Student, TeamShell], float]):
 
     def validate(self):
         super().validate()
+
+
+class GroupMatcherAlgorithmConfig(AlgorithmConfig):
+    csv_input_path: Path
+    group_matcher_run_path: Path
+
+    def __init__(self, csv_output_path: str, group_matcher_run_path: str):
+        super().__init__()
+        self.csv_input_path = Path(csv_output_path)
+        self.group_matcher_run_path = Path(group_matcher_run_path)
+
+    def validate(self):
+        super().validate()