From b05600605dea5af231569caba7b30cddbc8d4ada Mon Sep 17 00:00:00 2001
From: dvitel <viteldmitry@gmail.com>
Date: Thu, 23 Feb 2023 13:44:18 -0500
Subject: [PATCH] sampling quiz model

---
 .vscode/launch.json           |  41 +++++-
 evopie/cli.py                 |  17 ++-
 evopie/deca.py                |  22 +--
 evopie/pphc_quiz_model.py     |   9 +-
 evopie/quiz_model.py          |  17 ++-
 evopie/rand_quiz_model.py     |  15 +-
 evopie/sampling_quiz_model.py | 254 ++++++++++++++++++++++++++++++++++
 experiment.sh                 |  34 ++++-
 8 files changed, 377 insertions(+), 32 deletions(-)
 create mode 100644 evopie/sampling_quiz_model.py

diff --git a/.vscode/launch.json b/.vscode/launch.json
index fd35d53..5d70ae4 100644
--- a/.vscode/launch.json
+++ b/.vscode/launch.json
@@ -160,6 +160,27 @@
                 "--random-seed", "17"
             ]
         },
+        {
+            "name": "CLI: quiz run deca-pphc Sampling",
+            "type": "python",
+            "request": "launch",
+            "module" : "flask",
+            "env" : {
+                "FLASK_APP" : "app.py",
+                "FLASK_ENV" : "development",
+                "FLASK_DEBUG" : "1",
+                // "EVOPIE_DATABASE_LOG": "db.log" 
+            },
+            "args" : [
+                "quiz",
+                "run",
+                "-q", "1",
+                "-s", "STEP1",
+                "--algo", "evopie.sampling_quiz_model.SamplingQuizModel", "--algo-params", "{ \"n\": 3, \"min_num_evals\": 1, \"group_size\": 2, \"strategy\": \"non_domination\"}",
+                "--evo-output", "algo/s-nond.json", "--archive-output", "algo/a.csv",
+                "--random-seed", "17"
+            ]
+        },
         {
             "name": "CLI: deca init",
             "type": "python",
@@ -238,7 +259,7 @@
                 "--result-folder", "data/data-8/results",
                 "--figure-folder", "figures",
                 "--file-name-pattern", ".*_20-\\d+.csv",
-                "-p", "dim_coverage_with_spanned", "--group-by-space"
+                "--group-by-space"
             ]
         },
         {
@@ -280,6 +301,24 @@
             ],
             "console": "internalConsole"
         },
+        {
+            "name": "CLI: quiz deca-experiment Sampling",
+            "type": "python",
+            "request": "launch",
+            "module": "flask",
+            "env" : {
+                "FLASK_APP" : "app.py",
+                "FLASK_ENV" : "development",
+                "FLASK_DEBUG" : "1"
+            },
+            "args" : [
+                "quiz", "deca-experiment",
+                "--deca-input", "deca-spaces/space-4_4_4_4-s_4-0.json",
+                "--num-runs", "2",
+                "--algo", "{ \"id\": \"s-nond\", \"algo\":\"evopie.sampling_quiz_model.SamplingQuizModel\", \"n\": 3, \"min_num_evals\": 1, \"group_size\": 2, \"strategy\": \"non_domination\"}"
+            ],
+            "console": "internalConsole"
+        },
         {
             "name": "CLI: quiz deca-experiment RAND",
             "type": "python",
diff --git a/evopie/cli.py b/evopie/cli.py
index 58bf614..9cc3128 100644
--- a/evopie/cli.py
+++ b/evopie/cli.py
@@ -455,12 +455,13 @@ def export_student_knowledge(output):
 
 KNOWLEDGE_SELECTION_CHANCE = "KNOWLEDGE_SELECTION_CHANCE"
 KNOWLEDGE_SELECTION_WEIGHT = "KNOWLEDGE_SELECTION_WEIGHT"
+KNOWLEDGE_SELECTION_STRENGTH = "KNOWLEDGE_SELECTION_STRENGTH"
 
 @quiz_cli.command("run")
 @click.option('-q', '--quiz', type=int, required=True)
 @click.option('-s', '--step', default = [QUIZ_STEP1], multiple=True)
 @click.option('-n', '--n-times', type=int, default=1)
-@click.option('-kns', '--knowledge-selection', default = KNOWLEDGE_SELECTION_WEIGHT)
+@click.option('-kns', '--knowledge-selection', default = KNOWLEDGE_SELECTION_STRENGTH)
 @click.option('-i', '--instructor', default='i@usf.edu')
 @click.option('-p', '--password', default='pwd') 
 @click.option('--no-algo', is_flag=True) #randomize student order
@@ -537,6 +538,12 @@ def simulate_step(step):
                                             for sums in [np.cumsum(weights)]
                                             for level in [(rnd_state.rand() * sums[-1]) if len(sums) > 0 else None]
                                             for selected_d_index in [next((i for i, s in enumerate(sums) if s > level), None)]}
+                elif knowledge_selection == KNOWLEDGE_SELECTION_STRENGTH:
+                    responses = {qid:sorted(ds, key=lambda x: x[1])[-1][0]
+                                            for qid, distractors in attempt.alternatives_map.items() 
+                                            for distractor_strength in [student_knowledge.get(qid, {}) ]
+                                            for ds_distr in [[(alt, distractor_strength[d]) for alt, d in enumerate(distractors) if d in distractor_strength]] 
+                                            for ds in [ds_distr if any(ds_distr) else [(alt,1) for alt, d in enumerate(distractors) if d == -1]]}
                 else: 
                     responses = {}
 
@@ -573,17 +580,19 @@ def simulate_step(step):
                 if quiz_model is None:
                     sys.stdout.write(f"[{run_idx + 1}/{n_times}] Step1 quiz {quiz} finished\n")            
                 else:
-                    model_state = quiz_model.get_model_state()
+                    settings = quiz_model.get_model_state()
+                    best_distractors = quiz_model.get_best_quiz()
 
                     if archive_output is not None: 
                         quiz_model.to_csv(archive_output.format(run_idx))
                     
                     search_space_size = quiz_model.get_search_space_size()
                     explored_search_space_size = quiz_model.get_explored_search_space_size()
-                    sys.stdout.write(f"EVO algo: {quiz_model.__class__}\nEVO settings: {model_state}\n")
+                    sys.stdout.write(f"EVO algo: {quiz_model.__class__}\nEVO settings: {settings}\n")
                     if evo_output: 
                         with open(evo_output, 'w') as evo_output_json_file:
-                            evo_output_json_file.write(json.dumps({**model_state, "algo": quiz_model.__class__.__name__, 
+                            evo_output_json_file.write(json.dumps({"settings": settings, "distractors": best_distractors, 
+                                                        "algo": quiz_model.__class__.__name__, 
                                                         "explored_search_space_size": explored_search_space_size,
                                                         "search_space_size": search_space_size}, indent=4))
                     sys.stdout.write(f"[{run_idx + 1}/{n_times}] Step1 quiz {quiz} finished\n{quiz_model.to_dataframe()}\n")
diff --git a/evopie/deca.py b/evopie/deca.py
index 030fd43..440b16e 100644
--- a/evopie/deca.py
+++ b/evopie/deca.py
@@ -260,12 +260,12 @@ def unique_question_per_axis_constraint(space):
 def gen_test_distractor_mapping_knowledge(space): 
     ''' Generates knowledge in format similar to cli student init -k flag. Use this to init StudentKnowledge database 
     '''
-    knowledge = [*[ {"sid": point['cfs'], "qid": qid, "did": did, "chance": 1 } 
+    knowledge = [*[ {"sid": point['cfs'], "qid": qid, "did": did, "chance": 100 + int(point_id) } 
                     for _, points in space['axes'].items()
-                    for _, point in points.items() 
+                    for point_id, point in points.items() 
                     for qid, did in point['dids']],
-                 *[ {"sid": point['cfs'], "qid": qid, "did": did, "chance": 1 } 
-                    for _, point in space['spanned'].items()
+                 *[ {"sid": point['cfs'], "qid": qid, "did": did, "chance": 100 * len(axes_ids) + len(point['dids']) } 
+                    for axes_ids, point in space['spanned'].items()
                     for qid, did in point['dids']]]
     return knowledge
 
@@ -282,8 +282,8 @@ def dimension_coverage(space, population_distractors):
     spanned_axes = {axis_id for spanned_id, point in space['spanned'].items() for _, did in point['dids'] if did in population_distractors for axis_id, _ in spanned_id}
     did_axes = {axis_id for axis_id, points in space["axes"].items() for point in points.values() for _, did in point["dids"] if did in population_distractors}    
     dim_coverage = len(did_axes) / len(space["axes"])
-    dim_coverage_with_spanned = len(did_axes.union(spanned_axes)) / len(space["axes"])
-    return {"dim_coverage":dim_coverage, "dim_coverage_with_spanned": dim_coverage_with_spanned}
+    # dim_coverage_with_spanned = len(did_axes.union(spanned_axes)) / len(space["axes"])
+    return {"dim_coverage":dim_coverage} # "dim_coverage_with_spanned": dim_coverage_with_spanned}
 
 # dimension_coverage(space, [5,6,14])
 
@@ -301,10 +301,10 @@ def avg_rank_of_repr(space, population_distractors):
                                                                         if did in population_distractors], key = lambda x: x[0])}
     arr_axes = [axes_rank[axis_id] / len(space['axes'][axis_id]) for axis_id in space['axes'] if axis_id in axes_rank]
     arr = np.average(arr_axes) if len(arr_axes) > 0 else 0 
-    arr_with_spanned_axes = [max([axes_rank.get(axis_id, 0), spanned_ranks.get(axis_id, 0)]) / len(space['axes'][axis_id]) 
-                                for axis_id in space['axes'] if axis_id in axes_rank or axis_id in spanned_ranks]
-    arr_with_spanned = np.average(arr_with_spanned_axes) if len(arr_with_spanned_axes) > 0 else 0 
-    return {"arr": arr, "arr_with_spanned": arr_with_spanned}
+    # arr_with_spanned_axes = [max([axes_rank.get(axis_id, 0), spanned_ranks.get(axis_id, 0)]) / len(space['axes'][axis_id]) 
+    #                             for axis_id in space['axes'] if axis_id in axes_rank or axis_id in spanned_ranks]
+    # arr_with_spanned = np.average(arr_with_spanned_axes) if len(arr_with_spanned_axes) > 0 else 0 
+    return {"arr": arr}#, "arr_with_spanned": arr_with_spanned}
 
 # avg_rank_of_repr(space, [5,6,14])
 
@@ -314,7 +314,7 @@ def redundancy(space, population_distractors):
     population_spanned_distractors = [did for _, point in space['spanned'].items() for _, did in point['dids'] if did in population_distractors]
     pop_r = len(population_spanned_distractors) / len(population_distractors) 
     deca_r = len(space['spanned']) / (len(space['spanned']) + sum([len(points) for points in space["axes"].values()]))
-    return {"population_redundancy":pop_r, "deca_redundancy":deca_r, 'num_spanned': len(space['spanned']) }
+    return {"population_redundancy":pop_r, "deca_redundancy":deca_r} #, 'num_spanned': len(space['spanned']) }
 
 # redundancy(space, [5,6,14])
 
diff --git a/evopie/pphc_quiz_model.py b/evopie/pphc_quiz_model.py
index e3cd955..c48d9c9 100644
--- a/evopie/pphc_quiz_model.py
+++ b/evopie/pphc_quiz_model.py
@@ -260,8 +260,6 @@ def prepare_for_evaluation(self, evaluator_id: int) -> 'list[tuple[int, list[int
         return question_distractors
 
     def get_model_state(self):
-        population = [self.archive.get(genotype_id) for genotype_id in self.population]
-        distractors = [d for genotype in population for (_, dids) in genotype for d in dids ] 
         archive = [ {"genotype_id": genotype_id, "genotype": r.g.g, "objectives": {c: r[c] for c in r[r.notnull()].index if c != "g" }}
                                             for genotype_id, r in self.archive.items() ]
         settings = { "pop_size": self.pop_size, "gen": self.gen, "seed": self.seed,
@@ -271,7 +269,12 @@ def get_model_state(self):
                     "population": self.population, 
                     "objectives": self.objectives,
                     "archive": archive}   
-        return {"population": population, "distractors": distractors, "settings": settings}
+        return settings
+
+    def get_best_quiz(self):
+        population = [self.archive.get(genotype_id) for genotype_id in self.population]
+        distractors = [d for genotype in population for (_, dids) in genotype for d in dids ] 
+        return distractors
 
     def update_fitness(self, ind: int, evaluator_id: int, result: 'dict[int, int]') -> None:  
         # cur_score = self.archive.loc[ind, evaluator_id]
diff --git a/evopie/quiz_model.py b/evopie/quiz_model.py
index cfa2e40..0dd404f 100644
--- a/evopie/quiz_model.py
+++ b/evopie/quiz_model.py
@@ -52,19 +52,24 @@ def evaluate(self, evaluator_id: int, result: 'dict[int, int]') -> None:
         self.save()
     def save(self) -> None:
         ''' preserve state in persistent storage'''
-        impl_state = self.get_model_state().get("settings", {})
+        impl_state = self.get_model_state()
         self.process.impl = self.__class__ .__module__ + '.' + self.__class__.__name__
         self.process.impl_state = impl_state
         models.DB.session.commit()         
-    def to_csv(self, file_name) -> None: 
-        ''' save state to csv file '''
-        pass 
     def to_dataframe(self) -> Optional[DataFrame]: 
         return None
+    def to_csv(self, file_name) -> None: 
+        ''' save state to csv file '''
+        df = self.to_dataframe()
+        if df is not None:
+            df.to_csv(file_name)
+    def get_best_quiz(self):
+        ''' Should return known best quiz distractors '''
+        return []
 
-from evopie.pphc_quiz_model import PphcQuizModel
+from evopie.sampling_quiz_model import SamplingQuizModel
 class QuizModelBuilder():
-    default_quiz_model_class = PphcQuizModel
+    default_quiz_model_class = SamplingQuizModel
     default_settings = {}
 
     def get_quiz(self, quiz_or_id: 'models.Quiz | int') -> models.Quiz: 
diff --git a/evopie/rand_quiz_model.py b/evopie/rand_quiz_model.py
index 5f6fca0..4287129 100644
--- a/evopie/rand_quiz_model.py
+++ b/evopie/rand_quiz_model.py
@@ -2,6 +2,7 @@
 from evopie import models
 import numpy as np
 from evopie.quiz_model import QuizModel
+from pandas import DataFrame
 
 class RandomQuizModel(QuizModel):
     ''' Implements dummy choice of quiz questions - random questions at start '''
@@ -26,12 +27,18 @@ def get_sampling_size(self):
         return self.n
 
     def get_model_state(self) -> Any: #depends on impl, returns population for Evo models
-        population = [self.quiz_model]
-        distractors = [d for genotype in population for (_, dids) in genotype for d in dids ] 
-        return {"settings": {'n':self.n, 'seed': self.seed, 'quiz_model': self.quiz_model}, "population": population, "distractors": distractors}
+        return {'n':self.n, 'seed': self.seed, 'quiz_model': self.quiz_model}
         
     def prepare_for_evaluation(self, evaluator_id: int) -> 'list[tuple[int, list[int]]]':
         return [(q, list(ds)) for [q, ds] in self.quiz_model]
 
     def evaluate_internal(self, evaluator_id: int, result: 'dict[int, int]'):
-        self.interactions[str(evaluator_id)] = sum([1 if result.get(qid, -1) in genes else 0 for qid, genes in self.quiz_model ])
\ No newline at end of file
+        self.interactions[str(evaluator_id)] = sum([1 if result.get(qid, -1) in genes else 0 for qid, genes in self.quiz_model ])
+
+    def to_dataframe(self):
+        return DataFrame(data = [{'g': self.quiz_model, **self.interactions}])
+
+    def get_best_quiz(self):
+        population = [self.quiz_model]
+        distractors = [d for genotype in population for (_, dids) in genotype for d in dids ] 
+        return distractors
diff --git a/evopie/sampling_quiz_model.py b/evopie/sampling_quiz_model.py
new file mode 100644
index 0000000..fabea76
--- /dev/null
+++ b/evopie/sampling_quiz_model.py
@@ -0,0 +1,254 @@
+''' Modification of pphc which considers Pareto domination on level of distractors '''
+''' Note that archive is changed to be of level of distractor '''
+import numpy as np
+
+from evopie import models
+from evopie.utils import groupby
+from evopie.quiz_model import QuizModel
+from pandas import DataFrame
+
+#NOTE:
+# 1. DECA knowledge contains candidates and tests 
+#       candidates are students while tests are quiz question in a form of [d1, ... dn] 
+#           where n is number of alternatives and d is distractor from question pool
+#       di could also be * meaning any possible distractor. Example [*, d2, *] requires only d2 be present to fail student 
+#       Current DECA implementation allocates one distractor dx which is equivalent to [*, dx, *] set - ignoring distractor context 
+#       One DECA point could have several distractors [*, da, *] and [*, db, *] - if any schema of current student matches current quiz - simulated student will fail the quiz
+#    Lets look onto example DECA knowledge for 1 question quiz 
+#      DECA: 2 axis with 2 points (excluding origin) on each and 1 spanned points selected:
+#               Axis 1. point1 students: {s1}, distractors {d1}; point2 students {s1, s2}, distractors {d2}
+#               Axis 2. point1 students: {s3}, distractors {d3}; point2 students {s3, s4}, distractors {d4}
+#               Spanned at (2, 2): students {s1, s2, s3, s4}, distractor {d5}
+#               Origin d6
+# 2. Simulation is already organized in this way. It randombly picks matched distractor and assign it as an answer.
+# 3. Sampling algo obtains result with picked answer per question - which defines did current model fail student or not.
+# First goal of sampling algo is to give each distractor to students at least k=1 times
+# Then, it will use DECA analysis on low level interactions to sample distractors
+#       HIGH LEVEL interaction is between model and student. Per question it looks like (given knowledge above):
+#        question   | s1    | s2    | s3    | s4    | ...
+#        [d1*d2 d3 ]| 1     | *     | *     | *     |
+#        [d4 d5*d6 ]| *     | 1     | *     | *     |
+#        [d1 d5*d4*]| *     | *     | 1     | 1     | 
+#        []
+#       ....
+#       where we have question as it was given to student and fail 1, not-fail 0 result 
+#       LOW LEVEL interaction is between distractor and student and is used for sampling of next model 
+#       distractor  | s1    | s2    | s3    | s4    | ...
+#       d1          | 1,1   | *     | 1,0   | 1     |
+#       d2          | 1,0   | *     | *     | *     |
+#       d3          | 1,0   | *     | *     | 1     |
+#       d4          | *     | 1,0   | 1,1   | 1     |
+#       d5          | *     | 1,1   | 1,1,0 | 1     |
+#       d6          | *     | 1,0   | *     | 1     |
+#       values in the matrics - first number == to number from HIGH LEVEL matrix, second is real student selection. 
+#       QUESTION: Can high/low level iteraction have some distractor di expressed as sum(dj, j >= 2)?
+#           In a case when fully defined (no *) is required
+#           1. We need to have common columns (students), at least 2 to conclude the composition. 
+#           2. We are going to give to these students same set of distractors [da, db, dc] where we check that da = db + dc or similar.
+#           3. But each student still selects only one distractor among da, db, dc: We can have same result for all students. Say:
+#               d | s1 | s2     d | s1 | s2
+#               da| 0  | 0      da| 0  | 0
+#               db| 1  | 1      db| 1  | 0
+#               dc| 0  | 0      dc| 0  | 1
+#           Neither High no low level interactions will not be able to conclude da = db + dc. Student can pick only one answer. 
+#           Though for first case we assume that db has bigger strength and therefore we go to definition of strength:
+#NOTE: Distractor strength relation on DECA space:
+#       from DECA space above we can assume next natural ordering on distractor strength d1 < d2 for student s1
+#       1. Distractors d1 and d2 could not be on different axes if they fail s1 - student s1 is assigned to one axis point and/or spanned points
+#       2. if d1 and d2 on an axis - d2 is stronger if it is closer to axis end (fails more student)
+#       3. if d2 is spanned and d1 is on axis, d1 < d2 always (even if d2 at end of axis) - assuming that d2 represents a combination of misconcepts which makes it stronger
+#       4. if d2 and d1 are spanned - their strength is defined by number of axis they combine. If number of axis is same, number of failed students is used. 
+# We can build our algo assuming this relation and base our simulation on it.
+#IMPORTANT: SIMULATION should work according to defined strength.
+#       
+#           During sampling we should consider diversity - if we have same pattern like in prev first table - we should penalize db
+#           unless we meet some evaluation which different.
+#           So we have two forces. 
+#           1. To avoid spanning points we should prefer diversity in outcomes when we select distractor 
+#           2. To avoid origin and go towards axis, in oposite we would prefer quality during selection 
+# We can define 2 hyperparameters: quality_n and diversity_n - numbers of distractors to sample according to quality and according to diversity. 
+#IDEA: go to Shenon's Entropy to estimate perplexity of decision. Check entropy and perplexity as potential metrics.  
+#   Qulaity_N - number of distractors to sample according to quality characteristics.
+#       Quality is the force that pushes us towards end of axis. 
+#       In prev example we still can prefer db to be selected because even though it looks like spanned point - some unknown evaluations could be 0 for it
+#           and therefore it could be good axis point. 
+#       The danger of quality that the selection will always dominate the decision. 
+#   Diversity_N - number of distractors to sample for diversity - 1 0 or 0 1 transitions are prefered. 
+#THOUGHT: imagine quiz with 2 distractors. 1 is trivial and another is very but not absolutely hard. All but 1 student fails the second distractor.
+#           this corresponds to 1 axis DECA space with 1 axis point where all but one students are placed. 
+#           Does discovering this point make sense? Yes. 
+#
+#PROPOSITION: probabilistic selection is based on number of 1 0/0 1 for any two common students
+#               for each distractor we compute # of 1 0 and 0 1 transitions unique to it (not present in other distractors)
+#                   when same number - pick with biggest # of 1. 
+#   Probability value - low for all 0, a bit better for all 1, even better for present 0s and 1s (defined by unique 0 1 present) 
+# 
+#   did: {cfs:{student ids}, css: {student ids}} - candidate fail and success sets
+#   did1: cfs1, did2: cfs2  --> cfs1 - sum(cfs_others)
+
+class SamplingQuizModel(QuizModel): 
+    ''' Samples n distractors from interactions. Does not change sampling for group_size interactions '''
+    default_settings = { "n": 3, "min_num_evals": 1, "group_size": 2, "strategy": "non_domination"}
+
+    def __init__(self, quiz_id: int, process: models.EvoProcess, distractors_per_question: 'dict[int, list[int]]'):
+        super(SamplingQuizModel, self).__init__(quiz_id, process, distractors_per_question)
+        settings = {**SamplingQuizModel.default_settings, **process.impl_state}
+        self.seed = settings.get("seed", None)
+        self.rnd = np.random.RandomState(self.seed)
+        self.n: int = settings.get("n", SamplingQuizModel.default_settings["n"])
+        self.min_num_evals: int = settings.get("min_num_evals", SamplingQuizModel.default_settings["min_num_evals"])
+        self.group_size: int = settings.get("group_size", SamplingQuizModel.default_settings["group_size"])
+        self.cur_iter: int = settings.get("cur_iter", 0)
+        self.quiz = settings.get("quiz", []) #question distractors sampled to be present
+        self.strategy = settings.get("strategy", SamplingQuizModel.default_settings["strategy"])
+        #NOTE: we need  to maintain interactions in both forms but store only one form
+        self.interactions: dict = {**settings.get("interactions", {})} #dict student_id:{quiz:[(qid1, [dids]), ...], result:{did:0/1}}
+        # self.strength: dict = settings.get("strength", {}) #graph in a form of linked list did-to-did defines link from weaker to stronger distractor. did: {stronger:{dids}, weaker:{dids}}
+        self.inverted_interactions: dict = self.invert_interactions()
+        self.sample_best_one = False
+
+        self.sample_strategy = getattr(self, self.strategy)
+        
+    def invert_interactions(self):
+        return {int(did):{sid:result for (_, sid, result) in plain_ints} 
+                    for (did, plain_ints) in 
+                        groupby([(did, sid, result) for sid, interaction in self.interactions.items() 
+                                    for (did, result) in interaction.get('result', {}).items() ],
+                            key=lambda x: x[0])}
+
+    def get_explored_search_space_size(self) -> int:
+        tried_models = set(str(interaction['quiz']) for interaction in self.interactions.values())
+        return len(tried_models)
+
+    def get_sampling_size(self):
+        return self.n
+
+    def evaluate_internal(self, evaluator_id: int, result: 'dict[int, int]') -> None:
+        interaction = self.interactions.get(str(evaluator_id), None)
+        given_quiz = interaction['quiz']
+        interaction['result'] = {str(did):1 if did == result.get(qid, -1) else 0 for qid, dids in given_quiz for did in dids }            
+        for qid, dids in given_quiz:
+            selected_did = result.get(qid, -1)
+            for did in dids:
+                self.inverted_interactions.setdefault(int(did), {})[str(evaluator_id)] = 1 if did == selected_did else 0
+            # if selected_did != -1:
+            #     weaker_dids = [did for did in dids if did != selected_did]
+            #     self.strength[selected_did].setdefault("weaker", set()).update(weaker_dids)
+            #     for did in weaker_dids:
+            #         self.strength[did].setdefault("stronger", set()).add(selected_did)
+        self.cur_iter += 1
+
+    def prepare_for_evaluation(self, evaluator_id: int) -> 'list[tuple[int, list[int]]]':
+        if (len(self.quiz) == 0) or (self.cur_iter >= self.group_size): 
+            self.quiz = self.sample_quiz()      
+            self.cur_iter = 0          
+        interaction = self.interactions.setdefault(str(evaluator_id), {})  
+        interaction['quiz'] = self.quiz
+        quiz_to_return = [ (qid, list(dids)) for qid, dids in self.quiz ] #copy from model
+        return quiz_to_return
+
+    def get_model_state(self):
+        settings = { "seed": self.seed, "n": self.n, "min_num_evals": self.min_num_evals, "group_size": self.group_size,
+                    "cur_iter": self.cur_iter, "quiz": self.quiz, "interactions":  self.interactions, "strategy": self.strategy }
+        return settings
+
+    def get_best_quiz(self):
+        self.sample_best_one = True 
+        quiz = self.sample_quiz()
+        population = [quiz]
+        distractors = [d for _, dids in quiz for d in dids ] 
+        self.sample_best_one = False 
+        return distractors
+
+    def to_dataframe(self):
+        return DataFrame(data = self.inverted_interactions.values(), index = [int(did) for did in self.inverted_interactions.keys()])
+
+    #strategies should have signatures as next dids -> blocked_dids -> selection
+    def pick_random(self, dids, blocked_dids, num = None):
+        return [int(d) for d in self.rnd.choice(dids, num or self.n, raplce = False)] if len(dids) > (num or self.n) else dids          
+
+    def sample_by_score(self, dids, scores):
+        total_score = sum(scores)
+        weights = [s / total_score for s in scores]
+        selected_did = max(zip(dids, weights), key=lambda x: x[1])[0] if self.sample_best_one else self.rnd.choice(dids, p=weights)
+        return int(selected_did)
+
+    def max_difficulty(self, dids, blocked_dids):        
+        #first for fare game we give each distractor to students at least ones:
+        high_priority = [did for did in dids if len(self.inverted_interactions.get(int(did), {})) < self.min_num_evals]
+        selected = self.pick_random(self, high_priority, self.n)
+
+        did_scores = {}
+        def did_score(did):
+            if did not in did_scores:
+                did_scores[did] = sum(self.inverted_interactions.get(int(did), {}).values()) #more 1's - better score
+            return did_scores[did]
+
+        for i in range(len(selected), self.n):
+            scores = [0 if did in selected else did_score(did) for did in dids]
+            selected_did = self.sample_by_score(dids, scores)
+            selected.append(selected_did)
+        return selected 
+
+    def block_similar(self, selected_did, blocked_dids):
+        selected_did_students = self.inverted_interactions.get(selected_did, {})
+        for did, did_students in self.inverted_interactions.items():
+            common_students = set.intersection(set(did_students.keys()), set(selected_did_students.keys()))
+            if len(common_students) > 2 and all(did_students[sid] == selected_did_students[sid] for sid in common_students):
+                blocked_dids[did] = 0.1 #penalty for same behavior
+
+    def non_domination(self, dids, blocked_dids):                
+        did_relations = {did:(non_domination, domination)
+                            for did in dids                             
+                            for s in [self.inverted_interactions.get(int(did), {})]
+                            for non_domination in [[did1 for did1 in dids 
+                                if did1 != did
+                                for s1 in [self.inverted_interactions.get(int(did1), {})]
+                                for common_students in [set.intersection(set(s.keys()), set(s1.keys()))]
+                                for s_lst in [[s[sid] for sid in common_students]]
+                                for s1_lst in [[s1[sid] for sid in common_students]]
+                                if any(v1 > v2 for v1, v2 in zip(s_lst, s1_lst)) and any(v1 < v2 for v1, v2 in zip(s_lst, s1_lst))]] 
+                            for domination in [[did1 for did1 in dids 
+                                if did1 != did
+                                for s1 in [self.inverted_interactions.get(int(did1), {})]
+                                for common_students in [set.intersection(set(s.keys()), set(s1.keys()))]
+                                for s_lst in [[s[sid] for sid in common_students]]
+                                for s1_lst in [[s1[sid] for sid in common_students]]
+                                if s_lst != s1_lst and any(v1 > v2 for v1, v2 in zip(s_lst, s1_lst))]]}
+        selected = []
+        for i in range(len(selected), self.n):
+            scores = [0 if did in selected else blocked_dids.get(did, 1) * (0.1 + 100 * len(non_dominated) / len(dids) * len(dominated) / (2 * len(dids)) * len(self.interactions) / (2 * int_len) * (1 if len(cfs) == 0 else len(self.interactions) / (2 * len(cfs)))) if int_len > 0 else 100
+                        for did, (non_dominated, dominated) in did_relations.items() 
+                        for interations in [self.inverted_interactions.get(int(did), {})]
+                        for int_len in [len(interations)]
+                        for cfs in [[s for s, r in interations.items() if r == 1]]]
+            selected_did = self.sample_by_score(dids, scores)
+            self.block_similar(selected_did, blocked_dids)
+            selected.append(selected_did)
+        return selected         
+    
+    # def default_strategy(self, dids, blocked_dids):        
+    #     #first for fare game we give each distractor to students at least ones:
+    #     high_priority = [did for did in dids if len(self.inverted_interactions.get(did, {})) < self.min_num_evals]
+    #     selected = self.pick_random(self, high_priority, self.n)
+    #     def did_score(did):
+    #         score = 0.5 if did in blocked_dids else 1.0 
+    #         unknown_pairing_dids = set(dids) - self.strength[did]["weaker"] - self.strength[did]["stronger"]
+    #         score *= len(unknown_pairing_dids)
+    #         return score 
+    #     for i in range(len(selected), self.n): #we need to build prob distribution
+    #         #we base selection on positive scores for each possible dids
+    #         #blocked_dids gives penalty. in this strategy blocked dids have same interactions as some from previous questions            
+
+    #         scores = {did: 1.0 if dids not in blocked_dids else 0.5 for did in dids}
+            
+    #         res = None 
+    #         selected.append(res)
+    #     return selected 
+
+    def sample_quiz(self) -> 'list[tuple[int, list[int]]]':
+        ''' Sample based on interactions and strategy '''
+        blocked_dids = {} #some info to block same concept distractors across questions
+        return [[qid, sorted(self.sample_strategy(dids, blocked_dids))] for qid, dids in self.distractors_per_question.items()]        
+
+
diff --git a/experiment.sh b/experiment.sh
index 774be8c..2aed9a6 100755
--- a/experiment.sh
+++ b/experiment.sh
@@ -22,7 +22,31 @@ flask deca init-many -ns 100 -nq 4 -nd 25 \
     --best-students-percent 0.3 \
     --noninfo 0.3 \
     --timeout 1000 --random-seed 17
- 
+
+# local experimentation on 1 space
+flask deca init-many -ns 100 -nq 4 -nd 25 \
+    -an 10 \
+    -as 5 \
+    --num-spanned 10 \
+    --num-spaces 1 \
+    --best-students-percent 0.05 \
+    --noninfo 0.1 \
+    --timeout 1000 --random-seed 17
+
+    # --algo '{ "id": "rand-5", "algo":"evopie.rand_quiz_model.RandomQuizModel", "n": 5}' \
+    # --algo '{ "id": "pphc-1-2-1-3", "algo":"evopie.pphc_quiz_model.PphcQuizModel", "pop_size": 1, "pareto_n": 2, "child_n": 1, "gene_size": 3}' \
+
+flask quiz deca-experiments \
+    --deca-spaces deca-spaces \
+    --algo-folder algo \
+    --results-folder results \
+    --random-seed 23 --num-runs 10 \
+    --algo '{ "id": "rand-3", "algo":"evopie.rand_quiz_model.RandomQuizModel", "n": 3}' \
+    --algo '{ "id": "s-nond-1", "algo":"evopie.sampling_quiz_model.SamplingQuizModel", "n": 3, "min_num_evals": 1, "group_size": 2, "strategy": "non_domination"}' \
+    --algo '{ "id": "s-nond-2", "algo":"evopie.sampling_quiz_model.SamplingQuizModel", "n": 3, "min_num_evals": 1, "group_size": 2, "strategy": "non_domination"}' \
+    --algo '{ "id": "s-nond-3", "algo":"evopie.sampling_quiz_model.SamplingQuizModel", "n": 3, "min_num_evals": 1, "group_size": 3, "strategy": "non_domination"}'
+
+
 flask quiz deca-experiments \
     --random-seed 23 --num-runs 3 \
     --algo '{ "id": "pphc-1-2-1-3", "algo":"evopie.pphc_quiz_model.PphcQuizModel", "pop_size": 1, "pareto_n": 2, "child_n": 1, "gene_size": 3}'
@@ -31,6 +55,10 @@ flask quiz deca-experiment --deca-input deca-spaces/space-1_1_1_1_1_1_1_1-s_20-3
     --num-runs 3 \
     --algo '{ "id": "pphc-1-2-1-3", "algo":"evopie.pphc_quiz_model.PphcQuizModel", "pop_size": 1, "pareto_n": 2, "child_n": 1, "gene_size": 3}'
 
+flask quiz deca-experiment --deca-input deca-spaces/space-1_1_1_1_1_1_1_1-s_20-3.json \
+    --num-runs 3 \
+    --algo '{ "id": "s-nond", "algo":"evopie.sampling_quiz_model.SamplingQuizModel", "n": 3, "min_num_evals": 1, "group_size": 2, "strategy": "non_domination"}'
+
 flask quiz deca-experiment --deca-input deca-spaces/space-1_1_1-s_0-2.json \
     --num-runs 2 \
     --algo '{ "id": "pphc-1-2-1-3", "algo":"evopie.pphc_quiz_model.PphcQuizModel", "pop_size": 1, "pareto_n": 2, "child_n": 1, "gene_size": 3}'
@@ -52,7 +80,7 @@ flask deca result --algo-input algo/pphc-1-2-1-3.json --deca-space deca-spaces/s
 # flask quiz post-process --result-folder results --figure-folder figures -p dim_coverage
 
 flask quiz post-process --result-folder data/data-8/results --figure-folder figures --file-name-pattern '.*_20-\d+.csv' \
-  -p dim_coverage -p dim_coverage_with_spanned -p arr -p arr_with_spanned -p population_redundancy -p deca_redundancy -p num_spanned \
+  -p dim_coverage -p arr -p population_redundancy -p deca_redundancy -p num_spanned \
   -p deca_duplication -p population_duplication -p noninfo \
   --group-by-space
 
@@ -61,7 +89,7 @@ flask quiz post-process --result-folder data/data-2/results --figure-folder figu
 
 
 flask quiz post-process --result-folder data/data-2022-08-08/data-2/results --figure-folder figures --file-name-pattern '.*_0-\d+.csv' \
-  -p dim_coverage -p dim_coverage_with_spanned -p arr -p arr_with_spanned -p population_redundancy -p deca_redundancy -p num_spanned \
+  -p dim_coverage -p arr -p population_redundancy -p deca_redundancy -p num_spanned \
   -p deca_duplication -p population_duplication -p noninfo
 
 flask quiz post-process --result-folder data/data-2022-08-08/data-2/results --figure-folder figures --file-name-pattern '.*_0-\d+.csv' \