ls1intum · maximiliansoelch · Dec 5, 2024 · May 10, 2024 · May 11, 2024 · May 12, 2024
diff --git a/athena/pyproject.toml b/athena/pyproject.toml
@@ -13,6 +13,7 @@ httpx = "^0.24.1"
 gitpython = "^3.1.41"
 sqlalchemy = {extras = ["mypy"], version = "^2.0.21"}
 psycopg2 = "^2.9.9"
+pydantic = "1.10.13"
 
 [tool.poetry.group.dev.dependencies]
 types-requests = "^2.31.0.8"

diff --git a/docker-compose.prod.yml b/docker-compose.prod.yml
@@ -71,6 +71,14 @@ services:
       - postgres
     image: ls1tum/athena_module_programming_apted:${ATHENA_TAG:-develop}
 
+  module_programming_winnowing:
+    hostname: module-programming-winnowing
+    env_file:
+      - ${ATHENA_ENV_DIR:-./env_example}/module_programming_winnowing.env
+    depends_on:
+      - postgres
+    image: ls1tum/athena_module_programming_winnowing:${ATHENA_TAG:-develop}
+
   module_modeling_llm:
     hostname: module-modeling-llm
     env_file:

diff --git a/docker-compose.yml b/docker-compose.yml
@@ -82,3 +82,11 @@ services:
       - llm_core
     ports:
       - "5008:5008"
+
+  module_programming_winnowing:
+    hostname: module-programming-winnowing
+    build: ./module_programming_winnowing
+    depends_on:
+      - athena
+    ports:
+      - "5009:5009"
diff --git a/env_example/module_programming_winnowing.env b/env_example/module_programming_winnowing.env
@@ -0,0 +1,3 @@
+PRODUCTION=1
+SECRET=12345abcdef
+DATABASE_URL=postgresql://postgres:password@postgres:5432/athena
diff --git a/modules/__init__.py b/modules/__init__.py
diff --git a/modules/programming/__init__.py b/modules/programming/__init__.py
diff --git a/modules/programming/module_example/module_example/__main__.py b/modules/programming/module_example/module_example/__main__.py
@@ -1,5 +1,5 @@
 """
-Entry point for the module_example module.
+Entry point for the module_example.
 """
 import random
 from typing import List, Any
@@ -13,7 +13,7 @@
 
 @config_schema_provider
 class Configuration(BaseModel):
-    """Example configuration for the module_example module."""
+    """Example configuration for the module_example."""
     debug: bool = Field(False, description="Whether the module is in **debug mode**. This is an example config option.")
 
 

diff --git a/modules/programming/module_programming_apted/pyproject.toml b/modules/programming/module_programming_apted/pyproject.toml
@@ -13,6 +13,7 @@ athena = { git = "https://github.com/ls1intum/Athena.git", rev = "ccd00cf8346e76
 apted = "^1.0.3"
 antlr4-python3-runtime = "^4.13.1"
 javalang = {git = "https://github.com/c2nes/javalang"}
+pydantic = "1.10.13"
 
 [tool.poetry.group.dev.dependencies]
 types-requests = "^2.31.0.8"

diff --git a/modules/programming/module_programming_winnowing/.dockerignore b/modules/programming/module_programming_winnowing/.dockerignore
@@ -0,0 +1,4 @@
+.venv
+.vscode
+__pycache__
+.DS_Store
diff --git a/modules/programming/module_programming_winnowing/.vscode/settings.json b/modules/programming/module_programming_winnowing/.vscode/settings.json
@@ -0,0 +1,4 @@
+{
+  "python.pythonPath": "./.venv/bin/python",
+  "python.analysis.typeCheckingMode": "basic",
+}
diff --git a/modules/programming/module_programming_winnowing/Dockerfile b/modules/programming/module_programming_winnowing/Dockerfile
@@ -0,0 +1,30 @@
+# syntax=docker/dockerfile:1
+
+# This is the Dockerfile for the module_programming_winnowing.
+
+FROM python:3.11
+LABEL org.opencontainers.image.source=https://github.com/ls1intum/Athena
+
+# Environment variable Python in Docker
+ENV PYTHONUNBUFFERED=1
+
+WORKDIR /code
+
+# Poetry
+RUN pip install --no-cache-dir poetry==1.5.0
+
+# Dependencies
+COPY pyproject.toml poetry.lock ./
+# athena module (from the Dockerfile in the athena folder)
+COPY --from=athena /code /athena
+COPY --from=module_programming_apted /code /module_programming_apted
+# install dependencies
+RUN poetry config virtualenvs.create true \
+    && poetry config virtualenvs.in-project true \
+    && poetry install --no-interaction --no-ansi
+
+# Project files
+COPY . ./
+
+# poetry scripts don't work here
+CMD poetry run python -m module_*
diff --git a/modules/programming/module_programming_winnowing/README.md b/modules/programming/module_programming_winnowing/README.md
@@ -0,0 +1,8 @@
+# Start Directly
+`poetry run module`
+
+# Start with Docker
+`docker-compose up --build`
+
+# Start with Docker in Production Mode
+`docker-compose up --env-file .env.production --build`
diff --git a/modules/programming/module_programming_winnowing/__init__.py b/modules/programming/module_programming_winnowing/__init__.py
diff --git a/modules/programming/module_programming_winnowing/module.conf b/modules/programming/module_programming_winnowing/module.conf
@@ -0,0 +1,4 @@
+[module]
+name = module_programming_winnowing
+type = programming
+port = 5009
diff --git a/modules/programming/module_programming_winnowing/module_programming_winnowing/__init__.py b/modules/programming/module_programming_winnowing/module_programming_winnowing/__init__.py
diff --git a/modules/programming/module_programming_winnowing/module_programming_winnowing/__main__.py b/modules/programming/module_programming_winnowing/module_programming_winnowing/__main__.py
@@ -0,0 +1,171 @@
+"""
+Entry point for the module_programming_winnowing module.
+"""
+import random
+from typing import List, Any, cast
+from pydantic import BaseModel, Field
+
+from athena import app, config_schema_provider, submissions_consumer, submission_selector, feedback_consumer, feedback_provider, evaluation_provider, emit_meta
+from athena.programming import Exercise, Submission, Feedback, get_stored_feedback_suggestions, \
+    count_stored_submissions, get_stored_submissions
+from athena.logger import logger
+from athena.storage import store_exercise, store_submissions, store_feedback, store_feedback_suggestions
+from module_programming_winnowing.convert_code_to_ast.get_feedback_methods import get_feedback_method
+from module_programming_winnowing.feedback_suggestions.feedback_suggestions import create_feedback_suggestions
+from module_programming_winnowing.feedback_suggestions.remove_overlapping import filter_overlapping_suggestions
+from module_programming_winnowing.feedback_suggestions.remove_suspicious import filter_suspicious
+
+
+@config_schema_provider
+class Configuration(BaseModel):
+    """Example configuration for the module_programming_winnowing module."""
+    debug: bool = Field(False, description="Whether the module is in **debug mode**. This is an example config option.")
+
+
+@submissions_consumer
+def receive_submissions(exercise: Exercise, submissions: List[Submission], module_config: Configuration):
+    logger.info("receive_submissions: Received %d submissions for exercise %d", len(submissions), exercise.id)
+    for submission in submissions:
+        logger.info("- Submission %d", submission.id)
+        zip_content = submission.get_zip()
+        # list the files in the zip
+        for file in zip_content.namelist():
+            logger.info("  - %s", file)
+    # Do something with the submissions
+    logger.info("Doing stuff")
+
+    # Example use module config
+    # If you are not using module_config for your module, you can remove it from the function signature
+    logger.info("Config: %s", module_config)
+    if module_config.debug:
+        emit_meta('debug', True)
+        emit_meta('comment', 'You can add any metadata you want here')
+
+    # Add data to exercise
+    exercise.meta["some_data"] = "some_value"
+    logger.info("- Exercise meta: %s", exercise.meta)
+
+    # Add data to submission
+    for submission in submissions:
+        submission.meta["some_data"] = "some_value"
+        logger.info("- Submission %d meta: %s", submission.id, submission.meta)
+
+    store_exercise(exercise)
+    store_submissions(submissions)
+
+
+@submission_selector
+def select_submission(exercise: Exercise, submissions: List[Submission]) -> Submission:
+    logger.info("select_submission: Received %d submissions for exercise %d", len(submissions), exercise.id)
+    for submission in submissions:
+        logger.info("- Submission %d", submission.id)
+    # Do something with the submissions and return the one that should be assessed next
+    return submissions[0]
+
+
+@feedback_consumer
+def process_incoming_feedback(exercise: Exercise, submission: Submission, feedbacks: List[Feedback]):
+    logger.info("process_feedback: Received %d feedbacks for submission %d of exercise %d", len(feedbacks),
+                submission.id, exercise.id)
+    logger.info("process_feedback: Feedbacks: %s", feedbacks)
+
+    programming_language = exercise.programming_language.lower()
+    # Currently only works with Java and Python - can be extended with more languages if the grammar is available
+    if programming_language not in ["java", "python"]:
+        logger.info("The winnowing module currently only works with Java and Python. Not consuming feedback.")
+        return
+
+    # Remove unreferenced feedbacks
+    feedbacks = list(filter(lambda f: f.file_path is not None and f.line_start is not None, feedbacks))
+
+    # Add method metadata to feedbacks
+    feedbacks_with_method = []
+    for feedback in feedbacks:
+        feedback_method = get_feedback_method(submission, feedback, programming_language)
+        if feedback_method is None:
+            # don't consider feedback without a method
+            continue
+        logger.debug("Feedback #%d: Found method %s", feedback.id, feedback_method.name)
+        feedback.meta["method_name"] = feedback_method.name
+        feedback.meta["method_code"] = feedback_method.source_code
+        feedback.meta["method_line_start"] = feedback_method.line_start
+        feedback.meta["method_line_end"] = feedback_method.line_end
+        feedback.meta["method_ast"] = feedback_method.ast
+        feedbacks_with_method.append(feedback)
+    feedbacks = feedbacks_with_method
+
+    # find all submissions for this exercise
+    exercise_submissions = cast(List[Submission], list(get_stored_submissions(exercise.id)))
+
+    # create feedback suggestions
+    logger.info("Creating feedback suggestions for %d feedbacks", len(feedbacks))
+    feedback_suggestions = create_feedback_suggestions(exercise_submissions, feedbacks, programming_language)
+
+    # additionally, store metadata about how impactful each feedback was, i.e. how many suggestions were given based on it
+    for feedback in feedbacks:
+        # count how many suggestions were given based on this feedback
+        feedback.meta["n_feedback_suggestions"] = len(
+            [f for f in feedback_suggestions if f.meta["original_feedback_id"] == feedback.id])
+        # store the information on the suggestions as well for quicker access later
+        for suggestion in feedback_suggestions:
+            if suggestion.meta["original_feedback_id"] == feedback.id:
+                suggestion.meta["n_feedback_suggestions"] = feedback.meta["n_feedback_suggestions"]
+
+    # save to database
+    # type: ignore
+    store_feedback_suggestions(feedback_suggestions)
+    for feedback in feedbacks:
+        store_feedback(feedback)
+
+    logger.debug("Feedbacks processed")
+
+@feedback_provider
+def suggest_feedback(exercise: Exercise, submission: Submission, is_graded: bool, module_config: Configuration) -> List[Feedback]:
+    logger.info("suggest_feedback: Suggestions for submission %d of exercise %d were requested", submission.id,
+                exercise.id)
+    # Do something with the submission and return a list of feedback
+    # ThemisML currently only works with Java
+    if exercise.programming_language.lower() not in ["java", "python"]:
+        logger.info("The Winnowing module currently only works with Java and Python. Returning no suggestions.")
+        return []
+
+    suggested_feedbacks = cast(List[Feedback], list(get_stored_feedback_suggestions(exercise.id, submission.id)))
+    logger.debug("Found %d feedback suggestions (unfiltered)", len(suggested_feedbacks))
+    suggested_feedbacks = filter_suspicious(suggested_feedbacks, count_stored_submissions(exercise.id))
+    logger.debug("Found %d feedback suggestions (removed suspicious suggestions)", len(suggested_feedbacks))
+    suggested_feedbacks = filter_overlapping_suggestions(suggested_feedbacks)
+    logger.debug("Found %d feedback suggestions (removed overlapping suggestions)", len(suggested_feedbacks))
+
+    logger.info("Suggesting %d filtered feedback suggestions", len(suggested_feedbacks))
+    logger.debug("Suggested Feedback suggestions: %s", suggested_feedbacks)
+
+    return suggested_feedbacks
+
+
+# Only if it makes sense for a module (Optional)
+@evaluation_provider
+def evaluate_feedback(exercise: Exercise, submission: Submission, true_feedbacks: List[Feedback], predicted_feedbacks: List[Feedback]) -> Any:
+    logger.info(
+        "evaluate_feedback: Evaluation for submission %d of exercise %d was requested with %d true and %d predicted feedbacks", 
+        submission.id, exercise.id, len(true_feedbacks), len(predicted_feedbacks)
+    )
+
+    # Do something with the true and predicted feedback and return the evaluation result
+    # Generate some example evaluation result
+    evaluation_results = []
+    true_feedback_embeddings = [random.random() for _ in true_feedbacks] 
+    predicted_feedback_embeddings = [random.random() for _ in predicted_feedbacks]
+    for feedback, embedding in zip(predicted_feedbacks, predicted_feedback_embeddings):
+        feedback_evaluation = {
+            "feedback_id": feedback.id,
+            "embedding": embedding,
+            "has_match": len([t for t in true_feedback_embeddings if abs(t - embedding) < 0.1]) > 0,
+            "correctness": random.random()
+        }
+        evaluation_results.append(feedback_evaluation)
+
+    return evaluation_results
+
+
+if __name__ == "__main__":
+    app.start()
diff --git a/...module_programming_winnowing/module_programming_winnowing/convert_code_to_ast/__init__.py b/...module_programming_winnowing/module_programming_winnowing/convert_code_to_ast/__init__.py
diff --git a/...ming_winnowing/module_programming_winnowing/convert_code_to_ast/extract_method_and_ast.py b/...ming_winnowing/module_programming_winnowing/convert_code_to_ast/extract_method_and_ast.py
@@ -0,0 +1,65 @@
+from antlr4 import CommonTokenStream, InputStream
+from antlr4.tree.Tree import ParseTreeWalker
+from module_programming_apted.convert_code_to_ast.languages.python.Python3Lexer import Python3Lexer
+from module_programming_apted.convert_code_to_ast.languages.python.Python3Parser import Python3Parser
+from module_programming_apted.convert_code_to_ast.languages.java.JavaLexer import JavaLexer
+from module_programming_apted.convert_code_to_ast.languages.java.JavaParser import JavaParser
+from module_programming_apted.convert_code_to_ast.languages.python.Python3MethodParserListener import \
+    MethodParserListener as PythonMethodParserListener
+from module_programming_apted.convert_code_to_ast.languages.java.JavaMethodParserListener import \
+    MethodParserListener as JavaMethodParserListener
+
+# TODO: DO I need the to_ast method?
+
+# Grammars for programming languages have different parse rules
+JAVA_PARSE_RULE = "compilationUnit"
+PYTHON_PARSE_RULE = "file_input"
+
+def parse_java_file(source_code: str):
+    return parse_file(source_code, JavaLexer, JavaParser, JAVA_PARSE_RULE, JavaMethodParserListener)
+
+
+def parse_python_file(source_code: str):
+    return parse_file(source_code, Python3Lexer, Python3Parser, PYTHON_PARSE_RULE, PythonMethodParserListener)
+
+
+def parse_file(source_code, lexer_class, parser_class, parse_rule, listener_class):
+    input_stream = InputStream(source_code)
+    lexer = lexer_class(input_stream)
+    stream = CommonTokenStream(lexer)
+    parser = parser_class(stream)
+    tree = getattr(parser, parse_rule)()
+
+    listener = listener_class(parser)
+    walker = ParseTreeWalker()
+    walker.walk(listener, tree)
+    print(listener.methods)
+
+    return listener.methods.copy()
+
+
+def parse(source_code: str, programming_language: str):
+    if programming_language == "java":
+        return parse_java_file(source_code)
+    if programming_language == "python":
+        return parse_python_file(source_code)
+    raise ValueError(f"Unsupported programming language: {programming_language}")
+
+
+if __name__ == "__main__":
+    # file_path2 = "../test_files/test_java_1.java"
+    # parse_java_file(file_path2)
+
+    code = """def process_numbers(numbers):
+    total = 0
+    for number in numbers:
+        if number % 2 == 1:
+            total += number
+        else:
+            total -= number
+    if total > 0:
+        print("Positive total:", total)
+    else:
+        print("Non-positive total:", total)"""
+    code1 = parse_python_file(code)
+    code2 = parse_python_file(code)
diff --git a/...amming_winnowing/module_programming_winnowing/convert_code_to_ast/get_feedback_methods.py b/...amming_winnowing/module_programming_winnowing/convert_code_to_ast/get_feedback_methods.py
@@ -0,0 +1,27 @@
+from typing import Optional
+
+from athena.programming import Submission, Feedback
+from module_programming_apted.convert_code_to_ast.extract_method_and_ast import parse
+from module_programming_apted.convert_code_to_ast.method_node import MethodNode
+from athena.logger import logger
+
+
+def get_feedback_method(submission: Submission, feedback: Feedback, programming_language: str) -> Optional[MethodNode]:
+    """Find method that the feedback is on"""
+    if feedback.file_path is None or feedback.line_start is None:
+        return None
+    try:
+        code = submission.get_code(feedback.file_path)
+    except UnicodeDecodeError:
+        logger.warning("File %s in submission %d is not UTF-8 encoded.", feedback.file_path, submission.id)
+        return None
+    methods = parse(code, programming_language)
+    for m in methods:
+        if m.line_start is None or m.line_end is None:
+            continue
+        # method has to contain all feedback lines
+        if m.line_start <= feedback.line_start:
+            feedback_line_end = feedback.line_end if feedback.line_end is not None else feedback.line_start
+            if m.line_end >= feedback_line_end:
+                return m
+    return None
diff --git a/...gramming_winnowing/module_programming_winnowing/convert_code_to_ast/languages/__init__.py b/...gramming_winnowing/module_programming_winnowing/convert_code_to_ast/languages/__init__.py