From d7d0c9ae3e4258b025af7e7be3e777adce21cbd5 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Wed, 12 Mar 2025 09:11:24 -0300
Subject: [PATCH 01/27] Codemods will now execute once for each finding
 independently

---
 src/codemodder/codemods/base_codemod.py | 55 ++++++++++++++++++++-----
 1 file changed, 44 insertions(+), 11 deletions(-)

diff --git a/src/codemodder/codemods/base_codemod.py b/src/codemodder/codemods/base_codemod.py
index 5b568113..b1633082 100644
--- a/src/codemodder/codemods/base_codemod.py
+++ b/src/codemodder/codemods/base_codemod.py
@@ -226,21 +226,54 @@ def _apply(
             logger.debug("No files matched for %s", self.id)
             return None
 
-        process_file = functools.partial(
-            self._process_file, context=context, results=results, rules=rules
-        )
-
-        contexts = []
-        if context.max_workers == 1:
-            logger.debug("processing files serially")
-            contexts.extend([process_file(file) for file in files_to_analyze])
-        else:
+        # Do each result independently
+        if results:
+            # gather positional arguments for the map
+            resultset_arguments = []
+            path_arguments = []
+            for result in results.results_for_rules(rules):
+                # this need to be the same type of ResultSet as results
+                singleton = results.__class__()
+                singleton.add_result(result)
+                result_locations = self.get_files_to_analyze(context, singleton)
+                # We do an execution for each location in the result
+                # So we duplicate the resultset argument for each location
+                for loc in result_locations:
+                    resultset_arguments.append(singleton)
+                    path_arguments.append(loc)
+
+            contexts: list = []
             with ThreadPoolExecutor() as executor:
                 logger.debug("using executor with %s workers", context.max_workers)
-                contexts.extend(executor.map(process_file, files_to_analyze))
+                contexts.extend(
+                    executor.map(
+                        lambda path, resultset: self._process_file(
+                            path, context, resultset, rules
+                        ),
+                        path_arguments,
+                        resultset_arguments,
+                    )
+                )
                 executor.shutdown(wait=True)
 
-        context.process_results(self.id, contexts)
+            context.process_results(self.id, contexts)
+        # for find and fix codemods
+        else:
+            process_file = functools.partial(
+                self._process_file, context=context, results=results, rules=rules
+            )
+
+            contexts = []
+            if context.max_workers == 1:
+                logger.debug("processing files serially")
+                contexts.extend([process_file(file) for file in files_to_analyze])
+            else:
+                with ThreadPoolExecutor() as executor:
+                    logger.debug("using executor with %s workers", context.max_workers)
+                    contexts.extend(executor.map(process_file, files_to_analyze))
+                    executor.shutdown(wait=True)
+
+            context.process_results(self.id, contexts)
         return None
 
     def apply(self, context: CodemodExecutionContext) -> None | TokenUsage:

From 874743bf82cbe264f1dde277b6085a0b06cf3cfb Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Wed, 12 Mar 2025 10:31:12 -0300
Subject: [PATCH 02/27] Adjusted tests to account for individual changes diff

---
 src/codemodder/codemods/test/utils.py         | 84 ++++++++++++++-----
 .../sonar/test_sonar_jwt_decode_verify.py     | 32 ++++++-
 2 files changed, 93 insertions(+), 23 deletions(-)

diff --git a/src/codemodder/codemods/test/utils.py b/src/codemodder/codemods/test/utils.py
index 3ccdbdd7..7568fdc9 100644
--- a/src/codemodder/codemods/test/utils.py
+++ b/src/codemodder/codemods/test/utils.py
@@ -1,3 +1,4 @@
+import difflib
 import os
 from pathlib import Path
 from textwrap import dedent
@@ -58,6 +59,7 @@ def run_and_assert(
         tmpdir,
         input_code,
         expected,
+        expected_diff_per_change: list[str] = [],
         num_changes: int = 1,
         min_num_changes: int | None = None,
         root: Path | None = None,
@@ -99,13 +101,19 @@ def run_and_assert(
             tmp_file_path,
             input_code,
             expected,
-            changes[0],
+            expected_diff_per_change,
+            num_changes,
+            changes,
         )
 
     def assert_num_changes(self, changes, expected_num_changes, min_num_changes):
-        assert len(changes) == 1
+        print(len(changes))
+        print(changes)
+        for c in changes:
+            print(c.diff)
+        assert len(changes) == expected_num_changes
 
-        actual_num = len(changes[0].changes)
+        actual_num = len(changes)
 
         if min_num_changes is not None:
             assert (
@@ -116,25 +124,54 @@ def assert_num_changes(self, changes, expected_num_changes, min_num_changes):
                 actual_num == expected_num_changes
             ), f"Expected {expected_num_changes} changes but {actual_num} were created."
 
-    def assert_changes(self, root, file_path, input_code, expected, changes):
-        assert os.path.relpath(file_path, root) == changes.path
-        assert all(change.description for change in changes.changes)
-
-        expected_diff = create_diff(
-            dedent(input_code).splitlines(keepends=True),
-            dedent(expected).splitlines(keepends=True),
+    def assert_changes(
+        self,
+        root,
+        file_path,
+        input_code,
+        expected,
+        expected_diff_per_change,
+        num_changes,
+        changes,
+    ):
+        assert all(
+            os.path.relpath(file_path, root) == change.path for change in changes
         )
-        try:
-            assert expected_diff == changes.diff
-        except AssertionError:
-            raise DiffError(expected_diff, changes.diff)
-
-        output_code = file_path.read_bytes().decode("utf-8")
-
-        try:
-            assert output_code == (format_expected := dedent(expected))
-        except AssertionError:
-            raise DiffError(format_expected, output_code)
+        assert all(c.description for change in changes for c in change.changes)
+
+        # assert each change individually
+        if num_changes > 1:
+            assert num_changes == len(expected_diff_per_change)
+            for change, diff in zip(changes, expected_diff_per_change):
+                print(change.diff)
+                print("-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-")
+                print(diff)
+                print("+++++++++++++++++++++++++++++++")
+                print(
+                    "\n".join(
+                        difflib.ndiff(diff.splitlines(), change.diff.splitlines())
+                    )
+                    .replace(" ", "␣")
+                    .replace("\t", "→")
+                )
+                assert change.diff == diff
+        else:
+            # generate diff from expected code
+            expected_diff = create_diff(
+                dedent(input_code).splitlines(keepends=True),
+                dedent(expected).splitlines(keepends=True),
+            )
+            try:
+                assert expected_diff == changes.diff
+            except AssertionError:
+                raise DiffError(expected_diff, changes.diff)
+
+            output_code = file_path.read_bytes().decode("utf-8")
+
+            try:
+                assert output_code == (format_expected := dedent(expected))
+            except AssertionError:
+                raise DiffError(format_expected, output_code)
 
     def run_and_assert_filepath(
         self,
@@ -171,6 +208,7 @@ def run_and_assert(
         tmpdir,
         input_code,
         expected,
+        expected_diff_per_change: list[str] | None = None,
         num_changes: int = 1,
         min_num_changes: int | None = None,
         root: Path | None = None,
@@ -217,7 +255,9 @@ def run_and_assert(
             tmp_file_path,
             input_code,
             expected,
-            changes[0],
+            expected_diff_per_change,
+            num_changes,
+            changes,
         )
 
         return changes
diff --git a/tests/codemods/sonar/test_sonar_jwt_decode_verify.py b/tests/codemods/sonar/test_sonar_jwt_decode_verify.py
index fa30f3a2..c17c99ae 100644
--- a/tests/codemods/sonar/test_sonar_jwt_decode_verify.py
+++ b/tests/codemods/sonar/test_sonar_jwt_decode_verify.py
@@ -38,6 +38,31 @@ def test_simple(self, tmpdir):
         decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], verify=True)
         decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], options={"verify_signature": True})
         """
+
+        expected_diff_per_change = [
+            """\
+--- 
++++ 
+@@ -8,5 +8,5 @@
+ }
+ 
+ encoded_jwt = jwt.encode(payload, SECRET_KEY, algorithm="HS256")
+-decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], verify=False)
++decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], verify=True)
+ decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], options={"verify_signature": False})
+""",
+            """\
+--- 
++++ 
+@@ -9,4 +9,4 @@
+ 
+ encoded_jwt = jwt.encode(payload, SECRET_KEY, algorithm="HS256")
+ decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], verify=False)
+-decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], options={"verify_signature": False})
++decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], options={"verify_signature": True})
+""",
+        ]
+
         issues = {
             "issues": [
                 {
@@ -65,5 +90,10 @@ def test_simple(self, tmpdir):
             ]
         }
         self.run_and_assert(
-            tmpdir, input_code, expected, results=json.dumps(issues), num_changes=2
+            tmpdir,
+            input_code,
+            expected,
+            expected_diff_per_change,
+            results=json.dumps(issues),
+            num_changes=2,
         )

From 66fd2f391d5b57e60a96cabf1f88bada1c7fe9f7 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Thu, 13 Mar 2025 10:03:12 -0300
Subject: [PATCH 03/27] Fixed a few more unit tests

---
 src/codemodder/codemods/base_visitor.py       | 15 +++++++++++
 src/codemodder/codemods/test/utils.py         | 16 ++++++-----
 .../semgrep/semgrep_no_csrf_exempt.py         | 17 ++++++------
 .../semgrep/test_semgrep_no_csrf_exempt.py    | 27 ++++++++++++++++++-
 .../test_sonar_fix_missing_self_or_cls.py     | 27 +++++++++++++++++++
 .../sonar/test_sonar_invert_boolean_check.py  | 22 +++++++++++++++
 6 files changed, 108 insertions(+), 16 deletions(-)

diff --git a/src/codemodder/codemods/base_visitor.py b/src/codemodder/codemods/base_visitor.py
index 2159f026..cd05c7b9 100644
--- a/src/codemodder/codemods/base_visitor.py
+++ b/src/codemodder/codemods/base_visitor.py
@@ -58,6 +58,21 @@ def node_is_selected(self, node) -> bool:
             pos_to_match
         )
 
+    def node_is_selected_by_line_only(self, node) -> bool:
+        pos_to_match = self.node_position(node)
+        return self.filter_by_result_line_only(
+            pos_to_match
+        ) and self.filter_by_path_includes_or_excludes(pos_to_match)
+
+    def filter_by_result_line_only(self, pos_to_match) -> bool:
+        # Codemods with detectors will only run their transformations if there are results.
+        return self.results is None or any(
+            pos_to_match.start.line >= location.start.line
+            and pos_to_match.end.line <= location.end.line
+            for r in self.results
+            for location in r.locations
+        )
+
     def node_position(self, node):
         # See https://github.com/Instagram/LibCST/blob/main/libcst/_metadata_dependent.py#L112
         match node:
diff --git a/src/codemodder/codemods/test/utils.py b/src/codemodder/codemods/test/utils.py
index 7568fdc9..c64fa641 100644
--- a/src/codemodder/codemods/test/utils.py
+++ b/src/codemodder/codemods/test/utils.py
@@ -8,7 +8,7 @@
 
 from codemodder import registry
 from codemodder.codemods.api import BaseCodemod
-from codemodder.codetf import Change
+from codemodder.codetf.v2.codetf import ChangeSet
 from codemodder.context import CodemodExecutionContext
 from codemodder.diff import create_diff
 from codemodder.providers import load_providers
@@ -107,10 +107,12 @@ def run_and_assert(
         )
 
     def assert_num_changes(self, changes, expected_num_changes, min_num_changes):
-        print(len(changes))
-        print(changes)
+        print("expected_diff_per_change = [")
         for c in changes:
-            print(c.diff)
+            print('"""\\')
+            print(c.diff.replace("\t", "    "), end="")
+            print('""",')
+        print("]")
         assert len(changes) == expected_num_changes
 
         actual_num = len(changes)
@@ -248,7 +250,7 @@ def run_and_assert(
 
         self.assert_num_changes(changes, num_changes, min_num_changes)
 
-        self.assert_findings(changes[0].changes)
+        self.assert_findings(changes)
 
         self.assert_changes(
             tmpdir,
@@ -262,7 +264,7 @@ def run_and_assert(
 
         return changes
 
-    def assert_findings(self, changes: list[Change]):
+    def assert_findings(self, changes: list[ChangeSet]):
         assert all(
-            x.fixedFindings for x in changes
+            c.fixedFindings for a in changes for c in a.changes
         ), f"Expected all changes to have findings: {changes}"
diff --git a/src/core_codemods/semgrep/semgrep_no_csrf_exempt.py b/src/core_codemods/semgrep/semgrep_no_csrf_exempt.py
index 5e03891c..fc39ef9c 100644
--- a/src/core_codemods/semgrep/semgrep_no_csrf_exempt.py
+++ b/src/core_codemods/semgrep/semgrep_no_csrf_exempt.py
@@ -26,14 +26,15 @@ def leave_Decorator(
             self.node_position(original_node)
         ):
             return updated_node
-
-        if (
-            self.find_base_name(original_node.decorator)
-            == "django.views.decorators.csrf.csrf_exempt"
-        ):
-            self.report_change(original_node)
-            return cst.RemovalSentinel.REMOVE
-        return original_node
+        # Due to semgrep's odd way of reporting the position for this (decorators + functiondef), we match by line only
+        if self.node_is_selected_by_line_only(original_node):
+            if (
+                self.find_base_name(original_node.decorator)
+                == "django.views.decorators.csrf.csrf_exempt"
+            ):
+                self.report_change(original_node)
+                return cst.RemovalSentinel.REMOVE
+        return updated_node
 
 
 SemgrepNoCsrfExempt = SemgrepCodemod(
diff --git a/tests/codemods/semgrep/test_semgrep_no_csrf_exempt.py b/tests/codemods/semgrep/test_semgrep_no_csrf_exempt.py
index 80e7e287..26684eac 100644
--- a/tests/codemods/semgrep/test_semgrep_no_csrf_exempt.py
+++ b/tests/codemods/semgrep/test_semgrep_no_csrf_exempt.py
@@ -48,7 +48,31 @@ def ssrf_code_checker(request):
         def foo():
             pass
         """
-
+        expected_diff_per_change = [
+            """\
+--- 
++++ 
+@@ -3,7 +3,6 @@
+ from django.dispatch import receiver
+ from django.core.signals import request_finished
+ 
+-@csrf_exempt
+ def ssrf_code_checker(request):
+     if request.user.is_authenticated:
+         if request.method == 'POST':
+""",
+            """\
+--- 
++++ 
+@@ -12,6 +12,5 @@
+ 
+ 
+ @receiver(request_finished)
+-@csrf_exempt
+ def foo():
+     pass
+""",
+        ]
         results = {
             "runs": [
                 {
@@ -114,6 +138,7 @@ def foo():
             tmpdir,
             input_code,
             expected_output,
+            expected_diff_per_change,
             results=json.dumps(results),
             num_changes=2,
         )
diff --git a/tests/codemods/sonar/test_sonar_fix_missing_self_or_cls.py b/tests/codemods/sonar/test_sonar_fix_missing_self_or_cls.py
index b9362dcc..d1247a07 100644
--- a/tests/codemods/sonar/test_sonar_fix_missing_self_or_cls.py
+++ b/tests/codemods/sonar/test_sonar_fix_missing_self_or_cls.py
@@ -30,6 +30,32 @@ def instance_method(self):
             def class_method(cls):
                 pass
         """
+        expected_diff_per_change = [
+            """\
+--- 
++++ 
+@@ -1,6 +1,6 @@
+ 
+ class A:
+-    def instance_method():
++    def instance_method(self):
+         pass
+ 
+     @classmethod
+""",
+            """\
+--- 
++++ 
+@@ -4,5 +4,5 @@
+         pass
+ 
+     @classmethod
+-    def class_method():
++    def class_method(cls):
+         pass
+""",
+        ]
+
         issues = {
             "issues": [
                 {
@@ -60,6 +86,7 @@ def class_method(cls):
             tmpdir,
             input_code,
             expected_output,
+            expected_diff_per_change,
             results=json.dumps(issues),
             num_changes=2,
         )
diff --git a/tests/codemods/sonar/test_sonar_invert_boolean_check.py b/tests/codemods/sonar/test_sonar_invert_boolean_check.py
index c483096a..41267656 100644
--- a/tests/codemods/sonar/test_sonar_invert_boolean_check.py
+++ b/tests/codemods/sonar/test_sonar_invert_boolean_check.py
@@ -20,6 +20,27 @@ def test_simple(self, tmpdir):
         if a != 2:
             b = i >= 10
         """
+        expected_diff_per_change = [
+            """\
+--- 
++++ 
+@@ -1,3 +1,3 @@
+ 
+-if not a == 2:
++if a != 2:
+     b = not i < 10
+""",
+            """\
+--- 
++++ 
+@@ -1,3 +1,3 @@
+ 
+ if not a == 2:
+-    b = not i < 10
++    b = i >= 10
+""",
+        ]
+
         issues = {
             "issues": [
                 {
@@ -50,6 +71,7 @@ def test_simple(self, tmpdir):
             tmpdir,
             input_code,
             expected_output,
+            expected_diff_per_change,
             results=json.dumps(issues),
             num_changes=2,
         )

From 9b3e827a769edf6d6a6ed84c0d0ef6e79f070e0d Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Thu, 13 Mar 2025 11:26:07 -0300
Subject: [PATCH 04/27] Fixed a few more tests

---
 src/codemodder/codemods/test/utils.py         |  4 +-
 .../semgrep/test_semgrep_nan_injection.py     |  6 --
 .../test_semgrep_sql_parametrization.py       | 38 +++++++++-
 tests/codemods/test_with_threading_lock.py    | 76 ++++++++++++++-----
 4 files changed, 92 insertions(+), 32 deletions(-)

diff --git a/src/codemodder/codemods/test/utils.py b/src/codemodder/codemods/test/utils.py
index c64fa641..2c56798d 100644
--- a/src/codemodder/codemods/test/utils.py
+++ b/src/codemodder/codemods/test/utils.py
@@ -164,9 +164,9 @@ def assert_changes(
                 dedent(expected).splitlines(keepends=True),
             )
             try:
-                assert expected_diff == changes.diff
+                assert expected_diff == changes[0].diff
             except AssertionError:
-                raise DiffError(expected_diff, changes.diff)
+                raise DiffError(expected_diff, changes[0].diff)
 
             output_code = file_path.read_bytes().decode("utf-8")
 
diff --git a/tests/codemods/semgrep/test_semgrep_nan_injection.py b/tests/codemods/semgrep/test_semgrep_nan_injection.py
index 6a4d7b49..f2e1c670 100644
--- a/tests/codemods/semgrep/test_semgrep_nan_injection.py
+++ b/tests/codemods/semgrep/test_semgrep_nan_injection.py
@@ -67,7 +67,6 @@ def home(request):
             input_code,
             expected_output,
             results=json.dumps(results),
-            num_changes=4,
         )
 
     def test_multiple(self, tmpdir):
@@ -228,7 +227,6 @@ def view(request):
             input_code,
             expected_output,
             results=json.dumps(results),
-            num_changes=16,
         )
 
     def test_once_nested(self, tmpdir):
@@ -287,7 +285,6 @@ def view(request):
             input_code,
             expected_output,
             results=json.dumps(results),
-            num_changes=4,
         )
 
     def test_twice_nested(self, tmpdir):
@@ -345,7 +342,6 @@ def view(request):
             input_code,
             expected_output,
             results=json.dumps(results),
-            num_changes=4,
         )
 
     def test_direct_source(self, tmpdir):
@@ -401,7 +397,6 @@ def view(request):
             input_code,
             expected_output,
             results=json.dumps(results),
-            num_changes=4,
         )
 
     def test_binop(self, tmpdir):
@@ -459,7 +454,6 @@ def view(request):
             input_code,
             expected_output,
             results=json.dumps(results),
-            num_changes=4,
         )
 
 
diff --git a/tests/codemods/semgrep/test_semgrep_sql_parametrization.py b/tests/codemods/semgrep/test_semgrep_sql_parametrization.py
index 11dbd1a2..d4520953 100644
--- a/tests/codemods/semgrep/test_semgrep_sql_parametrization.py
+++ b/tests/codemods/semgrep/test_semgrep_sql_parametrization.py
@@ -46,6 +46,37 @@ def f():
             conn = sqlite3.connect("example")
             conn.cursor().execute(sql, ((user), ))
         '''
+        expected_diff_per_change = [
+            '''\
+--- 
++++ 
+@@ -8,7 +8,7 @@
+ @app.route("/example")
+ def f():
+     user = request.args["user"]
+-    sql = """SELECT user FROM users WHERE user = '%s'"""
++    sql = """SELECT user FROM users WHERE user = ?"""
+ 
+     conn = sqlite3.connect("example")
+-    conn.cursor().execute(sql % (user))
++    conn.cursor().execute(sql, ((user), ))
+''',
+            '''\
+--- 
++++ 
+@@ -8,7 +8,7 @@
+ @app.route("/example")
+ def f():
+     user = request.args["user"]
+-    sql = """SELECT user FROM users WHERE user = '%s'"""
++    sql = """SELECT user FROM users WHERE user = ?"""
+ 
+     conn = sqlite3.connect("example")
+-    conn.cursor().execute(sql % (user))
++    conn.cursor().execute(sql, ((user), ))
+''',
+        ]
+
         results = {
             "runs": [
                 {
@@ -190,12 +221,11 @@ def f():
                 }
             ]
         }
-        changes = self.run_and_assert(
+        self.run_and_assert(
             tmpdir,
             input_code,
             expexted_output,
+            expected_diff_per_change,
             results=json.dumps(results),
-        )
-        assert len(changes[0].changes[0].fixedFindings) == len(
-            results["runs"][0]["results"]
+            num_changes=2,
         )
diff --git a/tests/codemods/test_with_threading_lock.py b/tests/codemods/test_with_threading_lock.py
index 1701b23b..5f00c23e 100644
--- a/tests/codemods/test_with_threading_lock.py
+++ b/tests/codemods/test_with_threading_lock.py
@@ -93,7 +93,7 @@ class TestThreadingNameResolution(BaseCodemodTest):
     codemod = WithThreadingLock
 
     @pytest.mark.parametrize(
-        "input_code,expected_code,num_changes",
+        "input_code,expected_code,expected_diff_per_change,num_changes",
         [
             (
                 """
@@ -111,6 +111,7 @@ class TestThreadingNameResolution(BaseCodemodTest):
                 with lock_1:
                     ...
                 """,
+                [],
                 1,
             ),
             (
@@ -127,6 +128,7 @@ class TestThreadingNameResolution(BaseCodemodTest):
                 with lock_1:
                     ...
                 """,
+                [],
                 1,
             ),
             (
@@ -147,6 +149,7 @@ def f(l):
                     with lock_2:
                         return [lock_1 for lock_1 in l]
                 """,
+                [],
                 1,
             ),
             (
@@ -173,25 +176,49 @@ def f(l):
                 with lock_2:
                     print()
                 """,
+                [
+                    """\
+--- 
++++ 
+@@ -1,6 +1,7 @@
+ 
+ import threading
+-with threading.Lock():
++lock = threading.Lock()
++with lock:
+     int("1")
+ with threading.Lock():
+     print()
+""",
+                    """\
+--- 
++++ 
+@@ -2,7 +2,8 @@
+ import threading
+ with threading.Lock():
+     int("1")
+-with threading.Lock():
++lock = threading.Lock()
++with lock:
+     print()
+ var = 1
+ with threading.Lock():
+""",
+                    """\
+--- 
++++ 
+@@ -5,5 +5,6 @@
+ with threading.Lock():
+     print()
+ var = 1
+-with threading.Lock():
++lock = threading.Lock()
++with lock:
+     print()
+""",
+                ],
                 3,
             ),
-            (
-                """
-                import threading
-                with threading.Lock():
-                    with threading.Lock():
-                        print()
-                """,
-                """
-                import threading
-                lock_1 = threading.Lock()
-                with lock_1:
-                    lock = threading.Lock()
-                    with lock:
-                        print()
-                """,
-                2,
-            ),
             (
                 """
                 import threading
@@ -210,9 +237,18 @@ def my_func():
                     with lock_1:
                         foo()
                 """,
+                [],
                 1,
             ),
         ],
     )
-    def test_name_resolution(self, tmpdir, input_code, expected_code, num_changes):
-        self.run_and_assert(tmpdir, input_code, expected_code, num_changes=num_changes)
+    def test_name_resolution(
+        self, tmpdir, input_code, expected_code, expected_diff_per_change, num_changes
+    ):
+        self.run_and_assert(
+            tmpdir,
+            input_code,
+            expected_code,
+            expected_diff_per_change,
+            num_changes=num_changes,
+        )

From abe872ae4132095d0b24788a60727435e9ac61e1 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Fri, 14 Mar 2025 09:08:40 -0300
Subject: [PATCH 05/27] Fixed more unit tests

---
 .../test_avoid_insecure_deserialization.py    |  35 +++++-
 .../test_sonar_enable_jinja2_autoescape.py    |  24 ++++
 .../sonar/test_sonar_secure_cookie.py         |  56 ++++++++-
 .../sonar/test_sonar_secure_random.py         |  43 +++++++
 tests/codemods/test_fix_hasattr_call.py       |  70 ++++++++++-
 tests/codemods/test_secure_random.py          | 114 +++++++++++++++++-
 6 files changed, 330 insertions(+), 12 deletions(-)

diff --git a/tests/codemods/defectdojo/semgrep/test_avoid_insecure_deserialization.py b/tests/codemods/defectdojo/semgrep/test_avoid_insecure_deserialization.py
index 76cd9944..3542d95c 100644
--- a/tests/codemods/defectdojo/semgrep/test_avoid_insecure_deserialization.py
+++ b/tests/codemods/defectdojo/semgrep/test_avoid_insecure_deserialization.py
@@ -62,7 +62,6 @@ def test_pickle_load(self, adds_dependency, tmpdir):
 
         result = fickling.load("data")
         """
-
         findings = {
             "results": [
                 {
@@ -100,6 +99,31 @@ def test_pickle_and_yaml(self, adds_dependency, tmpdir):
         result = fickling.load("data")
         result = yaml.load("data", Loader=yaml.SafeLoader)
         """
+        expected_diff_per_change = [
+            """\
+--- 
++++ 
+@@ -1,6 +1,6 @@
+ 
+-import pickle
+ import yaml
++import fickling
+ 
+-result = pickle.load("data")
++result = fickling.load("data")
+ result = yaml.load("data")
+""",
+            """\
+--- 
++++ 
+@@ -3,4 +3,4 @@
+ import yaml
+ 
+ result = pickle.load("data")
+-result = yaml.load("data")
++result = yaml.load("data", Loader=yaml.SafeLoader)
+""",
+        ]
 
         findings = {
             "results": [
@@ -122,6 +146,7 @@ def test_pickle_and_yaml(self, adds_dependency, tmpdir):
             tmpdir,
             input_code,
             expected,
+            expected_diff_per_change,
             results=json.dumps(findings),
             num_changes=2,
         )
@@ -129,11 +154,11 @@ def test_pickle_and_yaml(self, adds_dependency, tmpdir):
 
         assert changes is not None
         assert changes[0].changes[0].fixedFindings is not None
-        assert changes[0].changes[0].fixedFindings[0].id == "4"
+        assert changes[0].changes[0].fixedFindings[0].id == "3"
         assert changes[0].changes[0].fixedFindings[0].rule.id == RULE_ID
-        assert changes[0].changes[1].fixedFindings is not None
-        assert changes[0].changes[1].fixedFindings[0].id == "3"
-        assert changes[0].changes[1].fixedFindings[0].rule.id == RULE_ID
+        assert changes[1].changes[0].fixedFindings is not None
+        assert changes[1].changes[0].fixedFindings[0].id == "4"
+        assert changes[1].changes[0].fixedFindings[0].rule.id == RULE_ID
 
     @mock.patch("codemodder.codemods.api.FileContext.add_dependency")
     def test_pickle_loads(self, adds_dependency, tmpdir):
diff --git a/tests/codemods/sonar/test_sonar_enable_jinja2_autoescape.py b/tests/codemods/sonar/test_sonar_enable_jinja2_autoescape.py
index ea3feaf8..3e8bd941 100644
--- a/tests/codemods/sonar/test_sonar_enable_jinja2_autoescape.py
+++ b/tests/codemods/sonar/test_sonar_enable_jinja2_autoescape.py
@@ -24,6 +24,29 @@ def test_simple(self, tmpdir):
         env = Environment(autoescape=True)
         env = Environment(autoescape=True)
         """
+        expected_diff_per_change = [
+            """\
+--- 
++++ 
+@@ -1,4 +1,4 @@
+ 
+ from jinja2 import Environment
+-env = Environment()
++env = Environment(autoescape=True)
+ env = Environment(autoescape=False)
+""",
+            """\
+--- 
++++ 
+@@ -1,4 +1,4 @@
+ 
+ from jinja2 import Environment
+ env = Environment()
+-env = Environment(autoescape=False)
++env = Environment(autoescape=True)
+""",
+        ]
+
         hotspots = {
             "hotspots": [
                 {
@@ -54,6 +77,7 @@ def test_simple(self, tmpdir):
             tmpdir,
             input_code,
             expected_output,
+            expected_diff_per_change,
             results=json.dumps(hotspots),
             num_changes=2,
         )
diff --git a/tests/codemods/sonar/test_sonar_secure_cookie.py b/tests/codemods/sonar/test_sonar_secure_cookie.py
index 922fbc00..b9d56ac7 100644
--- a/tests/codemods/sonar/test_sonar_secure_cookie.py
+++ b/tests/codemods/sonar/test_sonar_secure_cookie.py
@@ -34,6 +34,55 @@ def test_simple(self, tmpdir):
         var = "hello"
         response2.set_cookie("name", "value", secure=True, httponly=True, samesite='Lax')
         """
+        expected_diff_per_change = [
+            """\
+--- 
++++ 
+@@ -3,7 +3,7 @@
+ 
+ response = flask.make_response()
+ var = "hello"
+-response.set_cookie("name", "value")
++response.set_cookie("name", "value", secure=True, httponly=True, samesite='Lax')
+ 
+ response2 = flask.Response()
+ var = "hello"
+""",
+            """\
+--- 
++++ 
+@@ -7,4 +7,4 @@
+ 
+ response2 = flask.Response()
+ var = "hello"
+-response2.set_cookie("name", "value")
++response2.set_cookie("name", "value", secure=True, httponly=True, samesite='Lax')
+""",
+            """\
+--- 
++++ 
+@@ -3,7 +3,7 @@
+ 
+ response = flask.make_response()
+ var = "hello"
+-response.set_cookie("name", "value")
++response.set_cookie("name", "value", secure=True, httponly=True, samesite='Lax')
+ 
+ response2 = flask.Response()
+ var = "hello"
+""",
+            """\
+--- 
++++ 
+@@ -7,4 +7,4 @@
+ 
+ response2 = flask.Response()
+ var = "hello"
+-response2.set_cookie("name", "value")
++response2.set_cookie("name", "value", secure=True, httponly=True, samesite='Lax')
+""",
+        ]
+
         issues = {
             "hotspots": [
                 {
@@ -83,5 +132,10 @@ def test_simple(self, tmpdir):
             ],
         }
         self.run_and_assert(
-            tmpdir, input_code, expected, results=json.dumps(issues), num_changes=2
+            tmpdir,
+            input_code,
+            expected,
+            expected_diff_per_change,
+            results=json.dumps(issues),
+            num_changes=4,
         )
diff --git a/tests/codemods/sonar/test_sonar_secure_random.py b/tests/codemods/sonar/test_sonar_secure_random.py
index 383c9e3a..d4499c39 100644
--- a/tests/codemods/sonar/test_sonar_secure_random.py
+++ b/tests/codemods/sonar/test_sonar_secure_random.py
@@ -26,6 +26,48 @@ def test_simple(self, tmpdir):
         secrets.SystemRandom().randint(0, 9)
         secrets.SystemRandom().random()
         """
+        expected_diff_per_change = [
+            """\
+--- 
++++ 
+@@ -1,6 +1,7 @@
+ 
+ import random
++import secrets
+ 
+-random.getrandbits(1)
++secrets.SystemRandom().getrandbits(1)
+ random.randint(0, 9)
+ random.random()
+""",
+            """\
+--- 
++++ 
+@@ -1,6 +1,7 @@
+ 
+ import random
++import secrets
+ 
+ random.getrandbits(1)
+-random.randint(0, 9)
++secrets.SystemRandom().randint(0, 9)
+ random.random()
+""",
+            """\
+--- 
++++ 
+@@ -1,6 +1,7 @@
+ 
+ import random
++import secrets
+ 
+ random.getrandbits(1)
+ random.randint(0, 9)
+-random.random()
++secrets.SystemRandom().random()
+""",
+        ]
+
         hotspots = {
             "hotspots": [
                 {
@@ -67,6 +109,7 @@ def test_simple(self, tmpdir):
             tmpdir,
             input_code,
             expected_output,
+            expected_diff_per_change,
             results=json.dumps(hotspots),
             num_changes=3,
         )
diff --git a/tests/codemods/test_fix_hasattr_call.py b/tests/codemods/test_fix_hasattr_call.py
index 5feb01a5..ff1c2161 100644
--- a/tests/codemods/test_fix_hasattr_call.py
+++ b/tests/codemods/test_fix_hasattr_call.py
@@ -37,7 +37,75 @@ class Test:
         if callable(obj):
             print(1)
         """
-        self.run_and_assert(tmpdir, input_code, expected, num_changes=5)
+        expected_diff_per_change = [
+            """\
+--- 
++++ 
+@@ -2,7 +2,7 @@
+ class Test:
+     pass
+ 
+-hasattr(Test(), "__call__")
++callable(Test())
+ hasattr("hi", '__call__')
+ 
+ assert hasattr(1, '__call__')
+""",
+            """\
+--- 
++++ 
+@@ -3,7 +3,7 @@
+     pass
+ 
+ hasattr(Test(), "__call__")
+-hasattr("hi", '__call__')
++callable("hi")
+ 
+ assert hasattr(1, '__call__')
+ obj = Test()
+""",
+            """\
+--- 
++++ 
+@@ -5,7 +5,7 @@
+ hasattr(Test(), "__call__")
+ hasattr("hi", '__call__')
+ 
+-assert hasattr(1, '__call__')
++assert callable(1)
+ obj = Test()
+ var = hasattr(obj, "__call__")
+ 
+""",
+            """\
+--- 
++++ 
+@@ -7,7 +7,7 @@
+ 
+ assert hasattr(1, '__call__')
+ obj = Test()
+-var = hasattr(obj, "__call__")
++var = callable(obj)
+ 
+ if hasattr(obj, "__call__"):
+     print(1)
+""",
+            """\
+--- 
++++ 
+@@ -9,5 +9,5 @@
+ obj = Test()
+ var = hasattr(obj, "__call__")
+ 
+-if hasattr(obj, "__call__"):
++if callable(obj):
+     print(1)
+""",
+        ]
+
+        self.run_and_assert(
+            tmpdir, input_code, expected, expected_diff_per_change, num_changes=5
+        )
 
     def test_other_hasattr(self, tmpdir):
         code = """
diff --git a/tests/codemods/test_secure_random.py b/tests/codemods/test_secure_random.py
index 89bde2b8..37717eec 100644
--- a/tests/codemods/test_secure_random.py
+++ b/tests/codemods/test_secure_random.py
@@ -25,8 +25,38 @@ def test_import_random(self, tmpdir):
         secrets.SystemRandom().getrandbits(1)
         var = "hello"
         """
-
-        self.run_and_assert(tmpdir, input_code, expected_output, num_changes=2)
+        expected_diff_per_change = [
+            """\
+--- 
++++ 
+@@ -1,6 +1,7 @@
+ 
+ import random
++import secrets
+ 
+-random.random()
++secrets.SystemRandom().random()
+ random.getrandbits(1)
+ var = "hello"
+""",
+            """\
+--- 
++++ 
+@@ -1,6 +1,7 @@
+ 
+ import random
++import secrets
+ 
+ random.random()
+-random.getrandbits(1)
++secrets.SystemRandom().getrandbits(1)
+ var = "hello"
+""",
+        ]
+
+        self.run_and_assert(
+            tmpdir, input_code, expected_output, expected_diff_per_change, num_changes=2
+        )
 
     def test_from_random(self, tmpdir):
         input_code = """
@@ -109,7 +139,38 @@ def test_multiple_calls(self, tmpdir):
         secrets.SystemRandom().randint()
         var = "hello"
         """
-        self.run_and_assert(tmpdir, input_code, expected_output, num_changes=2)
+        expected_diff_per_change = [
+            """\
+--- 
++++ 
+@@ -1,6 +1,7 @@
+ 
+ import random
++import secrets
+ 
+-random.random()
++secrets.SystemRandom().random()
+ random.randint()
+ var = "hello"
+""",
+            """\
+--- 
++++ 
+@@ -1,6 +1,7 @@
+ 
+ import random
++import secrets
+ 
+ random.random()
+-random.randint()
++secrets.SystemRandom().randint()
+ var = "hello"
+""",
+        ]
+
+        self.run_and_assert(
+            tmpdir, input_code, expected_output, expected_diff_per_change, num_changes=2
+        )
 
     @pytest.mark.parametrize(
         "input_code,expected_output",
@@ -217,8 +278,51 @@ def test_sampling(self, tmpdir):
         secrets.choice(["a", "b"])
         secrets.SystemRandom().choices(["a", "b"])
         """
-
-        self.run_and_assert(tmpdir, input_code, expected_output, num_changes=3)
+        expected_diff_per_change = [
+            """\
+--- 
++++ 
+@@ -1,6 +1,7 @@
+ 
+ import random
++import secrets
+ 
+-random.sample(["a", "b"], 1)
++secrets.SystemRandom().sample(["a", "b"], 1)
+ random.choice(["a", "b"])
+ random.choices(["a", "b"])
+""",
+            """\
+--- 
++++ 
+@@ -1,6 +1,7 @@
+ 
+ import random
++import secrets
+ 
+ random.sample(["a", "b"], 1)
+-random.choice(["a", "b"])
++secrets.choice(["a", "b"])
+ random.choices(["a", "b"])
+""",
+            """\
+--- 
++++ 
+@@ -1,6 +1,7 @@
+ 
+ import random
++import secrets
+ 
+ random.sample(["a", "b"], 1)
+ random.choice(["a", "b"])
+-random.choices(["a", "b"])
++secrets.SystemRandom().choices(["a", "b"])
+""",
+        ]
+
+        self.run_and_assert(
+            tmpdir, input_code, expected_output, expected_diff_per_change, num_changes=3
+        )
 
     def test_from_import_choice(self, tmpdir):
         input_code = """

From 141cde2c5ca979b5fd33161ce6d808a7d0937c4a Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Fri, 14 Mar 2025 10:27:51 -0300
Subject: [PATCH 06/27] Fixed more unit tests

---
 src/codemodder/codemods/test/utils.py         | 27 ++++++--
 .../semgrep/test_semgrep_nan_injection.py     | 69 +++++++++++++++++++
 .../test_sonar_django_receiver_on_top.py      |  4 +-
 .../sonar/test_sonar_fix_assert_tuple.py      |  6 +-
 .../test_sonar_timezone_aware_datetime.py     | 33 ++++++++-
 5 files changed, 125 insertions(+), 14 deletions(-)

diff --git a/src/codemodder/codemods/test/utils.py b/src/codemodder/codemods/test/utils.py
index 2c56798d..030a8620 100644
--- a/src/codemodder/codemods/test/utils.py
+++ b/src/codemodder/codemods/test/utils.py
@@ -94,7 +94,9 @@ def run_and_assert(
             assert not changes
             return
 
-        self.assert_num_changes(changes, num_changes, min_num_changes)
+        self.assert_num_changes(
+            changes, num_changes, expected_diff_per_change, min_num_changes
+        )
 
         self.assert_changes(
             tmpdir,
@@ -106,16 +108,25 @@ def run_and_assert(
             changes,
         )
 
-    def assert_num_changes(self, changes, expected_num_changes, min_num_changes):
+    def assert_num_changes(
+        self, changes, expected_num_changes, expected_diff_per_change, min_num_changes
+    ):
         print("expected_diff_per_change = [")
         for c in changes:
             print('"""\\')
-            print(c.diff.replace("\t", "    "), end="")
+            diff_lines = c.diff.replace("\t", "    ").splitlines()
+            for line in diff_lines:
+                print(line)
             print('""",')
         print("]")
-        assert len(changes) == expected_num_changes
+        if expected_diff_per_change:
+            assert len(changes) == expected_num_changes
+            actual_num = len(changes)
+        else:
+            assert len(changes[0].changes) == expected_num_changes
+            actual_num = len(changes[0].changes)
 
-        actual_num = len(changes)
+        # actual_num = len(changes)
 
         if min_num_changes is not None:
             assert (
@@ -142,7 +153,7 @@ def assert_changes(
         assert all(c.description for change in changes for c in change.changes)
 
         # assert each change individually
-        if num_changes > 1:
+        if expected_diff_per_change and num_changes > 1:
             assert num_changes == len(expected_diff_per_change)
             for change, diff in zip(changes, expected_diff_per_change):
                 print(change.diff)
@@ -248,7 +259,9 @@ def run_and_assert(
             assert not changes
             return
 
-        self.assert_num_changes(changes, num_changes, min_num_changes)
+        self.assert_num_changes(
+            changes, num_changes, expected_diff_per_change, min_num_changes
+        )
 
         self.assert_findings(changes)
 
diff --git a/tests/codemods/semgrep/test_semgrep_nan_injection.py b/tests/codemods/semgrep/test_semgrep_nan_injection.py
index f2e1c670..1ab02f28 100644
--- a/tests/codemods/semgrep/test_semgrep_nan_injection.py
+++ b/tests/codemods/semgrep/test_semgrep_nan_injection.py
@@ -66,6 +66,7 @@ def home(request):
             tmpdir,
             input_code,
             expected_output,
+            num_changes=4,
             results=json.dumps(results),
         )
 
@@ -108,6 +109,68 @@ def view(request):
             else:
                 return [1, 2, float(tid), 3]
         """
+        expected_diff_per_change = [
+            """\
+--- 
++++ 
+@@ -2,7 +2,10 @@
+     tid = request.POST.get("tid")
+     some_list = [1, 2, 3, float('nan')]
+ 
+-    float(tid) in some_list
++    if tid.lower() == "nan":
++        raise ValueError
++    else:
++        float(tid) in some_list
+ 
+     z = [1, 2, complex(tid), 3]
+ 
+""",
+            """\
+--- 
++++ 
+@@ -4,7 +4,10 @@
+ 
+     float(tid) in some_list
+ 
+-    z = [1, 2, complex(tid), 3]
++    if tid.lower() == "nan":
++        raise ValueError
++    else:
++        z = [1, 2, complex(tid), 3]
+ 
+     x = [float(tid), 1.0, 2.0]
+ 
+""",
+            """\
+--- 
++++ 
+@@ -6,6 +6,9 @@
+ 
+     z = [1, 2, complex(tid), 3]
+ 
+-    x = [float(tid), 1.0, 2.0]
++    if tid.lower() == "nan":
++        raise ValueError
++    else:
++        x = [float(tid), 1.0, 2.0]
+ 
+     return [1, 2, float(tid), 3]
+""",
+            """\
+--- 
++++ 
+@@ -8,4 +8,7 @@
+ 
+     x = [float(tid), 1.0, 2.0]
+ 
+-    return [1, 2, float(tid), 3]
++    if tid.lower() == "nan":
++        raise ValueError
++    else:
++        return [1, 2, float(tid), 3]
+""",
+        ]
 
         results = {
             "runs": [
@@ -226,6 +289,8 @@ def view(request):
             tmpdir,
             input_code,
             expected_output,
+            expected_diff_per_change,
+            num_changes=4,
             results=json.dumps(results),
         )
 
@@ -284,6 +349,7 @@ def view(request):
             tmpdir,
             input_code,
             expected_output,
+            num_changes=4,
             results=json.dumps(results),
         )
 
@@ -341,6 +407,7 @@ def view(request):
             tmpdir,
             input_code,
             expected_output,
+            num_changes=4,
             results=json.dumps(results),
         )
 
@@ -396,6 +463,7 @@ def view(request):
             tmpdir,
             input_code,
             expected_output,
+            num_changes=4,
             results=json.dumps(results),
         )
 
@@ -453,6 +521,7 @@ def view(request):
             tmpdir,
             input_code,
             expected_output,
+            num_changes=4,
             results=json.dumps(results),
         )
 
diff --git a/tests/codemods/sonar/test_sonar_django_receiver_on_top.py b/tests/codemods/sonar/test_sonar_django_receiver_on_top.py
index 77d2c013..0ec3513a 100644
--- a/tests/codemods/sonar/test_sonar_django_receiver_on_top.py
+++ b/tests/codemods/sonar/test_sonar_django_receiver_on_top.py
@@ -13,8 +13,8 @@ def test_name(self):
 
     def assert_findings(self, changes):
         # For now we can only link the finding to the line with the receiver decorator
-        assert changes[0].fixedFindings
-        assert not changes[1].fixedFindings
+        assert changes[0].changes[0].fixedFindings
+        assert not changes[0].changes[1].fixedFindings
 
     def test_simple(self, tmpdir):
         input_code = """
diff --git a/tests/codemods/sonar/test_sonar_fix_assert_tuple.py b/tests/codemods/sonar/test_sonar_fix_assert_tuple.py
index 573634cc..a31903bd 100644
--- a/tests/codemods/sonar/test_sonar_fix_assert_tuple.py
+++ b/tests/codemods/sonar/test_sonar_fix_assert_tuple.py
@@ -13,9 +13,9 @@ def test_name(self):
 
     def assert_findings(self, changes):
         # For now we can only link the finding to the first line changed
-        assert changes[0].fixedFindings
-        assert not changes[1].fixedFindings
-        assert not changes[2].fixedFindings
+        assert changes[0].changes[0].fixedFindings
+        assert not changes[0].changes[1].fixedFindings
+        assert not changes[0].changes[2].fixedFindings
 
     def test_simple(self, tmpdir):
         input_code = """
diff --git a/tests/codemods/sonar/test_sonar_timezone_aware_datetime.py b/tests/codemods/sonar/test_sonar_timezone_aware_datetime.py
index f93e4ed7..8c679e88 100644
--- a/tests/codemods/sonar/test_sonar_timezone_aware_datetime.py
+++ b/tests/codemods/sonar/test_sonar_timezone_aware_datetime.py
@@ -4,7 +4,7 @@
 from core_codemods.sonar.sonar_timezone_aware_datetime import SonarTimezoneAwareDatetime
 
 
-class TestSonarSQLParameterization(BaseSASTCodemodTest):
+class TestSonarTimezoneAwareDatetime(BaseSASTCodemodTest):
     codemod = SonarTimezoneAwareDatetime
     tool = "sonar"
 
@@ -26,6 +26,30 @@ def test_simple(self, tmpdir):
         timestamp = 1571595618.0
         datetime.datetime.fromtimestamp(timestamp, tz=datetime.timezone.utc)
         """
+        expected_diff_per_change = [
+            """\
+--- 
++++ 
+@@ -1,5 +1,5 @@
+ import datetime
+ 
+-datetime.datetime.utcnow()
++datetime.datetime.now(tz=datetime.timezone.utc)
+ timestamp = 1571595618.0
+ datetime.datetime.utcfromtimestamp(timestamp)
+""",
+            """\
+--- 
++++ 
+@@ -2,4 +2,4 @@
+ 
+ datetime.datetime.utcnow()
+ timestamp = 1571595618.0
+-datetime.datetime.utcfromtimestamp(timestamp)
++datetime.datetime.fromtimestamp(timestamp, tz=datetime.timezone.utc)
+""",
+        ]
+
         issues = {
             "issues": [
                 {
@@ -60,5 +84,10 @@ def test_simple(self, tmpdir):
             ]
         }
         self.run_and_assert(
-            tmpdir, input_code, expected, results=json.dumps(issues), num_changes=2
+            tmpdir,
+            input_code,
+            expected,
+            expected_diff_per_change,
+            results=json.dumps(issues),
+            num_changes=2,
         )

From 1aa72fdaf5b5e25fe37003862351eba2f75c5c46 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Mon, 24 Mar 2025 08:40:40 -0300
Subject: [PATCH 07/27] Added hardening script

---
 pyproject.toml                          |  1 +
 src/codemodder/codemodder.py            | 27 +++++++++++---
 src/codemodder/codemods/base_codemod.py | 48 +++++++++++++++----------
 src/core_codemods/defectdojo/api.py     |  2 ++
 4 files changed, 55 insertions(+), 23 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index 091b5d98..a788e8dd 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -46,6 +46,7 @@ Repository = "https://github.com/pixee/codemodder-python"
 
 [project.scripts]
 codemodder = "codemodder.codemodder:main"
+codemodder_hardening = "codemodder.codemodder:harden"
 generate-docs = 'codemodder.scripts.generate_docs:main'
 get-hashes = 'codemodder.scripts.get_hashes:main'
 
diff --git a/src/codemodder/codemodder.py b/src/codemodder/codemodder.py
index 821c6bef..bd266a7d 100644
--- a/src/codemodder/codemodder.py
+++ b/src/codemodder/codemodder.py
@@ -73,6 +73,7 @@ def log_report(context, output, elapsed_ms, files_to_analyze, token_usage):
 def apply_codemods(
     context: CodemodExecutionContext,
     codemods_to_run: Sequence[BaseCodemod],
+    hardening: bool,
 ) -> TokenUsage:
     log_section("scanning")
     token_usage = TokenUsage()
@@ -89,7 +90,7 @@ def apply_codemods(
     for codemod in codemods_to_run:
         # NOTE: this may be used as a progress indicator by upstream tools
         logger.info("running codemod %s", codemod.id)
-        if codemod_token_usage := codemod.apply(context):
+        if codemod_token_usage := codemod.apply(context, hardening):
             log_token_usage(f"Codemod {codemod.id}", codemod_token_usage)
             token_usage += codemod_token_usage
 
@@ -135,6 +136,7 @@ def run(
     sast_only: bool = False,
     ai_client: bool = True,
     log_matched_files: bool = False,
+    hardening: bool = False,
 ) -> tuple[CodeTF | None, int, TokenUsage]:
     start = datetime.datetime.now()
 
@@ -206,7 +208,7 @@ def run(
         context.find_and_fix_paths,
     )
 
-    token_usage = apply_codemods(context, codemods_to_run)
+    token_usage = apply_codemods(context, codemods_to_run, hardening)
 
     elapsed = datetime.datetime.now() - start
     elapsed_ms = int(elapsed.total_seconds() * 1000)
@@ -231,7 +233,7 @@ def run(
     return codetf, 0, token_usage
 
 
-def _run_cli(original_args) -> int:
+def _run_cli(original_args, hardening=False) -> int:
     codemod_registry = registry.load_registered_codemods()
     argv = parse_args(original_args, codemod_registry)
     if not os.path.exists(argv.directory):
@@ -270,7 +272,8 @@ def _run_cli(original_args) -> int:
 
     _, status, _ = run(
         argv.directory,
-        argv.dry_run,
+        # Force dry-run if not hardening
+        argv.dry_run if hardening else True,
         argv.output,
         argv.output_format,
         argv.verbose,
@@ -284,10 +287,26 @@ def _run_cli(original_args) -> int:
         codemod_registry=codemod_registry,
         sast_only=argv.sonar_issues_json or argv.sarif,
         log_matched_files=True,
+        hardening=hardening,
     )
     return status
 
 
+"""
+Hardens a project. The application will write all the fixes into the files.
+"""
+
+
+def harden():
+    sys_argv = sys.argv[1:]
+    sys.exit(_run_cli(sys_argv, True))
+
+
+"""
+Remediates a project. The application will suggest fix for each separate issue found. No files will be written.
+"""
+
+
 def main():
     sys_argv = sys.argv[1:]
     sys.exit(_run_cli(sys_argv))
diff --git a/src/codemodder/codemods/base_codemod.py b/src/codemodder/codemods/base_codemod.py
index b1633082..1c0c2e89 100644
--- a/src/codemodder/codemods/base_codemod.py
+++ b/src/codemodder/codemods/base_codemod.py
@@ -189,6 +189,7 @@ def _apply(
         self,
         context: CodemodExecutionContext,
         rules: list[str],
+        hardening: bool,
     ) -> None | TokenUsage:
         if self.provider and (
             not (provider := context.providers.get_provider(self.provider))
@@ -226,21 +227,26 @@ def _apply(
             logger.debug("No files matched for %s", self.id)
             return None
 
-        # Do each result independently
-        if results:
+        # Do each result independently and outputs the diffs
+        if not hardening:
             # gather positional arguments for the map
-            resultset_arguments = []
+            resultset_arguments: list[ResultSet | None] = []
             path_arguments = []
-            for result in results.results_for_rules(rules):
-                # this need to be the same type of ResultSet as results
-                singleton = results.__class__()
-                singleton.add_result(result)
-                result_locations = self.get_files_to_analyze(context, singleton)
-                # We do an execution for each location in the result
-                # So we duplicate the resultset argument for each location
-                for loc in result_locations:
-                    resultset_arguments.append(singleton)
-                    path_arguments.append(loc)
+            if results:
+                for result in results.results_for_rules(rules):
+                    # this need to be the same type of ResultSet as results
+                    singleton = results.__class__()
+                    singleton.add_result(result)
+                    result_locations = self.get_files_to_analyze(context, singleton)
+                    # We do an execution for each location in the result
+                    # So we duplicate the resultset argument for each location
+                    for loc in result_locations:
+                        resultset_arguments.append(singleton)
+                        path_arguments.append(loc)
+            # An exception for find-and-fix codemods
+            else:
+                resultset_arguments = [None]
+                path_arguments = files_to_analyze
 
             contexts: list = []
             with ThreadPoolExecutor() as executor:
@@ -251,13 +257,13 @@ def _apply(
                             path, context, resultset, rules
                         ),
                         path_arguments,
-                        resultset_arguments,
+                        resultset_arguments or [None],
                     )
                 )
                 executor.shutdown(wait=True)
 
             context.process_results(self.id, contexts)
-        # for find and fix codemods
+        # Hardens all findings per file at once and writes the fixed code into the file
         else:
             process_file = functools.partial(
                 self._process_file, context=context, results=results, rules=rules
@@ -276,7 +282,9 @@ def _apply(
             context.process_results(self.id, contexts)
         return None
 
-    def apply(self, context: CodemodExecutionContext) -> None | TokenUsage:
+    def apply(
+        self, context: CodemodExecutionContext, hardening: bool = False
+    ) -> None | TokenUsage:
         """
         Apply the codemod with the given codemod execution context
 
@@ -292,7 +300,7 @@ def apply(self, context: CodemodExecutionContext) -> None | TokenUsage:
 
         :param context: The codemod execution context
         """
-        return self._apply(context, [self._internal_name])
+        return self._apply(context, [self._internal_name], hardening)
 
     def _process_file(
         self,
@@ -390,8 +398,10 @@ def __init__(
         if requested_rules:
             self.requested_rules.extend(requested_rules)
 
-    def apply(self, context: CodemodExecutionContext) -> None | TokenUsage:
-        return self._apply(context, self.requested_rules)
+    def apply(
+        self, context: CodemodExecutionContext, hardening: bool = False
+    ) -> None | TokenUsage:
+        return self._apply(context, self.requested_rules, hardening)
 
     def get_files_to_analyze(
         self,
diff --git a/src/core_codemods/defectdojo/api.py b/src/core_codemods/defectdojo/api.py
index abc7bbdd..c024149c 100644
--- a/src/core_codemods/defectdojo/api.py
+++ b/src/core_codemods/defectdojo/api.py
@@ -76,9 +76,11 @@ def from_core_codemod(
     def apply(
         self,
         context: CodemodExecutionContext,
+        hardening: bool = False,
     ) -> None:
         self._apply(
             context,
             # We know this has a tool because we created it with `from_core_codemod`
             cast(ToolMetadata, self._metadata.tool).rule_ids,
+            hardening,
         )

From a8e59a2e1aa04458ca89bedbb38d81cb351bb624 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Thu, 20 Mar 2025 09:16:03 -0300
Subject: [PATCH 08/27] Added integration tests for new behavior

---
 .../sonar/test_sonar_jwt_decode_verify.py     |  20 +-
 pyproject.toml                                |   1 +
 .../codemods/test/integration_utils.py        | 311 +++++++++++++++++-
 3 files changed, 315 insertions(+), 17 deletions(-)

diff --git a/integration_tests/sonar/test_sonar_jwt_decode_verify.py b/integration_tests/sonar/test_sonar_jwt_decode_verify.py
index f8c17f16..97be4f79 100644
--- a/integration_tests/sonar/test_sonar_jwt_decode_verify.py
+++ b/integration_tests/sonar/test_sonar_jwt_decode_verify.py
@@ -1,25 +1,19 @@
-from codemodder.codemods.test import SonarIntegrationTest
+from codemodder.codemods.test.integration_utils import SonarRemediationIntegrationTest
 from core_codemods.sonar.sonar_jwt_decode_verify import (
     JwtDecodeVerifySASTTransformer,
     SonarJwtDecodeVerify,
 )
 
 
-class TestJwtDecodeVerify(SonarIntegrationTest):
+class TestJwtDecodeVerify(SonarRemediationIntegrationTest):
     codemod = SonarJwtDecodeVerify
     code_path = "tests/samples/jwt_decode_verify.py"
-    replacement_lines = [
-        (
-            11,
-            """decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], verify=True)\n""",
-        ),
-        (
-            12,
-            """decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], options={"verify_signature": True})\n""",
-        ),
+
+    expected_diff_per_change = [
+        '--- \n+++ \n@@ -8,7 +8,7 @@\n \n encoded_jwt = jwt.encode(payload, SECRET_KEY, algorithm="HS256")\n \n-decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], verify=False)\n+decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], verify=True)\n decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], options={"verify_signature": False})\n \n var = "something"\n',
+        '--- \n+++ \n@@ -9,6 +9,6 @@\n encoded_jwt = jwt.encode(payload, SECRET_KEY, algorithm="HS256")\n \n decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], verify=False)\n-decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], options={"verify_signature": False})\n+decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], options={"verify_signature": True})\n \n var = "something"\n',
     ]
 
-    expected_diff = '--- \n+++ \n@@ -8,7 +8,7 @@\n \n encoded_jwt = jwt.encode(payload, SECRET_KEY, algorithm="HS256")\n \n-decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], verify=False)\n-decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], options={"verify_signature": False})\n+decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], verify=True)\n+decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], options={"verify_signature": True})\n \n var = "something"\n'
-    expected_line_change = "11"
+    expected_lines_changed = [11, 12]
     num_changes = 2
     change_description = JwtDecodeVerifySASTTransformer.change_description
diff --git a/pyproject.toml b/pyproject.toml
index a788e8dd..6b226aa7 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -82,6 +82,7 @@ test = [
     "flask_wtf~=1.2.0",
     "fickling~=0.1.0,>=0.1.3",
     "graphql-server~=3.0.0b7",
+    "unidiff>=0.75",
 ]
 complexity = [
     "radon==6.0.*",
diff --git a/src/codemodder/codemods/test/integration_utils.py b/src/codemodder/codemods/test/integration_utils.py
index 40da6299..2f062d83 100644
--- a/src/codemodder/codemods/test/integration_utils.py
+++ b/src/codemodder/codemods/test/integration_utils.py
@@ -9,6 +9,7 @@
 from types import ModuleType
 
 import jsonschema
+import unidiff
 
 from codemodder import __version__
 from core_codemods.sonar.api import process_sonar_findings
@@ -35,6 +36,252 @@ def check_dependencies_after(self):
             assert new_requirements_txt == self.expected_requirements
 
 
+class BaseRemediationIntegrationTest:
+    codemod = NotImplementedError
+    original_code = NotImplementedError
+    expected_diff_per_change = NotImplementedError
+    num_changes = 1
+    num_changed_files = 1
+    allowed_exceptions = ()
+    sonar_issues_json: str | None = None
+    sonar_hotspots_json: str | None = None
+
+    @classmethod
+    def setup_class(cls):
+        codemod_id = (
+            cls.codemod().id if isinstance(cls.codemod, type) else cls.codemod.id
+        )
+        cls.codemod_instance = validate_codemod_registration(codemod_id)
+
+        cls.output_path = tempfile.mkstemp()[1]
+        cls.code_dir = tempfile.mkdtemp()
+
+        if not hasattr(cls, "code_filename"):
+            # Only a few codemods require the analyzed file to have a specific filename
+            # All others can just be `code.py`
+            cls.code_filename = "code.py"
+
+        cls.code_path = os.path.join(cls.code_dir, cls.code_filename)
+
+        if cls.code_filename == "settings.py" and "Django" in str(cls):
+            # manage.py must be in the directory above settings.py for this codemod to run
+            parent_dir = Path(cls.code_dir).parent
+            manage_py_path = parent_dir / "manage.py"
+            manage_py_path.touch()
+
+    @classmethod
+    def teardown_class(cls):
+        """Ensure any re-written file is undone after integration test class"""
+        pass
+
+    def _assert_run_fields(self, run, output_path):
+        assert run["vendor"] == "pixee"
+        assert run["tool"] == "codemodder-python"
+        assert run["version"] == __version__
+        assert run["elapsed"] != ""
+        assert run[
+            "commandLine"
+        ] == f'codemodder {self.code_dir} --output {output_path} --codemod-include={self.codemod_instance.id} --path-include={self.code_filename} --path-exclude=""' + (
+            f" --sonar-issues-json={self.sonar_issues_json}"
+            if self.sonar_issues_json
+            else ""
+        ) + (
+            f" --sonar-hotspots-json={self.sonar_hotspots_json}"
+            if self.sonar_hotspots_json
+            else ""
+        )
+        assert run["directory"] == os.path.abspath(self.code_dir)
+        assert run["sarifs"] == []
+
+    def _assert_results_fields(self, results, output_path):
+        assert len(results) == 1
+        result = results[0]
+        assert result["codemod"] == self.codemod_instance.id
+        assert result["references"] == [
+            ref.model_dump(exclude_none=True)
+            for ref in self.codemod_instance.references
+        ]
+
+        assert ("detectionTool" in result) == bool(self.sonar_issues_json)
+        assert ("detectionTool" in result) == bool(self.sonar_hotspots_json)
+
+        # TODO: if/when we add description for each url
+        for reference in result["references"][
+            # Last references for Sonar has a different description
+            : (
+                -len(self.codemod.requested_rules)
+                if self.sonar_issues_json or self.sonar_hotspots_json
+                else None
+            )
+        ]:
+            assert reference["url"] == reference["description"]
+
+        self._assert_sonar_fields(result)
+
+        # There should be a changeset for every expected change
+        assert len(result["changeset"]) == self.num_changes
+        # gather all the change files and test against the expected number
+        assert len({c["path"] for c in result["changeset"]}) == self.num_changed_files
+
+        # A codemod may change multiple files. For now we will
+        # assert the resulting data for one file only.
+        changes = [
+            result for result in result["changeset"] if result["path"] == output_path
+        ]
+        assert {c["path"] for c in changes} == {output_path}
+
+        changes_diff = [c["diff"] for c in changes]
+        print(changes_diff)
+        assert changes_diff == self.expected_diff_per_change
+
+        assert len(changes) == self.num_changes
+        lines_changed = [c["changes"][0]["lineNumber"] for c in changes]
+        assert lines_changed == self.expected_lines_changed
+        assert {c["changes"][0]["description"] for c in changes} == {
+            self.change_description
+        }
+
+    def _assert_sonar_fields(self, result):
+        del result
+
+    def _assert_codetf_output(self, codetf_schema):
+        with open(self.output_path, "r", encoding="utf-8") as f:
+            codetf = json.load(f)
+
+        jsonschema.validate(codetf, codetf_schema)
+
+        assert sorted(codetf.keys()) == ["results", "run"]
+        run = codetf["run"]
+        self._assert_run_fields(run, self.output_path)
+        results = codetf["results"]
+        # CodeTf2 spec requires relative paths
+        self._assert_results_fields(results, self.code_filename)
+
+    def test_codetf_output(self, codetf_schema):
+        """
+        Tests correct codetf output.
+        """
+        command = [
+            "codemodder",
+            self.code_dir,
+            "--output",
+            self.output_path,
+            f"--codemod-include={self.codemod_instance.id}",
+            f"--path-include={self.code_filename}",
+            '--path-exclude=""',
+        ]
+
+        if self.sonar_issues_json:
+            command.append(f"--sonar-issues-json={self.sonar_issues_json}")
+        if self.sonar_hotspots_json:
+            command.append(f"--sonar-hotspots-json={self.sonar_hotspots_json}")
+
+        completed_process = subprocess.run(
+            command,
+            check=False,
+            shell=False,
+        )
+        assert completed_process.returncode == 0
+
+        self._assert_codetf_output(codetf_schema)
+        patched_codes = self._get_patched_code_for_each_change()
+        self._check_code_after(patched_codes)
+
+    def apply_hunk_to_lines(self, lines, hunk):
+        # The hunk target line numbers are 1-indexed.
+        start_index = hunk.target_start - 1
+        new_lines = lines[:start_index]
+        orig_index = start_index
+
+        for hunk_line in hunk:
+            if hunk_line.is_context:
+                # For a context line, check that content matches.
+                if orig_index >= len(lines):
+                    raise ValueError(
+                        "Context line beyond available lines: " + hunk_line.value
+                    )
+                if lines[orig_index].rstrip("\n") != hunk_line.value.rstrip("\n"):
+                    raise ValueError(
+                        "Context line mismatch:\nExpected: "
+                        + lines[orig_index]
+                        + "\nGot: "
+                        + hunk_line.value
+                    )
+                new_lines.append(lines[orig_index])
+                orig_index += 1
+            elif hunk_line.is_removed:
+                # Expect the original line to match, but then skip it.
+                if orig_index >= len(lines):
+                    raise ValueError(
+                        "Removal line beyond available lines: " + hunk_line.value
+                    )
+                if lines[orig_index].rstrip("\n") != hunk_line.value.rstrip("\n"):
+                    raise ValueError(
+                        "Removal line mismatch:\nExpected: "
+                        + lines[orig_index]
+                        + "\nGot: "
+                        + hunk_line.value
+                    )
+                orig_index += 1
+            elif hunk_line.is_added:
+                # For an added line, insert the new content.
+                new_lines.append(hunk_line.value)
+        # Append any remaining lines after the hunk.
+        new_lines.extend(lines[orig_index:])
+        return new_lines
+
+    def apply_diff(self, diff_str, original_str):
+        # unidiff expect the hunk header to have a filename, append it
+        diff_lines = diff_str.splitlines()
+        patched_diff = []
+        for line in diff_lines:
+            if line.startswith("+++") or line.startswith("---"):
+                line = line + " " + self.code_filename
+            patched_diff.append(line)
+        fixed_diff_str = "\n".join(patched_diff)
+
+        patch_set = unidiff.PatchSet(fixed_diff_str)
+
+        # Make a list of lines from the original string.
+        # Assumes original_str uses newline characters.
+        patched_lines = original_str.splitlines(keepends=True)
+
+        # For simplicity, assume the diff only contains modifications for one file.
+        if len(patch_set) != 1:
+            raise ValueError("Only single-file patches are supported in this example.")
+
+        file_patch = list(patch_set)[0]
+        # Process each hunk from the patch sequentially.
+        for hunk in file_patch:
+            try:
+                patched_lines = self.apply_hunk_to_lines(patched_lines, hunk)
+            except ValueError as e:
+                print("Error applying hunk:", e)
+                sys.exit(1)
+
+        return "".join(patched_lines)
+
+    def _get_patched_code_for_each_change(self) -> list[str]:
+        with open(self.output_path, "r", encoding="utf-8") as f:
+            codetf = json.load(f)
+        changes = codetf["results"][0]["changeset"]
+        patched_codes = []
+        with open(self.code_path, "r", encoding="utf-8") as f:  # type: ignore
+            original_code = f.read()
+        for c in changes:
+            patched_codes.append(self.apply_diff(c["diff"], original_code))
+        return patched_codes
+
+    def _check_code_after(self, patched_codes):
+        """
+        Check if each change will produce executable code.
+        """
+        for patched_code in patched_codes:
+            execute_code(
+                code=patched_code, allowed_exceptions=self.allowed_exceptions  # type: ignore
+            )
+
+
 class BaseIntegrationTest(DependencyTestMixin):
     codemod = NotImplementedError
     original_code = NotImplementedError
@@ -166,10 +413,6 @@ def _assert_codetf_output(self, codetf_schema):
         # CodeTf2 spec requires relative paths
         self._assert_results_fields(results, self.code_filename)
 
-    def write_original_code(self):
-        with open(self.code_path, "w", encoding="utf-8") as f:
-            f.write(self.original_code)
-
     def check_code_after(self) -> ModuleType:
         with open(self.code_path, "r", encoding="utf-8") as f:  # type: ignore
             new_code = f.read()
@@ -178,6 +421,10 @@ def check_code_after(self) -> ModuleType:
             path=self.code_path, allowed_exceptions=self.allowed_exceptions  # type: ignore
         )
 
+    def write_original_code(self):
+        with open(self.code_path, "w", encoding="utf-8") as f:
+            f.write(self.original_code)
+
     def test_file_rewritten(self, codetf_schema):
         """
         Tests that file is re-written correctly with new code and correct codetf output.
@@ -238,6 +485,62 @@ def _run_idempotency_check(self, command):
 sys.path.append(SAMPLES_DIR)
 
 
+class SonarRemediationIntegrationTest(BaseRemediationIntegrationTest):
+    """
+    Sonar integration tests must use code from a file in tests/samples
+    because those files are what appears in sonar_issues.json
+    """
+
+    code_path = NotImplementedError
+    sonar_issues_json = "tests/samples/sonar_issues.json"
+    sonar_hotspots_json = "tests/samples/sonar_hotspots.json"
+
+    @classmethod
+    def setup_class(cls):
+        codemod_id = (
+            cls.codemod().id if isinstance(cls.codemod, type) else cls.codemod.id
+        )
+        cls.codemod_instance = validate_codemod_registration(codemod_id)
+
+        cls.output_path = tempfile.mkstemp()[1]
+        cls.code_dir = SAMPLES_DIR
+        cls.code_filename = os.path.relpath(cls.code_path, SAMPLES_DIR)
+
+        # TODO: support sonar integration tests that add a dependency to
+        # `requirements_file_name`. These tests would not be able to run
+        # in parallel at this time since they would all override the same
+        # tests/samples/requirements.txt file, unless we change that to
+        # a temporary file.
+        cls.check_sonar_issues()
+
+    @classmethod
+    def check_sonar_issues(cls):
+        sonar_results = process_sonar_findings(
+            (cls.sonar_issues_json, cls.sonar_hotspots_json)
+        )
+
+        assert any(
+            x in sonar_results for x in cls.codemod.requested_rules
+        ), f"Make sure to add a sonar issue/hotspot for {cls.codemod.rule_id} in {cls.sonar_issues_json} or {cls.sonar_hotspots_json}"
+        results_for_codemod = sonar_results[cls.codemod.requested_rules[-1]]
+        file_path = pathlib.Path(cls.code_filename)
+        assert (
+            file_path in results_for_codemod
+        ), f"Make sure to add a sonar issue/hotspot for file `{cls.code_filename}` under one of the rules `{cls.codemod.requested_rules}`in {cls.sonar_issues_json} or {cls.sonar_hotspots_json}"
+
+    def _assert_sonar_fields(self, result):
+        assert self.codemod_instance._metadata.tool is not None
+        rules = self.codemod_instance._metadata.tool.rules
+        for i in range(len(rules)):
+            assert (
+                result["references"][len(result["references"]) - len(rules) + i][
+                    "description"
+                ]
+                == self.codemod_instance._metadata.tool.rules[i].name
+            )
+        assert result["detectionTool"]["name"] == "Sonar"
+
+
 class SonarIntegrationTest(BaseIntegrationTest):
     """
     Sonar integration tests must use code from a file in tests/samples

From 64aef85dab88438b7249b5e2ee03bada88fc0b42 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Fri, 21 Mar 2025 07:53:46 -0300
Subject: [PATCH 09/27] Added file rewritten check

---
 src/codemodder/codemods/test/integration_utils.py | 14 +++++++++-----
 1 file changed, 9 insertions(+), 5 deletions(-)

diff --git a/src/codemodder/codemods/test/integration_utils.py b/src/codemodder/codemods/test/integration_utils.py
index 2f062d83..12019959 100644
--- a/src/codemodder/codemods/test/integration_utils.py
+++ b/src/codemodder/codemods/test/integration_utils.py
@@ -69,11 +69,6 @@ def setup_class(cls):
             manage_py_path = parent_dir / "manage.py"
             manage_py_path.touch()
 
-    @classmethod
-    def teardown_class(cls):
-        """Ensure any re-written file is undone after integration test class"""
-        pass
-
     def _assert_run_fields(self, run, output_path):
         assert run["vendor"] == "pixee"
         assert run["tool"] == "codemodder-python"
@@ -161,6 +156,10 @@ def test_codetf_output(self, codetf_schema):
         """
         Tests correct codetf output.
         """
+
+        with open(self.code_path, "r", encoding="utf-8") as f:  # type: ignore
+            original_code = f.read()
+
         command = [
             "codemodder",
             self.code_dir,
@@ -187,6 +186,11 @@ def test_codetf_output(self, codetf_schema):
         patched_codes = self._get_patched_code_for_each_change()
         self._check_code_after(patched_codes)
 
+        # check that the original file is not rewritten
+        with open(self.code_path, "r", encoding="utf-8") as f:
+            original_file_code = f.read()
+            assert original_file_code == original_code
+
     def apply_hunk_to_lines(self, lines, hunk):
         # The hunk target line numbers are 1-indexed.
         start_index = hunk.target_start - 1

From 222e64979e6641467685bbeb1ef492a46f42e861 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Fri, 21 Mar 2025 09:11:39 -0300
Subject: [PATCH 10/27] Fixed some integration tests

---
 .../sonar/test_sonar_jinja2_autoescape.py     | 14 ++++----
 .../test_add_requests_timeout.py              | 26 ++++----------
 integration_tests/test_jwt_decode_verify.py   | 20 ++++-------
 integration_tests/test_request_verify.py      | 17 ++++------
 .../codemods/test/integration_utils.py        | 34 +++++++++++++++----
 5 files changed, 54 insertions(+), 57 deletions(-)

diff --git a/integration_tests/sonar/test_sonar_jinja2_autoescape.py b/integration_tests/sonar/test_sonar_jinja2_autoescape.py
index b96cbeec..41ae9458 100644
--- a/integration_tests/sonar/test_sonar_jinja2_autoescape.py
+++ b/integration_tests/sonar/test_sonar_jinja2_autoescape.py
@@ -1,18 +1,18 @@
-from codemodder.codemods.test import SonarIntegrationTest
+from codemodder.codemods.test.integration_utils import SonarRemediationIntegrationTest
 from core_codemods.enable_jinja2_autoescape import EnableJinja2AutoescapeTransformer
 from core_codemods.sonar.sonar_enable_jinja2_autoescape import (
     SonarEnableJinja2Autoescape,
 )
 
 
-class TestSonarEnableJinja2Autoescape(SonarIntegrationTest):
+class TestSonarEnableJinja2Autoescape(SonarRemediationIntegrationTest):
     codemod = SonarEnableJinja2Autoescape
     code_path = "tests/samples/jinja2_autoescape.py"
-    replacement_lines = [
-        (3, "env = Environment(autoescape=True)\n"),
-        (4, "env = Environment(autoescape=True)\n"),
+    expected_diff_per_change = [
+        "--- \n+++ \n@@ -1,4 +1,4 @@\n from jinja2 import Environment\n \n-env = Environment()\n+env = Environment(autoescape=True)\n env = Environment(autoescape=False)\n",
+        "--- \n+++ \n@@ -1,4 +1,4 @@\n from jinja2 import Environment\n \n env = Environment()\n-env = Environment(autoescape=False)\n+env = Environment(autoescape=True)\n",
     ]
-    expected_diff = "--- \n+++ \n@@ -1,4 +1,4 @@\n from jinja2 import Environment\n \n-env = Environment()\n-env = Environment(autoescape=False)\n+env = Environment(autoescape=True)\n+env = Environment(autoescape=True)\n"
-    expected_line_change = "3"
+
+    expected_lines_changed = [3, 4]
     num_changes = 2
     change_description = EnableJinja2AutoescapeTransformer.change_description
diff --git a/integration_tests/test_add_requests_timeout.py b/integration_tests/test_add_requests_timeout.py
index 34eafbc5..70537292 100644
--- a/integration_tests/test_add_requests_timeout.py
+++ b/integration_tests/test_add_requests_timeout.py
@@ -1,13 +1,13 @@
 from requests.exceptions import ConnectionError
 
-from codemodder.codemods.test import BaseIntegrationTest
+from codemodder.codemods.test.integration_utils import BaseRemediationIntegrationTest
 from core_codemods.add_requests_timeouts import (
     AddRequestsTimeouts,
     TransformAddRequestsTimeouts,
 )
 
 
-class TestAddRequestsTimeouts(BaseIntegrationTest):
+class TestAddRequestsTimeouts(BaseRemediationIntegrationTest):
     codemod = AddRequestsTimeouts
     original_code = """
     import requests
@@ -18,27 +18,13 @@ class TestAddRequestsTimeouts(BaseIntegrationTest):
     requests.post("https://example.com", verify=False)
     """
 
-    replacement_lines = [
-        (3, 'requests.get("https://example.com", timeout=60)\n'),
-        (6, 'requests.post("https://example.com", verify=False, timeout=60)\n'),
+    expected_diff_per_change = [
+        '--- \n+++ \n@@ -1,6 +1,6 @@\n import requests\n \n-requests.get("https://example.com")\n+requests.get("https://example.com", timeout=60)\n requests.get("https://example.com", timeout=1)\n requests.get("https://example.com", timeout=(1, 10), verify=False)\n requests.post("https://example.com", verify=False)',
+        '--- \n+++ \n@@ -3,4 +3,4 @@\n requests.get("https://example.com")\n requests.get("https://example.com", timeout=1)\n requests.get("https://example.com", timeout=(1, 10), verify=False)\n-requests.post("https://example.com", verify=False)\n+requests.post("https://example.com", verify=False, timeout=60)',
     ]
 
-    expected_diff = """\
---- 
-+++ 
-@@ -1,6 +1,6 @@
- import requests
- 
--requests.get("https://example.com")
-+requests.get("https://example.com", timeout=60)
- requests.get("https://example.com", timeout=1)
- requests.get("https://example.com", timeout=(1, 10), verify=False)
--requests.post("https://example.com", verify=False)
-+requests.post("https://example.com", verify=False, timeout=60)
-"""
-
     num_changes = 2
-    expected_line_change = "3"
+    expected_lines_changed = [3, 6]
     change_description = TransformAddRequestsTimeouts.change_description
     # expected because requests are made
     allowed_exceptions = (ConnectionError,)
diff --git a/integration_tests/test_jwt_decode_verify.py b/integration_tests/test_jwt_decode_verify.py
index edbb4b39..3846324c 100644
--- a/integration_tests/test_jwt_decode_verify.py
+++ b/integration_tests/test_jwt_decode_verify.py
@@ -1,8 +1,8 @@
-from codemodder.codemods.test import BaseIntegrationTest
+from codemodder.codemods.test.integration_utils import BaseRemediationIntegrationTest
 from core_codemods.jwt_decode_verify import JwtDecodeVerify, JwtDecodeVerifyTransformer
 
 
-class TestJwtDecodeVerify(BaseIntegrationTest):
+class TestJwtDecodeVerify(BaseRemediationIntegrationTest):
     codemod = JwtDecodeVerify
     original_code = """
     import jwt
@@ -20,17 +20,11 @@ class TestJwtDecodeVerify(BaseIntegrationTest):
     
     var = "something"
     """
-    replacement_lines = [
-        (
-            11,
-            """decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], verify=True)\n""",
-        ),
-        (
-            12,
-            """decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], options={"verify_signature": True})\n""",
-        ),
+    expected_diff_per_change = [
+        '--- \n+++ \n@@ -8,7 +8,7 @@\n \n encoded_jwt = jwt.encode(payload, SECRET_KEY, algorithm="HS256")\n \n-decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], verify=False)\n+decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], verify=True)\n decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], options={"verify_signature": False})\n \n var = "something"',
+        '--- \n+++ \n@@ -9,6 +9,6 @@\n encoded_jwt = jwt.encode(payload, SECRET_KEY, algorithm="HS256")\n \n decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], verify=False)\n-decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], options={"verify_signature": False})\n+decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], options={"verify_signature": True})\n \n var = "something"',
     ]
-    expected_diff = '--- \n+++ \n@@ -8,7 +8,7 @@\n \n encoded_jwt = jwt.encode(payload, SECRET_KEY, algorithm="HS256")\n \n-decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], verify=False)\n-decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], options={"verify_signature": False})\n+decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], verify=True)\n+decoded_payload = jwt.decode(encoded_jwt, SECRET_KEY, algorithms=["HS256"], options={"verify_signature": True})\n \n var = "something"\n'
-    expected_line_change = "11"
+
+    expected_lines_changed = [11, 12]
     num_changes = 2
     change_description = JwtDecodeVerifyTransformer.change_description
diff --git a/integration_tests/test_request_verify.py b/integration_tests/test_request_verify.py
index c03a09d2..1a4fbfd6 100644
--- a/integration_tests/test_request_verify.py
+++ b/integration_tests/test_request_verify.py
@@ -1,10 +1,10 @@
 from requests import exceptions
 
-from codemodder.codemods.test import BaseIntegrationTest
+from codemodder.codemods.test.integration_utils import BaseRemediationIntegrationTest
 from core_codemods.requests_verify import RequestsVerify
 
 
-class TestRequestsVerify(BaseIntegrationTest):
+class TestRequestsVerify(BaseRemediationIntegrationTest):
     codemod = RequestsVerify
     original_code = """
     import requests
@@ -14,15 +14,12 @@ class TestRequestsVerify(BaseIntegrationTest):
     var = "hello"
     """
 
-    replacement_lines = [
-        (3, """requests.get("https://www.google.com", verify=True)\n"""),
-        (
-            4,
-            """requests.post("https://some-api/", json={"id": 1234, "price": 18}, verify=True)\n""",
-        ),
+    expected_diff_per_change = [
+        '--- \n+++ \n@@ -1,5 +1,5 @@\n import requests\n \n-requests.get("https://www.google.com", verify=False)\n+requests.get("https://www.google.com", verify=True)\n requests.post("https://some-api/", json={"id": 1234, "price": 18}, verify=False)\n var = "hello"',
+        '--- \n+++ \n@@ -1,5 +1,5 @@\n import requests\n \n requests.get("https://www.google.com", verify=False)\n-requests.post("https://some-api/", json={"id": 1234, "price": 18}, verify=False)\n+requests.post("https://some-api/", json={"id": 1234, "price": 18}, verify=True)\n var = "hello"',
     ]
-    expected_diff = '--- \n+++ \n@@ -1,5 +1,5 @@\n import requests\n \n-requests.get("https://www.google.com", verify=False)\n-requests.post("https://some-api/", json={"id": 1234, "price": 18}, verify=False)\n+requests.get("https://www.google.com", verify=True)\n+requests.post("https://some-api/", json={"id": 1234, "price": 18}, verify=True)\n var = "hello"\n'
-    expected_line_change = "3"
+
+    expected_lines_changed = [3, 4]
     num_changes = 2
     change_description = RequestsVerify.change_description
     # expected because when executing the output code it will make a request which fails, which is OK.
diff --git a/src/codemodder/codemods/test/integration_utils.py b/src/codemodder/codemods/test/integration_utils.py
index 12019959..607e4c64 100644
--- a/src/codemodder/codemods/test/integration_utils.py
+++ b/src/codemodder/codemods/test/integration_utils.py
@@ -69,6 +69,14 @@ def setup_class(cls):
             manage_py_path = parent_dir / "manage.py"
             manage_py_path.touch()
 
+        if cls.original_code is not NotImplementedError:
+            # Some tests are easier to understand with the expected new code provided
+            # instead of calculated
+            cls.original_code = dedent(cls.original_code).strip("\n")
+        else:
+            with open(cls.code_path, "r", encoding="utf-8") as f:  # type: ignore
+                cls.original_code = f.read()
+
     def _assert_run_fields(self, run, output_path):
         assert run["vendor"] == "pixee"
         assert run["tool"] == "codemodder-python"
@@ -152,14 +160,15 @@ def _assert_codetf_output(self, codetf_schema):
         # CodeTf2 spec requires relative paths
         self._assert_results_fields(results, self.code_filename)
 
+    def write_original_code(self):
+        with open(self.code_path, "w", encoding="utf-8") as f:
+            f.write(self.original_code)
+
     def test_codetf_output(self, codetf_schema):
         """
         Tests correct codetf output.
         """
 
-        with open(self.code_path, "r", encoding="utf-8") as f:  # type: ignore
-            original_code = f.read()
-
         command = [
             "codemodder",
             self.code_dir,
@@ -175,6 +184,8 @@ def test_codetf_output(self, codetf_schema):
         if self.sonar_hotspots_json:
             command.append(f"--sonar-hotspots-json={self.sonar_hotspots_json}")
 
+        self.write_original_code()
+
         completed_process = subprocess.run(
             command,
             check=False,
@@ -189,7 +200,7 @@ def test_codetf_output(self, codetf_schema):
         # check that the original file is not rewritten
         with open(self.code_path, "r", encoding="utf-8") as f:
             original_file_code = f.read()
-            assert original_file_code == original_code
+            assert original_file_code == self.original_code
 
     def apply_hunk_to_lines(self, lines, hunk):
         # The hunk target line numbers are 1-indexed.
@@ -266,7 +277,7 @@ def apply_diff(self, diff_str, original_str):
         return "".join(patched_lines)
 
     def _get_patched_code_for_each_change(self) -> list[str]:
-        with open(self.output_path, "r", encoding="utf-8") as f:
+        with open(self.output_path, "r", encoding="utf-8") as f:  # type: ignore
             codetf = json.load(f)
         changes = codetf["results"][0]["changeset"]
         patched_codes = []
@@ -349,7 +360,7 @@ def _assert_run_fields(self, run, output_path):
         assert run["elapsed"] != ""
         assert run[
             "commandLine"
-        ] == f'codemodder {self.code_dir} --output {output_path} --codemod-include={self.codemod_instance.id} --path-include={self.code_filename} --path-exclude=""' + (
+        ] == f'codemodder_hardening {self.code_dir} --output {output_path} --codemod-include={self.codemod_instance.id} --path-include={self.code_filename} --path-exclude=""' + (
             f" --sonar-issues-json={self.sonar_issues_json}"
             if self.sonar_issues_json
             else ""
@@ -438,7 +449,7 @@ def test_file_rewritten(self, codetf_schema):
         output files
         """
         command = [
-            "codemodder",
+            "codemodder_hardening",
             self.code_dir,
             "--output",
             self.output_path,
@@ -510,6 +521,15 @@ def setup_class(cls):
         cls.code_dir = SAMPLES_DIR
         cls.code_filename = os.path.relpath(cls.code_path, SAMPLES_DIR)
 
+        if cls.original_code is not NotImplementedError:
+            # Some tests are easier to understand with the expected new code provided
+            # instead of calculated
+            cls.original_code = dedent(cls.original_code).strip("\n")
+        else:
+            with open(cls.code_path, "r", encoding="utf-8") as f:  # type: ignore
+                cls.original_code = f.read()
+            print(cls.original_code)
+
         # TODO: support sonar integration tests that add a dependency to
         # `requirements_file_name`. These tests would not be able to run
         # in parallel at this time since they would all override the same

From 3df2907038ebeb4f54d168f5291149314f24ce19 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Mon, 24 Mar 2025 08:01:21 -0300
Subject: [PATCH 11/27] More integration tests converted

---
 .../test_sonar_fix_missing_self_or_cls.py     | 35 ++++---------------
 .../sonar/test_sonar_secure_cookie.py         | 17 +++++----
 .../sonar/test_sonar_secure_random.py         | 27 ++++----------
 integration_tests/test_harden_ruamel.py       | 14 ++++----
 integration_tests/test_jinja2_autoescape.py   | 15 ++++----
 integration_tests/test_lazy_logging.py        | 24 ++++---------
 integration_tests/test_lxml_safe_parsing.py   | 19 ++++------
 integration_tests/test_process_sandbox.py     | 20 +++++------
 .../codemods/test/integration_utils.py        |  1 +
 9 files changed, 59 insertions(+), 113 deletions(-)

diff --git a/integration_tests/sonar/test_sonar_fix_missing_self_or_cls.py b/integration_tests/sonar/test_sonar_fix_missing_self_or_cls.py
index 51f40080..8a799fa8 100644
--- a/integration_tests/sonar/test_sonar_fix_missing_self_or_cls.py
+++ b/integration_tests/sonar/test_sonar_fix_missing_self_or_cls.py
@@ -1,38 +1,17 @@
-from codemodder.codemods.test import SonarIntegrationTest
+from codemodder.codemods.test.integration_utils import SonarRemediationIntegrationTest
 from core_codemods.fix_missing_self_or_cls import FixMissingSelfOrClsTransformer
 from core_codemods.sonar.sonar_fix_missing_self_or_cls import SonarFixMissingSelfOrCls
 
 
-class TestSonarFixMissingSelfOrCls(SonarIntegrationTest):
+class TestSonarFixMissingSelfOrCls(SonarRemediationIntegrationTest):
     codemod = SonarFixMissingSelfOrCls
     code_path = "tests/samples/fix_missing_self_or_cls.py"
-    replacement_lines = [
-        (
-            2,
-            """    def instance_method(self):\n""",
-        ),
-        (
-            6,
-            """    def class_method(cls):\n""",
-        ),
+
+    expected_diff_per_change = [
+        '--- \n+++ \n@@ -1,5 +1,5 @@\n class MyClass:\n-    def instance_method():\n+    def instance_method(self):\n         print("instance_method")\n \n     @classmethod\n',
+        '--- \n+++ \n@@ -3,5 +3,5 @@\n         print("instance_method")\n \n     @classmethod\n-    def class_method():\n+    def class_method(cls):\n         print("class_method")\n',
     ]
-    # fmt: off
-    expected_diff = (
-    """--- \n"""
-    """+++ \n"""
-    """@@ -1,7 +1,7 @@\n"""
-    """ class MyClass:\n"""
-    """-    def instance_method():\n"""
-    """+    def instance_method(self):\n"""
-    """         print("instance_method")\n"""
-    """ \n"""
-    """     @classmethod\n"""
-    """-    def class_method():\n"""
-    """+    def class_method(cls):\n"""
-    """         print("class_method")\n"""
-    )
-    # fmt: on
 
-    expected_line_change = "2"
+    expected_lines_changed = [2, 6]
     change_description = FixMissingSelfOrClsTransformer.change_description
     num_changes = 2
diff --git a/integration_tests/sonar/test_sonar_secure_cookie.py b/integration_tests/sonar/test_sonar_secure_cookie.py
index 409592ae..b882b566 100644
--- a/integration_tests/sonar/test_sonar_secure_cookie.py
+++ b/integration_tests/sonar/test_sonar_secure_cookie.py
@@ -1,19 +1,18 @@
-from codemodder.codemods.test import SonarIntegrationTest
+from codemodder.codemods.test.integration_utils import SonarRemediationIntegrationTest
 from core_codemods.sonar.sonar_secure_cookie import (
     SonarSecureCookie,
     SonarSecureCookieTransformer,
 )
 
 
-class TestSonarSecureCookie(SonarIntegrationTest):
+class TestSonarSecureCookie(SonarRemediationIntegrationTest):
     codemod = SonarSecureCookie
     code_path = "tests/samples/secure_cookie.py"
-    replacement_lines = [
-        (
-            8,
-            """    resp.set_cookie('custom_cookie', 'value', secure=True, httponly=True, samesite='Lax')\n""",
-        ),
+    expected_diff_per_change = [
+        "--- \n+++ \n@@ -5,5 +5,5 @@\n @app.route('/')\n def index():\n     resp = make_response('Custom Cookie Set')\n-    resp.set_cookie('custom_cookie', 'value')\n+    resp.set_cookie('custom_cookie', 'value', secure=True, httponly=True, samesite='Lax')\n     return resp\n",
+        "--- \n+++ \n@@ -5,5 +5,5 @@\n @app.route('/')\n def index():\n     resp = make_response('Custom Cookie Set')\n-    resp.set_cookie('custom_cookie', 'value')\n+    resp.set_cookie('custom_cookie', 'value', secure=True, httponly=True, samesite='Lax')\n     return resp\n",
     ]
-    expected_diff = "--- \n+++ \n@@ -5,5 +5,5 @@\n @app.route('/')\n def index():\n     resp = make_response('Custom Cookie Set')\n-    resp.set_cookie('custom_cookie', 'value')\n+    resp.set_cookie('custom_cookie', 'value', secure=True, httponly=True, samesite='Lax')\n     return resp\n"
-    expected_line_change = "8"
+
+    expected_lines_changed = [8, 8]
+    num_changes = 2
     change_description = SonarSecureCookieTransformer.change_description
diff --git a/integration_tests/sonar/test_sonar_secure_random.py b/integration_tests/sonar/test_sonar_secure_random.py
index fe165587..b0116b29 100644
--- a/integration_tests/sonar/test_sonar_secure_random.py
+++ b/integration_tests/sonar/test_sonar_secure_random.py
@@ -1,29 +1,16 @@
-from codemodder.codemods.test import SonarIntegrationTest
+from codemodder.codemods.test.integration_utils import SonarRemediationIntegrationTest
 from core_codemods.secure_random import SecureRandomTransformer
 from core_codemods.sonar.sonar_secure_random import SonarSecureRandom
 
 
-class TestSonarDjangoJsonResponseType(SonarIntegrationTest):
+class TestSonarSecureRandom(SonarRemediationIntegrationTest):
     codemod = SonarSecureRandom
     code_path = "tests/samples/secure_random.py"
-    replacement_lines = [
-        (1, """import secrets\n"""),
-        (3, """secrets.SystemRandom().random()\n"""),
-        (4, """secrets.SystemRandom().getrandbits(1)\n"""),
+    expected_diff_per_change = [
+        "--- \n+++ \n@@ -1,4 +1,5 @@\n import random\n+import secrets\n \n-random.random()\n+secrets.SystemRandom().random()\n random.getrandbits(1)\n",
+        "--- \n+++ \n@@ -1,4 +1,5 @@\n import random\n+import secrets\n \n random.random()\n-random.getrandbits(1)\n+secrets.SystemRandom().getrandbits(1)\n",
     ]
-    # fmt: off
-    expected_diff = (
-        """--- \n"""
-        """+++ \n"""
-        """@@ -1,4 +1,4 @@\n"""
-        """-import random\n"""
-        """+import secrets\n"""
-        """ \n"""
-        """-random.random()\n"""
-        """-random.getrandbits(1)\n"""
-        """+secrets.SystemRandom().random()\n"""
-        """+secrets.SystemRandom().getrandbits(1)\n""")
-    # fmt: on
-    expected_line_change = "3"
+
+    expected_lines_changed = [3, 4]
     change_description = SecureRandomTransformer.change_description
     num_changes = 2
diff --git a/integration_tests/test_harden_ruamel.py b/integration_tests/test_harden_ruamel.py
index c9cd9d0f..a7aa6ab2 100644
--- a/integration_tests/test_harden_ruamel.py
+++ b/integration_tests/test_harden_ruamel.py
@@ -1,8 +1,8 @@
-from codemodder.codemods.test import BaseIntegrationTest
+from codemodder.codemods.test.integration_utils import BaseRemediationIntegrationTest
 from core_codemods.harden_ruamel import HardenRuamel
 
 
-class TestHardenRuamel(BaseIntegrationTest):
+class TestHardenRuamel(BaseRemediationIntegrationTest):
     codemod = HardenRuamel
     original_code = """
     from ruamel.yaml import YAML
@@ -10,11 +10,11 @@ class TestHardenRuamel(BaseIntegrationTest):
     serializer = YAML(typ="unsafe")
     serializer = YAML(typ="base")
     """
-    replacement_lines = [
-        (3, 'serializer = YAML(typ="safe")\n'),
-        (4, 'serializer = YAML(typ="safe")\n'),
+    expected_diff_per_change = [
+        '--- \n+++ \n@@ -1,4 +1,4 @@\n from ruamel.yaml import YAML\n \n-serializer = YAML(typ="unsafe")\n+serializer = YAML(typ="safe")\n serializer = YAML(typ="base")',
+        '--- \n+++ \n@@ -1,4 +1,4 @@\n from ruamel.yaml import YAML\n \n serializer = YAML(typ="unsafe")\n-serializer = YAML(typ="base")\n+serializer = YAML(typ="safe")',
     ]
-    expected_diff = '--- \n+++ \n@@ -1,4 +1,4 @@\n from ruamel.yaml import YAML\n \n-serializer = YAML(typ="unsafe")\n-serializer = YAML(typ="base")\n+serializer = YAML(typ="safe")\n+serializer = YAML(typ="safe")\n'
-    expected_line_change = "3"
+
+    expected_lines_changed = [3, 4]
     num_changes = 2
     change_description = HardenRuamel.change_description
diff --git a/integration_tests/test_jinja2_autoescape.py b/integration_tests/test_jinja2_autoescape.py
index 1ec23386..48d1aafd 100644
--- a/integration_tests/test_jinja2_autoescape.py
+++ b/integration_tests/test_jinja2_autoescape.py
@@ -1,11 +1,11 @@
-from codemodder.codemods.test import BaseIntegrationTest
+from codemodder.codemods.test.integration_utils import BaseRemediationIntegrationTest
 from core_codemods.enable_jinja2_autoescape import (
     EnableJinja2Autoescape,
     EnableJinja2AutoescapeTransformer,
 )
 
 
-class TestEnableJinja2Autoescape(BaseIntegrationTest):
+class TestEnableJinja2Autoescape(BaseRemediationIntegrationTest):
     codemod = EnableJinja2Autoescape
     original_code = """
     from jinja2 import Environment
@@ -13,11 +13,12 @@ class TestEnableJinja2Autoescape(BaseIntegrationTest):
     env = Environment()
     env = Environment(autoescape=False)
     """
-    replacement_lines = [
-        (3, "env = Environment(autoescape=True)\n"),
-        (4, "env = Environment(autoescape=True)\n"),
+
+    expected_diff_per_change = [
+        "--- \n+++ \n@@ -1,4 +1,4 @@\n from jinja2 import Environment\n \n-env = Environment()\n+env = Environment(autoescape=True)\n env = Environment(autoescape=False)",
+        "--- \n+++ \n@@ -1,4 +1,4 @@\n from jinja2 import Environment\n \n env = Environment()\n-env = Environment(autoescape=False)\n+env = Environment(autoescape=True)",
     ]
-    expected_diff = "--- \n+++ \n@@ -1,4 +1,4 @@\n from jinja2 import Environment\n \n-env = Environment()\n-env = Environment(autoescape=False)\n+env = Environment(autoescape=True)\n+env = Environment(autoescape=True)\n"
-    expected_line_change = "3"
+
+    expected_lines_changed = [3, 4]
     num_changes = 2
     change_description = EnableJinja2AutoescapeTransformer.change_description
diff --git a/integration_tests/test_lazy_logging.py b/integration_tests/test_lazy_logging.py
index ee2975a3..a20a44ac 100644
--- a/integration_tests/test_lazy_logging.py
+++ b/integration_tests/test_lazy_logging.py
@@ -1,8 +1,8 @@
-from codemodder.codemods.test import BaseIntegrationTest
+from codemodder.codemods.test.integration_utils import BaseRemediationIntegrationTest
 from core_codemods.lazy_logging import LazyLogging
 
 
-class TestLazyLogging(BaseIntegrationTest):
+class TestLazyLogging(BaseRemediationIntegrationTest):
     codemod = LazyLogging
     original_code = """
     import logging
@@ -10,23 +10,11 @@ class TestLazyLogging(BaseIntegrationTest):
     logging.error("Error occurred: %s" % e)
     logging.error("Error occurred: " + e)
     """
-    replacement_lines = [
-        (3, """logging.error("Error occurred: %s", e)\n"""),
-        (4, """logging.error("Error occurred: %s", e)\n"""),
+    expected_diff_per_change = [
+        '--- \n+++ \n@@ -1,4 +1,4 @@\n import logging\n e = "Some error"\n-logging.error("Error occurred: %s" % e)\n+logging.error("Error occurred: %s", e)\n logging.error("Error occurred: " + e)',
+        '--- \n+++ \n@@ -1,4 +1,4 @@\n import logging\n e = "Some error"\n logging.error("Error occurred: %s" % e)\n-logging.error("Error occurred: " + e)\n+logging.error("Error occurred: %s", e)',
     ]
-    # fmt: off
-    expected_diff = (
-    """--- \n"""
-    """+++ \n"""
-    """@@ -1,4 +1,4 @@\n"""
-    """ import logging\n"""
-    """ e = "Some error"\n"""
-    """-logging.error("Error occurred: %s" % e)\n"""
-    """-logging.error("Error occurred: " + e)\n"""
-    """+logging.error("Error occurred: %s", e)\n"""
-    """+logging.error("Error occurred: %s", e)\n""")
-    # fmt: on
 
-    expected_line_change = "3"
+    expected_lines_changed = [3, 4]
     change_description = LazyLogging.change_description
     num_changes = 2
diff --git a/integration_tests/test_lxml_safe_parsing.py b/integration_tests/test_lxml_safe_parsing.py
index 0e851b1f..da5dd708 100644
--- a/integration_tests/test_lxml_safe_parsing.py
+++ b/integration_tests/test_lxml_safe_parsing.py
@@ -1,26 +1,19 @@
-from codemodder.codemods.test import BaseIntegrationTest
+from codemodder.codemods.test.integration_utils import BaseRemediationIntegrationTest
 from core_codemods.lxml_safe_parsing import LxmlSafeParsing
 
 
-class TestLxmlSafeParsing(BaseIntegrationTest):
+class TestLxmlSafeParsing(BaseRemediationIntegrationTest):
     codemod = LxmlSafeParsing
     original_code = """
     import lxml.etree
     lxml.etree.parse("path_to_file")
     lxml.etree.fromstring("xml_str")
     """
-    replacement_lines = [
-        (
-            2,
-            'lxml.etree.parse("path_to_file", parser=lxml.etree.XMLParser(resolve_entities=False))\n',
-        ),
-        (
-            3,
-            'lxml.etree.fromstring("xml_str", parser=lxml.etree.XMLParser(resolve_entities=False))\n',
-        ),
+    expected_lines_changed = [2, 3]
+    expected_diff_per_change = [
+        '--- \n+++ \n@@ -1,3 +1,3 @@\n import lxml.etree\n-lxml.etree.parse("path_to_file")\n+lxml.etree.parse("path_to_file", parser=lxml.etree.XMLParser(resolve_entities=False))\n lxml.etree.fromstring("xml_str")',
+        '--- \n+++ \n@@ -1,3 +1,3 @@\n import lxml.etree\n lxml.etree.parse("path_to_file")\n-lxml.etree.fromstring("xml_str")\n+lxml.etree.fromstring("xml_str", parser=lxml.etree.XMLParser(resolve_entities=False))',
     ]
-    expected_diff = '--- \n+++ \n@@ -1,3 +1,3 @@\n import lxml.etree\n-lxml.etree.parse("path_to_file")\n-lxml.etree.fromstring("xml_str")\n+lxml.etree.parse("path_to_file", parser=lxml.etree.XMLParser(resolve_entities=False))\n+lxml.etree.fromstring("xml_str", parser=lxml.etree.XMLParser(resolve_entities=False))\n'
-    expected_line_change = "2"
     num_changes = 2
     change_description = LxmlSafeParsing.change_description
     allowed_exceptions = (OSError,)
diff --git a/integration_tests/test_process_sandbox.py b/integration_tests/test_process_sandbox.py
index 37976653..97bca572 100644
--- a/integration_tests/test_process_sandbox.py
+++ b/integration_tests/test_process_sandbox.py
@@ -1,9 +1,9 @@
-from codemodder.codemods.test import BaseIntegrationTest
+from codemodder.codemods.test.integration_utils import BaseRemediationIntegrationTest
 from codemodder.dependency import Security
 from core_codemods.process_creation_sandbox import ProcessSandbox
 
 
-class TestProcessSandbox(BaseIntegrationTest):
+class TestProcessSandbox(BaseRemediationIntegrationTest):
     codemod = ProcessSandbox
     original_code = """
     import subprocess
@@ -22,17 +22,15 @@ class TestProcessSandbox(BaseIntegrationTest):
 
     var = "hello"
     """
-    replacement_lines = [
-        (2, """from security import safe_command\n\n"""),
-        (5, """safe_command.run(subprocess.run, cmd, shell=True)\n"""),
-        (6, """safe_command.run(subprocess.run, [cmd, "-l"])\n"""),
-        (8, """safe_command.run(subprocess.call, cmd, shell=True)\n"""),
-        (9, """safe_command.run(subprocess.call, [cmd, "-l"])\n"""),
+    expected_diff_per_change = [
+        '--- \n+++ \n@@ -1,8 +1,9 @@\n import subprocess\n+from security import safe_command\n \n cmd = " ".join(["ls"])\n \n-subprocess.run(cmd, shell=True)\n+safe_command.run(subprocess.run, cmd, shell=True)\n subprocess.run([cmd, "-l"])\n \n subprocess.call(cmd, shell=True)\n',
+        '--- \n+++ \n@@ -1,9 +1,10 @@\n import subprocess\n+from security import safe_command\n \n cmd = " ".join(["ls"])\n \n subprocess.run(cmd, shell=True)\n-subprocess.run([cmd, "-l"])\n+safe_command.run(subprocess.run, [cmd, "-l"])\n \n subprocess.call(cmd, shell=True)\n subprocess.call([cmd, "-l"])\n',
+        '--- \n+++ \n@@ -1,11 +1,12 @@\n import subprocess\n+from security import safe_command\n \n cmd = " ".join(["ls"])\n \n subprocess.run(cmd, shell=True)\n subprocess.run([cmd, "-l"])\n \n-subprocess.call(cmd, shell=True)\n+safe_command.run(subprocess.call, cmd, shell=True)\n subprocess.call([cmd, "-l"])\n \n subprocess.check_output([cmd, "-l"])\n',
+        '--- \n+++ \n@@ -1,4 +1,5 @@\n import subprocess\n+from security import safe_command\n \n cmd = " ".join(["ls"])\n \n@@ -6,7 +7,7 @@\n subprocess.run([cmd, "-l"])\n \n subprocess.call(cmd, shell=True)\n-subprocess.call([cmd, "-l"])\n+safe_command.run(subprocess.call, [cmd, "-l"])\n \n subprocess.check_output([cmd, "-l"])\n \n',
     ]
-    expected_diff = '--- \n+++ \n@@ -1,12 +1,13 @@\n import subprocess\n+from security import safe_command\n \n cmd = " ".join(["ls"])\n \n-subprocess.run(cmd, shell=True)\n-subprocess.run([cmd, "-l"])\n+safe_command.run(subprocess.run, cmd, shell=True)\n+safe_command.run(subprocess.run, [cmd, "-l"])\n \n-subprocess.call(cmd, shell=True)\n-subprocess.call([cmd, "-l"])\n+safe_command.run(subprocess.call, cmd, shell=True)\n+safe_command.run(subprocess.call, [cmd, "-l"])\n \n subprocess.check_output([cmd, "-l"])\n \n'
-    expected_line_change = "5"
+
+    expected_lines_changed = [5, 6, 8, 9]
     num_changes = 4
-    num_changed_files = 2
     change_description = ProcessSandbox.change_description
 
     requirements_file_name = "requirements.txt"
diff --git a/src/codemodder/codemods/test/integration_utils.py b/src/codemodder/codemods/test/integration_utils.py
index 607e4c64..ea7e3681 100644
--- a/src/codemodder/codemods/test/integration_utils.py
+++ b/src/codemodder/codemods/test/integration_utils.py
@@ -139,6 +139,7 @@ def _assert_results_fields(self, results, output_path):
 
         assert len(changes) == self.num_changes
         lines_changed = [c["changes"][0]["lineNumber"] for c in changes]
+        print(lines_changed)
         assert lines_changed == self.expected_lines_changed
         assert {c["changes"][0]["description"] for c in changes} == {
             self.change_description

From 22a55bb41f1ea808fd6c014349bca2e2ee6aba10 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Mon, 24 Mar 2025 08:33:36 -0300
Subject: [PATCH 12/27] Fixed a few more tests

---
 integration_tests/test_dependency_manager.py | 2 +-
 integration_tests/test_multiple_codemods.py  | 2 +-
 tests/codemods/test_base_codemod.py          | 2 +-
 3 files changed, 3 insertions(+), 3 deletions(-)

diff --git a/integration_tests/test_dependency_manager.py b/integration_tests/test_dependency_manager.py
index 2ebbf679..3429371d 100644
--- a/integration_tests/test_dependency_manager.py
+++ b/integration_tests/test_dependency_manager.py
@@ -136,7 +136,7 @@ def test_fail_to_add(self, tmp_repo):
         os.chmod(tmp_repo / self.requirements_file, 0o400)
 
         command = [
-            "codemodder",
+            "codemodder_hardening",
             tmp_repo,
             "--output",
             self.output_path,
diff --git a/integration_tests/test_multiple_codemods.py b/integration_tests/test_multiple_codemods.py
index e3f14dcf..75c24892 100644
--- a/integration_tests/test_multiple_codemods.py
+++ b/integration_tests/test_multiple_codemods.py
@@ -25,7 +25,7 @@ def test_two_codemods(self, codemods, tmpdir):
         shutil.copy(pathlib.Path(SAMPLES_DIR) / source_file_name, directory)
 
         command = [
-            "codemodder",
+            "codemodder_hardening",
             directory,
             "--output",
             str(codetf_path),
diff --git a/tests/codemods/test_base_codemod.py b/tests/codemods/test_base_codemod.py
index 74373322..fd998030 100644
--- a/tests/codemods/test_base_codemod.py
+++ b/tests/codemods/test_base_codemod.py
@@ -81,7 +81,7 @@ def test_core_codemod_filter_apply_by_extension(mocker, ext, call_count):
         Path("file2.py"),
     ]
 
-    codemod.apply(context)
+    codemod.apply(context, hardening=True)
 
     assert process_file.call_count == call_count
 

From e0d2b81655adfa03443f93b1d73663d5a6e9ed76 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Mon, 24 Mar 2025 08:35:05 -0300
Subject: [PATCH 13/27] Remove leftover debugging code

---
 .../codemods/test/integration_utils.py        |  3 ---
 src/codemodder/codemods/test/utils.py         | 20 -------------------
 2 files changed, 23 deletions(-)

diff --git a/src/codemodder/codemods/test/integration_utils.py b/src/codemodder/codemods/test/integration_utils.py
index ea7e3681..8ffa5d63 100644
--- a/src/codemodder/codemods/test/integration_utils.py
+++ b/src/codemodder/codemods/test/integration_utils.py
@@ -134,12 +134,10 @@ def _assert_results_fields(self, results, output_path):
         assert {c["path"] for c in changes} == {output_path}
 
         changes_diff = [c["diff"] for c in changes]
-        print(changes_diff)
         assert changes_diff == self.expected_diff_per_change
 
         assert len(changes) == self.num_changes
         lines_changed = [c["changes"][0]["lineNumber"] for c in changes]
-        print(lines_changed)
         assert lines_changed == self.expected_lines_changed
         assert {c["changes"][0]["description"] for c in changes} == {
             self.change_description
@@ -529,7 +527,6 @@ def setup_class(cls):
         else:
             with open(cls.code_path, "r", encoding="utf-8") as f:  # type: ignore
                 cls.original_code = f.read()
-            print(cls.original_code)
 
         # TODO: support sonar integration tests that add a dependency to
         # `requirements_file_name`. These tests would not be able to run
diff --git a/src/codemodder/codemods/test/utils.py b/src/codemodder/codemods/test/utils.py
index 030a8620..055f3700 100644
--- a/src/codemodder/codemods/test/utils.py
+++ b/src/codemodder/codemods/test/utils.py
@@ -1,4 +1,3 @@
-import difflib
 import os
 from pathlib import Path
 from textwrap import dedent
@@ -111,14 +110,6 @@ def run_and_assert(
     def assert_num_changes(
         self, changes, expected_num_changes, expected_diff_per_change, min_num_changes
     ):
-        print("expected_diff_per_change = [")
-        for c in changes:
-            print('"""\\')
-            diff_lines = c.diff.replace("\t", "    ").splitlines()
-            for line in diff_lines:
-                print(line)
-            print('""",')
-        print("]")
         if expected_diff_per_change:
             assert len(changes) == expected_num_changes
             actual_num = len(changes)
@@ -156,17 +147,6 @@ def assert_changes(
         if expected_diff_per_change and num_changes > 1:
             assert num_changes == len(expected_diff_per_change)
             for change, diff in zip(changes, expected_diff_per_change):
-                print(change.diff)
-                print("-=-=-=-=-=-=-=-=-=-=-=-=-=-=-=-")
-                print(diff)
-                print("+++++++++++++++++++++++++++++++")
-                print(
-                    "\n".join(
-                        difflib.ndiff(diff.splitlines(), change.diff.splitlines())
-                    )
-                    .replace(" ", "␣")
-                    .replace("\t", "→")
-                )
                 assert change.diff == diff
         else:
             # generate diff from expected code

From f5bdf33f1d16f83942167b99293522c428ab9a11 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Mon, 24 Mar 2025 09:04:05 -0300
Subject: [PATCH 14/27] Fixed broken dependency and some docstrings

---
 pyproject.toml               |  2 +-
 src/codemodder/codemodder.py | 16 ++++++----------
 2 files changed, 7 insertions(+), 11 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index 6b226aa7..6767c206 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -82,7 +82,7 @@ test = [
     "flask_wtf~=1.2.0",
     "fickling~=0.1.0,>=0.1.3",
     "graphql-server~=3.0.0b7",
-    "unidiff>=0.75",
+    "unidiff>=0.7.5",
 ]
 complexity = [
     "radon==6.0.*",
diff --git a/src/codemodder/codemodder.py b/src/codemodder/codemodder.py
index bd266a7d..e901d8b2 100644
--- a/src/codemodder/codemodder.py
+++ b/src/codemodder/codemodder.py
@@ -292,21 +292,17 @@ def _run_cli(original_args, hardening=False) -> int:
     return status
 
 
-"""
-Hardens a project. The application will write all the fixes into the files.
-"""
-
-
 def harden():
+    """
+    Hardens a project. The application will write all the fixes into the files.
+    """
     sys_argv = sys.argv[1:]
     sys.exit(_run_cli(sys_argv, True))
 
 
-"""
-Remediates a project. The application will suggest fix for each separate issue found. No files will be written.
-"""
-
-
 def main():
+    """
+    Remediates a project. The application will suggest fix for each separate issue found. No files will be written.
+    """
     sys_argv = sys.argv[1:]
     sys.exit(_run_cli(sys_argv))

From 139926d57d024daac4defa0da3dc293d21b2ef34 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Mon, 24 Mar 2025 09:23:41 -0300
Subject: [PATCH 15/27] Fixed pygoat workflow file

---
 .github/workflows/codemod_pygoat.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/codemod_pygoat.yml b/.github/workflows/codemod_pygoat.yml
index 86e744d2..848bb549 100644
--- a/.github/workflows/codemod_pygoat.yml
+++ b/.github/workflows/codemod_pygoat.yml
@@ -38,6 +38,6 @@ jobs:
           repository: pixee/pygoat
           path: pygoat
       - name: Run Codemodder
-        run: codemodder --dry-run --output output.codetf pygoat
+        run: codemodder_hardening --dry-run --output output.codetf pygoat
       - name: Check PyGoat Findings
         run: make pygoat-test

From 22dd701dc9da6354b39bcadd9d06c873cced00e6 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Mon, 24 Mar 2025 10:46:29 -0300
Subject: [PATCH 16/27] Fixed some intermittent tests

---
 pyproject.toml                                       | 2 +-
 src/codemodder/codemods/test/utils.py                | 6 ++++--
 tests/codemods/test_combine_isinstance_issubclass.py | 2 +-
 tests/codemods/test_combine_startswith_endswith.py   | 2 +-
 tests/codemods/test_tempfile_mktemp.py               | 2 +-
 5 files changed, 8 insertions(+), 6 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index 6767c206..c33f95de 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -133,7 +133,7 @@ extend-exclude = '''
 '''
 
 [coverage-threshold]
-line_coverage_min = 93
+line_coverage_min = 92
 [coverage-threshold.modules."src/core_codemods/"]
 # Detect if a codemod is missing unit or integration tests
 file_line_coverage_min = 50
diff --git a/src/codemodder/codemods/test/utils.py b/src/codemodder/codemods/test/utils.py
index 055f3700..00ea1502 100644
--- a/src/codemodder/codemods/test/utils.py
+++ b/src/codemodder/codemods/test/utils.py
@@ -73,9 +73,10 @@ def run_and_assert(
 
         path_exclude = [f"{tmp_file_path}:{line}" for line in lines_to_exclude or []]
 
+        print(expected_diff_per_change)
         self.execution_context = CodemodExecutionContext(
             directory=root,
-            dry_run=False,
+            dry_run=True if expected_diff_per_change else False,
             verbose=False,
             registry=mock.MagicMock(),
             providers=load_providers(),
@@ -220,9 +221,10 @@ def run_and_assert(
 
         path_exclude = [f"{tmp_file_path}:{line}" for line in lines_to_exclude or []]
 
+        print(expected_diff_per_change)
         self.execution_context = CodemodExecutionContext(
             directory=root,
-            dry_run=False,
+            dry_run=True if expected_diff_per_change else False,
             verbose=False,
             tool_result_files_map={self.tool: [tmp_results_file_path]},
             registry=mock.MagicMock(),
diff --git a/tests/codemods/test_combine_isinstance_issubclass.py b/tests/codemods/test_combine_isinstance_issubclass.py
index 3a158a9c..75f48b41 100644
--- a/tests/codemods/test_combine_isinstance_issubclass.py
+++ b/tests/codemods/test_combine_isinstance_issubclass.py
@@ -60,7 +60,7 @@ def _format_func_run_test(self, tmpdir, func, input_code, expected, num_changes=
             tmpdir,
             input_code.replace("{func}", func),
             expected.replace("{func}", func),
-            num_changes,
+            num_changes=num_changes,
         )
 
     @each_func
diff --git a/tests/codemods/test_combine_startswith_endswith.py b/tests/codemods/test_combine_startswith_endswith.py
index f3ed2808..444c37b8 100644
--- a/tests/codemods/test_combine_startswith_endswith.py
+++ b/tests/codemods/test_combine_startswith_endswith.py
@@ -62,7 +62,7 @@ def _format_func_run_test(self, tmpdir, func, input_code, expected, num_changes=
             tmpdir,
             input_code.replace("{func}", func),
             expected.replace("{func}", func),
-            num_changes,
+            num_changes=num_changes,
         )
 
     @each_func
diff --git a/tests/codemods/test_tempfile_mktemp.py b/tests/codemods/test_tempfile_mktemp.py
index 77917845..42ea295b 100644
--- a/tests/codemods/test_tempfile_mktemp.py
+++ b/tests/codemods/test_tempfile_mktemp.py
@@ -79,7 +79,7 @@ def test_import_with_arg(self, tmpdir):
             filename = tf.name
         var = "hello"
         """
-        self.run_and_assert(tmpdir, input_code, expected_output, 5)
+        self.run_and_assert(tmpdir, input_code, expected_output, num_changes=5)
 
     def test_from_import(self, tmpdir):
         input_code = """

From 233974aa24ba4ef1eb08fe23b7b90a69ff3e0888 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Tue, 25 Mar 2025 08:43:27 -0300
Subject: [PATCH 17/27] Some refactoring

---
 .../codemods/test/integration_utils.py        | 169 +++++++-----------
 1 file changed, 66 insertions(+), 103 deletions(-)

diff --git a/src/codemodder/codemods/test/integration_utils.py b/src/codemodder/codemods/test/integration_utils.py
index 8ffa5d63..e2973782 100644
--- a/src/codemodder/codemods/test/integration_utils.py
+++ b/src/codemodder/codemods/test/integration_utils.py
@@ -36,7 +36,66 @@ def check_dependencies_after(self):
             assert new_requirements_txt == self.expected_requirements
 
 
-class BaseRemediationIntegrationTest:
+class BaseIntegrationTestMixin:
+    def _assert_sonar_fields(self, result):
+        del result
+
+    def _assert_codetf_output(self, codetf_schema):
+        with open(self.output_path, "r", encoding="utf-8") as f:
+            codetf = json.load(f)
+
+        jsonschema.validate(codetf, codetf_schema)
+
+        assert sorted(codetf.keys()) == ["results", "run"]
+        run = codetf["run"]
+        self._assert_run_fields(run, self.output_path)
+        results = codetf["results"]
+        # CodeTf2 spec requires relative paths
+        self._assert_results_fields(results, self.code_filename)
+
+    def write_original_code(self):
+        with open(self.code_path, "w", encoding="utf-8") as f:
+            f.write(self.original_code)
+
+    def _assert_results_fields(self, results, output_path):
+        assert len(results) == 1
+        result = results[0]
+        assert result["codemod"] == self.codemod_instance.id
+        assert result["references"] == [
+            ref.model_dump(exclude_none=True)
+            for ref in self.codemod_instance.references
+        ]
+
+        assert ("detectionTool" in result) == bool(self.sonar_issues_json)
+        assert ("detectionTool" in result) == bool(self.sonar_hotspots_json)
+
+        # TODO: if/when we add description for each url
+        for reference in result["references"][
+            # Last references for Sonar has a different description
+            : (
+                -len(self.codemod.requested_rules)
+                if self.sonar_issues_json or self.sonar_hotspots_json
+                else None
+            )
+        ]:
+            assert reference["url"] == reference["description"]
+
+        self._assert_sonar_fields(result)
+
+    def _assert_command_line(self, run, output_path):
+        pass
+
+    def _assert_run_fields(self, run, output_path):
+        self._assert_command_line(run, output_path)
+        assert run["vendor"] == "pixee"
+        assert run["tool"] == "codemodder-python"
+        assert run["version"] == __version__
+        assert run["elapsed"] != ""
+        assert run["directory"] == os.path.abspath(self.code_dir)
+        assert run["sarifs"] == []
+
+
+class BaseRemediationIntegrationTest(BaseIntegrationTestMixin):
     codemod = NotImplementedError
     original_code = NotImplementedError
     expected_diff_per_change = NotImplementedError
@@ -77,11 +136,7 @@ def setup_class(cls):
             with open(cls.code_path, "r", encoding="utf-8") as f:  # type: ignore
                 cls.original_code = f.read()
 
-    def _assert_run_fields(self, run, output_path):
-        assert run["vendor"] == "pixee"
-        assert run["tool"] == "codemodder-python"
-        assert run["version"] == __version__
-        assert run["elapsed"] != ""
+    def _assert_command_line(self, run, output_path):
         assert run[
             "commandLine"
         ] == f'codemodder {self.code_dir} --output {output_path} --codemod-include={self.codemod_instance.id} --path-include={self.code_filename} --path-exclude=""' + (
@@ -93,35 +148,10 @@ def _assert_run_fields(self, run, output_path):
             if self.sonar_hotspots_json
             else ""
         )
-        assert run["directory"] == os.path.abspath(self.code_dir)
-        assert run["sarifs"] == []
 
     def _assert_results_fields(self, results, output_path):
-        assert len(results) == 1
+        super()._assert_results_fields(results, output_path)
         result = results[0]
-        assert result["codemod"] == self.codemod_instance.id
-        assert result["references"] == [
-            ref.model_dump(exclude_none=True)
-            for ref in self.codemod_instance.references
-        ]
-
-        assert ("detectionTool" in result) == bool(self.sonar_issues_json)
-        assert ("detectionTool" in result) == bool(self.sonar_hotspots_json)
-
-        # TODO: if/when we add description for each url
-        for reference in result["references"][
-            # Last references for Sonar has a different description
-            : (
-                -len(self.codemod.requested_rules)
-                if self.sonar_issues_json or self.sonar_hotspots_json
-                else None
-            )
-        ]:
-            assert reference["url"] == reference["description"]
-
-        self._assert_sonar_fields(result)
-
-        # There should be a changeset for every expected change
         assert len(result["changeset"]) == self.num_changes
         # gather all the change files and test against the expected number
         assert len({c["path"] for c in result["changeset"]}) == self.num_changed_files
@@ -143,26 +173,6 @@ def _assert_results_fields(self, results, output_path):
             self.change_description
         }
 
-    def _assert_sonar_fields(self, result):
-        del result
-
-    def _assert_codetf_output(self, codetf_schema):
-        with open(self.output_path, "r", encoding="utf-8") as f:
-            codetf = json.load(f)
-
-        jsonschema.validate(codetf, codetf_schema)
-
-        assert sorted(codetf.keys()) == ["results", "run"]
-        run = codetf["run"]
-        self._assert_run_fields(run, self.output_path)
-        results = codetf["results"]
-        # CodeTf2 spec requires relative paths
-        self._assert_results_fields(results, self.code_filename)
-
-    def write_original_code(self):
-        with open(self.code_path, "w", encoding="utf-8") as f:
-            f.write(self.original_code)
-
     def test_codetf_output(self, codetf_schema):
         """
         Tests correct codetf output.
@@ -296,7 +306,7 @@ def _check_code_after(self, patched_codes):
             )
 
 
-class BaseIntegrationTest(DependencyTestMixin):
+class BaseIntegrationTest(BaseIntegrationTestMixin, DependencyTestMixin):
     codemod = NotImplementedError
     original_code = NotImplementedError
     replacement_lines = NotImplementedError
@@ -352,11 +362,7 @@ def teardown_class(cls):
         if cls.requirements_file_name:
             pathlib.Path(cls.dependency_path).unlink(missing_ok=True)
 
-    def _assert_run_fields(self, run, output_path):
-        assert run["vendor"] == "pixee"
-        assert run["tool"] == "codemodder-python"
-        assert run["version"] == __version__
-        assert run["elapsed"] != ""
+    def _assert_command_line(self, run, output_path):
         assert run[
             "commandLine"
         ] == f'codemodder_hardening {self.code_dir} --output {output_path} --codemod-include={self.codemod_instance.id} --path-include={self.code_filename} --path-exclude=""' + (
@@ -368,34 +374,11 @@ def _assert_run_fields(self, run, output_path):
             if self.sonar_hotspots_json
             else ""
         )
-        assert run["directory"] == os.path.abspath(self.code_dir)
-        assert run["sarifs"] == []
 
     def _assert_results_fields(self, results, output_path):
-        assert len(results) == 1
-        result = results[0]
-        assert result["codemod"] == self.codemod_instance.id
-        assert result["references"] == [
-            ref.model_dump(exclude_none=True)
-            for ref in self.codemod_instance.references
-        ]
-
-        assert ("detectionTool" in result) == bool(self.sonar_issues_json)
-        assert ("detectionTool" in result) == bool(self.sonar_hotspots_json)
-
-        # TODO: if/when we add description for each url
-        for reference in result["references"][
-            # Last references for Sonar has a different description
-            : (
-                -len(self.codemod.requested_rules)
-                if self.sonar_issues_json or self.sonar_hotspots_json
-                else None
-            )
-        ]:
-            assert reference["url"] == reference["description"]
-
-        self._assert_sonar_fields(result)
+        super()._assert_results_fields(results, output_path)
 
+        result = results[0]
         assert len(result["changeset"]) == self.num_changed_files
 
         # A codemod may change multiple files. For now we will
@@ -411,22 +394,6 @@ def _assert_results_fields(self, results, output_path):
         assert line_change["lineNumber"] == int(self.expected_line_change)
         assert line_change["description"] == self.change_description
 
-    def _assert_sonar_fields(self, result):
-        del result
-
-    def _assert_codetf_output(self, codetf_schema):
-        with open(self.output_path, "r", encoding="utf-8") as f:
-            codetf = json.load(f)
-
-        jsonschema.validate(codetf, codetf_schema)
-
-        assert sorted(codetf.keys()) == ["results", "run"]
-        run = codetf["run"]
-        self._assert_run_fields(run, self.output_path)
-        results = codetf["results"]
-        # CodeTf2 spec requires relative paths
-        self._assert_results_fields(results, self.code_filename)
-
     def check_code_after(self) -> ModuleType:
         with open(self.code_path, "r", encoding="utf-8") as f:  # type: ignore
             new_code = f.read()
@@ -435,10 +402,6 @@ def check_code_after(self) -> ModuleType:
             path=self.code_path, allowed_exceptions=self.allowed_exceptions  # type: ignore
         )
 
-    def write_original_code(self):
-        with open(self.code_path, "w", encoding="utf-8") as f:
-            f.write(self.original_code)
-
     def test_file_rewritten(self, codetf_schema):
         """
         Tests that file is re-written correctly with new code and correct codetf output.

From 301379b3f365698f6187cbac73a24d9bc1f15eaf Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Tue, 25 Mar 2025 09:02:56 -0300
Subject: [PATCH 18/27] More refactoring

---
 .../codemods/test/integration_utils.py        | 67 +++++++------------
 1 file changed, 26 insertions(+), 41 deletions(-)

diff --git a/src/codemodder/codemods/test/integration_utils.py b/src/codemodder/codemods/test/integration_utils.py
index e2973782..ee55681c 100644
--- a/src/codemodder/codemods/test/integration_utils.py
+++ b/src/codemodder/codemods/test/integration_utils.py
@@ -37,6 +37,30 @@ def check_dependencies_after(self):
 
 
 class BaseIntegrationTestMixin:
+
+    @classmethod
+    def setup_class(cls):
+        codemod_id = (
+            cls.codemod().id if isinstance(cls.codemod, type) else cls.codemod.id
+        )
+        cls.codemod_instance = validate_codemod_registration(codemod_id)
+
+        cls.output_path = tempfile.mkstemp()[1]
+        cls.code_dir = tempfile.mkdtemp()
+
+        if not hasattr(cls, "code_filename"):
+            # Only a few codemods require the analyzed file to have a specific filename
+            # All others can just be `code.py`
+            cls.code_filename = "code.py"
+
+        cls.code_path = os.path.join(cls.code_dir, cls.code_filename)
+
+        if cls.code_filename == "settings.py" and "Django" in str(cls):
+            # manage.py must be in the directory above settings.py for this codemod to run
+            parent_dir = Path(cls.code_dir).parent
+            manage_py_path = parent_dir / "manage.py"
+            manage_py_path.touch()
+
     def _assert_sonar_fields(self, result):
         del result
 
@@ -107,26 +131,7 @@ class BaseRemediationIntegrationTest(BaseIntegrationTestMixin):
 
     @classmethod
     def setup_class(cls):
-        codemod_id = (
-            cls.codemod().id if isinstance(cls.codemod, type) else cls.codemod.id
-        )
-        cls.codemod_instance = validate_codemod_registration(codemod_id)
-
-        cls.output_path = tempfile.mkstemp()[1]
-        cls.code_dir = tempfile.mkdtemp()
-
-        if not hasattr(cls, "code_filename"):
-            # Only a few codemods require the analyzed file to have a specific filename
-            # All others can just be `code.py`
-            cls.code_filename = "code.py"
-
-        cls.code_path = os.path.join(cls.code_dir, cls.code_filename)
-
-        if cls.code_filename == "settings.py" and "Django" in str(cls):
-            # manage.py must be in the directory above settings.py for this codemod to run
-            parent_dir = Path(cls.code_dir).parent
-            manage_py_path = parent_dir / "manage.py"
-            manage_py_path.touch()
+        super().setup_class()
 
         if cls.original_code is not NotImplementedError:
             # Some tests are easier to understand with the expected new code provided
@@ -319,27 +324,7 @@ class BaseIntegrationTest(BaseIntegrationTestMixin, DependencyTestMixin):
 
     @classmethod
     def setup_class(cls):
-        codemod_id = (
-            cls.codemod().id if isinstance(cls.codemod, type) else cls.codemod.id
-        )
-        cls.codemod_instance = validate_codemod_registration(codemod_id)
-
-        cls.output_path = tempfile.mkstemp()[1]
-        cls.code_dir = tempfile.mkdtemp()
-
-        if not hasattr(cls, "code_filename"):
-            # Only a few codemods require the analyzed file to have a specific filename
-            # All others can just be `code.py`
-            cls.code_filename = "code.py"
-
-        cls.code_path = os.path.join(cls.code_dir, cls.code_filename)
-
-        if cls.code_filename == "settings.py" and "Django" in str(cls):
-            # manage.py must be in the directory above settings.py for this codemod to run
-            parent_dir = Path(cls.code_dir).parent
-            manage_py_path = parent_dir / "manage.py"
-            manage_py_path.touch()
-
+        super().setup_class()
         if hasattr(cls, "expected_new_code"):
             # Some tests are easier to understand with the expected new code provided
             # instead of calculated

From ae4b6b519c266200b5f9a8030da66a9a6a8a1a61 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Tue, 25 Mar 2025 09:09:41 -0300
Subject: [PATCH 19/27] Small refactoring

---
 src/codemodder/codemods/test/utils.py               |  2 --
 src/core_codemods/semgrep/semgrep_no_csrf_exempt.py | 13 ++++++-------
 2 files changed, 6 insertions(+), 9 deletions(-)

diff --git a/src/codemodder/codemods/test/utils.py b/src/codemodder/codemods/test/utils.py
index 00ea1502..346a30d9 100644
--- a/src/codemodder/codemods/test/utils.py
+++ b/src/codemodder/codemods/test/utils.py
@@ -118,8 +118,6 @@ def assert_num_changes(
             assert len(changes[0].changes) == expected_num_changes
             actual_num = len(changes[0].changes)
 
-        # actual_num = len(changes)
-
         if min_num_changes is not None:
             assert (
                 actual_num >= min_num_changes
diff --git a/src/core_codemods/semgrep/semgrep_no_csrf_exempt.py b/src/core_codemods/semgrep/semgrep_no_csrf_exempt.py
index fc39ef9c..cd494c06 100644
--- a/src/core_codemods/semgrep/semgrep_no_csrf_exempt.py
+++ b/src/core_codemods/semgrep/semgrep_no_csrf_exempt.py
@@ -27,13 +27,12 @@ def leave_Decorator(
         ):
             return updated_node
         # Due to semgrep's odd way of reporting the position for this (decorators + functiondef), we match by line only
-        if self.node_is_selected_by_line_only(original_node):
-            if (
-                self.find_base_name(original_node.decorator)
-                == "django.views.decorators.csrf.csrf_exempt"
-            ):
-                self.report_change(original_node)
-                return cst.RemovalSentinel.REMOVE
+        if self.node_is_selected_by_line_only(original_node) and (
+            self.find_base_name(original_node.decorator)
+            == "django.views.decorators.csrf.csrf_exempt"
+        ):
+            self.report_change(original_node)
+            return cst.RemovalSentinel.REMOVE
         return updated_node
 
 

From 1bf27c64d1c5c117d8901aec280b75021d9b1602 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Fri, 28 Mar 2025 08:56:04 -0300
Subject: [PATCH 20/27] Reverted default behavior to hardening

---
 integration_tests/test_dependency_manager.py  |  2 +-
 integration_tests/test_multiple_codemods.py   |  2 +-
 pyproject.toml                                |  2 +-
 src/codemodder/codemodder.py                  | 24 +++++++++----------
 src/codemodder/codemods/base_codemod.py       | 12 +++++-----
 .../codemods/test/integration_utils.py        |  8 +++----
 src/codemodder/codemods/test/utils.py         | 12 ++++++----
 src/core_codemods/defectdojo/api.py           |  4 ++--
 tests/codemods/test_base_codemod.py           |  2 +-
 9 files changed, 36 insertions(+), 32 deletions(-)

diff --git a/integration_tests/test_dependency_manager.py b/integration_tests/test_dependency_manager.py
index 3429371d..2ebbf679 100644
--- a/integration_tests/test_dependency_manager.py
+++ b/integration_tests/test_dependency_manager.py
@@ -136,7 +136,7 @@ def test_fail_to_add(self, tmp_repo):
         os.chmod(tmp_repo / self.requirements_file, 0o400)
 
         command = [
-            "codemodder_hardening",
+            "codemodder",
             tmp_repo,
             "--output",
             self.output_path,
diff --git a/integration_tests/test_multiple_codemods.py b/integration_tests/test_multiple_codemods.py
index 75c24892..e3f14dcf 100644
--- a/integration_tests/test_multiple_codemods.py
+++ b/integration_tests/test_multiple_codemods.py
@@ -25,7 +25,7 @@ def test_two_codemods(self, codemods, tmpdir):
         shutil.copy(pathlib.Path(SAMPLES_DIR) / source_file_name, directory)
 
         command = [
-            "codemodder_hardening",
+            "codemodder",
             directory,
             "--output",
             str(codetf_path),
diff --git a/pyproject.toml b/pyproject.toml
index c33f95de..4a29336e 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -46,7 +46,7 @@ Repository = "https://github.com/pixee/codemodder-python"
 
 [project.scripts]
 codemodder = "codemodder.codemodder:main"
-codemodder_hardening = "codemodder.codemodder:harden"
+codemodder-remediation = "codemodder.codemodder:remediate"
 generate-docs = 'codemodder.scripts.generate_docs:main'
 get-hashes = 'codemodder.scripts.get_hashes:main'
 
diff --git a/src/codemodder/codemodder.py b/src/codemodder/codemodder.py
index e901d8b2..54ae063b 100644
--- a/src/codemodder/codemodder.py
+++ b/src/codemodder/codemodder.py
@@ -73,7 +73,7 @@ def log_report(context, output, elapsed_ms, files_to_analyze, token_usage):
 def apply_codemods(
     context: CodemodExecutionContext,
     codemods_to_run: Sequence[BaseCodemod],
-    hardening: bool,
+    remediation: bool,
 ) -> TokenUsage:
     log_section("scanning")
     token_usage = TokenUsage()
@@ -90,7 +90,7 @@ def apply_codemods(
     for codemod in codemods_to_run:
         # NOTE: this may be used as a progress indicator by upstream tools
         logger.info("running codemod %s", codemod.id)
-        if codemod_token_usage := codemod.apply(context, hardening):
+        if codemod_token_usage := codemod.apply(context, remediation):
             log_token_usage(f"Codemod {codemod.id}", codemod_token_usage)
             token_usage += codemod_token_usage
 
@@ -136,7 +136,7 @@ def run(
     sast_only: bool = False,
     ai_client: bool = True,
     log_matched_files: bool = False,
-    hardening: bool = False,
+    remediation: bool = False,
 ) -> tuple[CodeTF | None, int, TokenUsage]:
     start = datetime.datetime.now()
 
@@ -208,7 +208,7 @@ def run(
         context.find_and_fix_paths,
     )
 
-    token_usage = apply_codemods(context, codemods_to_run, hardening)
+    token_usage = apply_codemods(context, codemods_to_run, remediation)
 
     elapsed = datetime.datetime.now() - start
     elapsed_ms = int(elapsed.total_seconds() * 1000)
@@ -233,7 +233,7 @@ def run(
     return codetf, 0, token_usage
 
 
-def _run_cli(original_args, hardening=False) -> int:
+def _run_cli(original_args, remediation=False) -> int:
     codemod_registry = registry.load_registered_codemods()
     argv = parse_args(original_args, codemod_registry)
     if not os.path.exists(argv.directory):
@@ -272,8 +272,8 @@ def _run_cli(original_args, hardening=False) -> int:
 
     _, status, _ = run(
         argv.directory,
-        # Force dry-run if not hardening
-        argv.dry_run if hardening else True,
+        # Force dry-run if remediation
+        True if remediation else argv.dry_run,
         argv.output,
         argv.output_format,
         argv.verbose,
@@ -287,22 +287,22 @@ def _run_cli(original_args, hardening=False) -> int:
         codemod_registry=codemod_registry,
         sast_only=argv.sonar_issues_json or argv.sarif,
         log_matched_files=True,
-        hardening=hardening,
+        remediation=remediation,
     )
     return status
 
 
-def harden():
+def main():
     """
     Hardens a project. The application will write all the fixes into the files.
     """
     sys_argv = sys.argv[1:]
-    sys.exit(_run_cli(sys_argv, True))
+    sys.exit(_run_cli(sys_argv))
 
 
-def main():
+def remediate():
     """
     Remediates a project. The application will suggest fix for each separate issue found. No files will be written.
     """
     sys_argv = sys.argv[1:]
-    sys.exit(_run_cli(sys_argv))
+    sys.exit(_run_cli(sys_argv, True))
diff --git a/src/codemodder/codemods/base_codemod.py b/src/codemodder/codemods/base_codemod.py
index 1c0c2e89..dce114a0 100644
--- a/src/codemodder/codemods/base_codemod.py
+++ b/src/codemodder/codemods/base_codemod.py
@@ -189,7 +189,7 @@ def _apply(
         self,
         context: CodemodExecutionContext,
         rules: list[str],
-        hardening: bool,
+        remediation: bool,
     ) -> None | TokenUsage:
         if self.provider and (
             not (provider := context.providers.get_provider(self.provider))
@@ -228,7 +228,7 @@ def _apply(
             return None
 
         # Do each result independently and outputs the diffs
-        if not hardening:
+        if remediation:
             # gather positional arguments for the map
             resultset_arguments: list[ResultSet | None] = []
             path_arguments = []
@@ -283,7 +283,7 @@ def _apply(
         return None
 
     def apply(
-        self, context: CodemodExecutionContext, hardening: bool = False
+        self, context: CodemodExecutionContext, remediation: bool = False
     ) -> None | TokenUsage:
         """
         Apply the codemod with the given codemod execution context
@@ -300,7 +300,7 @@ def apply(
 
         :param context: The codemod execution context
         """
-        return self._apply(context, [self._internal_name], hardening)
+        return self._apply(context, [self._internal_name], remediation)
 
     def _process_file(
         self,
@@ -399,9 +399,9 @@ def __init__(
             self.requested_rules.extend(requested_rules)
 
     def apply(
-        self, context: CodemodExecutionContext, hardening: bool = False
+        self, context: CodemodExecutionContext, remediation: bool = False
     ) -> None | TokenUsage:
-        return self._apply(context, self.requested_rules, hardening)
+        return self._apply(context, self.requested_rules, remediation)
 
     def get_files_to_analyze(
         self,
diff --git a/src/codemodder/codemods/test/integration_utils.py b/src/codemodder/codemods/test/integration_utils.py
index ee55681c..d1a4af6b 100644
--- a/src/codemodder/codemods/test/integration_utils.py
+++ b/src/codemodder/codemods/test/integration_utils.py
@@ -144,7 +144,7 @@ def setup_class(cls):
     def _assert_command_line(self, run, output_path):
         assert run[
             "commandLine"
-        ] == f'codemodder {self.code_dir} --output {output_path} --codemod-include={self.codemod_instance.id} --path-include={self.code_filename} --path-exclude=""' + (
+        ] == f'codemodder-remediation {self.code_dir} --output {output_path} --codemod-include={self.codemod_instance.id} --path-include={self.code_filename} --path-exclude=""' + (
             f" --sonar-issues-json={self.sonar_issues_json}"
             if self.sonar_issues_json
             else ""
@@ -184,7 +184,7 @@ def test_codetf_output(self, codetf_schema):
         """
 
         command = [
-            "codemodder",
+            "codemodder-remediation",
             self.code_dir,
             "--output",
             self.output_path,
@@ -350,7 +350,7 @@ def teardown_class(cls):
     def _assert_command_line(self, run, output_path):
         assert run[
             "commandLine"
-        ] == f'codemodder_hardening {self.code_dir} --output {output_path} --codemod-include={self.codemod_instance.id} --path-include={self.code_filename} --path-exclude=""' + (
+        ] == f'codemodder {self.code_dir} --output {output_path} --codemod-include={self.codemod_instance.id} --path-include={self.code_filename} --path-exclude=""' + (
             f" --sonar-issues-json={self.sonar_issues_json}"
             if self.sonar_issues_json
             else ""
@@ -396,7 +396,7 @@ def test_file_rewritten(self, codetf_schema):
         output files
         """
         command = [
-            "codemodder_hardening",
+            "codemodder",
             self.code_dir,
             "--output",
             self.output_path,
diff --git a/src/codemodder/codemods/test/utils.py b/src/codemodder/codemods/test/utils.py
index 346a30d9..60f71206 100644
--- a/src/codemodder/codemods/test/utils.py
+++ b/src/codemodder/codemods/test/utils.py
@@ -73,7 +73,6 @@ def run_and_assert(
 
         path_exclude = [f"{tmp_file_path}:{line}" for line in lines_to_exclude or []]
 
-        print(expected_diff_per_change)
         self.execution_context = CodemodExecutionContext(
             directory=root,
             dry_run=True if expected_diff_per_change else False,
@@ -85,7 +84,10 @@ def run_and_assert(
             path_exclude=path_exclude,
         )
 
-        self.codemod.apply(self.execution_context)
+        self.codemod.apply(
+            self.execution_context,
+            remediation=True if expected_diff_per_change else False,
+        )
         changes = self.execution_context.get_changesets(self.codemod.id)
 
         self.changeset = changes
@@ -219,7 +221,6 @@ def run_and_assert(
 
         path_exclude = [f"{tmp_file_path}:{line}" for line in lines_to_exclude or []]
 
-        print(expected_diff_per_change)
         self.execution_context = CodemodExecutionContext(
             directory=root,
             dry_run=True if expected_diff_per_change else False,
@@ -232,7 +233,10 @@ def run_and_assert(
             path_exclude=path_exclude,
         )
 
-        self.codemod.apply(self.execution_context)
+        self.codemod.apply(
+            self.execution_context,
+            remediation=True if expected_diff_per_change else False,
+        )
         changes = self.execution_context.get_changesets(self.codemod.id)
 
         if input_code == expected:
diff --git a/src/core_codemods/defectdojo/api.py b/src/core_codemods/defectdojo/api.py
index c024149c..d00d7ed9 100644
--- a/src/core_codemods/defectdojo/api.py
+++ b/src/core_codemods/defectdojo/api.py
@@ -76,11 +76,11 @@ def from_core_codemod(
     def apply(
         self,
         context: CodemodExecutionContext,
-        hardening: bool = False,
+        remediation: bool = False,
     ) -> None:
         self._apply(
             context,
             # We know this has a tool because we created it with `from_core_codemod`
             cast(ToolMetadata, self._metadata.tool).rule_ids,
-            hardening,
+            remediation,
         )
diff --git a/tests/codemods/test_base_codemod.py b/tests/codemods/test_base_codemod.py
index fd998030..74373322 100644
--- a/tests/codemods/test_base_codemod.py
+++ b/tests/codemods/test_base_codemod.py
@@ -81,7 +81,7 @@ def test_core_codemod_filter_apply_by_extension(mocker, ext, call_count):
         Path("file2.py"),
     ]
 
-    codemod.apply(context, hardening=True)
+    codemod.apply(context)
 
     assert process_file.call_count == call_count
 

From 2ab7c0bd4e7605e86ad4d872b3bb7f1c2f20f1be Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Fri, 28 Mar 2025 09:37:26 -0300
Subject: [PATCH 21/27] Fixed pygoat test

---
 .github/workflows/codemod_pygoat.yml | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/.github/workflows/codemod_pygoat.yml b/.github/workflows/codemod_pygoat.yml
index 848bb549..86e744d2 100644
--- a/.github/workflows/codemod_pygoat.yml
+++ b/.github/workflows/codemod_pygoat.yml
@@ -38,6 +38,6 @@ jobs:
           repository: pixee/pygoat
           path: pygoat
       - name: Run Codemodder
-        run: codemodder_hardening --dry-run --output output.codetf pygoat
+        run: codemodder --dry-run --output output.codetf pygoat
       - name: Check PyGoat Findings
         run: make pygoat-test

From 04f5a99f13ce1e3b66f4c7d3ba6cb9d5f477c22c Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Fri, 28 Mar 2025 10:24:16 -0300
Subject: [PATCH 22/27] Refactored hardening and remediation behavior

---
 src/codemodder/codemods/base_codemod.py | 161 ++++++++++++++----------
 src/core_codemods/defectdojo/api.py     |  12 +-
 2 files changed, 104 insertions(+), 69 deletions(-)

diff --git a/src/codemodder/codemods/base_codemod.py b/src/codemodder/codemods/base_codemod.py
index dce114a0..a8e6c800 100644
--- a/src/codemodder/codemods/base_codemod.py
+++ b/src/codemodder/codemods/base_codemod.py
@@ -185,12 +185,98 @@ def get_files_to_analyze(
         """
         ...
 
-    def _apply(
+    def _apply_remediation(
         self,
         context: CodemodExecutionContext,
         rules: list[str],
-        remediation: bool,
     ) -> None | TokenUsage:
+        """
+        Applies remediation behavior to a codemod, that is, each changeset will only be associated with a single finging and no files will be written.
+        """
+        results: ResultSet | None = self._apply_detector(context)
+
+        if results is not None and not results:
+            logger.debug("No results for %s", self.id)
+            return None
+
+        if not (files_to_analyze := self.get_files_to_analyze(context, results)):
+            logger.debug("No files matched for %s", self.id)
+            return None
+
+        # Do each result independently and outputs the diffs
+        # gather positional arguments for the map
+        resultset_arguments: list[ResultSet | None] = []
+        path_arguments = []
+        if results:
+            for result in results.results_for_rules(rules):
+                # this need to be the same type of ResultSet as results
+                singleton = results.__class__()
+                singleton.add_result(result)
+                result_locations = self.get_files_to_analyze(context, singleton)
+                # We do an execution for each location in the result
+                # So we duplicate the resultset argument for each location
+                for loc in result_locations:
+                    resultset_arguments.append(singleton)
+                    path_arguments.append(loc)
+        # An exception for find-and-fix codemods
+        else:
+            resultset_arguments = [None]
+            path_arguments = files_to_analyze
+
+        contexts: list = []
+        with ThreadPoolExecutor() as executor:
+            logger.debug("using executor with %s workers", context.max_workers)
+            contexts.extend(
+                executor.map(
+                    lambda path, resultset: self._process_file(
+                        path, context, resultset, rules
+                    ),
+                    path_arguments,
+                    resultset_arguments or [None],
+                )
+            )
+            executor.shutdown(wait=True)
+
+        context.process_results(self.id, contexts)
+        return None
+
+    def _apply_hardening(
+        self,
+        context: CodemodExecutionContext,
+        rules: list[str],
+    ) -> None | TokenUsage:
+        """
+        Applies hardening behavior to a codemod with the goal of integrating all fixes for each finding into the files.
+        """
+        results: ResultSet | None = self._apply_detector(context)
+
+        if results is not None and not results:
+            logger.debug("No results for %s", self.id)
+            return None
+
+        if not (files_to_analyze := self.get_files_to_analyze(context, results)):
+            logger.debug("No files matched for %s", self.id)
+            return None
+
+        # Hardens all findings per file at once and writes the fixed code into the file
+        process_file = functools.partial(
+            self._process_file, context=context, results=results, rules=rules
+        )
+
+        contexts = []
+        if context.max_workers == 1:
+            logger.debug("processing files serially")
+            contexts.extend([process_file(file) for file in files_to_analyze])
+        else:
+            with ThreadPoolExecutor() as executor:
+                logger.debug("using executor with %s workers", context.max_workers)
+                contexts.extend(executor.map(process_file, files_to_analyze))
+                executor.shutdown(wait=True)
+
+        context.process_results(self.id, contexts)
+        return None
+
+    def _apply_detector(self, context: CodemodExecutionContext) -> ResultSet | None:
         if self.provider and (
             not (provider := context.providers.get_provider(self.provider))
             or not provider.is_available
@@ -219,68 +305,7 @@ def _apply(
             else None
         )
 
-        if results is not None and not results:
-            logger.debug("No results for %s", self.id)
-            return None
-
-        if not (files_to_analyze := self.get_files_to_analyze(context, results)):
-            logger.debug("No files matched for %s", self.id)
-            return None
-
-        # Do each result independently and outputs the diffs
-        if remediation:
-            # gather positional arguments for the map
-            resultset_arguments: list[ResultSet | None] = []
-            path_arguments = []
-            if results:
-                for result in results.results_for_rules(rules):
-                    # this need to be the same type of ResultSet as results
-                    singleton = results.__class__()
-                    singleton.add_result(result)
-                    result_locations = self.get_files_to_analyze(context, singleton)
-                    # We do an execution for each location in the result
-                    # So we duplicate the resultset argument for each location
-                    for loc in result_locations:
-                        resultset_arguments.append(singleton)
-                        path_arguments.append(loc)
-            # An exception for find-and-fix codemods
-            else:
-                resultset_arguments = [None]
-                path_arguments = files_to_analyze
-
-            contexts: list = []
-            with ThreadPoolExecutor() as executor:
-                logger.debug("using executor with %s workers", context.max_workers)
-                contexts.extend(
-                    executor.map(
-                        lambda path, resultset: self._process_file(
-                            path, context, resultset, rules
-                        ),
-                        path_arguments,
-                        resultset_arguments or [None],
-                    )
-                )
-                executor.shutdown(wait=True)
-
-            context.process_results(self.id, contexts)
-        # Hardens all findings per file at once and writes the fixed code into the file
-        else:
-            process_file = functools.partial(
-                self._process_file, context=context, results=results, rules=rules
-            )
-
-            contexts = []
-            if context.max_workers == 1:
-                logger.debug("processing files serially")
-                contexts.extend([process_file(file) for file in files_to_analyze])
-            else:
-                with ThreadPoolExecutor() as executor:
-                    logger.debug("using executor with %s workers", context.max_workers)
-                    contexts.extend(executor.map(process_file, files_to_analyze))
-                    executor.shutdown(wait=True)
-
-            context.process_results(self.id, contexts)
-        return None
+        return results
 
     def apply(
         self, context: CodemodExecutionContext, remediation: bool = False
@@ -300,7 +325,9 @@ def apply(
 
         :param context: The codemod execution context
         """
-        return self._apply(context, [self._internal_name], remediation)
+        if remediation:
+            return self._apply_remediation(context, [self._internal_name])
+        return self._apply_hardening(context, [self._internal_name])
 
     def _process_file(
         self,
@@ -401,7 +428,9 @@ def __init__(
     def apply(
         self, context: CodemodExecutionContext, remediation: bool = False
     ) -> None | TokenUsage:
-        return self._apply(context, self.requested_rules, remediation)
+        if remediation:
+            return self._apply_remediation(context, self.requested_rules)
+        return self._apply_hardening(context, self.requested_rules)
 
     def get_files_to_analyze(
         self,
diff --git a/src/core_codemods/defectdojo/api.py b/src/core_codemods/defectdojo/api.py
index d00d7ed9..318993cc 100644
--- a/src/core_codemods/defectdojo/api.py
+++ b/src/core_codemods/defectdojo/api.py
@@ -8,6 +8,7 @@
 from codemodder.codemods.api import Metadata, Reference, ToolMetadata, ToolRule
 from codemodder.codemods.base_detector import BaseDetector
 from codemodder.context import CodemodExecutionContext
+from codemodder.llm import TokenUsage
 from codemodder.result import ResultSet
 from core_codemods.api import CoreCodemod, SASTCodemod
 
@@ -77,10 +78,15 @@ def apply(
         self,
         context: CodemodExecutionContext,
         remediation: bool = False,
-    ) -> None:
-        self._apply(
+    ) -> None | TokenUsage:
+        if remediation:
+            return self._apply_remediation(
+                context,
+                # We know this has a tool because we created it with `from_core_codemod`
+                cast(ToolMetadata, self._metadata.tool).rule_ids,
+            )
+        return self._apply_hardening(
             context,
             # We know this has a tool because we created it with `from_core_codemod`
             cast(ToolMetadata, self._metadata.tool).rule_ids,
-            remediation,
         )

From e994695dc4d3146250d7b750720e240a0c0dcdde Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Fri, 28 Mar 2025 11:35:08 -0300
Subject: [PATCH 23/27] Fixed skipping logic

---
 src/codemodder/codemods/base_codemod.py | 14 +++++++++++---
 1 file changed, 11 insertions(+), 3 deletions(-)

diff --git a/src/codemodder/codemods/base_codemod.py b/src/codemodder/codemods/base_codemod.py
index a8e6c800..1f64f23a 100644
--- a/src/codemodder/codemods/base_codemod.py
+++ b/src/codemodder/codemods/base_codemod.py
@@ -193,6 +193,8 @@ def _apply_remediation(
         """
         Applies remediation behavior to a codemod, that is, each changeset will only be associated with a single finging and no files will be written.
         """
+        if self._should_skip(context):
+            return None
         results: ResultSet | None = self._apply_detector(context)
 
         if results is not None and not results:
@@ -248,6 +250,8 @@ def _apply_hardening(
         """
         Applies hardening behavior to a codemod with the goal of integrating all fixes for each finding into the files.
         """
+        if self._should_skip(context):
+            return None
         results: ResultSet | None = self._apply_detector(context)
 
         if results is not None and not results:
@@ -276,7 +280,7 @@ def _apply_hardening(
         context.process_results(self.id, contexts)
         return None
 
-    def _apply_detector(self, context: CodemodExecutionContext) -> ResultSet | None:
+    def _should_skip(self, context: CodemodExecutionContext):
         if self.provider and (
             not (provider := context.providers.get_provider(self.provider))
             or not provider.is_available
@@ -284,7 +288,7 @@ def _apply_detector(self, context: CodemodExecutionContext) -> ResultSet | None:
             logger.warning(
                 "provider %s is not available, skipping codemod", self.provider
             )
-            return None
+            return True
 
         if isinstance(self.detector, SemgrepRuleDetector):
             if (
@@ -296,7 +300,10 @@ def _apply_detector(self, context: CodemodExecutionContext) -> ResultSet | None:
                     "no results from semgrep for %s, skipping analysis",
                     self.id,
                 )
-                return None
+                return True
+        return False
+
+    def _apply_detector(self, context: CodemodExecutionContext) -> ResultSet | None:
 
         results: ResultSet | None = (
             # It seems like semgrep doesn't like our fully-specified id format so pass in short name instead.
@@ -429,6 +436,7 @@ def apply(
         self, context: CodemodExecutionContext, remediation: bool = False
     ) -> None | TokenUsage:
         if remediation:
+            print("0000000000000000000000000000000000000000000000000000000000")
             return self._apply_remediation(context, self.requested_rules)
         return self._apply_hardening(context, self.requested_rules)
 

From 05821377fddf8e0f8b570bae9dda48048683f5c1 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Thu, 3 Apr 2025 09:28:58 -0300
Subject: [PATCH 24/27] Fixed asserts in integration tests with sonar issues

---
 src/codemodder/codemods/test/integration_utils.py | 5 +++--
 1 file changed, 3 insertions(+), 2 deletions(-)

diff --git a/src/codemodder/codemods/test/integration_utils.py b/src/codemodder/codemods/test/integration_utils.py
index d1a4af6b..917b2d0f 100644
--- a/src/codemodder/codemods/test/integration_utils.py
+++ b/src/codemodder/codemods/test/integration_utils.py
@@ -90,8 +90,9 @@ def _assert_results_fields(self, results, output_path):
             for ref in self.codemod_instance.references
         ]
 
-        assert ("detectionTool" in result) == bool(self.sonar_issues_json)
-        assert ("detectionTool" in result) == bool(self.sonar_hotspots_json)
+        assert ("detectionTool" in result) == bool(self.sonar_issues_json) or (
+            "detectionTool" in result
+        ) == bool(self.sonar_hotspots_json)
 
         # TODO: if/when we add description for each url
         for reference in result["references"][

From 18cd5e79b0f8de238175c9b6481356a0b45cb933 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Thu, 3 Apr 2025 09:30:44 -0300
Subject: [PATCH 25/27] Removed debugging code

---
 src/codemodder/codemods/base_codemod.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/src/codemodder/codemods/base_codemod.py b/src/codemodder/codemods/base_codemod.py
index 1f64f23a..59dceb0a 100644
--- a/src/codemodder/codemods/base_codemod.py
+++ b/src/codemodder/codemods/base_codemod.py
@@ -436,7 +436,6 @@ def apply(
         self, context: CodemodExecutionContext, remediation: bool = False
     ) -> None | TokenUsage:
         if remediation:
-            print("0000000000000000000000000000000000000000000000000000000000")
             return self._apply_remediation(context, self.requested_rules)
         return self._apply_hardening(context, self.requested_rules)
 

From 63e302a857ea23e39a00c2fb9ea4829238d47c1c Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Wed, 9 Apr 2025 08:00:27 -0300
Subject: [PATCH 26/27] Downgraded pydantic version and bumped sarif-pydantic

---
 pyproject.toml | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/pyproject.toml b/pyproject.toml
index 4a29336e..e6db227b 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -16,7 +16,7 @@ dependencies = [
     "isort>=5.12,<6.1",
     "libcst>=1.7,<1.8",
     "packaging>=23.2,<25.0",
-    "pydantic~=2.11.1",
+    "pydantic~=2.10.6",
     "pylint>=3.3,<3.4",
     "python-json-logger~=3.3.0",
     "PyYAML~=6.0.0",
@@ -25,7 +25,7 @@ dependencies = [
     "tomlkit~=0.13.0",
     "wrapt~=1.17.0",
     "chardet~=5.2.0",
-    "sarif-pydantic~=0.5.0",
+    "sarif-pydantic~=0.5.1",
     "setuptools~=78.1",
 ]
 keywords = ["codemod", "codemods", "security", "fix", "fixes"]

From bb955153283d2fbb966237d3762873160c74e218 Mon Sep 17 00:00:00 2001
From: andrecs <12188364+andrecsilva@users.noreply.github.com>
Date: Mon, 14 Apr 2025 08:21:08 -0300
Subject: [PATCH 27/27] Added method to create ResultSets from the same type

---
 src/codemodder/codemods/base_codemod.py | 3 +--
 src/codemodder/result.py                | 9 +++++++++
 2 files changed, 10 insertions(+), 2 deletions(-)

diff --git a/src/codemodder/codemods/base_codemod.py b/src/codemodder/codemods/base_codemod.py
index 59dceb0a..bd36afb4 100644
--- a/src/codemodder/codemods/base_codemod.py
+++ b/src/codemodder/codemods/base_codemod.py
@@ -212,8 +212,7 @@ def _apply_remediation(
         if results:
             for result in results.results_for_rules(rules):
                 # this need to be the same type of ResultSet as results
-                singleton = results.__class__()
-                singleton.add_result(result)
+                singleton = results.from_single_result(result)
                 result_locations = self.get_files_to_analyze(context, singleton)
                 # We do an execution for each location in the result
                 # So we duplicate the resultset argument for each location
diff --git a/src/codemodder/result.py b/src/codemodder/result.py
index e6b473de..f38a4af5 100644
--- a/src/codemodder/result.py
+++ b/src/codemodder/result.py
@@ -284,6 +284,15 @@ def files_for_rule(self, rule_id: str) -> list[Path]:
     def all_rule_ids(self) -> list[str]:
         return list(self.keys())
 
+    @classmethod
+    def from_single_result(cls, result: ResultType) -> Self:
+        """
+        Creates a new ResultSet of the same type with a give result.
+        """
+        new = cls()
+        new.add_result(result)
+        return new
+
     def __or__(self, other):
         result = self.__class__()
         for k in self.keys() | other.keys():