import time import unittest import shutil import os import threading from detection.utils import read_file_content from .final_tests_util import clone_repo, Path, inject_random_backdoor from detection.Regexdetection import find_dangerous_functions from detection.GPTdetection import detectGPT def GPTdetectFileList(fileList): results = [] threads = [] for file in fileList: content = read_file_content(str(file)) threads.append(threading.Thread(target=GPTThread(), args=(content, results))) for thread in threads: thread.start() time.sleep(0.5) for thread in threads: thread.join() return results def GPTThread(content, results): try: results.append(detectGPT(content)) except Exception as e: print(e) class TestFinalTests(unittest.TestCase): def setUp(self) -> None: self.path = "./tmp/repo/" shutil.rmtree(self.path, ignore_errors=True) if not os.path.exists("/tmp/Python/"): clone_repo("https://github.com/TheAlgorithms/Python.git", "/tmp/Python") shutil.copytree("/tmp/Python", self.path) sampleRate = 0.1 self.inject_result = inject_random_backdoor( self.path, sample_rate=sampleRate, pyc=True, pickle=True ) self.injectedNum = len(self.inject_result) print(self.injectedNum) project_path = Path(self.path) self.all_python_files = list(project_path.rglob("*.py")) self.py_filesNum = len(self.all_python_files) all_pickle_files = list(project_path.rglob("*.pickle")) self.pickle_filesNum = len(all_pickle_files) all_pyc_files = list(project_path.rglob("*.pyc")) self.pyc_filesNum = len(all_pyc_files) os.system( "python -m detection " + self.path + " -o " + self.path + "output.txt" ) def test_final_tests_pycode(self): # test backdoor code in python files detectedNum = 0 possibly_dangerous_file = [] for file in self.all_python_files: content = read_file_content(str(file)) results = find_dangerous_functions(content, ".py") if ( len(results["high"]) > 0 or len(results["medium"]) > 0 or len(results["low"]) > 0 ): detectedNum += 1 possibly_dangerous_file.append(file) print(detectedNum / self.py_filesNum) GPTdetectedNum = 0 for i in possibly_dangerous_file: content = read_file_content(str(i)) results = {} try: results = detectGPT(content) if ( len(results["high"]) > 0 or len(results["medium"]) > 0 or len(results["low"]) > 0 ): GPTdetectedNum += 1 print(GPTdetectedNum) except Exception as e: # print(e) pass # test injected code with open(self.path + "output.txt", "r") as f: lines = f.readlines() injected_detectedNum = 0 for line in lines: if "py:" in line: injected_detectedNum += 1 injected_accurency = injected_detectedNum / self.injectedNum print(f"injected files accurency: {injected_accurency}") GPTresult = GPTdetectFileList(possibly_dangerous_file) for result in GPTresult: if len(result) > 0: GPTdetectedNum += 1 print(GPTdetectedNum) self.assertGreaterEqual(GPTdetectedNum, detectedNum) # test pickle files with open(self.path + "output.txt", "r") as f: lines = f.readlines() pickle_detectedNum = 0 for line in lines: if "pickle" in line: pickle_detectedNum += 1 pickle_accurency = pickle_detectedNum / self.pickle_filesNum print(f"pickle files accurency: {pickle_accurency}") # test pyc files with open(self.path + "output.txt", "r") as f: lines = f.readlines() pyc_detectedNum = 0 for line in lines: if "pyc" in line: pyc_detectedNum += 1 pyc_accurency = pyc_detectedNum / self.pyc_filesNum print(f"pyc files accurency: {pyc_accurency}") if __name__ == "__main__": unittest.main()