This commit is contained in:
Jean-Marie Mineau 2025-05-21 17:30:26 +02:00
parent 0b5f6e4b25
commit 00582dddc4
Signed by: histausse
GPG key ID: B66AEEDA9B645AD2

View file

@ -0,0 +1,146 @@
from pathlib import Path
import argparse
import json
import androguard # type: ignore
from androguard.core.dex import DEX # type: ignore
from androguard.core.apk import APK # type: ignore
androguard.util.set_log("SUCCESS") # type: ignore
def check_app_result(path: Path, app_folder: Path, summary: dict):
if (path / "TIMEOUT").exists():
summary["nb_timeout"] += 1
return
if not (path / "data.json").exists():
return
with (path / "data.json").open() as fp:
data = json.load(fp)
if "error" in data:
summary["nb_failed"] += 1
return
nb_class_collision_at_invoke = 0
seen = {}
for invoke_data in data["invoke_data"]:
call_site = (
invoke_data["caller_method"],
invoke_data["caller_cl_id"],
invoke_data["addr"],
)
clazz = invoke_data["method"].split("->")[0]
id_ = (call_site, clazz)
cl = invoke_data["method_cl_id"]
if id_ not in seen:
seen[id_] = {cl} # first call
if cl not in seen[id_]:
nb_class_collision_at_invoke += 1
seen[id_].add(cl)
seen = {}
for invoke_data in data["class_new_inst_data"]:
call_site = (
invoke_data["caller_method"],
invoke_data["caller_cl_id"],
invoke_data["addr"],
)
clazz = invoke_data["constructor"].split("->")[0]
id_ = (call_site, clazz)
cl = invoke_data["constructor_cl_id"]
if id_ not in seen:
seen[id_] = {cl} # first call
if cl not in seen[id_]:
nb_class_collision_at_invoke += 1
seen[id_].add(cl)
seen = {}
for invoke_data in data["cnstr_new_inst_data"]:
call_site = (
invoke_data["caller_method"],
invoke_data["caller_cl_id"],
invoke_data["addr"],
)
clazz = invoke_data["constructor"].split("->")[0]
id_ = (call_site, clazz)
cl = invoke_data["constructor_cl_id"]
if id_ not in seen:
seen[id_] = {cl} # first call
if cl not in seen[id_]:
nb_class_collision_at_invoke += 1
seen[id_].add(cl)
classes_by_cl: dict[str, list[str]] = {}
dyn_load_classes = set()
for dyn_load in data["dyn_code_load"]:
dyn_load_classes.add(dyn_load["classloader_class"])
cl_id = dyn_load["classloader"]
if cl_id not in classes_by_cl:
classes_by_cl[cl_id] = []
for file in dyn_load["files"]:
with open(file, "rb") as fp:
dex_bin = fp.read()
dex = DEX(dex_bin)
classes_by_cl[cl_id].extend(dex.get_classes())
apk_name = f"{path.name}.apk"
apk = APK(str(app_folder / apk_name))
cl_id = data["apk_cl_id"]
if cl_id not in classes_by_cl:
classes_by_cl[cl_id] = []
for dex_bin in apk.get_all_dex():
dex = DEX(dex_bin)
classes_by_cl[cl_id].extend(dex.get_classes())
nb_class_collision = 0
already_found: set[str] = set()
for cls_l in classes_by_cl.values():
cls: set[str] = set(cls_l)
nb_class_collision += len(already_found.intersection(cls))
already_found.update(cls)
summary["apks"][path.name] = {
"nb_class_collision": nb_class_collision,
"nb_class_collision_at_invoke": nb_class_collision_at_invoke,
}
if nb_class_collision:
summary["nb_with_class_collision"] += 1
if nb_class_collision_at_invoke:
summary["nb_with_class_collision_at_invoke"] += 1
def run(folder: Path, app_folder: Path):
summary = {
"nb_timeout": 0,
"nb_failed": 0,
"nb_with_class_collision": 0,
"nb_with_class_collision_at_invoke": 0,
"apks": {},
}
for p in folder.iterdir():
if p.is_dir():
check_app_result(p, app_folder, summary)
print(json.dumps(summary, indent=" "))
def main():
parser = argparse.ArgumentParser(
prog="check_collision",
description="check the result of the dynamic analysis and look at class collision",
)
parser.add_argument(
"result_folder",
type=Path,
help="Folder containing the result of the experiment",
)
parser.add_argument(
"app_folder",
type=Path,
help="Folder containing the apks of the experiment",
)
args = parser.parse_args()
run(args.result_folder, args.app_folder)
if __name__ == "__main__":
main()