SMAC/SMAC_FlowDroid_1.py at main · L-Jubarah-upb/SMAC · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
"""
Aim: search for optimal configuration of cgalgo to minimize
    the difference between found-leaks and expected-leaks
    (this is the target function in train function)
cgalgo: Callgraph algorithm to use
    (AUTO, CHA, VTA, RTA, SPARK, GEOM)
use APK-file of DroidBench:
/Users/ljubarah/DroidBench-develop/apk/Aliasing/FlowSensitivity1.apk
contains one leak with:
<android.util.Log: int i(java.lang.String,java.lang.String)> -> _SINK_
<android.telephony.TelephonyManager: java.lang.String getDeviceId()> -> _SOURCE_

this file is based on the example of the SMAC3-website:
https://automl.github.io/SMAC3/v2.3.0/examples/1%20Basics/1_quadratic_function/
"""
from distributed.diagnostics.task_stream import prefix

"""
Configuration is a class of package ConfigSpace and contains only one configuration
ConfigurationSpace is also a class and contains multiple configurations,
i.e. configurations can be sampled from the ConfigurationSpace
Categorical creates a CategoricalHyperparameter
"""
import re
from ConfigSpace import Configuration, ConfigurationSpace, Categorical
import statistics
import time

timeout = time.time() + 60 * 1  # 1 minutes

# from matplotlib import pyplot as plt
# from smac.facade.algorithm_configuration_facade import AlgorithmConfigurationFacade as ACFacade
from smac.facade.hyperparameter_optimization_facade import HyperparameterOptimizationFacade as HPOFacade  # todo: change smac.facade?

"""
RunHistory: contains information of evaluated/running trials and calculates the cost
(SMAC automatically generates an output file -> have a look into that)
Scenario: contains variables of the environment: configuration space, number of trials, time limit etc.
"""
from smac import Scenario  # ,RunHistory

"""os to execute FlowDroid from this python-script"""
import os

import json
import re


class FlowDroid_configuration_SMAC:
    """
    Callgraph algorithm to use
    (AUTO, CHA, VTA, RTA, SPARK, GEOM)
    """

    @property
    def configspace(self) -> ConfigurationSpace:

        """
        ConfigurationSpace with seed=0 is created
        and search space of cgalgo is the set ("AUTO", "CHA", "VTA", "RTA", "SPARK", "GEOM")
        default of cgalgo is CHA
        so the ConfigurationSpace contains the option cgalgo and the possible values of cgalgo
        at the end the aim of SMAC is to find the best option for cgalgo (of course depending on the target/train function)
        here to minimize the false positives/false negatives i.e. the false leaks

        returns ConfigurationSpace

        """
        cs = ConfigurationSpace(seed=0)
        # cgalgo = Categorical("cgalgo", ["AUTO", "CHA", "VTA", "RTA", "SPARK", "GEOM"], default="CHA")  # -cg
        # cgalgo =Categorical("cgalgo",["RTA", "AUTO"]) # -cg

        # cs.add([cgalgo])

        aliasalgo = Categorical("aliasalgo", ["NONE", "FLOWSENSITIVE", "PTSBASED", "LAZY"])
        cs.add([aliasalgo])  # -aa

        layoutmode = Categorical("layoutmode", ["NONE", "PWD", "ALL"])
        cs.add([layoutmode])

        callbackanalyzer = Categorical("callbackanalyzer",
                                       ["DEFAULT", "FAST"])
        cs.add([callbackanalyzer])

        # pathreconstructionmode = Categorical("pathreconstructionmode",   ["NONE", "FAST", "PRECISE"])
        # cs.add([pathreconstructionmode])
        ################################################################
        """


        ################################################################

        ################################################################
        codeelimination = Categorical("codeelimination", ["NONE", "PROPAGATECONSTS", "REMOVECODE"])
        cs.add([codeelimination])"""
        ################################################################
        """
        ################################################################

        ################################################################
        dataflowsolver = Categorical("dataflowsolver",
                                     ["CONTEXTFLOWSENSITIVE", "FLOWINSENSITIVE"])
        cs.add([dataflowsolver])
        ################################################################
        implicit = Categorical("implicit", ["NONE", "ARRAYONLY", "ALL"])
        cs.add([implicit])
        ################################################################
        layoutmode = Categorical("layoutmode", ["NONE", "PWD", "ALL"])
        cs.add([layoutmode])
        ################################################################
        pathalgo = Categorical("pathalgo",
                               ["CONTEXTSENSITIVE", "CONTEXTINSENSITIVE", "SOURCESONLY"])
        cs.add([pathalgo])
        ################################################################

        ################################################################
        staticmode = Categorical("staticmode",
                                 ["CONTEXTFLOWSENSITIVE", "CONTEXTFLOWINSENSITIVE", "NONE"])
        cs.add([staticmode])
        ################################################################
        taintwrapper = Categorical("taintwrapper",
                                   ["NONE", "EASY", "STUBDROID", "MULTI"])
        cs.add([taintwrapper])
        ################################################################
        callbacksourcemode = Categorical("callbacksourcemode", ["NONE", "ALL", "SOURCELIST"])
        cs.add([callbacksourcemode])
"""
        return cs

    def train(self, config: Configuration, seed: int = 0):
        #  f-measure F = 2TP / (2TP + FP +FN)
        # aim is to maximize f_score which assumes values in interval [0,1] -> SMAC minimizes cost -> i.e. minimize 1-f_score

        # todo: remove seed
        """
        run train method on each apk-file of one subset of DroidBench with configuration.
        at the end you should have an optimal configuration for this subset of DroidBench.

        optimal configuration is which minimizes the costs.


        :param
        expected_leaks: expected leaks from expected file
        found_leaks: leaks found by FlowDroid saved in output file
        :return


        """
        aliasalgo = config["aliasalgo"]  # -aa
        callbackanalyzer = config["callbackanalyzer"]  # -ca
        layoutmode = config["layoutmode"]  # -l
        # cgalgo = config["cgalgo"]  # -cg
        # pathreconstructionmode = config["pathreconstructionmode"]  # -pr

        #
        # codeelimination = config["codeelimination"] # -ce

        # callbacksourcemode = config["callbacksourcemode"] # -cs
        # dataflowsolver = config["dataflowsolver"] # -ds
        # implicit = config["implicit"] # -i
        #
        # pathalgo = config["pathalgo"] # -pa
        # staticmode = config["staticmode"] # -sf
        # taintwrapper = config["taintwrapper"] # -tw

        # now FlowDroid is executed with selected cgalgo by SMAC:
        path_to_sdk = "/Users/ljubarah/Library/Android/sdk/platforms"  # sdk platform (always same)
        SourcesAndSinks = "/Users/ljubarah/DroidBench-develop/SourcesAndSinks.txt"  # sources and sinks file (always same)

        # ------------------------------------------------------------------
        # define apk-files by their path
        # ------------------------------------------------------------------
        path = "/Users/ljubarah/DroidBench-develop"
        list_of_all_apk_files = os.listdir(path + "/apk/Aliasing")
        # list_of_all_apk_files = ["FlowSensitivity1.apk"]

        apk_files = []
        for file in list_of_all_apk_files:
            file = "/Users/ljubarah/DroidBench-develop/apk/Aliasing/" + file
            apk_files.append(file)
        # apk_files = ["/Users/ljubarah/DroidBench-develop/apk/Aliasing/FlowSensitivity1.apk"]

        names = []
        for i in list_of_all_apk_files:
            i = i[:-4]
            names.append(i)
        # names = ["FlowSensitivity1"]

        # ------------------------------------------------------------------
        # define expected-files by their path
        # ------------------------------------------------------------------
        expected_files = [path + "/eclipse-project/Aliasing/" + i + "/expected-info-flows.json" for i
                          in names]

        # ------------------------------------------------------------------
        # define output-files by their path and by their configuration
        # ------------------------------------------------------------------
        # output_files = [path + "/eclipse-project/Aliasing/" + i + f"/OutputOfSMAC_three/output_{aliasalgo}_{cgalgo}_{pathreconstructionmode}.xml" for i in names]
        # output_files = [path + f"/eclipse-project/Aliasing/OutputSMAC/{i}_output_{aliasalgo}_{cgalgo}_{pathreconstructionmode}.xml" for i in names]

        # output_files = [f"/Users/ljubarah/Downloads/{i}_output_{aliasalgo}_{cgalgo}_{pathreconstructionmode}.xml" for i in names]
        # output_files = [f"/Users/ljubarah/Downloads/{i}_output_{cgalgo}_{aliasalgo}.xml" for i in names]
        output_files = [
            path + "/eclipse-project/Aliasing/Output_15_04_2025/" + i + f"/{callbackanalyzer}_{aliasalgo}_{layoutmode}.xml".format(
                callbackanalyzer=callbackanalyzer, aliasalgo=aliasalgo, layoutmode=layoutmode) for i in names]

        """
        Execute FlowDroid on instances and measure cost by following method:
        ----------------------------------------------------------------------------------------------------------------
        Step 1. Selection: Select configuration (e.g. cgalgo= "CHA")
        ----------------------------------------------------------------------------------------------------------------
        Step 2. Iteration: According to Eggensperger et al.-2019-Pitfalls and Best Practices in Algorithm Configuration:
        ----------------------------------------------------------------------------------------------------------------
        Run FlowDroid with this configuration on each apk-file of one subset (e.g. subsets defined by DroidBench; you
        have to do this because according to this paper SMAC only makes sense if applied on similar instances. Because
        sense of SMAC is to find optimal configuration for these instances.)
        E.g. you have three instances i_1, i_2 and i_3 and two configurations conf_1 and conf_2.
        First iteration: run FlowDroid with first configuration conf_1 on these three instances and measure cost of each
        instance, e.g. c(conf1, i1) = 2, c(conf1, i2) = 5 and c(conf1, i3) = 4 -> sum_c = 2+5+4=11
        Second iteration: run FlowDroid with second configuration conf_2 on these three instances and measure cost of each
        instance, e.g. c(conf2, i1) = 20, c(conf2, i2) = 1 and c(conf2, i3) = 1 -> sum_c = 20+1+1 = 22

        Aim of AC according to this paper is to find configuration which minimizes the sum of costs. -> conf_1 minimizes
        cost so optimal configuration is conf_2
        """

        # Step 1:
        # combine apk_files with expected output_files to run FlowDroid. and to compare expected leaks with found leaks:
        apk_expected_output = list(zip(apk_files, expected_files, output_files))
        all_false_positives = []  # all_false_positives contains false_positives costs of all apk-files
        all_false_negatives = []  # all_false_negatives contains costs of all apk-files
        all_f_score = []  # all_f_score contains all f_scores

        for apk, expected, output in apk_expected_output:

            false_positives = 0  # false_positives is false_positives of just one apk-file
            false_negatives = 0  # false_negatives is false_negatives of just one apk-file

            true_positives = 0
            all_f_score = []

            app = ("java -jar /Users/ljubarah/FlowDroid-2.14.1/soot-infoflow-cmd-2.14.1-jar-with-dependencies.jar "
                   "-a {a} -p {p} -s {s} -o {o} "
                   "-ca {ca} -aa {aa} -l {l}").format(a=apk, p=path_to_sdk, s=SourcesAndSinks, o=output,
                                                      ca=callbackanalyzer,
                                                      aa=aliasalgo, l=layoutmode)

            os.system(app)
            if time.time() > timeout:
                break

            # compare found leaks with expected leaks:
            # sometimes DroidBench does not contain for each apk-file an expected file
            #  so comparison is only possible if expected-file exists.
            # sometimes FlowDroid does not generate output-files i.e. when no leak was found

            source_expected = []
            sink_expected = []
            sink_method_expected = []
            source_method_expected = []

            source_found = []
            sink_found = []
            sink_method_found = []
            source_method_found = []

            if os.path.isfile(expected):
                with open(expected) as expected:
                    expected = expected.read()
                    expected = json.loads(expected)
                    for key in expected["expected-info-flows"]:
                        if "Sink" in key:
                            sink_expected.append(key["Sink"])
                        if "Source" in key:
                            source_expected.append(key["Source"])
                        if "Sink" in key and "Method" in key:
                            sink_method_expected.append(key["Method"])
                        if "Source" in key and "Method" in key:
                            source_method_expected.append(key["Method"])

            if os.path.isfile(output):
                found_leaks = open(output).read()
                source_method_pattern_found = re.findall('Source Statement(.*?)&lt;(.*?)&gt;(.*?)&lt;(.*?)&gt;',
                                                         found_leaks)
                for i in source_method_pattern_found:
                    source_method_found.append(i[3])
                    source_found.append(i[1])

                sink_method_pattern_found = re.findall('Sink Statement(.*?)&lt;(.*?)&gt;(.*?)&lt;(.*?)&gt;', found_leaks)
                for i in sink_method_pattern_found:
                    sink_found.append(i[1])
                    sink_method_found.append(i[3])

            # dict to compare expected and found (dict and not list because order isn't to be considered
            source_expected_dict = dict(zip(source_method_expected, source_expected))
            source_found_dict = dict(zip(source_method_found, source_found))
            sink_expected_dict = dict(zip(sink_method_expected, sink_expected))
            sink_found_dict = dict(zip(sink_method_found, sink_found))

            # sets to count number of common elements
            source_expected_dict_set = set(source_expected_dict.items())
            source_found_dict_set = set(source_found_dict.items())
            sink_expected_dict_set = set(sink_expected_dict.items())
            sink_found_dict_set = set(sink_found_dict.items())


            diff_source = source_expected_dict_set ^ source_found_dict_set
            diff_sink = sink_expected_dict_set ^ sink_found_dict_set

            if (source_expected_dict_set == set() and source_found_dict_set == set()
                    and sink_expected_dict_set == set() and sink_found_dict_set == set()):  # means nothing expected and found:
                f_score = 1

            else:
                # first for sources:
                if diff_source == set():
                    true_positives += len(source_expected_dict_set)
                else:
                    for i in diff_source:
                        if i in source_expected_dict_set:
                            false_negatives += 1
                        else:
                            false_positives += 1
                    true_positives += len(source_expected_dict_set & source_found_dict_set)


                # now same for sinks:
                if diff_sink == set():
                    true_positives += len(sink_expected_dict_set)
                else:
                    for i in diff_sink:
                        if i in sink_expected_dict_set:
                            false_negatives += 1
                        else:
                            false_positives += 1
                    true_positives += len(sink_expected_dict_set & sink_found_dict_set)

                f_score = 2*true_positives / (2*true_positives + false_positives + false_negatives)
            all_f_score.append(f_score)
            all_false_positives.append(false_positives)
            all_false_negatives.append(false_negatives)

        return all_f_score


        return 1

    # def plot


if __name__ == "__main__":

    # create an instance
    model = FlowDroid_configuration_SMAC()

    # scenario object specifies the environment
    scenario = Scenario(model.configspace, deterministic=True, n_trials=18 * 6)

    # run SMAC to find optimal options: train the model in the set scenario
    smac = HPOFacade(  # todo: try others instead of HPOFacade
        scenario,
        model.train,
        overwrite=True
    )  # define on what running smac

    incumbent = smac.optimize()  # define what to do i.e. optimize the cost
    # todo: smac.optimize() (another things i can do with smac else than smac.optimize ?)

    # print cost of default configuration and of incumbent to compare improvement
    default = model.configspace.get_default_configuration()
    default_cost = smac.validate(model.configspace.get_default_configuration())  # default configuration was with CHA
    print(f"Default configuration: {default}")
    print(f"Default cost: {default_cost}")

    # print cost of incumbent (best solution)
    incumbent_cost = smac.validate(incumbent)
    print(f"Incumbent configuration: {incumbent}")
    print(f"Optimal cost: {incumbent_cost}")

    print("")
    print("Runhistory:")

    # todo: plot the results over history:
    # Results over history
    for k, v in smac.runhistory.items():
        # print("k = {k}, v = {v}".format(k=k, v=v))
        config = smac.runhistory.get_config(k.config_id)
        print("------------------------")
        print("configuration_id= {id}".format(id=k.config_id))
        print("configuration = {config}".format(config=config))
        print("cost = {cost}".format(cost=v.cost))
        print("------------------------")

# todo: close the files (because i opened e.g. expected-flow-files
# todo: n_trials should be larger than cross product of all combinations