7 tahun lalu · be0471c882
--- a/code/Attack/MembersMgmtCommAttack.py
+++ b/code/Attack/MembersMgmtCommAttack.py
@@ -1,7 +1,8 @@
 
				 from enum import Enum
			
 
				+
			
 
				 class MessageType(Enum):
			
 
				     """
			
 
				-    Defines possible Message types
			
 
				+    Defines possible botnet message types
			
 
				     """
			
 
				 
			
 
				     TIMEOUT = 3
			
@@ -10,6 +11,19 @@ class MessageType(Enum):
 
				     SALITY_HELLO = 103
			
 
				     SALITY_HELLO_REPLY = 104
			
 
				 
			
 
				+class Message():
			
 
				+    def __init__(self, msg_id: int, src: str, dst: str, type_: MessageType, time: float, refer_msg_id: int=-1):
			
 
				+        self.msg_id = msg_id
			
 
				+        self.src = src
			
 
				+        self.dst = dst
			
 
				+        self.type = type_
			
 
				+        self.time = time
			
 
				+        self.refer_msg_id = refer_msg_id
			
 
				+
			
 
				+    def __str__(self):
			
 
				+        str_ = "{0}. at {1}: {2}-->{3}, {4}, refer:{5}".format(self.msg_id, self.time, self.src, self.dst, self.type, self.refer_msg_id)
			
 
				+        return str_
			
 
				+
			
 
				 from random import randint, randrange, choice
			
 
				 from collections import deque
			
 
				 from scipy.stats import gamma
			
@@ -23,13 +37,10 @@ from ID2TLib import FileUtils, PaddingGenerator
 
				 from ID2TLib.PacketGenerator import PacketGenerator
			
 
				 from ID2TLib.IPGenerator import IPGenerator 
			
 
				 from ID2TLib.PcapAddressOperations import PcapAddressOperations
			
 
				-from ID2TLib.MapInputCSVToIDs import find_interval_with_most_comm, determine_id_roles
			
 
				+from ID2TLib.CommunicationProcessor import CommunicationProcessor
			
 
				 from ID2TLib.MacAddressGenerator import MacAddressGenerator
			
 
				 from ID2TLib.PortGenerator import gen_random_server_port
			
 
				 
			
 
				-###### MOVE LOCAL, EXTERNAL IP DECISION INTO MAP CLASS ???? ######
			
 
				-###### REQUEST/REPLY IDENTIFICATION: NEW DATASTRUCTURE THAT KEEPS REQ AND REPL AND ALL IMPORTANT INFOS (ADDR, ID, PORT). #######
			
 
				-###### CREATE WHEN DETERMINING INITIATOR AND RESPONDER AND UPDATE LATER WITH ADDRESSES ... ########
			
 
				 
			
 
				 class MembersMgmtCommAttack(BaseAttack.BaseAttack):
			
 
				     def __init__(self):
			
@@ -146,35 +157,25 @@ class MembersMgmtCommAttack(BaseAttack.BaseAttack):
 
				             filepath_xml = FileUtils.parse_csv_to_xml(filepath_csv) 
			
 
				 
			
 
				         abstract_packets = FileUtils.parse_xml(filepath_xml)
			
 
				-        
			
 
				+
			
 
				         # find a good communication mapping
			
 
				         duration = self.get_param_value(Param.ATTACK_DURATION)
			
 
				         number_bots = self.get_param_value(Param.NUMBER_BOTS)
			
 
				-        comm_interval = find_interval_with_most_comm(abstract_packets, number_bots, duration)[0]
			
 
				+        comm_proc = CommunicationProcessor(abstract_packets)
			
 
				+        comm_interval = comm_proc.find_interval_with_most_comm(number_bots, duration)[0]
			
 
				 
			
 
				         if comm_interval is None:
			
 
				             print("Error: There is no interval in the given CSV/XML that has enough communication")
			
 
				             return 0, None
			
 
				 
			
 
				         mapped_ids, id_comms, packet_start_idx, packet_end_idx = comm_interval["IDs"], comm_interval["Comms"], comm_interval["Start"], comm_interval["End"]
			
 
				-
			
 
				+        # print(mapped_ids)
			
 
				+        comm_proc.set_mapping(abstract_packets[packet_start_idx:packet_end_idx+1], mapped_ids, id_comms)
			
 
				+        # print(mapped_ids)
			
 
				         # print start and end time of mapped interval
			
 
				         # print(abstract_packets[packet_start_idx]["Time"])
			
 
				         # print(abstract_packets[packet_end_idx]["Time"])
			
 
				 
			
 
				-        # determine most common communicating IDs
			
 
				-        # total_mentions = 0
			
 
				-        # most_common_thres = self.MOST_COMMON_THRES
			
 
				-        # most_common_ids = {}
			
 
				-        # for id_ in mapped_ids:
			
 
				-        #     total_mentions += mapped_ids[id_]
			
 
				-
			
 
				-        # for id_ in mapped_ids:
			
 
				-        #     count = mapped_ids[id_]
			
 
				-        #     mentions_percentage = count / total_mentions
			
 
				-        #     if mentions_percentage >= most_common_thres:
			
 
				-        #         most_common_ids[id_] = mentions_percentage
			
 
				-
			
 
				         # determine amount of reused IPs
			
 
				         reuse_percent_total = self.get_param_value(Param.IP_REUSE_TOTAL)
			
 
				         reuse_percent_external = self.get_param_value(Param.IP_REUSE_EXTERNAL)
			
@@ -189,63 +190,20 @@ class MembersMgmtCommAttack(BaseAttack.BaseAttack):
 
				         pcapops = PcapAddressOperations(self.statistics)
			
 
				         router_mac = pcapops.get_probable_router_mac()
			
 
				         bot_configs = {}
			
 
				-        external_ids = set()
			
 
				-        local_ids = set()
			
 
				-        id_comms = sorted(id_comms)
			
 
				-        # print(self.get_param_value(Param.INJECT_AT_TIMESTAMP))
			
 
				+        init_ids, respnd_ids, both_ids, messages = comm_proc.det_id_roles_and_msgs(self.msg_types)
			
 
				+        local_ids, external_ids = comm_proc.det_ext_and_local_ids(comm_type, self.PROB_INIT_IS_LOCAL, self.PROB_RESPND_IS_LOCAL)
			
 
				+        # print(external_ids)
			
 
				 
			
 
				-        if comm_type == "local":
			
 
				-            local_ids = set(mapped_ids.keys())
			
 
				-        else:
			
 
				-            init_local_or_external = Lea.fromValFreqsDict({"local": self.PROB_INIT_IS_LOCAL*100, "external": (1-self.PROB_INIT_IS_LOCAL)*100})
			
 
				-            mixed_respnd_is_local = Lea.fromValFreqsDict({"local": self.PROB_RESPND_IS_LOCAL*100, "external": (1-self.PROB_RESPND_IS_LOCAL)*100})
			
 
				-            ids = set(mapped_ids.keys())
			
 
				-            init_ids, respnd_ids, both_ids = determine_id_roles(abstract_packets[packet_start_idx:packet_end_idx+1], ids)
			
 
				-
			
 
				-            # assign IDs in 'both' local everytime for mixed? 
			
 
				-            initiators = sorted(list(init_ids) + list(both_ids))
			
 
				-            for id_ in initiators:
			
 
				-                if id_ in local_ids or id_ in external_ids:
			
 
				-                    continue
			
 
				+        # for msg in messages:
			
 
				+        #     print(msg)
			
 
				 
			
 
				-                pos = init_local_or_external.random()          
			
 
				-                if pos == "local":
			
 
				-                    local_ids.add(id_) 
			
 
				-                    for id_comm in id_comms:
			
 
				-                        ids = id_comm.split("-")
			
 
				-                        other = ids[0] if id_ == ids[1] else ids[1] 
			
 
				-                        
			
 
				-                        # what if before other was external ...
			
 
				-                        if other in local_ids or other in external_ids:
			
 
				-                            continue 
			
 
				-
			
 
				-                        if comm_type == "mixed":
			
 
				-                            other_pos = mixed_respnd_is_local.random()
			
 
				-                            if other_pos == "local":
			
 
				-                                local_ids.add(other)
			
 
				-                            elif other_pos == "external":
			
 
				-                                external_ids.add(other)
			
 
				-                        elif comm_type == "external":
			
 
				-                            if not other in initiators:
			
 
				-                                external_ids.add(other)
			
 
				-
			
 
				-                elif pos == "external":
			
 
				-                    external_ids.add(id_)
			
 
				-                    for id_comm in id_comms:
			
 
				-                        ids = id_comm.split("-")
			
 
				-                        other = ids[0] if id_ == ids[1] else ids[1] 
			
 
				-                        
			
 
				-                        # what if before other was external ...
			
 
				-                        if other in local_ids or other in external_ids:
			
 
				-                            continue 
			
 
				-                        if not other in initiators:
			
 
				-                            local_ids.add(other)
			
 
				-
			
 
				-
			
 
				-        # print(sorted(initiators))
			
 
				+        # print(sorted(list(init_ids)+list(both_ids)))
			
 
				         # print(sorted(local_ids))
			
 
				         # print(sorted(external_ids))
			
 
				 
			
 
				+        #### Set realistic timestamps for messages ####
			
 
				+        #### ... ####
			
 
				+
			
 
				         # IDs are always added to bot_configs in the same order under a given seed
			
 
				         number_local_ids, number_external_ids = len(local_ids), len(external_ids)
			
 
				         if number_local_ids > 0:
			
@@ -265,6 +223,7 @@ class MembersMgmtCommAttack(BaseAttack.BaseAttack):
 
				         # create bot port configs
			
 
				         for bot in bot_configs:
			
 
				             bot_configs[bot]["Port"] = gen_random_server_port()    
			
 
				+        # print(bot_configs)
			
 
				 
			
 
				         # create realistic ttl for every bot
			
 
				         # Gamma distribution parameters derived from MAWI 13.8G dataset
			
@@ -310,6 +269,8 @@ class MembersMgmtCommAttack(BaseAttack.BaseAttack):
 
				             ttl = bot_configs[id_src]["TTL"]
			
 
				             type_src, type_dst = bot_configs[id_src]["Type"], bot_configs[id_dst]["Type"]
			
 
				 
			
 
				+            # print("{0} --> {1}, {2} - {3}".format(id_src, id_dst, type_src, type_dst))
			
 
				+
			
 
				             if type_src == "external" and type_dst == "external":
			
 
				                 continue
			
 
				             if comm_type == "external":
			
--- a/code/ID2TLib/CommunicationProcessor.py
+++ b/code/ID2TLib/CommunicationProcessor.py
@@ -0,0 +1,333 @@
 
				+from lea import Lea
			
 
				+from Attack.MembersMgmtCommAttack import MessageType
			
 
				+from Attack.MembersMgmtCommAttack import Message
			
 
				+
			
 
				+# needed because of machine inprecision. E.g A time difference of 0.1s is stored as >0.1s
			
 
				+EPS_TOLERANCE = 1e-13  # works for a difference of 0.1, no less
			
 
				+
			
 
				+class CommunicationProcessor():
			
 
				+
			
 
				+    def __init__(self, packets):
			
 
				+        self.packets = packets
			
 
				+
			
 
				+    def set_mapping(self, packets, mapped_ids, id_comms):
			
 
				+        self.packets = packets
			
 
				+        self.ids = mapped_ids.keys()
			
 
				+        self.id_comms = id_comms
			
 
				+        self.indv_id_counts = mapped_ids
			
 
				+
			
 
				+    def find_interval_with_most_comm(self, number_ids: int, max_int_time: float):
			
 
				+        """
			
 
				+        Finds a time interval of the given seconds where the given number of ids communicate among themselves the most.
			
 
				+        
			
 
				+        :param packets: The packets containing the communication
			
 
				+        :param number_ids: The number of ids that are to be considered
			
 
				+        :param max_int_time: A short description of the attack.
			
 
				+        :return: A triple consisting of the ids, as well as start and end idx with respect to the given packets. 
			
 
				+        """
			
 
				+        packets = self.packets
			
 
				+
			
 
				+        def get_nez_msg_counts(msg_counts: dict):
			
 
				+            """
			
 
				+            Filters out all msg_counts that have 0 as value
			
 
				+            """
			
 
				+            nez_msg_counts = dict()
			
 
				+            for msg in msg_counts.keys():
			
 
				+                count = msg_counts[msg]
			
 
				+                if count > 0:
			
 
				+                    nez_msg_counts[msg] = count
			
 
				+            return nez_msg_counts
			
 
				+
			
 
				+        def greater_than(a: float, b: float):
			
 
				+            """
			
 
				+            A greater than operator desgined to handle slight machine inprecision up to EPS_TOLERANCE.
			
 
				+            :return: True if a > b, otherwise False
			
 
				+            """
			
 
				+            return b - a < -EPS_TOLERANCE
			
 
				+
			
 
				+        def change_msg_counts(msg_counts: dict, idx: int, add=True):
			
 
				+            """
			
 
				+            Changes the value of the message count of the message occuring in the packet specified by the given index. 
			
 
				+            Adds 1 if add is True and subtracts 1 otherwise.
			
 
				+            """
			
 
				+            change = 1 if add else -1
			
 
				+            id_src, id_dst = packets[idx]["Src"], packets[idx]["Dst"]
			
 
				+            src_to_dst = "{0}-{1}".format(id_src, id_dst)
			
 
				+            dst_to_src = "{0}-{1}".format(id_dst, id_src)
			
 
				+
			
 
				+            if src_to_dst in msg_counts.keys():
			
 
				+                msg_counts[src_to_dst] += change
			
 
				+            elif dst_to_src in msg_counts.keys():
			
 
				+                msg_counts[dst_to_src] += change
			
 
				+            elif add:
			
 
				+                msg_counts[src_to_dst] = 1
			
 
				+
			
 
				+        def count_ids_in_msg_counts(msg_counts: dict):
			
 
				+            """
			
 
				+            Counts all ids that are involved in messages with a non zero message count
			
 
				+            """
			
 
				+            ids = set()
			
 
				+            for msg in msg_counts.keys():
			
 
				+                src, dst = msg.split("-")
			
 
				+                ids.add(dst)
			
 
				+                ids.add(src)
			
 
				+            return len(ids)
			
 
				+
			
 
				+        def get_msg_count_first_ids(msg_counts: list):
			
 
				+            """
			
 
				+            Finds the ids that communicate among themselves the most with respect to the given message counts.
			
 
				+            :param msg_counts: a sorted list of message counts where each entry is a tuple of key and value
			
 
				+            :return: The picked ids and their total message count as a tuple
			
 
				+            """
			
 
				+            # if order of most messages is important, use an additional list
			
 
				+            picked_ids = set()
			
 
				+            total_msg_count = 0
			
 
				+
			
 
				+            # iterate over every message count
			
 
				+            for i, msg in enumerate(msg_counts):
			
 
				+                count_picked_ids = len(picked_ids)
			
 
				+                id_one, id_two = msg[0].split("-")
			
 
				+
			
 
				+                # if enough ids have been found, stop
			
 
				+                if count_picked_ids >= number_ids:
			
 
				+                    break
			
 
				+
			
 
				+                # if two ids can be added without exceeding the desired number of ids, add them
			
 
				+                if count_picked_ids - 2 <= number_ids:
			
 
				+                    picked_ids.add(id_one)
			
 
				+                    picked_ids.add(id_two)
			
 
				+                    total_msg_count += msg[1]
			
 
				+
			
 
				+                # if there is only room for one more id to be added, 
			
 
				+                # find one that is already contained in the picked ids
			
 
				+                else:
			
 
				+                    for j, msg in enumerate(msg_counts[i:]):
			
 
				+                        id_one, id_two = msg[0].split("-")
			
 
				+                        if id_one in picked_ids:
			
 
				+                            picked_ids.add(id_two)
			
 
				+                            total_msg_count += msg[1]
			
 
				+                            break
			
 
				+                        elif id_two in picked_ids:
			
 
				+                            picked_ids.add(id_one)
			
 
				+                            total_msg_count += msg[1]
			
 
				+                            break
			
 
				+                    break
			
 
				+
			
 
				+            return picked_ids, total_msg_count
			
 
				+
			
 
				+        def get_indv_id_counts_and_comms(picked_ids: dict, msg_counts: dict):
			
 
				+            """ 
			
 
				+            Retrieves the total mentions of one ID in the communication pattern
			
 
				+            and all communication entries that include only picked IDs.
			
 
				+            """
			
 
				+            indv_id_counts = {}
			
 
				+            id_comms = set()
			
 
				+            for msg in msg_counts:
			
 
				+                ids = msg.split("-")
			
 
				+                if ids[0] in picked_ids and ids[1] in picked_ids:
			
 
				+                    msg_other_dir = "{}-{}".format(ids[1], ids[0])
			
 
				+                    if (not msg in id_comms) and (not msg_other_dir in id_comms):
			
 
				+                        id_comms.add(msg)
			
 
				+
			
 
				+                    for id_ in ids:
			
 
				+                        if id_ in indv_id_counts:
			
 
				+                            indv_id_counts[id_] += msg_counts[msg]
			
 
				+                        else:
			
 
				+                            indv_id_counts[id_] = msg_counts[msg]
			
 
				+
			
 
				+            return indv_id_counts, id_comms
			
 
				+
			
 
				+
			
 
				+        # first find all possible intervals that contain enough IDs that communicate among themselves
			
 
				+        idx_low, idx_high = 0, 0
			
 
				+        msg_counts = dict()
			
 
				+        possible_intervals = []
			
 
				+
			
 
				+        # Iterate over all packets from start to finish and process the info of each packet
			
 
				+        # If time of packet within time interval, update the message count for this communication
			
 
				+        # If time of packet exceeds time interval, substract from the message count for this communication
			
 
				+        while True:
			
 
				+            if idx_high < len(packets):
			
 
				+                cur_int_time = float(packets[idx_high]["Time"]) - float(packets[idx_low]["Time"])
			
 
				+     
			
 
				+            # if current interval time exceeds time interval, save the message counts if appropriate, or stop if no more packets
			
 
				+            if greater_than(cur_int_time, max_int_time) or idx_high >= len(packets):
			
 
				+                # get all message counts for communications that took place in the current intervall
			
 
				+                nez_msg_counts = get_nez_msg_counts(msg_counts)
			
 
				+
			
 
				+                # if we have enough ids as specified by the caller, mark as possible interval
			
 
				+                if count_ids_in_msg_counts(nez_msg_counts) >= number_ids:
			
 
				+                    # possible_intervals.append((nez_msg_counts, packets[idx_low]["Time"], packets[idx_high-1]["Time"]))
			
 
				+                    possible_intervals.append((nez_msg_counts, idx_low, idx_high - 1))
			
 
				+
			
 
				+                if idx_high >= len(packets):
			
 
				+                    break
			
 
				+
			
 
				+            # let idx_low "catch up" so that the current interval time fits into the interval time specified by the caller
			
 
				+            while greater_than(cur_int_time, max_int_time):
			
 
				+                change_msg_counts(msg_counts, idx_low, add=False)
			
 
				+                idx_low += 1
			
 
				+                cur_int_time = float(packets[idx_high]["Time"]) - float(packets[idx_low]["Time"])
			
 
				+
			
 
				+            # consume the new packet at idx_high and process its information
			
 
				+            change_msg_counts(msg_counts, idx_high)
			
 
				+            idx_high += 1
			
 
				+
			
 
				+
			
 
				+        # now find the interval in which as many ids as specified communicate the most in the given time interval
			
 
				+        summed_intervals = []
			
 
				+        sum_intervals_idxs = []
			
 
				+        cur_highest_sum = 0
			
 
				+
			
 
				+        # for every interval compute the sum of msg_counts of the first most communicative ids and eventually find
			
 
				+        # the interval(s) with most communication and its ids
			
 
				+        for j, interval in enumerate(possible_intervals):
			
 
				+            msg_counts = interval[0].items()
			
 
				+            sorted_msg_counts = sorted(msg_counts, key=lambda x: x[1], reverse=True)
			
 
				+            picked_ids, msg_sum = get_msg_count_first_ids(sorted_msg_counts)
			
 
				+
			
 
				+            if msg_sum == cur_highest_sum:
			
 
				+                summed_intervals.append({"IDs": picked_ids, "MsgSum": msg_sum, "Start": interval[1], "End": interval[2]})
			
 
				+                sum_intervals_idxs.append(j)
			
 
				+            elif msg_sum > cur_highest_sum:
			
 
				+                summed_intervals = []
			
 
				+                sum_intervals_idxs = [j]
			
 
				+                summed_intervals.append({"IDs": picked_ids, "MsgSum": msg_sum, "Start": interval[1], "End": interval[2]})
			
 
				+                cur_highest_sum = msg_sum
			
 
				+
			
 
				+        for j, interval in enumerate(summed_intervals):
			
 
				+            idx = sum_intervals_idxs[j]
			
 
				+            msg_counts_picked = possible_intervals[idx][0]
			
 
				+            indv_id_counts, id_comms = get_indv_id_counts_and_comms(interval["IDs"], msg_counts_picked)
			
 
				+            interval["IDs"] = indv_id_counts
			
 
				+            interval["Comms"] = id_comms
			
 
				+
			
 
				+        return summed_intervals
			
 
				+
			
 
				+    def det_ext_and_local_ids(self, comm_type: str, prob_init_local: int, prob_rspnd_local: int):
			
 
				+        init_ids, respnd_ids, both_ids = self.init_ids, self.respnd_ids, self.both_ids
			
 
				+        id_comms = self.id_comms
			
 
				+        external_ids = set()
			
 
				+        local_ids = set()
			
 
				+
			
 
				+        def map_init_is_local(id_: int):
			
 
				+            for id_comm in id_comms:
			
 
				+                ids = id_comm.split("-")
			
 
				+                other = ids[0] if id_ == ids[1] else ids[1] 
			
 
				+                
			
 
				+                # what if before other was external ...
			
 
				+                if other in local_ids or other in external_ids:
			
 
				+                    continue 
			
 
				+
			
 
				+                if comm_type == "mixed":
			
 
				+                    other_pos = mixed_respnd_is_local.random()
			
 
				+                    if other_pos == "local":
			
 
				+                        local_ids.add(other)
			
 
				+                    elif other_pos == "external":
			
 
				+                        external_ids.add(other)
			
 
				+                elif comm_type == "external":
			
 
				+                    if not other in initiators:
			
 
				+                        external_ids.add(other)
			
 
				+
			
 
				+        def map_init_is_external(id_: int):
			
 
				+            for id_comm in id_comms:
			
 
				+                ids = id_comm.split("-")
			
 
				+                other = ids[0] if id_ == ids[1] else ids[1] 
			
 
				+                
			
 
				+                # what if before other was external ...
			
 
				+                if other in local_ids or other in external_ids:
			
 
				+                    continue 
			
 
				+                if not other in initiators:
			
 
				+                    local_ids.add(other)
			
 
				+
			
 
				+
			
 
				+        if comm_type == "local":
			
 
				+                local_ids = set(mapped_ids.keys())
			
 
				+        else:
			
 
				+            init_local_or_external = Lea.fromValFreqsDict({"local": prob_init_local*100, "external": (1-prob_init_local)*100})
			
 
				+            mixed_respnd_is_local = Lea.fromValFreqsDict({"local": prob_rspnd_local*100, "external": (1-prob_rspnd_local)*100})
			
 
				+
			
 
				+            # assign IDs in 'both' local everytime for mixed? 
			
 
				+            initiators = sorted(list(init_ids) + list(both_ids))
			
 
				+            initiators = sorted(initiators, key=lambda id_:self.indv_id_counts[id_], reverse=True)
			
 
				+
			
 
				+            for id_ in initiators:
			
 
				+                pos = init_local_or_external.random()          
			
 
				+                if pos == "local":
			
 
				+                    if id_ in external_ids:
			
 
				+                        map_init_is_external(id_)
			
 
				+                    else:
			
 
				+                        local_ids.add(id_)
			
 
				+                        map_init_is_local(id_)
			
 
				+                elif pos == "external":
			
 
				+                    if id_ in local_ids:
			
 
				+                        map_init_is_local(id_)
			
 
				+                    else:
			
 
				+                        external_ids.add(id_)
			
 
				+                        map_init_is_external(id_)
			
 
				+
			
 
				+        self.local_ids, self.external_ids = local_ids, external_ids
			
 
				+        return local_ids, external_ids
			
 
				+
			
 
				+    def det_id_roles_and_msgs(self, mtypes: dict):
			
 
				+        """
			
 
				+        Determine the role of every mapped ID. The role can be initiator, responder or both.
			
 
				+        :param packets: the mapped section of abstract packets
			
 
				+        :param all_ids: all IDs that were mapped/chosen
			
 
				+        :return: a dict that for every ID contains its role
			
 
				+        """
			
 
				+        init_ids, respnd_ids, both_ids = set(), set(), set()
			
 
				+        msgs, msg_id = [], 0
			
 
				+        prev_reqs = {}
			
 
				+        all_ids = self.ids
			
 
				+        packets = self.packets
			
 
				+
			
 
				+        def process_initiator(id_: str):
			
 
				+            if id_ in both_ids:
			
 
				+                pass
			
 
				+            elif not id_ in respnd_ids:
			
 
				+                init_ids.add(id_)
			
 
				+            elif id_ in respnd_ids:
			
 
				+                respnd_ids.remove(id_)
			
 
				+                both_ids.add(id_)
			
 
				+
			
 
				+        def process_responder(id_: str):
			
 
				+            if id_ in both_ids:
			
 
				+                pass
			
 
				+            elif not id_ in init_ids:
			
 
				+                respnd_ids.add(id_)
			
 
				+            elif id_ in init_ids:
			
 
				+                init_ids.remove(id_)
			
 
				+                both_ids.add(id_)
			
 
				+
			
 
				+        for packet in packets:
			
 
				+            id_src, id_dst, msg_type, time = packet["Src"], packet["Dst"], int(packet["Type"]), float(packet["Time"])
			
 
				+            if (not id_src in all_ids) or (not id_dst in all_ids):
			
 
				+                continue
			
 
				+            msg_type = mtypes[msg_type]
			
 
				+            if msg_type in {MessageType.SALITY_HELLO, MessageType.SALITY_NL_REQUEST}:
			
 
				+                process_initiator(id_src)
			
 
				+                process_responder(id_dst)
			
 
				+                msg_str = "{0}-{1}".format(id_src, id_dst)
			
 
				+                msg = Message(msg_id, id_src, id_dst, msg_type, time)
			
 
				+                msgs.append(msg)
			
 
				+                prev_reqs[msg_str] = msg_id
			
 
				+
			
 
				+            elif msg_type in {MessageType.SALITY_HELLO_REPLY, MessageType.SALITY_NL_REPLY}:
			
 
				+                process_initiator(id_dst)
			
 
				+                process_responder(id_src)
			
 
				+                msg_str = "{0}-{1}".format(id_dst, id_src)
			
 
				+                refer_idx = prev_reqs[msg_str]
			
 
				+                msgs[refer_idx].refer_msg_id = msg_id
			
 
				+                # print(msgs[refer_idx])
			
 
				+                msg = Message(msg_id, id_src, id_dst, msg_type, time, refer_idx)
			
 
				+                msgs.append(msg)
			
 
				+                del(prev_reqs[msg_str])
			
 
				+
			
 
				+            if not msg_type == MessageType.TIMEOUT:
			
 
				+                msg_id += 1
			
 
				+
			
 
				+        self.init_ids, self.respnd_ids, self.both_ids = init_ids, respnd_ids, both_ids
			
 
				+        self.messages = msgs
			
 
				+        return init_ids, respnd_ids, both_ids, msgs
			
 
				+
			
--- a/code/ID2TLib/MapInputCSVToIDs.py
+++ b/code/ID2TLib/MapInputCSVToIDs.py
@@ -1,232 +0,0 @@
 
				-from Attack.MembersMgmtCommAttack import MessageType
			
 
				-
			
 
				-# needed because of machine inprecision. E.g A time difference of 0.1s is stored as >0.1s
			
 
				-EPS_TOLERANCE = 1e-13  # works for a difference of 0.1, no less
			
 
				-
			
 
				-def find_interval_with_most_comm(packets: list, number_ids: int, max_int_time: float):
			
 
				-    """
			
 
				-    Finds a time interval of the given seconds where the given number of ids communicate among themselves the most.
			
 
				-    
			
 
				-    :param packets: The packets containing the communication
			
 
				-    :param number_ids: The number of ids that are to be considered
			
 
				-    :param max_int_time: A short description of the attack.
			
 
				-    :return: A triple consisting of the ids, as well as start and end idx with respect to the given packets. 
			
 
				-    """
			
 
				-    
			
 
				-    def get_nez_msg_counts(msg_counts: dict):
			
 
				-        """
			
 
				-        Filters out all msg_counts that have 0 as value
			
 
				-        """
			
 
				-        nez_msg_counts = dict()
			
 
				-        for msg in msg_counts.keys():
			
 
				-            count = msg_counts[msg]
			
 
				-            if count > 0:
			
 
				-                nez_msg_counts[msg] = count
			
 
				-        return nez_msg_counts
			
 
				-
			
 
				-    def greater_than(a: float, b: float):
			
 
				-        """
			
 
				-        A greater than operator desgined to handle slight machine inprecision up to EPS_TOLERANCE.
			
 
				-        :return: True if a > b, otherwise False
			
 
				-        """
			
 
				-        return b - a < -EPS_TOLERANCE
			
 
				-
			
 
				-    def change_msg_counts(msg_counts: dict, idx: int, add=True):
			
 
				-        """
			
 
				-        Changes the value of the message count of the message occuring in the packet specified by the given index. 
			
 
				-        Adds 1 if add is True and subtracts 1 otherwise.
			
 
				-        """
			
 
				-        change = 1 if add else -1
			
 
				-        id_src, id_dst = packets[idx]["Src"], packets[idx]["Dst"]
			
 
				-        src_to_dst = "{0}-{1}".format(id_src, id_dst)
			
 
				-        dst_to_src = "{0}-{1}".format(id_dst, id_src)
			
 
				-
			
 
				-        if src_to_dst in msg_counts.keys():
			
 
				-            msg_counts[src_to_dst] += change
			
 
				-        elif dst_to_src in msg_counts.keys():
			
 
				-            msg_counts[dst_to_src] += change
			
 
				-        elif add:
			
 
				-            msg_counts[src_to_dst] = 1
			
 
				-
			
 
				-    def count_ids_in_msg_counts(msg_counts: dict):
			
 
				-        """
			
 
				-        Counts all ids that are involved in messages with a non zero message count
			
 
				-        """
			
 
				-        ids = set()
			
 
				-        for msg in msg_counts.keys():
			
 
				-            src, dst = msg.split("-")
			
 
				-            ids.add(dst)
			
 
				-            ids.add(src)
			
 
				-        return len(ids)
			
 
				-
			
 
				-    def get_msg_count_first_ids(msg_counts: list):
			
 
				-        """
			
 
				-        Finds the ids that communicate among themselves the most with respect to the given message counts.
			
 
				-        :param msg_counts: a sorted list of message counts where each entry is a tuple of key and value
			
 
				-        :return: The picked ids and their total message count as a tuple
			
 
				-        """
			
 
				-        # if order of most messages is important, use an additional list
			
 
				-        picked_ids = set()
			
 
				-        total_msg_count = 0
			
 
				-
			
 
				-        # iterate over every message count
			
 
				-        for i, msg in enumerate(msg_counts):
			
 
				-            count_picked_ids = len(picked_ids)
			
 
				-            id_one, id_two = msg[0].split("-")
			
 
				-
			
 
				-            # if enough ids have been found, stop
			
 
				-            if count_picked_ids >= number_ids:
			
 
				-                break
			
 
				-
			
 
				-            # if two ids can be added without exceeding the desired number of ids, add them
			
 
				-            if count_picked_ids - 2 <= number_ids:
			
 
				-                picked_ids.add(id_one)
			
 
				-                picked_ids.add(id_two)
			
 
				-                total_msg_count += msg[1]
			
 
				-
			
 
				-            # if there is only room for one more id to be added, 
			
 
				-            # find one that is already contained in the picked ids
			
 
				-            else:
			
 
				-                for j, msg in enumerate(msg_counts[i:]):
			
 
				-                    id_one, id_two = msg[0].split("-")
			
 
				-                    if id_one in picked_ids:
			
 
				-                        picked_ids.add(id_two)
			
 
				-                        total_msg_count += msg[1]
			
 
				-                        break
			
 
				-                    elif id_two in picked_ids:
			
 
				-                        picked_ids.add(id_one)
			
 
				-                        total_msg_count += msg[1]
			
 
				-                        break
			
 
				-                break
			
 
				-
			
 
				-        return picked_ids, total_msg_count
			
 
				-
			
 
				-    def get_indv_id_counts_and_comms(picked_ids: dict, msg_counts: dict):
			
 
				-        """ 
			
 
				-        Retrieves the total mentions of one ID in the communication pattern
			
 
				-        and all communication entries that include only picked IDs.
			
 
				-        """
			
 
				-        indv_id_counts = {}
			
 
				-        id_comms = set()
			
 
				-        for msg in msg_counts:
			
 
				-            ids = msg.split("-")
			
 
				-            if ids[0] in picked_ids and ids[1] in picked_ids:
			
 
				-                msg_other_dir = "{}-{}".format(ids[1], ids[0])
			
 
				-                if (not msg in id_comms) and (not msg_other_dir in id_comms):
			
 
				-                    id_comms.add(msg)
			
 
				-
			
 
				-                for id_ in ids:
			
 
				-                    if id_ in indv_id_counts:
			
 
				-                        indv_id_counts[id_] += msg_counts[msg]
			
 
				-                    else:
			
 
				-                        indv_id_counts[id_] = msg_counts[msg]
			
 
				-
			
 
				-        return indv_id_counts, id_comms
			
 
				-
			
 
				-
			
 
				-    # first find all possible intervals that contain enough IDs that communicate among themselves
			
 
				-    idx_low, idx_high = 0, 0
			
 
				-    msg_counts = dict()
			
 
				-    possible_intervals = []
			
 
				-
			
 
				-    # Iterate over all packets from start to finish and process the info of each packet
			
 
				-    # If time of packet within time interval, update the message count for this communication
			
 
				-    # If time of packet exceeds time interval, substract from the message count for this communication
			
 
				-    while True:
			
 
				-        if idx_high < len(packets):
			
 
				-            cur_int_time = float(packets[idx_high]["Time"]) - float(packets[idx_low]["Time"])
			
 
				- 
			
 
				-        # if current interval time exceeds time interval, save the message counts if appropriate, or stop if no more packets
			
 
				-        if greater_than(cur_int_time, max_int_time) or idx_high >= len(packets):
			
 
				-            # get all message counts for communications that took place in the current intervall
			
 
				-            nez_msg_counts = get_nez_msg_counts(msg_counts)
			
 
				-
			
 
				-            # if we have enough ids as specified by the caller, mark as possible interval
			
 
				-            if count_ids_in_msg_counts(nez_msg_counts) >= number_ids:
			
 
				-                # possible_intervals.append((nez_msg_counts, packets[idx_low]["Time"], packets[idx_high-1]["Time"]))
			
 
				-                possible_intervals.append((nez_msg_counts, idx_low, idx_high - 1))
			
 
				-
			
 
				-            if idx_high >= len(packets):
			
 
				-                break
			
 
				-
			
 
				-        # let idx_low "catch up" so that the current interval time fits into the interval time specified by the caller
			
 
				-        while greater_than(cur_int_time, max_int_time):
			
 
				-            change_msg_counts(msg_counts, idx_low, add=False)
			
 
				-            idx_low += 1
			
 
				-            cur_int_time = float(packets[idx_high]["Time"]) - float(packets[idx_low]["Time"])
			
 
				-
			
 
				-        # consume the new packet at idx_high and process its information
			
 
				-        change_msg_counts(msg_counts, idx_high)
			
 
				-        idx_high += 1
			
 
				-
			
 
				-
			
 
				-    # now find the interval in which as many ids as specified communicate the most in the given time interval
			
 
				-    summed_intervals = []
			
 
				-    sum_intervals_idxs = []
			
 
				-    cur_highest_sum = 0
			
 
				-
			
 
				-    # for every interval compute the sum of msg_counts of the first most communicative ids and eventually find
			
 
				-    # the interval(s) with most communication and its ids
			
 
				-    for j, interval in enumerate(possible_intervals):
			
 
				-        msg_counts = interval[0].items()
			
 
				-        sorted_msg_counts = sorted(msg_counts, key=lambda x: x[1], reverse=True)
			
 
				-        picked_ids, msg_sum = get_msg_count_first_ids(sorted_msg_counts)
			
 
				-
			
 
				-        if msg_sum == cur_highest_sum:
			
 
				-            summed_intervals.append({"IDs": picked_ids, "MsgSum": msg_sum, "Start": interval[1], "End": interval[2]})
			
 
				-            sum_intervals_idxs.append(j)
			
 
				-        elif msg_sum > cur_highest_sum:
			
 
				-            summed_intervals = []
			
 
				-            sum_intervals_idxs = [j]
			
 
				-            summed_intervals.append({"IDs": picked_ids, "MsgSum": msg_sum, "Start": interval[1], "End": interval[2]})
			
 
				-            cur_highest_sum = msg_sum
			
 
				-
			
 
				-    for j, interval in enumerate(summed_intervals):
			
 
				-        idx = sum_intervals_idxs[j]
			
 
				-        msg_counts_picked = possible_intervals[idx][0]
			
 
				-        indv_id_counts, id_comms = get_indv_id_counts_and_comms(interval["IDs"], msg_counts_picked)
			
 
				-        interval["IDs"] = indv_id_counts
			
 
				-        interval["Comms"] = id_comms
			
 
				-
			
 
				-    return summed_intervals
			
 
				-
			
 
				-
			
 
				-def determine_id_roles(packets: list, all_ids: set):
			
 
				-    """
			
 
				-    Determine the role of every mapped ID. The role can be initiator, responder or both.
			
 
				-    :param packets: the mapped section of abstract packets
			
 
				-    :param all_ids: all IDs that were mapped/chosen
			
 
				-    :return: a dict that for every ID contains its role
			
 
				-    """
			
 
				-    init_ids, respnd_ids, both_ids = set(), set(), set()
			
 
				-    def process_initiator(id_: str):
			
 
				-        if id_ in both_ids:
			
 
				-            pass
			
 
				-        elif not id_ in respnd_ids:
			
 
				-            init_ids.add(id_)
			
 
				-        elif id_ in respnd_ids:
			
 
				-            respnd_ids.remove(id_)
			
 
				-            both_ids.add(id_)
			
 
				-
			
 
				-    def process_responder(id_: str):
			
 
				-        if id_ in both_ids:
			
 
				-            pass
			
 
				-        elif not id_ in init_ids:
			
 
				-            respnd_ids.add(id_)
			
 
				-        elif id_ in init_ids:
			
 
				-            init_ids.remove(id_)
			
 
				-            both_ids.add(id_)
			
 
				-
			
 
				-    for packet in packets:
			
 
				-        id_src, id_dst, msg_type = packet["Src"], packet["Dst"], packet["Type"]
			
 
				-        if (not id_src in all_ids) or (not id_dst in all_ids):
			
 
				-            continue
			
 
				-        if int(msg_type) in {MessageType.SALITY_HELLO.value, MessageType.SALITY_NL_REQUEST.value}:
			
 
				-            process_initiator(id_src)
			
 
				-            process_responder(id_dst)
			
 
				-        elif int(msg_type) in {MessageType.SALITY_HELLO_REPLY.value, MessageType.SALITY_NL_REPLY.value}:
			
 
				-            process_initiator(id_dst)
			
 
				-            process_responder(id_src)
			
 
				-
			
 
				-    return init_ids, respnd_ids, both_ids
			
 
				-
			
--- a/code/ID2TLib/PortGenerator.py
+++ b/code/ID2TLib/PortGenerator.py
@@ -1,11 +1,12 @@
 
				 import random
			
 
				 import string
			
 
				 
			
 
				-def gen_random_server_port():
			
 
				+def gen_random_server_port(offset: int=2199):
			
 
				     """
			
 
				     Generates a valid random first and last character for a bots hostname
			
 
				     and computes a port from these two characters.
			
 
				+    The default offset is chosen from a Sality implementation in 2011
			
 
				     """
			
 
				     firstLetter = random.choice(string.ascii_letters);
			
 
				     lastLetter = random.choice(string.ascii_letters + string.digits);
			
 
				-    return (ord(firstLetter) * ord(lastLetter));
			
 
				+    return (offset + ord(firstLetter) * ord(lastLetter));