123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417 |
- from enum import Enum
- class MessageType(Enum):
- """
- Defines possible botnet message types
- """
- TIMEOUT = 3
- SALITY_NL_REQUEST = 101
- SALITY_NL_REPLY = 102
- SALITY_HELLO = 103
- SALITY_HELLO_REPLY = 104
- class Message():
- """
- Defines a compact message type that contains all necessary information.
- """
- def __init__(self, msg_id: int, src, dst, type_: MessageType, time: float, refer_msg_id: int=-1):
- """
- Constructs a message with the given parameters.
- :param msg_id: the ID of the message
- :param src: something identifiying the source, e.g. ID or configuration
- :param dst: something identifiying the destination, e.g. ID or configuration
- :param type_: the type of the message
- :param time: the timestamp of the message
- :param refer_msg_id: the ID this message is a request for or reply to. -1 if there is no related message.
- """
- self.msg_id = msg_id
- self.src = src
- self.dst = dst
- self.type = type_
- self.time = time
- self.refer_msg_id = refer_msg_id
- def __str__(self):
- str_ = "{0}. at {1}: {2}-->{3}, {4}, refer:{5}".format(self.msg_id, self.time, self.src, self.dst, self.type, self.refer_msg_id)
- return str_
- from random import randint, randrange, choice
- from collections import deque
- from scipy.stats import gamma
- from lea import Lea
- from Attack import BaseAttack
- from Attack.AttackParameters import Parameter as Param
- from Attack.AttackParameters import ParameterTypes
- from ID2TLib import FileUtils, PaddingGenerator
- from ID2TLib.PacketGenerator import PacketGenerator
- from ID2TLib.IPGenerator import IPGenerator
- from ID2TLib.PcapAddressOperations import PcapAddressOperations
- from ID2TLib.CommunicationProcessor import CommunicationProcessor
- from ID2TLib.MacAddressGenerator import MacAddressGenerator
- from ID2TLib.PortGenerator import gen_random_server_port
- class MembersMgmtCommAttack(BaseAttack.BaseAttack):
- def __init__(self):
- """
- Creates a new instance of the Membership Management Communication.
- """
- # Initialize communication
- super(MembersMgmtCommAttack, self).__init__("Membership Management Communication Attack (MembersMgmtCommAttack)",
- "Injects Membership Management Communication", "Botnet communication")
- # Define allowed parameters and their type
- self.supported_params = {
- # parameters regarding attack
- Param.INJECT_AT_TIMESTAMP: ParameterTypes.TYPE_FLOAT,
- Param.INJECT_AFTER_PACKET: ParameterTypes.TYPE_PACKET_POSITION,
- Param.PACKETS_PER_SECOND: ParameterTypes.TYPE_FLOAT,
- Param.PACKETS_LIMIT: ParameterTypes.TYPE_INTEGER_POSITIVE,
- Param.ATTACK_DURATION: ParameterTypes.TYPE_INTEGER_POSITIVE,
- # use num_attackers to specify number of communicating devices?
- Param.NUMBER_BOTS: ParameterTypes.TYPE_INTEGER_POSITIVE,
- # input file containing botnet communication
- Param.FILE_CSV: ParameterTypes.TYPE_FILEPATH,
- Param.FILE_XML: ParameterTypes.TYPE_FILEPATH,
- # the scope of communications
- Param.COMM_TYPE: ParameterTypes.TYPE_COMM_TYPE,
- # the percentage of IP reuse (if total and other is specified, percentages are multiplied)
- Param.IP_REUSE_TOTAL: ParameterTypes.TYPE_PERCENTAGE,
- Param.IP_REUSE_LOCAL: ParameterTypes.TYPE_PERCENTAGE,
- Param.IP_REUSE_EXTERNAL: ParameterTypes.TYPE_PERCENTAGE,
- # the user-selected padding to add to every packet
- Param.PACKET_PADDING: ParameterTypes.TYPE_PADDING
- }
- # create dict with MessageType values for fast name lookup
- self.msg_types = {}
- for msg_type in MessageType:
- self.msg_types[msg_type.value] = msg_type
- def init_params(self):
- """
- Initialize some parameters of this communication-attack using the user supplied command line parameters.
- The remaining parameters are implicitly set in the provided data file. Note: the timestamps in the file
- have to be sorted in ascending order
- :param statistics: Reference to a statistics object.
- """
- # set class constants
- self.DEFAULT_XML_PATH = "resources/MembersMgmtComm_example.xml"
- # threshold for ID to be recognized as rather common in communication
- self.MOST_COMMON_THRES = 0.08
- # probability for initiator ID to be local
- self.PROB_INIT_IS_LOCAL = 0.8
- # probability for responder ID to be local if comm_type is mixed
- self.PROB_RESPND_IS_LOCAL = 0.2
- # PARAMETERS: initialize with default values
- # (values are overwritten if user specifies them)
- # print(self.statistics.get_packet_count())
- self.add_param_value(Param.INJECT_AFTER_PACKET, randint(0, self.statistics.get_packet_count()))
- # print(self.get_param_value(Param.INJECT_AT_TIMESTAMP))
- self.add_param_value(Param.PACKETS_PER_SECOND, 0)
- self.add_param_value(Param.FILE_XML, self.DEFAULT_XML_PATH)
- self.add_param_value(Param.ATTACK_DURATION, 100)
- self.add_param_value(Param.NUMBER_BOTS, 20)
- # default locality behavior
- self.add_param_value(Param.COMM_TYPE, "mixed")
- # TODO: change 1 to something better
- self.add_param_value(Param.IP_REUSE_TOTAL, 1)
- self.add_param_value(Param.IP_REUSE_LOCAL, 0.5)
- self.add_param_value(Param.IP_REUSE_EXTERNAL, 0.5)
- # add default additional padding
- self.add_param_value(Param.PACKET_PADDING, 0)
-
- def generate_attack_pcap(self):
- # create the final messages that have to be sent, including all bot configurations
- messages = self._create_messages()
- # for msg in messages:
- # print(msg)
- # Setup (initial) parameters for packet creation loop
- BUFFER_SIZE = 1000
- pkt_gen = PacketGenerator()
- file_timestamp_prv = messages[0].time
- pcap_timestamp = self.get_param_value(Param.INJECT_AT_TIMESTAMP)
- padding = self.get_param_value(Param.PACKET_PADDING)
- packets = deque(maxlen=BUFFER_SIZE)
- total_pkts = 0
- limit_packetcount = self.get_param_value(Param.PACKETS_LIMIT)
- limit_duration = self.get_param_value(Param.ATTACK_DURATION)
- duration = 0
- path_attack_pcap = None
- # create packets to write to PCAP file
- for msg in messages:
- # retrieve the source and destination configurations
- id_src, id_dst = msg.src["ID"], msg.dst["ID"]
- ip_src, ip_dst = msg.src["IP"], msg.dst["IP"]
- mac_src, mac_dst = msg.src["MAC"], msg.dst["MAC"]
- port_src, port_dst = msg.src["Port"], msg.dst["Port"]
- ttl = msg.src["TTL"]
- # update timestamps and duration
- file_timestamp = msg.time
- file_time_delta = file_timestamp - file_timestamp_prv
- pcap_timestamp += file_time_delta
- duration += file_time_delta
- file_timestamp_prv = file_timestamp
- # if total number of packets has been sent or the attack duration has been exceeded, stop
- if ((limit_packetcount is not None and total_pkts >= limit_packetcount) or
- (limit_duration is not None and duration >= limit_duration)):
- break
-
- # if the type of the message is a NL reply, determine the number of entries
- nl_size = 0
- if msg.type == MessageType.SALITY_NL_REPLY:
- nl_size = randint(1, 25) # what is max NL entries?
- # create suitable IP/UDP packet and add to packets list
- packet = pkt_gen.generate_mmcom_packet(ip_src=ip_src, ip_dst=ip_dst, ttl=ttl, mac_src=mac_src, mac_dst=mac_dst,
- port_src=port_src, port_dst=port_dst, message_type=msg.type, neighborlist_entries=nl_size)
- PaddingGenerator.add_padding(packet, padding)
- packet.time = pcap_timestamp
- packets.append(packet)
- total_pkts += 1
- # Store timestamp of first packet (for attack label)
- if total_pkts <= 1:
- self.attack_start_utime = packets[0].time
- elif total_pkts % BUFFER_SIZE == 0: # every 1000 packets write them to the PCAP file (append)
- packets = list(packets)
- PaddingGenerator.equal_length(packets)
- last_packet = packets[-1]
- path_attack_pcap = self.write_attack_pcap(packets, True, path_attack_pcap)
- packets = deque(maxlen=BUFFER_SIZE)
- # if there are unwritten packets remaining, write them to the PCAP file
- if len(packets) > 0:
- packets = list(packets)
- PaddingGenerator.equal_length(packets)
- path_attack_pcap = self.write_attack_pcap(packets, True, path_attack_pcap)
- last_packet = packets[-1]
- # Store timestamp of last packet
- self.attack_end_utime = last_packet.time
- # Return packets sorted by packet by timestamp and total number of packets (sent)
- return total_pkts , path_attack_pcap
- def _create_messages(self):
- def add_ids_to_config(ids_to_add: list, existing_ips: list, new_ips: list, bot_configs: dict, idtype:str="local", router_mac:str=""):
- """
- Creates IP and MAC configurations for the given IDs and adds them to the existing configurations object.
- :param ids_to_add: all sorted IDs that have to be configured and added
- :param existing_ips: the existing IPs in the PCAP file that should be assigned to some, or all, IDs
- :param new_ips: the newly generated IPs that should be assigned to some, or all, IDs
- :param bot_configs: the existing configurations for the bots
- :param idtype: the locality type of the IDs
- :param router_mac: the MAC address of the router in the PCAP
- """
- ids = ids_to_add.copy()
- # macgen only needed, when IPs are new local IPs (therefore creating the object here suffices for the current callers
- # to not end up with the same MAC paired with different IPs)
- macgen = MacAddressGenerator()
- # assign existing IPs and the corresponding MAC addresses in the PCAP to the IDs
- for ip in existing_ips:
- random_id = choice(ids)
- mac = self.statistics.process_db_query("macAddress(IPAddress=%s)" % ip)
- bot_configs[random_id] = {"Type": idtype, "IP": ip, "MAC": mac}
- ids.remove(random_id)
- # assign new IPs and for local IPs new MACs or for external IPs the router MAC to the IDs
- for ip in new_ips:
- random_id = choice(ids)
- if idtype == "local":
- mac = macgen.random_mac()
- elif idtype == "external":
- mac = router_mac
- bot_configs[random_id] = {"Type": idtype, "IP": ip, "MAC": mac}
- ids.remove(random_id)
- def index_increment(number: int, max: int):
- """
- Number increment with rollover.
- """
- if number + 1 < max:
- return number + 1
- else:
- return 0
- def assign_realistic_ttls2(bot_configs):
- # Gamma distribution parameters derived from MAWI 13.8G dataset
- ids = sorted(bot_configs.keys())
- alpha, loc, beta = (2.3261710235, -0.188306914406, 44.4853123884)
- gd = gamma.rvs(alpha, loc=loc, scale=beta, size=len(ids))
- for pos, bot in enumerate(ids):
- # print(bot)
- is_invalid = True
- pos_max = len(gd)
- while is_invalid:
- ttl = int(round(gd[pos]))
- if 0 < ttl < 256: # validity check
- is_invalid = False
- else:
- pos = index_increment(pos, pos_max)
- bot_configs[bot]["TTL"] = ttl
- def assign_realistic_ttls(bot_configs):
- '''
- Assigns a realisitic ttl to each bot from @param: bot_configs. Uses statistics and distribution to be able
- to calculate a realisitc ttl.
- :param bot_configs:
- :return:
- '''
- ids = sorted(bot_configs.keys())
- for pos,bot in enumerate(ids):
- #print(type(bot_configs))
- # Set TTL based on TTL distribution of IP address
- bot_ttl_dist = self.statistics.get_ttl_distribution(bot_configs[bot]["IP"])
- if len(bot_ttl_dist) > 0:
- source_ttl_prob_dict = Lea.fromValFreqsDict(bot_ttl_dist)
- bot_configs[bot]["TTL"] = source_ttl_prob_dict.random()
- else:
- bot_configs[bot]["TTL"] = self.statistics.process_db_query("most_used(ttlValue)")
- # parse input CSV or XML
- filepath_xml = self.get_param_value(Param.FILE_XML)
- filepath_csv = self.get_param_value(Param.FILE_CSV)
- # prefer XML input over CSV input (in case both are given)
- if filepath_csv and filepath_xml == self.DEFAULT_XML_PATH:
- filepath_xml = FileUtils.parse_csv_to_xml(filepath_csv)
- abstract_packets = FileUtils.parse_xml(filepath_xml)
- # find a good communication mapping in the input file that matches the users parameters
- duration = self.get_param_value(Param.ATTACK_DURATION)
- number_bots = self.get_param_value(Param.NUMBER_BOTS)
- comm_proc = CommunicationProcessor(abstract_packets)
- comm_interval = comm_proc.find_interval_with_most_comm(number_bots, duration)[0]
- if comm_interval is None:
- print("Error: There is no interval in the given CSV/XML that has enough communication")
- return 0, None
- # retrieve the mapping information
- mapped_ids, id_comms, packet_start_idx, packet_end_idx = comm_interval["IDs"], comm_interval["Comms"], comm_interval["Start"], comm_interval["End"]
- # assign the communication processor this mapping for further processing
- comm_proc.set_mapping(abstract_packets[packet_start_idx:packet_end_idx+1], mapped_ids, id_comms)
- # print start and end time of mapped interval
- # print(abstract_packets[packet_start_idx]["Time"])
- # print(abstract_packets[packet_end_idx]["Time"])
- # determine number of reused local and external IPs
- reuse_percent_total = self.get_param_value(Param.IP_REUSE_TOTAL)
- reuse_percent_external = self.get_param_value(Param.IP_REUSE_EXTERNAL)
- reuse_percent_local = self.get_param_value(Param.IP_REUSE_LOCAL)
- reuse_count_external = int(reuse_percent_total * reuse_percent_external * len(mapped_ids))
- reuse_count_local = int(reuse_percent_total * reuse_percent_local * len(mapped_ids))
- # create locality, IP and MAC configurations for the IDs/Bots
- ipgen = IPGenerator()
- comm_type = self.get_param_value(Param.COMM_TYPE)
- pcapops = PcapAddressOperations(self.statistics)
- router_mac = pcapops.get_probable_router_mac()
- bot_configs = {}
- # determine the roles of the IDs in the mapping communication-{initiator, responder} or both
- init_ids, respnd_ids, both_ids, messages = comm_proc.det_id_roles_and_msgs(self.msg_types)
- # use these roles to determine which IDs are to be local and which external
- local_ids, external_ids = comm_proc.det_ext_and_local_ids(comm_type, self.PROB_INIT_IS_LOCAL, self.PROB_RESPND_IS_LOCAL)
-
- # retrieve and assign the IPs and MACs for the bots with respect to the given parameters
- # (IDs are always added to bot_configs in the same order under a given seed)
- number_local_ids, number_external_ids = len(local_ids), len(external_ids)
- # assign addresses for local IDs
- if number_local_ids > 0:
- reuse_count_local = int(reuse_percent_total * reuse_percent_local * number_local_ids)
- existing_local_ips = sorted(pcapops.get_existing_priv_ips(reuse_count_local))
- new_local_ips = sorted(pcapops.get_new_priv_ips(number_local_ids - len(existing_local_ips)))
- add_ids_to_config(sorted(local_ids), existing_local_ips, new_local_ips, bot_configs)
- # assign addresses for external IDs
- if number_external_ids > 0:
- reuse_count_external = int(reuse_percent_total * reuse_percent_external * number_external_ids)
- existing_external_ips = sorted(pcapops.get_existing_external_ips(reuse_count_external))
- remaining = len(external_ids) - len(existing_external_ips)
- new_external_ips = sorted([ipgen.random_ip() for _ in range(remaining)])
- add_ids_to_config(sorted(external_ids), existing_external_ips, new_external_ips, bot_configs, idtype="external", router_mac=router_mac)
- # for msg in messages:
- # print(msg)
- # print(sorted(list(init_ids)+list(both_ids)))
- # print(sorted(local_ids))
- # print(sorted(external_ids))
- #### Set realistic timestamps for messages ####
- #### ... ####
-
- # create port configurations for the bots
- for bot in bot_configs:
- bot_configs[bot]["Port"] = gen_random_server_port()
- # assign realistic TTL for every bot
- assign_realistic_ttls(bot_configs)
- # put together the final messages including the full sender and receiver
- # configurations (i.e. IP, MAC, port, ...) for easier later use
- final_messages = []
- new_id = 0
- for msg in messages:
- #print(msg)
- #print(mapped_ids.keys())
- type_src, type_dst = bot_configs[msg.src]["Type"], bot_configs[msg.dst]["Type"]
- id_src, id_dst = msg.src, msg.dst
- # sort out messages that do not have a suitable locality setting
- if type_src == "external" and type_dst == "external":
- continue
- if comm_type == "external":
- if type_src == "local" and type_dst == "local":
- continue
- msg.src, msg.dst = bot_configs[id_src], bot_configs[id_dst]
- msg.src["ID"], msg.dst["ID"] = id_src, id_dst
- msg.msg_id = new_id
- new_id += 1
- ### Important here to update refers, i.e. needed later?
- final_messages.append(msg)
- return final_messages
|