BaseAttack.py 32 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824
  1. import abc
  2. import csv
  3. import hashlib
  4. import ipaddress
  5. import math
  6. import os
  7. import random
  8. import random as rnd
  9. import re
  10. import socket
  11. import sys
  12. import tempfile
  13. import time
  14. # TODO: double check this import
  15. # does it complain because libpcapreader is not a .py?
  16. import ID2TLib.libpcapreader as pr
  17. import lea
  18. import numpy as np
  19. import scapy.layers.inet as inet
  20. import scapy.utils
  21. import Attack.AttackParameters as atkParam
  22. import ID2TLib.Utility as Util
  23. class BaseAttack(metaclass=abc.ABCMeta):
  24. """
  25. Abstract base class for all attack classes. Provides basic functionalities, like parameter validation.
  26. """
  27. def __init__(self, name, description, attack_type):
  28. """
  29. To be called within the individual attack class to initialize the required parameters.
  30. :param name: The name of the attack class.
  31. :param description: A short description of the attack.
  32. :param attack_type: The type the attack belongs to, like probing/scanning, malware.
  33. """
  34. # Reference to statistics class
  35. self.statistics = None
  36. # Class fields
  37. self.attack_name = name
  38. self.attack_description = description
  39. self.attack_type = attack_type
  40. self.params = {}
  41. self.supported_params = {}
  42. self.attack_start_utime = 0
  43. self.attack_end_utime = 0
  44. self.start_time = 0
  45. self.finish_time = 0
  46. self.packets = []
  47. self.path_attack_pcap = ""
  48. def set_statistics(self, statistics):
  49. """
  50. Specify the statistics object that will be used to calculate the parameters of this attack.
  51. The statistics are used to calculate default parameters and to process user supplied
  52. queries.
  53. :param statistics: Reference to a statistics object.
  54. """
  55. self.statistics = statistics
  56. @abc.abstractmethod
  57. def init_params(self):
  58. """
  59. Initialize all required parameters taking into account user supplied values. If no value is supplied,
  60. or if a user defined query is supplied, use a statistics object to do the calculations.
  61. A call to this function requires a call to 'set_statistics' first.
  62. """
  63. pass
  64. @abc.abstractmethod
  65. def generate_attack_packets(self):
  66. """
  67. Creates the attack packets.
  68. """
  69. pass
  70. @abc.abstractmethod
  71. def generate_attack_pcap(self):
  72. """
  73. Creates a pcap containing the attack packets.
  74. :return: The location of the generated pcap file.
  75. """
  76. pass
  77. ################################################
  78. # HELPER VALIDATION METHODS
  79. # Used to validate the given parameter values
  80. ################################################
  81. @staticmethod
  82. def _is_mac_address(mac_address: str):
  83. """
  84. Verifies if the given string is a valid MAC address.
  85. Accepts the formats 00:80:41:ae:fd:7e and 00-80-41-ae-fd-7e.
  86. :param mac_address: The MAC address as string.
  87. :return: True if the MAC address is valid, otherwise False.
  88. """
  89. pattern = re.compile('^([0-9A-Fa-f]{2}[:-]){5}([0-9A-Fa-f]{2})$', re.MULTILINE)
  90. if isinstance(mac_address, list):
  91. for mac in mac_address:
  92. if re.match(pattern, mac) is None:
  93. return False
  94. else:
  95. if re.match(pattern, mac_address) is None:
  96. return False
  97. return True
  98. @staticmethod
  99. def _is_ip_address(ip_address: str):
  100. """
  101. Verifies that the given string or list of IP addresses (strings) is a valid IPv4/IPv6 address.
  102. Accepts comma-separated lists of IP addresses, like "192.169.178.1, 192.168.178.2"
  103. :param ip_address: The IP address(es) as list of strings, comma-separated or dash-separated string.
  104. :return: True if all IP addresses are valid, otherwise False. And a list of IP addresses as string.
  105. """
  106. def append_ips(ip_address_input):
  107. """
  108. Recursive appending function to handle lists and ranges of IP addresses.
  109. :param ip_address_input: The IP address(es) as list of strings, comma-separated or dash-separated string.
  110. :return: List of all given IP addresses.
  111. """
  112. ip_list = []
  113. is_valid = True
  114. for ip in ip_address_input:
  115. if '-' in ip:
  116. ip_range = ip.split('-')
  117. ip_range = Util.get_ip_range(ip_range[0], ip_range[1])
  118. is_valid, ips = append_ips(ip_range)
  119. ip_list.extend(ips)
  120. else:
  121. try:
  122. ipaddress.ip_address(ip)
  123. ip_list.append(ip)
  124. except ValueError:
  125. return False, ip_list
  126. return is_valid, ip_list
  127. # a comma-separated list of IP addresses must be split first
  128. if isinstance(ip_address, str):
  129. ip_address = ip_address.split(',')
  130. result, ip_address_output = append_ips(ip_address)
  131. if len(ip_address_output) == 1:
  132. return result, ip_address_output[0]
  133. else:
  134. return result, ip_address_output
  135. @staticmethod
  136. def _is_port(ports_input: str):
  137. """
  138. Verifies if the given value is a valid port. Accepts port ranges, like 80-90, 80..99, 80...99.
  139. :param ports_input: The port number as int or string.
  140. :return: True if the port number is valid, otherwise False. If a single port or a comma-separated list of ports
  141. was given, a list of int is returned. If a port range was given, the range is resolved
  142. and a list of int is returned.
  143. """
  144. def _is_invalid_port(num):
  145. """
  146. Checks whether the port number is invalid.
  147. :param num: The port number as int.
  148. :return: True if the port number is invalid, otherwise False.
  149. """
  150. return num < 1 or num > 65535
  151. if ports_input is None or ports_input is "":
  152. return False
  153. if isinstance(ports_input, str):
  154. ports_input = ports_input.replace(' ', '').split(',')
  155. elif isinstance(ports_input, int):
  156. ports_input = [ports_input]
  157. elif len(ports_input) is 0:
  158. return False
  159. ports_output = []
  160. for port_entry in ports_input:
  161. if isinstance(port_entry, int):
  162. if _is_invalid_port(port_entry):
  163. return False
  164. ports_output.append(port_entry)
  165. # TODO: validate last condition
  166. elif isinstance(port_entry, str) and port_entry.isdigit():
  167. # port_entry describes a single port
  168. port_entry = int(port_entry)
  169. if _is_invalid_port(port_entry):
  170. return False
  171. ports_output.append(port_entry)
  172. elif '-' in port_entry or '..' in port_entry:
  173. # port_entry describes a port range
  174. # allowed format: '1-49151', '1..49151', '1...49151'
  175. match = re.match(r'^([0-9]{1,5})(?:-|\.{2,3})([0-9]{1,5})$', str(port_entry))
  176. # check validity of port range
  177. # and create list of ports derived from given start and end port
  178. (port_start, port_end) = int(match.group(1)), int(match.group(2))
  179. if _is_invalid_port(port_start) or _is_invalid_port(port_end):
  180. return False
  181. else:
  182. ports_list = [i for i in range(port_start, port_end + 1)]
  183. # append ports at ports_output list
  184. ports_output += ports_list
  185. if len(ports_output) == 1:
  186. return True, ports_output[0]
  187. else:
  188. return True, ports_output
  189. @staticmethod
  190. def _is_timestamp(timestamp: str):
  191. """
  192. Checks whether the given value is in a valid timestamp format. The accepted format is:
  193. YYYY-MM-DD h:m:s, whereas h, m, s may be one or two digits.
  194. :param timestamp: The timestamp to be checked.
  195. :return: True if the timestamp is valid, otherwise False.
  196. """
  197. is_valid = re.match(r'[0-9]{4}(?:-[0-9]{1,2}){2} (?:[0-9]{1,2}:){2}[0-9]{1,2}', timestamp)
  198. return is_valid is not None
  199. @staticmethod
  200. def _is_boolean(value):
  201. """
  202. Checks whether the given value (string or bool) is a boolean. Strings are valid booleans if they are in:
  203. {y, yes, t, true, on, 1, n, no, f, false, off, 0}.
  204. :param value: The value to be checked.
  205. :return: True if the value is a boolean, otherwise false. And the casted boolean.
  206. """
  207. # If value is already a boolean
  208. if isinstance(value, bool):
  209. return True, value
  210. # If value is a string
  211. # True values are y, yes, t, true, on and 1;
  212. # False values are n, no, f, false, off and 0.
  213. # Raises ValueError if value is anything else.
  214. try:
  215. import distutils.core
  216. import distutils.util
  217. value = distutils.util.strtobool(value.lower())
  218. is_bool = True
  219. except ValueError:
  220. is_bool = False
  221. return is_bool, value
  222. @staticmethod
  223. def _is_float(value):
  224. """
  225. Checks whether the given value is a float.
  226. :param value: The value to be checked.
  227. :return: True if the value is a float, otherwise False. And the casted float.
  228. """
  229. try:
  230. value = float(value)
  231. return True, value
  232. except ValueError:
  233. return False, value
  234. @staticmethod
  235. def _is_domain(val: str):
  236. """
  237. Verifies that the given string is a valid URI.
  238. :param val: The URI as string.
  239. :return: True if URI is valid, otherwise False.
  240. """
  241. domain = re.match(r'^(?:[a-zA-Z]|[0-9]|[$-_@.&+]|[!*\(\),]|(?:%[0-9a-fA-F][0-9a-fA-F]))+$', val)
  242. return domain is not None
  243. #########################################
  244. # HELPER METHODS
  245. #########################################
  246. @staticmethod
  247. def set_seed(seed):
  248. """
  249. :param seed: The random seed to be set.
  250. """
  251. seed_final = None
  252. if isinstance(seed, int):
  253. seed_final = seed
  254. elif isinstance(seed, str):
  255. if seed.isdigit():
  256. seed_final = int(seed)
  257. else:
  258. hashed_seed = hashlib.sha1(seed.encode()).digest()
  259. seed_final = int.from_bytes(hashed_seed, byteorder="little")
  260. if seed_final:
  261. random.seed(seed_final)
  262. np.random.seed(seed_final & 0xFFFFFFFF)
  263. def set_start_time(self):
  264. """
  265. Set the current time as global starting time.
  266. """
  267. self.start_time = time.time()
  268. def set_finish_time(self):
  269. """
  270. Set the current time as global finishing time.
  271. """
  272. self.finish_time = time.time()
  273. def get_packet_generation_time(self):
  274. """
  275. :return difference between starting and finishing time.
  276. """
  277. return self.finish_time - self.start_time
  278. def add_param_value(self, param, value):
  279. """
  280. Adds the pair param : value to the dictionary of attack parameters. Prints and error message and skips the
  281. parameter if the validation fails.
  282. :param param: Name of the parameter that we wish to modify.
  283. :param value: The value we wish to assign to the specified parameter.
  284. :return: None.
  285. """
  286. # This function call is valid only if there is a statistics object available.
  287. if self.statistics is None:
  288. print('Error: Attack parameter added without setting a statistics object first.')
  289. exit(1)
  290. # by default no param is valid
  291. is_valid = False
  292. # get AttackParameters instance associated with param
  293. # for default values assigned in attack classes, like Parameter.PORT_OPEN
  294. if isinstance(param, atkParam.Parameter):
  295. param_name = param
  296. # for values given by user input, like port.open
  297. else:
  298. # Get Enum key of given string identifier
  299. param_name = atkParam.Parameter(param)
  300. # Get parameter type of attack's required_params
  301. param_type = self.supported_params.get(param_name)
  302. # Verify validity of given value with respect to parameter type
  303. if param_type is None:
  304. print('Parameter ' + str(param_name) + ' not available for chosen attack. Skipping parameter.')
  305. # If value is query -> get value from database
  306. elif param_name != atkParam.Parameter.INTERVAL_SELECT_STRATEGY and self.statistics.is_query(value):
  307. value = self.statistics.process_db_query(value, False)
  308. if value is not None and value is not "":
  309. is_valid = True
  310. else:
  311. print('Error in given parameter value: ' + str(value) + '. Data could not be retrieved.')
  312. # Validate parameter depending on parameter's type
  313. elif param_type == atkParam.ParameterTypes.TYPE_IP_ADDRESS:
  314. is_valid, value = self._is_ip_address(value)
  315. elif param_type == atkParam.ParameterTypes.TYPE_PORT:
  316. is_valid, value = self._is_port(value)
  317. elif param_type == atkParam.ParameterTypes.TYPE_MAC_ADDRESS:
  318. is_valid = self._is_mac_address(value)
  319. elif param_type == atkParam.ParameterTypes.TYPE_INTEGER_POSITIVE:
  320. if isinstance(value, int) and int(value) >= 0:
  321. is_valid = True
  322. elif isinstance(value, str) and value.isdigit() and int(value) >= 0:
  323. is_valid = True
  324. value = int(value)
  325. elif param_type == atkParam.ParameterTypes.TYPE_STRING:
  326. if isinstance(value, str):
  327. is_valid = True
  328. elif param_type == atkParam.ParameterTypes.TYPE_FLOAT:
  329. is_valid, value = self._is_float(value)
  330. # this is required to avoid that the timestamp's microseconds of the first attack packet is '000000'
  331. # but microseconds are only chosen randomly if the given parameter does not already specify it
  332. # e.g. inject.at-timestamp=123456.987654 -> is not changed
  333. # e.g. inject.at-timestamp=123456 -> is changed to: 123456.[random digits]
  334. if param_name == atkParam.Parameter.INJECT_AT_TIMESTAMP and is_valid and ((value - int(value)) == 0):
  335. value = value + random.uniform(0, 0.999999)
  336. elif param_type == atkParam.ParameterTypes.TYPE_TIMESTAMP:
  337. is_valid = self._is_timestamp(value)
  338. elif param_type == atkParam.ParameterTypes.TYPE_BOOLEAN:
  339. is_valid, value = self._is_boolean(value)
  340. elif param_type == atkParam.ParameterTypes.TYPE_PACKET_POSITION:
  341. ts = pr.pcap_processor(self.statistics.pcap_filepath, "False").get_timestamp_mu_sec(int(value))
  342. if 0 <= int(value) <= self.statistics.get_packet_count() and ts >= 0:
  343. is_valid = True
  344. param_name = atkParam.Parameter.INJECT_AT_TIMESTAMP
  345. value = (ts / 1000000) # convert microseconds from getTimestampMuSec into seconds
  346. elif param_type == atkParam.ParameterTypes.TYPE_DOMAIN:
  347. is_valid = self._is_domain(value)
  348. elif param_type == atkParam.ParameterTypes.TYPE_FILEPATH:
  349. is_valid = os.path.isfile(value)
  350. elif param_type == atkParam.ParameterTypes.TYPE_PERCENTAGE:
  351. is_valid_float, value = self._is_float(value)
  352. if is_valid_float:
  353. is_valid = value >= 0 and value <= 1
  354. else:
  355. is_valid = False
  356. elif param_type == atkParam.ParameterTypes.TYPE_PADDING:
  357. if isinstance(value, int):
  358. is_valid = value >= 0 and value <= 100
  359. elif isinstance(value, str) and value.isdigit():
  360. value = int(value)
  361. is_valid = value >= 0 and value <= 100
  362. elif param_type == atkParam.ParameterTypes.TYPE_INTERVAL_SELECT_STRAT:
  363. is_valid = value in {"random", "optimal", "custom"}
  364. # add value iff validation was successful
  365. if is_valid:
  366. self.params[param_name] = value
  367. else:
  368. print("ERROR: Parameter " + str(param) + " or parameter value " + str(value) +
  369. " not valid. Skipping parameter.")
  370. def get_param_value(self, param: atkParam.Parameter):
  371. """
  372. Returns the parameter value for a given parameter.
  373. :param param: The parameter whose value is wanted.
  374. :return: The parameter's value.
  375. """
  376. return self.params.get(param)
  377. def check_parameters(self):
  378. """
  379. Checks whether all parameter values are defined. If a value is not defined, the application is terminated.
  380. However, this should not happen as all attack should define default parameter values.
  381. """
  382. # parameters which do not require default values
  383. non_obligatory_params = [atkParam.Parameter.INJECT_AFTER_PACKET, atkParam.Parameter.NUMBER_ATTACKERS]
  384. for param, param_type in self.supported_params.items():
  385. # checks whether all params have assigned values, INJECT_AFTER_PACKET must not be considered because the
  386. # timestamp derived from it is set to Parameter.INJECT_AT_TIMESTAMP
  387. if param not in self.params.keys() and param not in non_obligatory_params:
  388. print("\033[91mCRITICAL ERROR: Attack '" + self.attack_name + "' does not define the parameter '" +
  389. str(param) + "'.\n The attack must define default values for all parameters."
  390. + "\n Cannot continue attack generation.\033[0m")
  391. import sys
  392. sys.exit(0)
  393. def write_attack_pcap(self, packets: list, append_flag: bool = False, destination_path: str = None):
  394. """
  395. Writes the attack's packets into a PCAP file with a temporary filename.
  396. :return: The path of the written PCAP file.
  397. """
  398. # Only check params initially when attack generation starts
  399. if append_flag is False and destination_path is None:
  400. # Check if all req. parameters are set
  401. self.check_parameters()
  402. # Determine destination path
  403. if destination_path is not None and os.path.exists(destination_path):
  404. destination = destination_path
  405. else:
  406. temp_file = tempfile.NamedTemporaryFile(delete=False, suffix='.pcap')
  407. destination = temp_file.name
  408. # Write packets into pcap file
  409. pktdump = scapy.utils.PcapWriter(destination, append=append_flag)
  410. pktdump.write(packets)
  411. # Store pcap path and close file objects
  412. pktdump.close()
  413. return destination
  414. def get_reply_delay(self, ip_dst, default = 2000):
  415. """
  416. Gets the minimum and the maximum reply delay for all the connections of a specific IP.
  417. :param ip_dst: The IP to reterive its reply delay.
  418. :param default: The default value to return if no delay could be fount. If < 0 raise an exception instead
  419. :return minDelay: minimum delay
  420. :return maxDelay: maximum delay
  421. """
  422. result = self.statistics.process_db_query(
  423. "SELECT AVG(minDelay), AVG(maxDelay) FROM conv_statistics WHERE ipAddressB='" + ip_dst + "';")
  424. if result[0][0] and result[0][1]:
  425. min_delay = result[0][0]
  426. max_delay = result[0][1]
  427. else:
  428. all_min_delays = self.statistics.process_db_query("SELECT minDelay FROM conv_statistics LIMIT 500;")
  429. min_delay = np.median(all_min_delays)
  430. all_max_delays = self.statistics.process_db_query("SELECT maxDelay FROM conv_statistics LIMIT 500;")
  431. max_delay = np.median(all_max_delays)
  432. if math.isnan(min_delay): # max_delay is nan too then
  433. if default < 0:
  434. raise ValueError("Could not calculate min/max_delay")
  435. min_delay = default
  436. max_delay = default
  437. min_delay = int(min_delay) * 10 ** -6 # convert from micro to seconds
  438. max_delay = int(max_delay) * 10 ** -6
  439. return min_delay, max_delay
  440. @staticmethod
  441. def packets_to_convs(exploit_raw_packets):
  442. """
  443. Classifies a bunch of packets to conversations groups. A conversation is a set of packets go between host A
  444. (IP,port) to host B (IP,port)
  445. :param exploit_raw_packets: A set of packets contains several conversations.
  446. :return conversations: A set of arrays, each array contains the packet of specifc conversation
  447. :return orderList_conversations: An array contains the conversations ids (IP_A,port_A, IP_b,port_B) in the
  448. order they appeared in the original packets.
  449. """
  450. conversations = {}
  451. order_list_conversations = []
  452. for pkt_num, pkt in enumerate(exploit_raw_packets):
  453. eth_frame = inet.Ether(pkt[0])
  454. ip_pkt = eth_frame.payload
  455. ip_dst = ip_pkt.getfieldval("dst")
  456. ip_src = ip_pkt.getfieldval("src")
  457. tcp_pkt = ip_pkt.payload
  458. port_dst = tcp_pkt.getfieldval("dport")
  459. port_src = tcp_pkt.getfieldval("sport")
  460. conv_req = (ip_src, port_src, ip_dst, port_dst)
  461. conv_rep = (ip_dst, port_dst, ip_src, port_src)
  462. if conv_req not in conversations and conv_rep not in conversations:
  463. pkt_list = [pkt]
  464. conversations[conv_req] = pkt_list
  465. # Order list of conv
  466. order_list_conversations.append(conv_req)
  467. else:
  468. if conv_req in conversations:
  469. pkt_list = conversations[conv_req]
  470. pkt_list.append(pkt)
  471. conversations[conv_req] = pkt_list
  472. else:
  473. pkt_list = conversations[conv_rep]
  474. pkt_list.append(pkt)
  475. conversations[conv_rep] = pkt_list
  476. return conversations, order_list_conversations
  477. @staticmethod
  478. def is_valid_ip_address(addr):
  479. """
  480. Checks if the IP address family is supported.
  481. :param addr: IP address to be checked.
  482. :return: Boolean
  483. """
  484. try:
  485. socket.inet_aton(addr)
  486. return True
  487. except socket.error:
  488. return False
  489. @staticmethod
  490. def ip_src_dst_equal_check(ip_source, ip_destination):
  491. """
  492. Checks if the source IP and destination IP are equal.
  493. :param ip_source: source IP address.
  494. :param ip_destination: destination IP address.
  495. """
  496. equal = False
  497. if isinstance(ip_source, list):
  498. if ip_destination in ip_source:
  499. equal = True
  500. else:
  501. if ip_source == ip_destination:
  502. equal = True
  503. if equal:
  504. print("\nERROR: Invalid IP addresses; source IP is the same as destination IP: " + ip_destination + ".")
  505. sys.exit(0)
  506. @staticmethod
  507. def get_inter_arrival_time(packets, distribution: bool = False):
  508. """
  509. Gets the inter-arrival times array and its distribution of a set of packets.
  510. :param packets: the packets to extract their inter-arrival time.
  511. :param distribution: build distribution dictionary or not
  512. :return inter_arrival_times: array of the inter-arrival times
  513. :return dict: the inter-arrival time distribution as a histogram {inter-arrival time:frequency}
  514. """
  515. inter_arrival_times = []
  516. prvs_pkt_time = 0
  517. for index, pkt in enumerate(packets):
  518. timestamp = pkt[2][0] + pkt[2][1] / 10 ** 6
  519. if index == 0:
  520. prvs_pkt_time = timestamp
  521. inter_arrival_times.append(0)
  522. else:
  523. inter_arrival_times.append(timestamp - prvs_pkt_time)
  524. prvs_pkt_time = timestamp
  525. if distribution:
  526. # Build a distribution dictionary
  527. freq, values = np.histogram(inter_arrival_times, bins=20)
  528. dist_dict = {}
  529. for i, val in enumerate(values):
  530. if i < len(freq):
  531. dist_dict[str(val)] = freq[i]
  532. return inter_arrival_times, dist_dict
  533. else:
  534. return inter_arrival_times
  535. @staticmethod
  536. def clean_white_spaces(str_param):
  537. """
  538. Delete extra backslash from white spaces. This function is used to process the payload of packets.
  539. :param str_param: the payload to be processed.
  540. """
  541. str_param = str_param.replace("\\n", "\n")
  542. str_param = str_param.replace("\\r", "\r")
  543. str_param = str_param.replace("\\t", "\t")
  544. str_param = str_param.replace("\\\'", "\'")
  545. return str_param
  546. def modify_http_header(self, str_tcp_seg, orig_target_uri, target_uri, orig_ip_dst, target_host):
  547. """
  548. Substitute the URI and HOST in a HTTP header with new values.
  549. :param str_tcp_seg: the payload to be processed.
  550. :param orig_target_uri: old URI
  551. :param target_uri: new URI
  552. :param orig_ip_dst: old host
  553. :param target_host: new host
  554. """
  555. if len(str_tcp_seg) > 0:
  556. # convert payload bytes to str => str = "b'..\\r\\n..'"
  557. str_tcp_seg = str_tcp_seg[2:-1]
  558. str_tcp_seg = str_tcp_seg.replace(orig_target_uri, target_uri)
  559. str_tcp_seg = str_tcp_seg.replace(orig_ip_dst, target_host)
  560. str_tcp_seg = self.clean_white_spaces(str_tcp_seg)
  561. return str_tcp_seg
  562. def get_ip_data(self, ip_address: str):
  563. """
  564. :param ip_address: the ip of which (packet-)data shall be returned
  565. :return: MSS, TTL and Window Size values of the given IP
  566. """
  567. # Set MSS (Maximum Segment Size) based on MSS distribution of IP address
  568. mss_dist = self.statistics.get_mss_distribution(ip_address)
  569. if len(mss_dist) > 0:
  570. mss_prob_dict = lea.Lea.fromValFreqsDict(mss_dist)
  571. mss_value = mss_prob_dict.random()
  572. else:
  573. mss_value = Util.handle_most_used_outputs(self.statistics.process_db_query("most_used(mssValue)"))
  574. # Set TTL based on TTL distribution of IP address
  575. ttl_dist = self.statistics.get_ttl_distribution(ip_address)
  576. if len(ttl_dist) > 0:
  577. ttl_prob_dict = lea.Lea.fromValFreqsDict(ttl_dist)
  578. ttl_value = ttl_prob_dict.random()
  579. else:
  580. ttl_value = Util.handle_most_used_outputs(self.statistics.process_db_query("most_used(ttlValue)"))
  581. # Set Window Size based on Window Size distribution of IP address
  582. win_dist = self.statistics.get_win_distribution(ip_address)
  583. if len(win_dist) > 0:
  584. win_prob_dict = lea.Lea.fromValFreqsDict(win_dist)
  585. win_value = win_prob_dict.random()
  586. else:
  587. win_value = Util.handle_most_used_outputs(self.statistics.process_db_query("most_used(winSize)"))
  588. return mss_value, ttl_value, win_value
  589. #########################################
  590. # RANDOM IP/MAC ADDRESS GENERATORS
  591. #########################################
  592. @staticmethod
  593. def generate_random_ipv4_address(ip_class, n: int = 1):
  594. # TODO: document ip_class
  595. """
  596. Generates n random IPv4 addresses.
  597. :param ip_class:
  598. :param n: The number of IP addresses to be generated
  599. :return: A single IP address, or if n>1, a list of IP addresses
  600. """
  601. def is_invalid(ip_address_param: ipaddress.IPv4Address):
  602. return ip_address_param.is_multicast or ip_address_param.is_unspecified or ip_address_param.is_loopback or \
  603. ip_address_param.is_link_local or ip_address_param.is_reserved or ip_address_param.is_private
  604. # Generate a random IP from specific class
  605. def generate_address(ip_class_param):
  606. if ip_class_param == "Unknown":
  607. return ipaddress.IPv4Address(random.randint(0, 2 ** 32 - 1))
  608. else:
  609. # For DDoS attack, we do not generate private IPs
  610. if "private" in ip_class_param:
  611. ip_class_param = ip_class_param[0] # convert A-private to A
  612. ip_classes_byte1 = {"A": {1, 126}, "B": {128, 191}, "C": {192, 223}, "D": {224, 239}, "E": {240, 254}}
  613. temp = list(ip_classes_byte1[ip_class_param])
  614. min_b1 = temp[0]
  615. max_b1 = temp[1]
  616. b1 = random.randint(min_b1, max_b1)
  617. b2 = random.randint(1, 255)
  618. b3 = random.randint(1, 255)
  619. b4 = random.randint(1, 255)
  620. ip_address = ipaddress.IPv4Address(str(b1) + "." + str(b2) + "." + str(b3) + "." + str(b4))
  621. return ip_address
  622. ip_addresses = []
  623. for i in range(0, n):
  624. address = generate_address(ip_class)
  625. while is_invalid(address):
  626. address = generate_address(ip_class)
  627. ip_addresses.append(str(address))
  628. if n == 1:
  629. return ip_addresses[0]
  630. else:
  631. return ip_addresses
  632. @staticmethod
  633. def generate_random_ipv6_address(n: int = 1):
  634. """
  635. Generates n random IPv6 addresses.
  636. :param n: The number of IP addresses to be generated
  637. :return: A single IP address, or if n>1, a list of IP addresses
  638. """
  639. def is_invalid(ip_address: ipaddress.IPv6Address):
  640. return ip_address.is_multicast or ip_address.is_unspecified or ip_address.is_loopback or \
  641. ip_address.is_link_local or ip_address.is_private or ip_address.is_reserved
  642. def generate_address():
  643. return ipaddress.IPv6Address(random.randint(0, 2 ** 128 - 1))
  644. ip_addresses = []
  645. for i in range(0, n):
  646. address = generate_address()
  647. while is_invalid(address):
  648. address = generate_address()
  649. ip_addresses.append(str(address))
  650. if n == 1:
  651. return ip_addresses[0]
  652. else:
  653. return ip_addresses
  654. @staticmethod
  655. def generate_random_mac_address(n: int = 1):
  656. """
  657. Generates n random MAC addresses.
  658. :param n: The number of MAC addresses to be generated.
  659. :return: A single MAC addres, or if n>1, a list of MAC addresses
  660. """
  661. def is_invalid(address_param: str):
  662. first_octet = int(address_param[0:2], 16)
  663. is_multicast_address = bool(first_octet & 0b01)
  664. is_locally_administered = bool(first_octet & 0b10)
  665. return is_multicast_address or is_locally_administered
  666. def generate_address():
  667. # FIXME: cleanup
  668. mac = [random.randint(0x00, 0xff) for i in range(0, 6)]
  669. return ':'.join(map(lambda x: "%02x" % x, mac))
  670. mac_addresses = []
  671. for i in range(0, n):
  672. address = generate_address()
  673. while is_invalid(address):
  674. address = generate_address()
  675. mac_addresses.append(address)
  676. if n == 1:
  677. return mac_addresses[0]
  678. else:
  679. return mac_addresses
  680. @staticmethod
  681. def get_ports_from_nmap_service_dst(ports_num):
  682. """
  683. Read the most ports_num frequently open ports from nmap-service-tcp file to be used in the port scan.
  684. :return: Ports numbers to be used as default destination ports or default open ports in the port scan.
  685. """
  686. ports_dst = []
  687. file = open(Util.RESOURCE_DIR + 'nmap-services-tcp.csv', 'rt')
  688. spamreader = csv.reader(file, delimiter=',')
  689. for count in range(ports_num):
  690. # escape first row (header)
  691. next(spamreader)
  692. # save ports numbers
  693. ports_dst.append(next(spamreader)[0])
  694. file.close()
  695. # rnd.shuffle ports numbers partially
  696. if ports_num == 1000: # used for port.dst
  697. # FIXME: cleanup
  698. temp_array = [[0 for i in range(10)] for i in range(100)]
  699. port_dst_shuffled = []
  700. for count in range(0, 10):
  701. temp_array[count] = ports_dst[count * 100:(count + 1) * 100]
  702. rnd.shuffle(temp_array[count])
  703. port_dst_shuffled += temp_array[count]
  704. else: # used for port.open
  705. rnd.shuffle(ports_dst)
  706. port_dst_shuffled = ports_dst
  707. return port_dst_shuffled