123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424 |
- /*
- * Class providing containers and access methods for statistical data collection.
- */
- #ifndef CPP_PCAPREADER_STATISTICS_H
- #define CPP_PCAPREADER_STATISTICS_H
- // Aidmar
- #include <vector>
- #include <unordered_map>
- #include <list>
- #include <tuple>
- #include <tins/timestamp.h>
- #include <tins/ip_address.h>
- /*
- * Definition of structs used in unordered_map fields
- */
- /*
- * Struct used as data structure for method get_stats_for_ip, represents:
- * - Incoming bandwidth in KBits
- * - Outgoing bandwidth in KBits
- * - Number of incoming packets per second
- * - Number of outgoing packets per second
- * - Average size of sent packets in kbytes
- * - Average size of received packets in kybtes
- * - Average value of TCP option Maximum Segment Size (MSS)
- */
- struct ip_stats {
- float bandwidthKBitsIn;
- float bandwidthKBitsOut;
- float packetPerSecondIn;
- float packetPerSecondOut;
- float AvgPacketSizeSent;
- float AvgPacketSizeRecv;
- long AvgMaxSegmentSizeTCP;
- };
- // Aidmar
- /*
- * Struct used to represent a conv by:
- * - IP address A
- * - Port A
- * - IP address B
- * - Port B
- */
- struct conv{
- std::string ipAddressA;
- int portA;
- std::string ipAddressB;
- int portB;
- bool operator==(const conv &other) const {
- return ipAddressA == other.ipAddressA
- && portA == other.portA
- &&ipAddressB == other.ipAddressB
- && portB == other.portB;
- }
- };
- // Aidmar
- /*
- * Struct used to represent:
- * - IP address (IPv4 or IPv6)
- * - MSS value
- */
- struct ipAddress_mss {
- std::string ipAddress;
- int mssValue;
- bool operator==(const ipAddress_mss &other) const {
- return ipAddress == other.ipAddress
- && mssValue == other.mssValue;
- }
- };
- // Aidmar
- /*
- * Struct used to represent:
- * - IP address (IPv4 or IPv6)
- * - Window size
- */
- struct ipAddress_win {
- std::string ipAddress;
- int winSize;
- bool operator==(const ipAddress_win &other) const {
- return ipAddress == other.ipAddress
- && winSize == other.winSize;
- }
- };
- /*
- * Struct used to represent:
- * - IP address (IPv4 or IPv6)
- * - TTL value
- */
- struct ipAddress_ttl {
- std::string ipAddress;
- int ttlValue;
- bool operator==(const ipAddress_ttl &other) const {
- return ipAddress == other.ipAddress
- && ttlValue == other.ttlValue;
- }
- };
- /*
- * Struct used to represent:
- * - IP address (IPv4 or IPv6)
- * - Protocol (e.g. TCP, UDP, IPv4, IPv6)
- */
- struct ipAddress_protocol {
- std::string ipAddress;
- std::string protocol;
- bool operator==(const ipAddress_protocol &other) const {
- return ipAddress == other.ipAddress
- && protocol == other.protocol;
- }
- };
- /*
- * Struct used to represent:
- * - Number of received packets
- * - Number of sent packets
- * - Data received in kbytes
- * - Data sent in kbytes
- */
- struct entry_ipStat {
- long pkts_received;
- long pkts_sent;
- float kbytes_received;
- float kbytes_sent;
- // Aidmar
- std::string ip_class;
- std::vector<float> interval_pkt_rate;
- float max_pkt_rate;
- float min_pkt_rate;
- // Aidmar - to calculate Mahoney anomaly score
- long firstAppearAsSenderPktCount;
- long firstAppearAsReceiverPktCount;
- long sourceAnomalyScore;
- long destinationAnomalyScore;
- // Aidmar- To collect statstics over time interval
- std::vector<std::chrono::microseconds> pktsSentTimestamp;
- std::vector<std::chrono::microseconds> pktsReceivedTimestamp;
- bool operator==(const entry_ipStat &other) const {
- return pkts_received == other.pkts_received
- && pkts_sent == other.pkts_sent
- && kbytes_sent == other.kbytes_sent
- && kbytes_received == other.kbytes_received
- // Aidmar
- && interval_pkt_rate == other.interval_pkt_rate
- && max_pkt_rate == other.max_pkt_rate
- && min_pkt_rate == other.min_pkt_rate
- && ip_class == other.ip_class
- && firstAppearAsSenderPktCount == other.firstAppearAsSenderPktCount
- && firstAppearAsReceiverPktCount == other.firstAppearAsReceiverPktCount
- && sourceAnomalyScore == other.sourceAnomalyScore
- && destinationAnomalyScore == other.destinationAnomalyScore
- && pktsSentTimestamp == other.pktsSentTimestamp
- && pktsReceivedTimestamp == other.pktsReceivedTimestamp;
- }
- };
- // Aidmar
- /*
- * Struct used to represent interval statistics:
- * - Number of packets
- * - IP source entropy
- * - IP destination entropy
- */
- struct entry_intervalStat {
- int pkts_count;
- float ip_src_entropy;
- float ip_dst_entropy;
- bool operator==(const entry_intervalStat &other) const {
- return pkts_count == other.pkts_count
- && ip_src_entropy == other.ip_src_entropy
- && ip_dst_entropy == other.ip_dst_entropy;
- }
- };
- // Aidmar
- /*
- * Struct used to represent:
- * - Number of packets from A to B
- * - Number of packets from B to A
- */
- struct entry_convStat {
- long pkts_A_B;
- long pkts_B_A;
- std::vector<std::chrono::microseconds> pkts_A_B_timestamp;
- std::vector<std::chrono::microseconds> pkts_B_A_timestamp;
- std::vector<std::chrono::microseconds> pkts_delay;
- //std::chrono::duration<double, std::micro> median_delay;
- std::chrono::microseconds avg_delay;
-
- bool operator==(const entry_convStat &other) const {
- return pkts_A_B == other.pkts_A_B
- && pkts_A_B_timestamp == other.pkts_A_B_timestamp
- && pkts_B_A_timestamp == other.pkts_B_A_timestamp
- && pkts_delay == other.pkts_delay
- && avg_delay == other.avg_delay;
- }
- };
- /*
- * Struct used to represent:
- * - IP address (IPv4 or IPv6)
- - Traffic direction (out: outgoing connection, in: incoming connection)
- * - Port number
- */
- struct ipAddress_inOut_port {
- std::string ipAddress;
- std::string trafficDirection;
- int portNumber;
- bool operator==(const ipAddress_inOut_port &other) const {
- return ipAddress == other.ipAddress
- && trafficDirection == other.trafficDirection
- && portNumber == other.portNumber;
- }
- };
- /*
- * Definition of hash functions for structs used as key in unordered_map
- */
- namespace std {
- template<>
- struct hash<ipAddress_ttl> {
- std::size_t operator()(const ipAddress_ttl &k) const {
- using std::size_t;
- using std::hash;
- using std::string;
- return ((hash<string>()(k.ipAddress)
- ^ (hash<int>()(k.ttlValue) << 1)) >> 1);
- }
- };
- // Aidmar
- template<>
- struct hash<ipAddress_mss> {
- std::size_t operator()(const ipAddress_mss &k) const {
- using std::size_t;
- using std::hash;
- using std::string;
- return ((hash<string>()(k.ipAddress)
- ^ (hash<int>()(k.mssValue) << 1)) >> 1);
- }
- };
- // Aidmar
- template<>
- struct hash<ipAddress_win> {
- std::size_t operator()(const ipAddress_win &k) const {
- using std::size_t;
- using std::hash;
- using std::string;
- return ((hash<string>()(k.ipAddress)
- ^ (hash<int>()(k.winSize) << 1)) >> 1);
- }
- };
-
- // Aidmar: TO-DO:??
- template<>
- struct hash<conv> {
- std::size_t operator()(const conv &k) const {
- using std::size_t;
- using std::hash;
- using std::string;
- return ((hash<string>()(k.ipAddressA)
- ^ (hash<int>()(k.portA) << 1)) >> 1)
- ^ ((hash<string>()(k.ipAddressB)
- ^ (hash<int>()(k.portB) << 1)) >> 1);
- }
- };
-
- template<>
- struct hash<ipAddress_protocol> {
- std::size_t operator()(const ipAddress_protocol &k) const {
- using std::size_t;
- using std::hash;
- using std::string;
- return ((hash<string>()(k.ipAddress)
- ^ (hash<string>()(k.protocol) << 1)) >> 1);
- }
- };
- template<>
- struct hash<ipAddress_inOut_port> {
- std::size_t operator()(const ipAddress_inOut_port &k) const {
- using std::size_t;
- using std::hash;
- using std::string;
- return ((hash<string>()(k.ipAddress)
- ^ (hash<string>()(k.trafficDirection) << 1)) >> 1)
- ^ (hash<int>()(k.portNumber) << 1);
- }
- };
- }
- class statistics {
- public:
- /*
- * Constructor
- */
- statistics();
- /*
- * Methods
- */
- std::string getFormattedTimestamp(time_t seconds, suseconds_t microseconds) const;
- /*
- * Access methods for containers
- */
- void incrementPacketCount();
- // Adimar
- void incrementMSScount(std::string ipAddress, int mssValue);
- void incrementWinCount(std::string ipAddress, int winSize);
- void addIPEntropy(std::string filePath);
- void addFlowStat(std::string ipAddressSender,int sport,std::string ipAddressReceiver,int dport, std::chrono::microseconds timestamp);
- void calculateLastIntervalIPsEntropy(std::string filePath, std::chrono::microseconds intervalStartTimestamp);
- void calculateLastIntervalPacketRate(std::chrono::duration<int, std::micro> interval, std::chrono::microseconds intervalStartTimestamp);
- void addIntervalStat(std::chrono::duration<int, std::micro> interval, std::chrono::microseconds intervalStartTimestamp, std::chrono::microseconds lastPktTimestamp, int previousPacketCount);
- void incrementTTLcount(std::string ipAddress, int ttlValue);
- void incrementProtocolCount(std::string ipAddress, std::string protocol);
- void incrementPortCount(std::string ipAddressSender, int outgoingPort, std::string ipAddressReceiver,
- int incomingPort);
- int getProtocolCount(std::string ipAddress, std::string protocol);
- void setTimestampFirstPacket(Tins::Timestamp ts);
- void setTimestampLastPacket(Tins::Timestamp ts);
-
- // Aidmar
- Tins::Timestamp getTimestampFirstPacket();
- Tins::Timestamp getTimestampLastPacket();
- void assignMacAddress(std::string ipAddress, std::string macAddress);
-
- // Aidmar
- void addIpStat_packetSent(std::string filePath, std::string ipAddressSender, std::string ipAddressReceiver, long bytesSent, std::chrono::microseconds timestamp);
- int getPacketCount();
- void addMSS(std::string ipAddress, int MSSvalue);
- void writeToDatabase(std::string database_path);
- void addPacketSize(uint32_t packetSize);
- std::string getCaptureDurationTimestamp() const;
- float getCaptureDurationSeconds() const;
- float getAvgPacketSize() const;
- void printStats(std::string ipAddress);
- /*
- * IP Address-specific statistics
- */
- ip_stats getStatsForIP(std::string ipAddress);
- private:
- /*
- * Data fields
- */
- Tins::Timestamp timestamp_firstPacket;
- Tins::Timestamp timestamp_lastPacket;
- float sumPacketSize = 0;
- int packetCount = 0;
- /*
- * Data containers
- */
- // {IP Address, TTL value, count}
- std::unordered_map<ipAddress_ttl, int> ttl_distribution;
- // Aidmar
- // {IP Address, MSS value, count}
- std::unordered_map<ipAddress_mss, int> mss_distribution;
- // {IP Address, Win size, count}
- std::unordered_map<ipAddress_win, int> win_distribution;
- // {IP Address A, Port A, IP Address B, Port B, #packets_A_B, #packets_B_A}
- std::unordered_map<conv, entry_convStat> conv_statistics;
- std::unordered_map<std::string, entry_intervalStat> interval_statistics;
-
- // {IP Address, Protocol, count}
- std::unordered_map<ipAddress_protocol, int> protocol_distribution;
- // {IP Address, #received packets, #sent packets, Data received in kbytes, Data sent in kbytes}
- std::unordered_map<std::string, entry_ipStat> ip_statistics;
- // {IP Address, in_out, Port Number, count}
- std::unordered_map<ipAddress_inOut_port, int> ip_ports;
- // {IP Address, MAC Address}
- std::unordered_map<std::string, std::string> ip_mac_mapping;
- // {IP Address, avg MSS}
- std::unordered_map<std::string, int> ip_sumMss;
- };
- #endif //CPP_PCAPREADER_STATISTICS_H
|