123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931 |
- #include <iostream>
- #include <fstream>
- #include <vector>
- #include <math.h>
- #include "statistics.h"
- #include <sstream>
- #include <SQLiteCpp/SQLiteCpp.h>
- #include "statistics_db.h"
- #include "statistics.h"
- #include "utilities.h"
- using namespace Tins;
- /**
- * Checks if there is a payload and increments payloads counter.
- * @param pdu_l4 The packet that should be checked if it has a payload or not.
- */
- void statistics::checkPayload(const PDU *pdu_l4) {
- if(this->getDoExtraTests()) {
- // pdu_l4: Tarnsport layer 4
- int pktSize = pdu_l4->size();
- int headerSize = pdu_l4->header_size(); // TCP/UDP header
- int payloadSize = pktSize - headerSize;
- if (payloadSize > 0)
- payloadCount++;
- }
- }
- /**
- * Checks the correctness of TCP checksum and increments counter if the checksum was incorrect.
- * @param ipAddressSender The source IP.
- * @param ipAddressReceiver The destination IP.
- * @param tcpPkt The packet to get checked.
- */
- void statistics::checkTCPChecksum(const std::string &ipAddressSender, const std::string &ipAddressReceiver, TCP tcpPkt) {
- if(this->getDoExtraTests()) {
- if(check_tcpChecksum(ipAddressSender, ipAddressReceiver, tcpPkt))
- correctTCPChecksumCount++;
- else incorrectTCPChecksumCount++;
- }
- }
- /**
- * Calculates entropy of the source and destination IPs in a time interval.
- * @param intervalStartTimestamp The timstamp where the interval starts.
- * @return a vector: contains source IP entropy and destination IP entropy.
- */
- std::vector<double> statistics::calculateLastIntervalIPsEntropy(std::chrono::microseconds intervalStartTimestamp){
- if(this->getDoExtraTests()) {
- // TODO: change datastructures
- std::vector<long> IPsSrcPktsCounts;
- std::vector<long> IPsDstPktsCounts;
- std::vector<long> IPsSrcNovelPktsCounts;
- std::vector<long> IPsDstNovelPktsCounts;
- std::vector<double> IPsSrcProb;
- std::vector<double> IPsDstProb;
- std::vector<double> IPsSrcNovelProb;
- std::vector<double> IPsDstNovelProb;
- long pktsSent = 0, pktsReceived = 0, novelPktsSent = 0, novelPktsReceived = 0;
- for (auto i = ip_statistics.begin(); i != ip_statistics.end(); i++) {
- long IPsSrcPktsCount = 0;
- long IPsSrcNovelPktsCount = 0;
- if (intervalCumIPStats.count(i->first) == 0) {
- IPsSrcPktsCount = i->second.pkts_sent;
- IPsSrcNovelPktsCount = i->second.pkts_sent;
- IPsSrcNovelPktsCounts.push_back(IPsSrcNovelPktsCount);
- novelPktsSent += IPsSrcNovelPktsCount;
- } else {
- IPsSrcPktsCount = i->second.pkts_sent-intervalCumIPStats[i->first].pkts_sent;
- }
- if(IPsSrcPktsCount != 0) {
- IPsSrcPktsCounts.push_back(IPsSrcPktsCount);
- pktsSent += IPsSrcPktsCount;
- }
- long IPsDstPktsCount = 0;
- long IPsDstNovelPktsCount = 0;
- if (intervalCumIPStats.count(i->first) == 0) {
- IPsDstPktsCount = i->second.pkts_received;
- IPsDstNovelPktsCount = i->second.pkts_received;
- IPsDstNovelPktsCounts.push_back(IPsDstNovelPktsCount);
- novelPktsReceived += IPsDstNovelPktsCount;
- } else {
- IPsDstPktsCount = i->second.pkts_received-intervalCumIPStats[i->first].pkts_received;
- }
- if(IPsDstPktsCount != 0) {
- IPsDstPktsCounts.push_back(IPsDstPktsCount);
- pktsReceived += IPsDstPktsCount;
- }
- }
- for (auto i = IPsSrcPktsCounts.begin(); i != IPsSrcPktsCounts.end(); i++) {
- IPsSrcProb.push_back(static_cast<double>(*i) / static_cast<double>(pktsSent));
- }
- for (auto i = IPsDstPktsCounts.begin(); i != IPsDstPktsCounts.end(); i++) {
- IPsDstProb.push_back(static_cast<double>(*i) / static_cast<double>(pktsReceived));
- }
- for (auto i = IPsSrcNovelPktsCounts.begin(); i != IPsSrcNovelPktsCounts.end(); i++) {
- IPsSrcNovelProb.push_back(static_cast<double>(*i) / static_cast<double>(novelPktsSent));
- }
- for (auto i = IPsDstNovelPktsCounts.begin(); i != IPsDstNovelPktsCounts.end(); i++) {
- IPsDstNovelProb.push_back(static_cast<double>(*i) / static_cast<double>(novelPktsReceived));
- }
- // Calculate IP source entropy
- double IPsSrcEntropy = 0;
- for (unsigned i = 0; i < IPsSrcProb.size(); i++) {
- if (IPsSrcProb[i] > 0)
- IPsSrcEntropy += -IPsSrcProb[i] * log2(IPsSrcProb[i]);
- }
- // Calculate IP destination entropy
- double IPsDstEntropy = 0;
- for (unsigned i = 0; i < IPsDstProb.size(); i++) {
- if (IPsDstProb[i] > 0)
- IPsDstEntropy += -IPsDstProb[i] * log2(IPsDstProb[i]);
- }
- // Calculate IP source novel entropy
- double IPsSrcNovelEntropy = 0;
- for (unsigned i = 0; i < IPsSrcNovelProb.size(); i++) {
- if (IPsSrcNovelProb[i] > 0)
- IPsSrcNovelEntropy += -IPsSrcNovelProb[i] * log2(IPsSrcNovelProb[i]);
- }
- // Calculate IP destination novel entropy
- double IPsDstNovelEntropy = 0;
- for (unsigned i = 0; i < IPsDstNovelProb.size(); i++) {
- if (IPsDstNovelProb[i] > 0)
- IPsDstNovelEntropy += -IPsDstNovelProb[i] * log2(IPsDstNovelProb[i]);
- }
- this->ip_src_novel_count = IPsSrcNovelPktsCounts.size();
- this->ip_dst_novel_count = IPsDstNovelPktsCounts.size();
- double norm_src_entropy = 0;
- if (IPsSrcPktsCounts.size() > 0 && log2(IPsSrcPktsCounts.size()) > 0) {
- norm_src_entropy = IPsSrcEntropy / log2(IPsSrcPktsCounts.size());
- }
- double norm_dst_entropy = 0;
- if (IPsDstPktsCounts.size() > 0 && log2(IPsDstPktsCounts.size()) > 0) {
- norm_dst_entropy = IPsDstEntropy / log2(IPsDstPktsCounts.size());
- }
- double norm_novel_src_entropy = 0;
- if (IPsSrcNovelPktsCounts.size() > 0 && log2(IPsSrcNovelPktsCounts.size()) > 0) {
- norm_novel_src_entropy = IPsSrcNovelEntropy / log2(IPsSrcNovelPktsCounts.size());
- }
- double norm_novel_dst_entropy = 0;
- if (IPsDstNovelPktsCounts.size() > 0 && log2(IPsDstNovelPktsCounts.size()) > 0) {
- norm_novel_dst_entropy = IPsDstNovelEntropy / log2(IPsDstNovelPktsCounts.size());
- }
- std::vector<double> entropies = {IPsSrcEntropy, IPsDstEntropy, IPsSrcNovelEntropy, IPsDstNovelEntropy, norm_src_entropy, norm_dst_entropy, norm_novel_src_entropy, norm_novel_dst_entropy};
- return entropies;
- }
- else {
- return {-1, -1, -1, -1, -1, -1, -1, -1};
- }
- }
- /**
- * Calculates the cumulative entropy of the source and destination IPs, i.e., the entropy for packets from the beginning of the pcap file.
- * @return a vector: contains the cumulative entropies of source and destination IPs
- */
- std::vector<double> statistics::calculateIPsCumEntropy(){
- if(this->getDoExtraTests()) {
- std::vector <std::string> IPs;
- std::vector <double> IPsSrcProb;
- std::vector <double> IPsDstProb;
- for (auto i = ip_statistics.begin(); i != ip_statistics.end(); i++) {
- IPs.push_back(i->first);
- IPsSrcProb.push_back(static_cast<double>(i->second.pkts_sent)/static_cast<double>(packetCount));
- IPsDstProb.push_back(static_cast<double>(i->second.pkts_received)/static_cast<double>(packetCount));
- }
- // Calculate IP source entropy
- double IPsSrcEntropy = 0;
- for(unsigned i=0; i < IPsSrcProb.size();i++){
- if (IPsSrcProb[i] > 0)
- IPsSrcEntropy += - IPsSrcProb[i]*log2(IPsSrcProb[i]);
- }
- // Calculate IP destination entropy
- double IPsDstEntropy = 0;
- for(unsigned i=0; i < IPsDstProb.size();i++){
- if (IPsDstProb[i] > 0)
- IPsDstEntropy += - IPsDstProb[i]*log2(IPsDstProb[i]);
- }
- double norm_src_entropy = 0;
- if (IPsSrcProb.size() > 0 && log2(IPsDstProb.size()) > 0) {
- norm_src_entropy = IPsSrcEntropy / log2(IPsSrcProb.size());
- }
- double norm_dst_entropy = 0;
- if (IPsDstProb.size() > 0 && log2(IPsDstProb.size()) > 0) {
- norm_dst_entropy = IPsDstEntropy / log2(IPsDstProb.size());
- }
- std::vector<double> entropies = {IPsSrcEntropy, IPsDstEntropy, norm_src_entropy, norm_dst_entropy};
- return entropies;
- }
- else {
- return {-1, -1, -1, -1};
- }
- }
- /**
- * Calculates sending packet rate for each IP in a time interval. Finds min and max packet rate and adds them to ip_statistics map.
- * @param intervalStartTimestamp The timstamp where the interval starts.
- */
- void statistics::calculateIPIntervalPacketRate(std::chrono::duration<int, std::micro> interval, std::chrono::microseconds intervalStartTimestamp){
- for (auto i = ip_statistics.begin(); i != ip_statistics.end(); i++) {
- int IPsSrcPktsCount = 0;
- for (auto j = i->second.pkts_sent_timestamp.begin(); j != i->second.pkts_sent_timestamp.end(); j++) {
- if(*j >= intervalStartTimestamp)
- IPsSrcPktsCount++;
- }
- float interval_pkt_rate = (float) IPsSrcPktsCount * 1000000 / interval.count(); // used 10^6 because interval in microseconds
- i->second.interval_pkt_rate.push_back(interval_pkt_rate);
- if(interval_pkt_rate > i->second.max_interval_pkt_rate || i->second.max_interval_pkt_rate == 0)
- i->second.max_interval_pkt_rate = interval_pkt_rate;
- if(interval_pkt_rate < i->second.min_interval_pkt_rate || i->second.min_interval_pkt_rate == 0)
- i->second.min_interval_pkt_rate = interval_pkt_rate;
- }
- }
- /**
- * Calculates the entropies for the count of integer values.
- * @param current map containing the values with counts
- * @param an old map containing the values with counts (from last iteration)
- * @return a vector containing the calculated entropies: entropy of all updated values, entropy of all novel values, normalized entropy of all, normalized entropy of novel
- */
- std::vector<double> statistics::calculateEntropies(std::unordered_map<int, int> &map, std::unordered_map<int, int> &old) {
- std::vector<double> counts;
- int count_total = 0;
- double entropy = 0.0;
- std::vector<double> novel_counts;
- int novel_count_total = 0;
- double novel_entropy = 0.0;
- // iterate over all values
- for (auto iter: map) {
- if (old.count(iter.first) == 0) {
- // count novel values
- double novel_count = static_cast<double>(iter.second);
- counts.push_back(novel_count);
- count_total += novel_count;
- novel_counts.push_back(novel_count);
- novel_count_total += novel_count;
- } else if (iter.second != old[iter.first]) {
- // count all increased values
- double count = static_cast<double>(iter.second-old[iter.first]);
- if (count != 0.0) {
- counts.push_back(count);
- count_total += count;
- }
- }
- }
- // calculate entropy
- for (auto count: counts) {
- double prob = count / static_cast<double>(count_total);
- entropy += -1 * prob * log2(prob);
- }
- // calculate novelty entropy
- for (auto novel_count: novel_counts) {
- double novel_prob = novel_count / static_cast<double>(novel_count_total);
- novel_entropy += -1 * novel_prob * log2(novel_prob);
- }
- double norm_entropy = 0;
- if (counts.size() > 0 && log2(counts.size()) > 0) {
- norm_entropy = entropy / log2(counts.size());
- }
- double norm_novel_entropy = 0;
- if (novel_counts.size() > 0 && log2(novel_counts.size()) > 0) {
- norm_novel_entropy = novel_entropy / log2(novel_counts.size());
- }
- return {entropy, novel_entropy, norm_entropy, norm_novel_entropy};
- }
- /**
- * Registers statistical data for a time interval.
- * @param intervalStartTimestamp The timstamp where the interval starts.
- * @param intervalEndTimestamp The timstamp where the interval ends.
- * @param previousPacketCount The total number of packets in last interval.
- */
- void statistics::addIntervalStat(std::chrono::duration<int, std::micro> interval, std::chrono::microseconds intervalStartTimestamp, std::chrono::microseconds intervalEndTimestamp){
- // Add packet rate for each IP to ip_statistics map
- calculateIPIntervalPacketRate(interval, intervalStartTimestamp);
-
- std::vector<double> ipEntopies = calculateLastIntervalIPsEntropy(intervalStartTimestamp);
- std::vector<double> ipCumEntopies = calculateIPsCumEntropy();
- std::string lastPktTimestamp_s = std::to_string(intervalEndTimestamp.count());
- std::string intervalStartTimestamp_s = std::to_string(intervalStartTimestamp.count());
- // The intervalStartTimestamp_s is the previous interval lastPktTimestamp_s
- // TODO: check with carlos if first and last packet timestamps are alright
- interval_statistics[lastPktTimestamp_s].start = std::to_string(intervalStartTimestamp.count());
- interval_statistics[lastPktTimestamp_s].end = std::to_string(intervalEndTimestamp.count());
- interval_statistics[lastPktTimestamp_s].pkts_count = packetCount - intervalCumPktCount;
- interval_statistics[lastPktTimestamp_s].pkt_rate = static_cast<float>(interval_statistics[lastPktTimestamp_s].pkts_count) / (static_cast<double>(interval.count()) / 1000000);
- interval_statistics[lastPktTimestamp_s].kbytes = static_cast<float>(sumPacketSize - intervalCumSumPktSize) / 1024;
- interval_statistics[lastPktTimestamp_s].kbyte_rate = interval_statistics[lastPktTimestamp_s].kbytes / (static_cast<double>(interval.count()) / 1000000);
- interval_statistics[lastPktTimestamp_s].payload_count = payloadCount - intervalPayloadCount;
- interval_statistics[lastPktTimestamp_s].incorrect_tcp_checksum_count = incorrectTCPChecksumCount - intervalIncorrectTCPChecksumCount;
- interval_statistics[lastPktTimestamp_s].correct_tcp_checksum_count = correctTCPChecksumCount - intervalCorrectTCPChecksumCount;
- interval_statistics[lastPktTimestamp_s].novel_ip_src_count = this->ip_src_novel_count;
- interval_statistics[lastPktTimestamp_s].novel_ip_dst_count = this->ip_dst_novel_count;
- interval_statistics[lastPktTimestamp_s].novel_ttl_count = static_cast<int>(ttl_values.size()) - intervalCumNovelTTLCount;
- interval_statistics[lastPktTimestamp_s].novel_win_size_count = static_cast<int>(win_values.size()) - intervalCumNovelWinSizeCount;
- interval_statistics[lastPktTimestamp_s].novel_tos_count = static_cast<int>(tos_values.size()) - intervalCumNovelToSCount;
- interval_statistics[lastPktTimestamp_s].novel_mss_count = static_cast<int>(mss_values.size()) - intervalCumNovelMSSCount;
- interval_statistics[lastPktTimestamp_s].novel_port_count = static_cast<int>(port_values.size()) - intervalCumNovelPortCount;
- interval_statistics[lastPktTimestamp_s].ttl_entropies = calculateEntropies(ttl_values, intervalCumTTLValues);
- interval_statistics[lastPktTimestamp_s].win_size_entropies = calculateEntropies(win_values, intervalCumWinSizeValues);
- interval_statistics[lastPktTimestamp_s].tos_entropies = calculateEntropies(tos_values, intervalCumTosValues);
- interval_statistics[lastPktTimestamp_s].mss_entropies = calculateEntropies(mss_values, intervalCumMSSValues);
- interval_statistics[lastPktTimestamp_s].port_entropies = calculateEntropies(port_values, intervalCumPortValues);
- intervalPayloadCount = payloadCount;
- intervalIncorrectTCPChecksumCount = incorrectTCPChecksumCount;
- intervalCorrectTCPChecksumCount = correctTCPChecksumCount;
- intervalCumPktCount = packetCount;
- intervalCumSumPktSize = sumPacketSize;
- intervalCumNovelIPCount = static_cast<int>(ip_statistics.size());
- intervalCumNovelTTLCount = static_cast<int>(ttl_values.size());
- intervalCumNovelWinSizeCount = static_cast<int>(win_values.size());
- intervalCumNovelToSCount =static_cast<int>(tos_values.size());
- intervalCumNovelMSSCount = static_cast<int>(mss_values.size());
- intervalCumNovelPortCount = static_cast<int>(port_values.size());
- intervalCumIPStats = ip_statistics;
- intervalCumTTLValues = ttl_values;
- intervalCumWinSizeValues = win_values;
- intervalCumTosValues = tos_values;
- intervalCumMSSValues = mss_values;
- intervalCumPortValues = port_values;
- interval_statistics[lastPktTimestamp_s].ip_entropies = ipEntopies;
- interval_statistics[lastPktTimestamp_s].ip_cum_entropies = ipCumEntopies;
- }
- /**
- * Registers statistical data for a sent packet in a given conversation (two IPs, two ports).
- * Increments the counter packets_A_B or packets_B_A.
- * Adds the timestamp of the packet in pkts_A_B_timestamp or pkts_B_A_timestamp.
- * @param ipAddressSender The sender IP address.
- * @param sport The source port.
- * @param ipAddressReceiver The receiver IP address.
- * @param dport The destination port.
- * @param timestamp The timestamp of the packet.
- */
- void statistics::addConvStat(const std::string &ipAddressSender,int sport,const std::string &ipAddressReceiver,int dport, std::chrono::microseconds timestamp, small_uint<12> flags){
- conv f1 = {ipAddressReceiver, dport, ipAddressSender, sport};
- conv f2 = {ipAddressSender, sport, ipAddressReceiver, dport};
- // if already exist A(ipAddressReceiver, dport), B(ipAddressSender, sport) conversation
- if (conv_statistics.count(f1)>0){
- conv_statistics[f1].pkts_count++;
- if(conv_statistics[f1].pkts_count<=3)
- conv_statistics[f1].interarrival_time.push_back(std::chrono::duration_cast<std::chrono::microseconds> (timestamp - conv_statistics[f1].pkts_timestamp.back()));
- conv_statistics[f1].pkts_timestamp.push_back(timestamp);
- conv_statistics[f1].tcp_types.push_back(flags);
- }
- // Add new conversation A(ipAddressSender, sport), B(ipAddressReceiver, dport)
- else{
- conv_statistics[f2].pkts_count++;
- if(conv_statistics[f2].pkts_timestamp.size()>0 && conv_statistics[f2].pkts_count<=3 )
- conv_statistics[f2].interarrival_time.push_back(std::chrono::duration_cast<std::chrono::microseconds> (timestamp - conv_statistics[f2].pkts_timestamp.back()));
- conv_statistics[f2].pkts_timestamp.push_back(timestamp);
- conv_statistics[f2].tcp_types.push_back(flags);
- }
- }
- /**
- * Registers statistical data for a sent packet in a given extended conversation (two IPs, two ports, protocol).
- * Increments the counter packets_A_B or packets_B_A.
- * Adds the timestamp of the packet in pkts_A_B_timestamp or pkts_B_A_timestamp.
- * Updates all other statistics of conv_statistics_extended
- * @param ipAddressSender The sender IP address.
- * @param sport The source port.
- * @param ipAddressReceiver The receiver IP address.
- * @param dport The destination port.
- * @param protocol The used protocol.
- * @param timestamp The timestamp of the packet.
- */
- void statistics::addConvStatExt(const std::string &ipAddressSender,int sport,const std::string &ipAddressReceiver,int dport,const std::string &protocol, std::chrono::microseconds timestamp){
- if(this->getDoExtraTests()) {
- convWithProt f1 = {ipAddressReceiver, dport, ipAddressSender, sport, protocol};
- convWithProt f2 = {ipAddressSender, sport, ipAddressReceiver, dport, protocol};
- convWithProt f;
- // if there already exists a communication interval for the specified conversation
- if (conv_statistics_extended.count(f1) > 0 || conv_statistics_extended.count(f2) > 0){
- // find out which direction of conversation is contained in conv_statistics_extended
- if (conv_statistics_extended.count(f1) > 0)
- f = f1;
- else
- f = f2;
- // increase pkts count and check on delay
- conv_statistics_extended[f].pkts_count++;
- if (conv_statistics_extended[f].pkts_timestamp.size()>0 && conv_statistics_extended[f].pkts_count<=3)
- conv_statistics_extended[f].interarrival_time.push_back(std::chrono::duration_cast<std::chrono::microseconds> (timestamp - conv_statistics_extended[f].pkts_timestamp.back()));
- conv_statistics_extended[f].pkts_timestamp.push_back(timestamp);
- // if the time difference has exceeded the threshold, create a new interval with this message
- if (timestamp - conv_statistics_extended[f].comm_intervals.back().end > (std::chrono::microseconds) ((unsigned long) COMM_INTERVAL_THRESHOLD)) { // > or >= ?
- commInterval new_interval = {timestamp, timestamp, 1};
- conv_statistics_extended[f].comm_intervals.push_back(new_interval);
- }
- // otherwise, set the time of the last interval message to the current timestamp and increase interval packet count by 1
- else{
- conv_statistics_extended[f].comm_intervals.back().end = timestamp;
- conv_statistics_extended[f].comm_intervals.back().pkts_count++;
- }
- }
- // if there does not exist a communication interval for the specified conversation
- else{
- // add initial interval entry for this conversation
- commInterval initial_interval = {timestamp, timestamp, 1};
- entry_convStatExt entry;
- entry.comm_intervals.push_back(initial_interval);
- entry.pkts_count = 1;
- entry.pkts_timestamp.push_back(timestamp);
- conv_statistics_extended[f2] = entry;
- }
- }
- }
- /**
- * Aggregate the collected information about all communication intervals within conv_statistics_extended of every conversation.
- * Do this by computing the average packet rate per interval and the average time between intervals.
- * Also compute average interval duration and total communication duration (i.e. last_msg.time - first_msg.time)
- */
- void statistics::createCommIntervalStats(){
- // iterate over all <convWithProt, entry_convStatExt> pairs
- for (auto &cur_elem : conv_statistics_extended) {
- entry_convStatExt &entry = cur_elem.second;
- std::vector<commInterval> &intervals = entry.comm_intervals;
- // if there is only one interval, the time between intervals cannot be computed and is therefore set to 0
- if (intervals.size() == 1){
- double interval_duration = (double) (intervals[0].end - intervals[0].start).count() / (double) 1e6;
- entry.avg_int_pkts_count = (double) intervals[0].pkts_count;
- entry.avg_time_between_ints = (double) 0;
- entry.avg_interval_time = interval_duration;
- }
- // If there is more than one interval, compute the specified averages
- else if (intervals.size() > 1){
- long summed_pkts_count = intervals[0].pkts_count;
- std::chrono::microseconds time_between_ints_sum = (std::chrono::microseconds) 0;
- std::chrono::microseconds summed_int_duration = intervals[0].end - intervals[0].start;
- for (std::size_t i = 1; i < intervals.size(); i++) {
- summed_pkts_count += intervals[i].pkts_count;
- summed_int_duration += intervals[i].end - intervals[i].start;
- time_between_ints_sum += intervals[i].start - intervals[i - 1].end;
- }
- entry.avg_int_pkts_count = summed_pkts_count / ((double) intervals.size());
- entry.avg_time_between_ints = (time_between_ints_sum.count() / (double) (intervals.size() - 1)) / (double) 1e6;
- entry.avg_interval_time = (summed_int_duration.count() / (double) intervals.size()) / (double) 1e6;
- }
- entry.total_comm_duration = (double) (entry.pkts_timestamp.back() - entry.pkts_timestamp.front()).count() / (double) 1e6;
- }
- }
- /**
- * Increments the packet counter for the given IP address and MSS value.
- * @param ipAddress The IP address whose MSS packet counter should be incremented.
- * @param mssValue The MSS value of the packet.
- */
- void statistics::incrementMSScount(const std::string &ipAddress, int mssValue) {
- mss_values[mssValue]++;
- mss_distribution[{ipAddress, mssValue}]++;
- }
- /**
- * Increments the packet counter for the given IP address and window size.
- * @param ipAddress The IP address whose window size packet counter should be incremented.
- * @param winSize The window size of the packet.
- */
- void statistics::incrementWinCount(const std::string &ipAddress, int winSize) {
- win_values[winSize]++;
- win_distribution[{ipAddress, winSize}]++;
- }
- /**
- * Increments the packet counter for the given IP address and TTL value.
- * @param ipAddress The IP address whose TTL packet counter should be incremented.
- * @param ttlValue The TTL value of the packet.
- */
- void statistics::incrementTTLcount(const std::string &ipAddress, int ttlValue) {
- ttl_values[ttlValue]++;
- ttl_distribution[{ipAddress, ttlValue}]++;
- }
- /**
- * Increments the packet counter for the given IP address and ToS value.
- * @param ipAddress The IP address whose ToS packet counter should be incremented.
- * @param tosValue The ToS value of the packet.
- */
- void statistics::incrementToScount(const std::string &ipAddress, int tosValue) {
- tos_values[tosValue]++;
- tos_distribution[{ipAddress, tosValue}]++;
- }
- /**
- * Increments the protocol counter for the given IP address and protocol.
- * @param ipAddress The IP address whose protocol packet counter should be incremented.
- * @param protocol The protocol of the packet.
- */
- void statistics::incrementProtocolCount(const std::string &ipAddress, const std::string &protocol) {
- protocol_distribution[{ipAddress, protocol}].count++;
- }
- /**
- * Returns the number of packets seen for the given IP address and protocol.
- * @param ipAddress The IP address whose packet count is wanted.
- * @param protocol The protocol whose packet count is wanted.
- */
- int statistics::getProtocolCount(const std::string &ipAddress, const std::string &protocol) {
- return protocol_distribution[{ipAddress, protocol}].count;
- }
- /**
- * Increases the byte counter for the given IP address and protocol.
- * @param ipAddress The IP address whose protocol byte counter should be increased.
- * @param protocol The protocol of the packet.
- * @param byteSent The packet's size.
- */
- void statistics::increaseProtocolByteCount(const std::string &ipAddress, const std::string &protocol, long bytesSent) {
- protocol_distribution[{ipAddress, protocol}].byteCount += bytesSent;
- }
- /**
- * Returns the number of bytes seen for the given IP address and protocol.
- * @param ipAddress The IP address whose byte count is wanted.
- * @param protocol The protocol whose byte count is wanted.
- * @return a float: The number of bytes
- */
- float statistics::getProtocolByteCount(const std::string &ipAddress, const std::string &protocol) {
- return protocol_distribution[{ipAddress, protocol}].byteCount;
- }
- /**
- * Increments the packet counter for
- * - the given sender IP address with outgoing port and
- * - the given receiver IP address with incoming port.
- * @param ipAddressSender The IP address of the packet sender.
- * @param outgoingPort The port used by the sender.
- * @param ipAddressReceiver The IP address of the packet receiver.
- * @param incomingPort The port used by the receiver.
- */
- void statistics::incrementPortCount(const std::string &ipAddressSender, int outgoingPort, const std::string &ipAddressReceiver,
- int incomingPort, const std::string &protocol) {
- port_values[outgoingPort]++;
- port_values[incomingPort]++;
- ip_ports[{ipAddressSender, "out", outgoingPort, protocol}].count++;
- ip_ports[{ipAddressReceiver, "in", incomingPort, protocol}].count++;
- }
- /**
- * Increases the packet byte counter for
- * - the given sender IP address with outgoing port and
- * - the given receiver IP address with incoming port.
- * @param ipAddressSender The IP address of the packet sender.
- * @param outgoingPort The port used by the sender.
- * @param ipAddressReceiver The IP address of the packet receiver.
- * @param incomingPort The port used by the receiver.
- * @param byteSent The packet's size.
- */
- void statistics::increasePortByteCount(const std::string &ipAddressSender, int outgoingPort, const std::string &ipAddressReceiver,
- int incomingPort, long bytesSent, const std::string &protocol) {
- ip_ports[{ipAddressSender, "out", outgoingPort, protocol}].byteCount += bytesSent;
- ip_ports[{ipAddressReceiver, "in", incomingPort, protocol}].byteCount += bytesSent;
- }
- /**
- * Increments the packet counter for
- * - the given sender MAC address and
- * - the given receiver MAC address.
- * @param srcMac The MAC address of the packet sender.
- * @param dstMac The MAC address of the packet receiver.
- * @param typeNumber The payload type number of the packet.
- */
- void statistics::incrementUnrecognizedPDUCount(const std::string &srcMac, const std::string &dstMac, uint32_t typeNumber,
- const std::string ×tamp) {
- unrecognized_PDUs[{srcMac, dstMac, typeNumber}].count++;
- unrecognized_PDUs[{srcMac, dstMac, typeNumber}].timestamp_last_occurrence = timestamp;
- }
- /**
- * Creates a new statistics object.
- */
- statistics::statistics(std::string resourcePath) {;
- this->resourcePath = resourcePath;
- }
- /**
- * Stores the assignment IP address -> MAC address.
- * @param ipAddress The IP address belonging to the given MAC address.
- * @param macAddress The MAC address belonging to the given IP address.
- */
- void statistics::assignMacAddress(const std::string &ipAddress, const std::string &macAddress) {
- ip_mac_mapping[ipAddress] = macAddress;
- }
- /**
- * Registers statistical data for a sent packet. Increments the counter packets_sent for the sender and
- * packets_received for the receiver. Adds the bytes as kbytes_sent (sender) and kybtes_received (receiver).
- * @param ipAddressSender The IP address of the packet sender.
- * @param ipAddressReceiver The IP address of the packet receiver.
- * @param bytesSent The packet's size.
- */
- void statistics::addIpStat_packetSent(const std::string &ipAddressSender, const std::string &ipAddressReceiver, long bytesSent, std::chrono::microseconds timestamp) {
- // Adding IP as a sender for first time
- if(ip_statistics[ipAddressSender].pkts_sent==0){
- // Add the IP class
- ip_statistics[ipAddressSender].ip_class = getIPv4Class(ipAddressSender);
- }
-
- // Adding IP as a receiver for first time
- if(ip_statistics[ipAddressReceiver].pkts_received==0){
- // Add the IP class
- ip_statistics[ipAddressReceiver].ip_class = getIPv4Class(ipAddressReceiver);
- }
- // Update stats for packet sender
- ip_statistics[ipAddressSender].kbytes_sent += (float(bytesSent) / 1024);
- ip_statistics[ipAddressSender].pkts_sent++;
- ip_statistics[ipAddressSender].pkts_sent_timestamp.push_back(timestamp);
-
- // Update stats for packet receiver
- ip_statistics[ipAddressReceiver].kbytes_received += (float(bytesSent) / 1024);
- ip_statistics[ipAddressReceiver].pkts_received++;
- ip_statistics[ipAddressReceiver].pkts_received_timestamp.push_back(timestamp);
- if(this->getDoExtraTests()) {
- // Increment Degrees for sender and receiver, if Sender sends its first packet to this receiver
- std::unordered_set<std::string>::const_iterator found_receiver = contacted_ips[ipAddressSender].find(ipAddressReceiver);
- if(found_receiver == contacted_ips[ipAddressSender].end()){
- // Receiver is NOT contained in the List of IPs, that the Sender has contacted, therefore this is the first packet in this direction
- ip_statistics[ipAddressSender].out_degree++;
- ip_statistics[ipAddressReceiver].in_degree++;
- // Increment overall_degree only if this is the first packet for the connection (both directions)
- // Therefore check, whether Receiver has contacted Sender before
- std::unordered_set<std::string>::const_iterator sender_contacted = contacted_ips[ipAddressReceiver].find(ipAddressSender);
- if(sender_contacted == contacted_ips[ipAddressReceiver].end()){
- ip_statistics[ipAddressSender].overall_degree++;
- ip_statistics[ipAddressReceiver].overall_degree++;
- }
- contacted_ips[ipAddressSender].insert(ipAddressReceiver);
- }
- }
- }
- /**
- * Setter for the timestamp_firstPacket field.
- * @param ts The timestamp of the first packet in the PCAP file.
- */
- void statistics::setTimestampFirstPacket(Tins::Timestamp ts) {
- timestamp_firstPacket = ts;
- }
- /**
- * Setter for the timestamp_lastPacket field.
- * @param ts The timestamp of the last packet in the PCAP file.
- */
- void statistics::setTimestampLastPacket(Tins::Timestamp ts) {
- timestamp_lastPacket = ts;
- }
- /**
- * Getter for the timestamp_firstPacket field.
- */
- Tins::Timestamp statistics::getTimestampFirstPacket() {
- return timestamp_firstPacket;
- }
- /**
- * Getter for the timestamp_lastPacket field.
- */
- Tins::Timestamp statistics::getTimestampLastPacket() {
- return timestamp_lastPacket;
- }
- /**
- * Getter for the packetCount field.
- */
- int statistics::getPacketCount() {
- return packetCount;
- }
- /**
- * Getter for the sumPacketSize field.
- */
- int statistics::getSumPacketSize() {
- return sumPacketSize;
- }
- /**
- * Returns the average packet size.
- * @return a float indicating the average packet size in kbytes.
- */
- float statistics::getAvgPacketSize() const {
- // AvgPktSize = (Sum of all packet sizes / #Packets)
- return (sumPacketSize / packetCount) / 1024;
- }
- /**
- * Adds the size of a packet (to be used to calculate the avg. packet size).
- * @param packetSize The size of the current packet in bytes.
- */
- void statistics::addPacketSize(uint32_t packetSize) {
- sumPacketSize += ((float) packetSize);
- }
- /**
- * Setter for the doExtraTests field.
- */
- void statistics::setDoExtraTests(bool var) {
- doExtraTests = var;
- }
- /**
- * Getter for the doExtraTests field.
- */
- bool statistics::getDoExtraTests() {
- return doExtraTests;
- }
- /**
- * Calculates the capture duration.
- * @return a formatted string HH:MM:SS.mmmmmm with
- * HH: hour, MM: minute, SS: second, mmmmmm: microseconds
- */
- std::string statistics::getCaptureDurationTimestamp() const {
- // Calculate duration
- timeval fp, lp, d;
- fp.tv_sec = timestamp_firstPacket.seconds();
- fp.tv_usec = timestamp_firstPacket.microseconds();
- lp.tv_sec = timestamp_lastPacket.seconds();
- lp.tv_usec = timestamp_lastPacket.microseconds();
- timersub(&lp, &fp, &d);
- long int hour = d.tv_sec / 3600;
- long int remainder = (d.tv_sec - hour * 3600);
- long int minute = remainder / 60;
- long int second = (remainder - minute * 60) % 60;
- long int microseconds = d.tv_usec;
- // Build desired output format: YYYY-mm-dd hh:mm:ss
- char out[64];
- sprintf(out, "%02ld:%02ld:%02ld.%06ld ", hour, minute, second, microseconds);
- return std::string(out);
- }
- /**
- * Calculates the capture duration.
- * @return a formatted string SS.mmmmmm with
- * S: seconds (UNIX time), mmmmmm: microseconds
- */
- float statistics::getCaptureDurationSeconds() const {
- timeval fp, lp, d;
- fp.tv_sec = timestamp_firstPacket.seconds();
- fp.tv_usec = timestamp_firstPacket.microseconds();
- lp.tv_sec = timestamp_lastPacket.seconds();
- lp.tv_usec = timestamp_lastPacket.microseconds();
- timersub(&lp, &fp, &d);
- char buf[64];
- snprintf(buf, sizeof(buf), "%u.%06u", static_cast<uint>(d.tv_sec), static_cast<uint>(d.tv_usec));
- return std::stof(std::string(buf));
- }
- /**
- * Creates a timestamp based on a time_t seconds (UNIX time format) and microseconds.
- * @param seconds
- * @param microseconds
- * @return a formatted string Y-m-d H:M:S.m with
- * Y: year, m: month, d: day, H: hour, M: minute, S: second, m: microseconds
- */
- std::string statistics::getFormattedTimestamp(time_t seconds, suseconds_t microseconds) const {
- timeval tv;
- tv.tv_sec = seconds;
- tv.tv_usec = microseconds;
- char tmbuf[20], buf[64];
- auto nowtm = gmtime(&(tv.tv_sec));
- strftime(tmbuf, sizeof(tmbuf), "%Y-%m-%d %H:%M:%S", nowtm);
- snprintf(buf, sizeof(buf), "%s.%06u", tmbuf, static_cast<uint>(tv.tv_usec));
- return std::string(buf);
- }
- /**
- * Calculates the statistics for a given IP address.
- * @param ipAddress The IP address whose statistics should be calculated.
- * @return a ip_stats struct containing statistical data derived by the statistical data collected.
- */
- ip_stats statistics::getStatsForIP(const std::string &ipAddress) {
- float duration = getCaptureDurationSeconds();
- entry_ipStat ipStatEntry = ip_statistics[ipAddress];
- ip_stats s;
- s.bandwidthKBitsIn = (ipStatEntry.kbytes_received / duration) * 8;
- s.bandwidthKBitsOut = (ipStatEntry.kbytes_sent / duration) * 8;
- s.packetPerSecondIn = (ipStatEntry.pkts_received / duration);
- s.packetPerSecondOut = (ipStatEntry.pkts_sent / duration);
- s.AvgPacketSizeSent = (ipStatEntry.kbytes_sent / ipStatEntry.pkts_sent);
- s.AvgPacketSizeRecv = (ipStatEntry.kbytes_received / ipStatEntry.pkts_received);
- return s;
- }
- int statistics::getDefaultInterval() {
- return this->default_interval;
- }
- void statistics::setDefaultInterval(int interval) {
- this->default_interval = interval;
- }
- /**
- * Increments the packet counter.
- */
- void statistics::incrementPacketCount() {
- packetCount++;
- }
- /**
- * Prints the statistics of the PCAP and IP specific statistics for the given IP address.
- * @param ipAddress The IP address whose statistics should be printed. Can be empty "" to print only general file statistics.
- */
- void statistics::printStats(const std::string &ipAddress) {
- std::stringstream ss;
- ss << std::endl;
- ss << "Capture duration: " << getCaptureDurationSeconds() << " seconds" << std::endl;
- ss << "Capture duration (HH:MM:SS.mmmmmm): " << getCaptureDurationTimestamp() << std::endl;
- ss << "#Packets: " << packetCount << std::endl;
- ss << std::endl;
- // Print IP address specific statistics only if IP address was given
- if (ipAddress != "") {
- entry_ipStat e = ip_statistics[ipAddress];
- ss << "\n----- STATS FOR IP ADDRESS [" << ipAddress << "] -------" << std::endl;
- ss << std::endl << "KBytes sent: " << e.kbytes_sent << std::endl;
- ss << "KBytes received: " << e.kbytes_received << std::endl;
- ss << "Packets sent: " << e.pkts_sent << std::endl;
- ss << "Packets received: " << e.pkts_received << "\n\n";
- ip_stats is = getStatsForIP(ipAddress);
- ss << "Bandwidth IN: " << is.bandwidthKBitsIn << " kbit/s" << std::endl;
- ss << "Bandwidth OUT: " << is.bandwidthKBitsOut << " kbit/s" << std::endl;
- ss << "Packets per second IN: " << is.packetPerSecondIn << std::endl;
- ss << "Packets per second OUT: " << is.packetPerSecondOut << std::endl;
- ss << "Avg Packet Size Sent: " << is.AvgPacketSizeSent << " kbytes" << std::endl;
- ss << "Avg Packet Size Received: " << is.AvgPacketSizeRecv << " kbytes" << std::endl;
- }
- std::cout << ss.str();
- }
- /**
- * Derives general PCAP file statistics from the collected statistical data and
- * writes all data into a SQLite database, located at database_path.
- * @param database_path The path of the SQLite database file ending with .sqlite3.
- */
- void statistics::writeToDatabase(std::string database_path, std::vector<std::chrono::duration<int, std::micro>> timeIntervals, bool del) {
- // Generate general file statistics
- float duration = getCaptureDurationSeconds();
- long sumPacketsSent = 0, senderCountIP = 0;
- float sumBandwidthIn = 0.0, sumBandwidthOut = 0.0;
- for (auto i = ip_statistics.begin(); i != ip_statistics.end(); i++) {
- sumPacketsSent += i->second.pkts_sent;
- // Consumed bandwith (bytes) for sending packets
- sumBandwidthIn += (i->second.kbytes_received / duration);
- sumBandwidthOut += (i->second.kbytes_sent / duration);
- senderCountIP++;
- }
- float avgPacketRate = (packetCount / duration);
- long avgPacketSize = getAvgPacketSize();
- if(senderCountIP>0) {
- long avgPacketsSentPerHost = (sumPacketsSent / senderCountIP);
- float avgBandwidthInKBits = (sumBandwidthIn / senderCountIP) * 8;
- float avgBandwidthOutInKBits = (sumBandwidthOut / senderCountIP) * 8;
- // Create database and write information
- statistics_db db(database_path, resourcePath);
- db.writeStatisticsFile(packetCount, getCaptureDurationSeconds(),
- getFormattedTimestamp(timestamp_firstPacket.seconds(), timestamp_firstPacket.microseconds()),
- getFormattedTimestamp(timestamp_lastPacket.seconds(), timestamp_lastPacket.microseconds()),
- avgPacketRate, avgPacketSize, avgPacketsSentPerHost, avgBandwidthInKBits,
- avgBandwidthOutInKBits, doExtraTests);
- db.writeStatisticsIP(ip_statistics);
- db.writeStatisticsTTL(ttl_distribution);
- db.writeStatisticsIpMac(ip_mac_mapping);
- db.writeStatisticsDegree(ip_statistics);
- db.writeStatisticsPorts(ip_ports);
- db.writeStatisticsProtocols(protocol_distribution);
- db.writeStatisticsMSS(mss_distribution);
- db.writeStatisticsToS(tos_distribution);
- db.writeStatisticsWin(win_distribution);
- db.writeStatisticsConv(conv_statistics);
- db.writeStatisticsConvExt(conv_statistics_extended);
- db.writeStatisticsInterval(interval_statistics, timeIntervals, del, this->default_interval, this->getDoExtraTests());
- db.writeDbVersion();
- db.writeStatisticsUnrecognizedPDUs(unrecognized_PDUs);
- }
- else {
- // Tinslib failed to recognize the types of the packets in the input PCAP
- std::cerr<<"ERROR: Statistics could not be collected from the input PCAP!"<<"\n";
- return;
- }
- }
- void statistics::writeIntervalsToDatabase(std::string database_path, std::vector<std::chrono::duration<int, std::micro>> timeIntervals, bool del) {
- statistics_db db(database_path, resourcePath);
- db.writeStatisticsInterval(interval_statistics, timeIntervals, del, this->default_interval, this->getDoExtraTests());
- }
|