123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307 |
- import java.util.ArrayList;
- import java.util.HashMap;
- import java.util.Iterator;
- import java.util.LinkedList;
- import java.util.Map.Entry;
- import de.tu_darmstadt.tk.SmartHomeNetworkSim.core.Link;
- import de.tu_darmstadt.tk.SmartHomeNetworkSim.core.Packet;
- import de.tu_darmstadt.tk.SmartHomeNetworkSim.core.PacketSniffer;
- import weka.clusterers.SimpleKMeans;
- import weka.core.Attribute;
- import weka.core.DenseInstance;
- import weka.core.Instance;
- import weka.core.Instances;
- public class UnsupervisedAnomalyDetectionExample implements PacketSniffer {
-
- private SimpleKMeans clusterer;
-
-
- private boolean training = true;
-
-
- private ArrayList<Attribute> atts = new ArrayList<Attribute>();
-
-
- private Instances dataset;
-
-
- private HashMap<Link, LinkedList<Packet>> lastPackets = new HashMap<Link, LinkedList<Packet>>();
-
-
- private int NUMBER_OF_CLUSTERS = 2;
-
-
- private int NUMBER_OF_PACKETS = 30;
-
-
- private HashMap<String,Integer> link_mappings = new HashMap<String, Integer>();
- private HashMap<String,Integer> source_mappings = new HashMap<String, Integer>();
-
- private HashMap<String,Integer> destination_mappings = new HashMap<String, Integer>();
-
- private HashMap<String,Integer> protocol_mappings = new HashMap<String, Integer>();
-
- public UnsupervisedAnomalyDetectionExample() {
-
- link_mappings.put("unknown", 0);
- atts.add(new Attribute("Link-Name", false));
- source_mappings.put("unknown", 0);
- atts.add(new Attribute("Source-Device", false));
- atts.add(new Attribute("Source-Port-number", false));
- destination_mappings.put("unknown", 0);
- atts.add(new Attribute("Destination-Device", false));
- atts.add(new Attribute("Destination-Port-number", false));
- protocol_mappings.put("unknown", 0);
- atts.add(new Attribute("Protocol-name", false));
- atts.add(new Attribute("Packets-per-second", false));
-
- dataset = new Instances("Packets", atts, 100000);
-
- clusterer = new SimpleKMeans();
- clusterer.setSeed(42);
- try {
- clusterer.setNumClusters(NUMBER_OF_CLUSTERS);
- } catch (Exception e) {
- System.out.println("Error while building cluster");
- e.printStackTrace();
- }
- }
-
- @Override
- public void processPackets(HashMap<Link, LinkedList<Packet>> packets) {
- if(training)
- try {
- training(packets);
- } catch (Exception e) {
- e.printStackTrace();
- }
- else
- classify(packets);
- }
-
- private double getEstimatedPacketsPerSecond(Link link, Packet packet) {
-
- LinkedList<Packet> list = lastPackets.get(link);
- if(list == null) {
-
- list = new LinkedList<Packet>();
- lastPackets.put(link, list);
- }
- if(list.isEmpty()) {
- list.addLast(packet);
-
- return 1.0;
- }
- if(list.size() == NUMBER_OF_PACKETS){
- list.removeFirst();
- }
- list.addLast(packet);
-
- long elapsed_time = packet.getTimestamp()-list.getFirst().getTimestamp()/list.size();
- if(elapsed_time<=0)
- return Double.POSITIVE_INFINITY;
-
- return 1000.0/elapsed_time;
-
- }
-
-
- private Instance packet2Instance(Link link, Packet packet, Instances dataset) {
-
- DenseInstance instance = new DenseInstance(dataset.numAttributes());
- instance.setDataset(dataset);
-
-
- instance.setValue(0, link == null ? 0 : stringToNumber(link_mappings, link.getName()));
-
-
- if(packet.getSource()==null) {
- instance.setValue(1, 0);
- instance.setValue(2, Double.NEGATIVE_INFINITY);
- }else if(packet.getSource().getOwner()==null){
- instance.setValue(1, 0);
- instance.setValue(2, packet.getSource().getPortNumber());
- }else {
- instance.setValue(1, stringToNumber(source_mappings, packet.getSource().getOwner().getName()));
- instance.setValue(2, packet.getSource().getPortNumber());
- }
-
-
- if(packet.getDestination()==null) {
- instance.setValue(3, 0);
- instance.setValue(4, Double.NEGATIVE_INFINITY);
- }else if(packet.getDestination().getOwner()==null){
- instance.setValue(3, 0);
- instance.setValue(4, packet.getDestination().getPortNumber());
- }else {
- instance.setValue(3, stringToNumber(destination_mappings, packet.getDestination().getOwner().getName()));
- instance.setValue(4, packet.getDestination().getPortNumber());
- }
-
-
- instance.setValue(5, stringToNumber(protocol_mappings, packet.getProtocolName()));
-
-
- instance.setValue(6, getEstimatedPacketsPerSecond(link, packet));
-
- return instance;
- }
-
-
- double stringToNumber(HashMap<String, Integer> map, String s) {
- Integer i = map.get(s);
- if(i == null) {
- int size = map.size();
- map.put(s, size);
- return size;
- }else {
- return i;
- }
- }
-
- private void training(HashMap<Link, LinkedList<Packet>> packets) {
- for (Iterator<Entry<Link, LinkedList<Packet>>> it = packets.entrySet().iterator(); it.hasNext();) {
- Entry<Link, LinkedList<Packet>> entry = it.next();
-
- Link l = entry.getKey();
- for (Iterator<Packet> itPacket = entry.getValue().iterator(); itPacket.hasNext();) {
-
- Packet packet = (Packet) itPacket.next();
- dataset.add(packet2Instance(l, packet, dataset));
- }
- }
- }
-
-
- private void finishDataCollection() throws Exception{
-
- clusterer.buildClusterer(dataset);
- }
-
-
- private void classify(HashMap<Link, LinkedList<Packet>> packets) {
- for (Iterator<Entry<Link, LinkedList<Packet>>> it = packets.entrySet().iterator(); it.hasNext();) {
-
- Entry<Link, LinkedList<Packet>> entry = it.next();
-
- Link l = entry.getKey();
- for (Iterator<Packet> itPacket = entry.getValue().iterator(); itPacket.hasNext();) {
-
- Packet packet = (Packet) itPacket.next();
-
- Instance packet_instance = packet2Instance(l, packet, dataset);
- try {
-
- clusterer.clusterInstance(packet_instance);
- } catch (Exception e) {
-
- System.out.println("Anomaly: "+packet.getTextualRepresentation());
-
- }
- }
- }
- }
-
-
- @Override
- public void setMode(boolean testing) {
- training = !testing;
- if(testing) {
-
- try {
- finishDataCollection();
- } catch (Exception e) {
- System.out.println("Clustering failed");
- e.printStackTrace();
- }
- }
- }
-
- @Override
- public boolean getMode() {
- return !training;
- }
- }
|