package edu.uci.iotproject;
-import edu.uci.iotproject.analysis.PcapPacketPair;
+import static edu.uci.iotproject.analysis.UserAction.Type;
+
import edu.uci.iotproject.analysis.TcpConversationUtils;
+import edu.uci.iotproject.analysis.TrafficLabeler;
import edu.uci.iotproject.analysis.TriggerTrafficExtractor;
+import edu.uci.iotproject.analysis.UserAction;
import edu.uci.iotproject.io.TriggerTimesFileReader;
import org.pcap4j.core.*;
import org.pcap4j.packet.namednumber.DataLinkType;
import java.io.EOFException;
import java.net.UnknownHostException;
import java.time.Instant;
-import java.util.ArrayList;
-import java.util.Collections;
-import java.util.List;
+import java.util.*;
import java.util.concurrent.TimeoutException;
/**
public static void main(String[] args) throws PcapNativeException, NotOpenException, EOFException, TimeoutException, UnknownHostException {
// -------------------------------------------------------------------------------------------------------------
- // Example/debug code for searching for a pattern at the MAC layer.
-// String fileName = "./pcap/mac-tplink.local.pcapng";
-// PcapHandle handle;
-// try {
-// handle = Pcaps.openOffline(fileName, PcapHandle.TimestampPrecision.NANO);
-// } catch (PcapNativeException pne) {
-// handle = Pcaps.openOffline(fileName);
-// }
-// Arrays.asList(1590, 1590, 1590, 1001, 337, 197, 636, 1311, 177) // Full pattern (all non-zero payload packets).
-// MacLayerFlowPattern pattern = new MacLayerFlowPattern("TP_LINK_LOCAL_OFF_MAC", "50:c7:bf:33:1f:09", Arrays.asList(637, 1312));
-// MacLayerFlowPatternFinder finder = new MacLayerFlowPatternFinder(handle, pattern);
-// finder.findFlowPattern();
- // -------------------------------------------------------------------------------------------------------------
-//
-// //final String fileName = args.length > 0 ? args[0] : "/home/rtrimana/pcap_processing/smart_home_traffic/Code/Projects/SmartPlugDetector/pcap/wlan1.local.dns.pcap";
-// final String fileName = args.length > 0 ? args[0] : "/scratch/June-2018/TPLink/wlan1/tplink.wlan1.local.pcap";
-// //final String fileName = args.length > 0 ? args[0] : "/scratch/June-2018/DLink/wlan1/dlink.wlan1.local.pcap";
-// final String trainingFileName = "./pcap/TP_LINK_LOCAL_ON_SUBSET.pcap";
-//// final String trainingFileName = "./pcap/TP_LINK_LOCAL_ON.pcap";
-////
-//// // ====== Debug code ======
-// PcapHandle handle;
-// PcapHandle trainingPcap;
-// try {
-// handle = Pcaps.openOffline(fileName, PcapHandle.TimestampPrecision.NANO);
-// trainingPcap = Pcaps.openOffline(trainingFileName, PcapHandle.TimestampPrecision.NANO);
-// } catch (PcapNativeException pne) {
-// handle = Pcaps.openOffline(fileName);
-// trainingPcap = Pcaps.openOffline(trainingFileName);
-// }
-////
-//// // TODO: The followings are the way to extract multiple hostnames and their associated packet lengths lists
-//// //List<String> list = new ArrayList<>();
-//// //list.add("events.tplinkra.com");
-//// //FlowPattern fp = new FlowPattern("TP_LINK_LOCAL_ON", list, trainingPcap);
-//// //List<String> list2 = new ArrayList<>();
-//// //list2.add("devs.tplinkcloud.com");
-//// //list2.add("events.tplinkra.com");
-//// //FlowPattern fp3 = new FlowPattern("TP_LINK_REMOTE_ON", list2, trainingPcap);
-////
-// FlowPattern fp = new FlowPattern("TP_LINK_LOCAL_ON", "events.tplinkra.com", trainingPcap);
-// //FlowPattern fp = new FlowPattern("DLINK_LOCAL_ON", "rfe-us-west-1.dch.dlink.com", trainingPcap);
-// FlowPatternFinder fpf = new FlowPatternFinder(handle, fp);
-// fpf.start();
-////
-//// // ========================
-
- /*
- PcapReader pcapReader = new PcapReader(args[0]);
- PcapProcessingPipeline pipeline = new PcapProcessingPipeline(pcapReader);
- TcpReassembler tcpReassembler = new TcpReassembler();
- pipeline.addPcapPacketConsumer(tcpReassembler);
- pipeline.executePipeline();
- System.out.println("Pipeline terminated");
+ // ------------ # Code for extracting traffic generated by a device within x seconds of a trigger # ------------
+ // Paths to input and output files (consider supplying these as arguments instead) and IP of the device for
+ // which traffic is to be extracted:
+ String path = "/scratch/July-2018"; // Rahmadi
+ //String path = "/Users/varmarken/temp/UCI IoT Project/experiments"; // Janus
- List<List<PcapPacketPair>> pairs = new ArrayList<>();
- for (Conversation c : tcpReassembler.getTcpConversations()) {
- pairs.add(TcpConversationUtils.extractPacketPairs(c));
- }
- */
+ // D-Link July 26 experiment
+// final String inputPcapFile = path + "/2018-07/dlink/dlink.wlan1.local.pcap";
+// final String outputPcapFile = path + "/2018-07/dlink/dlink-processed.pcap";
+// final String triggerTimesFile = path + "/2018-07/dlink/dlink-july-26-2018.timestamps";
+// final String deviceIp = "192.168.1.246"; // .246 == phone; .199 == dlink plug?
- /*
- // -------- 07-17-2018 --------
- // Only consider packets to/from the TP-Link plug.
- PcapReader pcapReader = new PcapReader(args[0], "ip host 192.168.1.159");
- TcpReassembler tcpReassembler = new TcpReassembler();
- PcapPacket packet;
- while((packet = pcapReader.readNextPacket()) != null) {
- tcpReassembler.consumePacket(packet);
- }
- // Now we have a set of reassembled TCP conversations.
- List<Conversation> conversations = tcpReassembler.getTcpConversations();
- for(Conversation c : conversations) {
- List<PcapPacketPair> pairs = TcpConversationUtils.extractPacketPairs(c);
- for (PcapPacketPair pair : pairs) {
- // TODO ...
- // 1. discard packets that are not within X seconds after trigger time
- // 2. conversations may be (are) with different servers - so need to plot in different plots, one per hostname?
- }
- }
+ // TP-Link July 25 experiment
+ final String inputPcapFile = path + "/2018-07/tplink/tplink.wlan1.local.pcap";
+ final String outputPcapFile = path + "/2018-07/tplink/tplink-processed.pcap";
+ final String triggerTimesFile = path + "/2018-07/tplink/tplink-july-25-2018.timestamps";
+ final String deviceIp = "192.168.1.159";
+
+ // SmartThings Plug July 25 experiment
+// final String inputPcapFile = path + "/2018-07/stplug/stplug.wlan1.local.pcap";
+// final String outputPcapFile = path + "/2018-07/stplug/stplug-processed.pcap";
+// final String triggerTimesFile = path + "/2018-07/stplug/smartthings-july-25-2018.timestamps";
+// final String deviceIp = "192.168.1.246"; // .246 == phone; .142 == SmartThings Hub (note: use eth0 capture for this!)
+
+ // Wemo July 30 experiment
+// final String inputPcapFile = path + "/2018-07/wemo/wemo.wlan1.local.pcap";
+// final String outputPcapFile = path + "/2018-07/wemo/wemo-processed.pcap";
+// final String triggerTimesFile = path + "/2018-07/wemo/wemo-july-30-2018.timestamps";
+// final String deviceIp = "192.168.1.145";
+
+ // Wemo Insight July 31 experiment
+// final String inputPcapFile = path + "/2018-07/wemoinsight/wemoinsight.wlan1.local.pcap";
+// final String outputPcapFile = path + "/2018-07/wemoinsight/wemoinsight-processed.pcap";
+// final String triggerTimesFile = path + "/2018-07/wemoinsight/wemo-insight-july-31-2018.timestamps";
+// final String deviceIp = "192.168.1.135";
- // ----------------------------
- */
+ // TP-Link BULB August 1 experiment
+// final String inputPcapFile = path + "/2018-08/tplink-bulb/tplinkbulb.wlan1.local.pcap";
+// final String outputPcapFile = path + "/2018-08/tplink-bulb/tplinkbulb-processed.pcap";
+// final String triggerTimesFile = path + "/2018-08/tplink-bulb/tplink-bulb-aug-3-2018.timestamps";
+// final String deviceIp = "192.168.1.140";
- // -------- 07-19-2018 --------
TriggerTimesFileReader ttfr = new TriggerTimesFileReader();
- List<Instant> triggerTimes = ttfr.readTriggerTimes("/Users/varmarken/Downloads/tplink-feb-13-2018.timestamps", false);
-// triggerTimes.stream().forEach(i -> System.out.println(i.atZone(TriggerTimesFileReader.ZONE_ID_LOS_ANGELES).toString()));
- String pcapFile = "/Users/varmarken/Development/Repositories/UCI/NetworkingGroup/smart_home_traffic/Code/Projects/SmartPlugDetector/pcap/wlan1.local.dns.pcap";
- String tpLinkPlugIp = "192.168.1.159";
- TriggerTrafficExtractor tte = new TriggerTrafficExtractor(pcapFile, triggerTimes, tpLinkPlugIp);
- final PcapDumper outputter = Pcaps.openDead(DataLinkType.EN10MB, 65536).dumpOpen("/Users/varmarken/temp/traces/output/tplink-filtered.pcap");
+ List<Instant> triggerTimes = ttfr.readTriggerTimes(triggerTimesFile, false);
+ // Tag each trigger with "ON" or "OFF", assuming that the first trigger is an "ON" and that they alternate.
+ List<UserAction> userActions = new ArrayList<>();
+ for (int i = 0; i < triggerTimes.size(); i++) {
+ userActions.add(new UserAction(i % 2 == 0 ? Type.TOGGLE_ON : Type.TOGGLE_OFF, triggerTimes.get(i)));
+ }
+ TriggerTrafficExtractor tte = new TriggerTrafficExtractor(inputPcapFile, triggerTimes, deviceIp);
+ final PcapDumper outputter = Pcaps.openDead(DataLinkType.EN10MB, 65536).dumpOpen(outputPcapFile);
+ DnsMap dnsMap = new DnsMap();
TcpReassembler tcpReassembler = new TcpReassembler();
+ TrafficLabeler trafficLabeler = new TrafficLabeler(userActions);
tte.performExtraction(pkt -> {
try {
outputter.dump(pkt);
} catch (NotOpenException e) {
e.printStackTrace();
}
- }, tcpReassembler);
+ }, dnsMap, tcpReassembler, trafficLabeler);
outputter.flush();
outputter.close();
- int packets = 0;
- for (Conversation c : tcpReassembler.getTcpConversations()) {
- packets += c.getPackets().size();
- packets += c.getSynPackets().size();
- // only count the FIN packets, not the ACKs; every FinAckPair holds a FIN packet
- packets += c.getFinAckPairs().size();
- }
- // Produces 271 packets for the Feb 13 experiment
- // Applying filter: "(tcp and not tcp.len == 0 and not tcp.analysis.retransmission and not tcp.analysis.fast_retransmission) or (tcp.flags.syn == 1) or (tcp.flags.fin == 1)"
- // to the file gives 295 packets, but there are 24 TCP-Out-Of-Order SYN/SYNACKs which are filtered as retransmissions in Conversation, so the numbers seem to match.
- System.out.println("number of packets: " + packets);
-
- List<List<PcapPacketPair>> pairs = new ArrayList<>();
- for (Conversation c : tcpReassembler.getTcpConversations()) {
- pairs.add(TcpConversationUtils.extractPacketPairs(c));
+ if (tte.getPacketsIncludedCount() != trafficLabeler.getTotalPacketCount()) {
+ // Sanity/debug check
+ throw new AssertionError(String.format("mismatch between packet count in %s and %s",
+ TriggerTrafficExtractor.class.getSimpleName(), TrafficLabeler.class.getSimpleName()));
}
- // Sort pairs according to timestamp of first packet of conversation for (debugging) convenience.
- Collections.sort(pairs, (l1, l2) -> {
- if (l1.get(0).getFirst().getTimestamp().isBefore(l2.get(0).getFirst().getTimestamp())) return -1;
- else if (l2.get(0).getFirst().getTimestamp().isBefore(l1.get(0).getFirst().getTimestamp())) return 1;
- else return 0;
+
+ // Extract all conversations present in the filtered trace.
+ List<Conversation> allConversations = tcpReassembler.getTcpConversations();
+ // Group conversations by hostname.
+ Map<String, List<Conversation>> convsByHostname = TcpConversationUtils.groupConversationsByHostname(allConversations, dnsMap);
+ System.out.println("Grouped conversations by hostname.");
+ // For each hostname, count the frequencies of packet lengths exchanged with that hostname.
+ final Map<String, Map<Integer, Integer>> pktLenFreqsByHostname = new HashMap<>();
+ convsByHostname.forEach((host, convs) -> pktLenFreqsByHostname.put(host, TcpConversationUtils.countPacketLengthFrequencies(convs)));
+ System.out.println("Counted frequencies of packet lengths exchanged with each hostname.");
+ // For each hostname, count the frequencies of packet sequences (i.e., count how many conversations exchange a
+ // sequence of packets of some specific lengths).
+ final Map<String, Map<String, Integer>> pktSeqFreqsByHostname = new HashMap<>();
+ convsByHostname.forEach((host, convs) -> pktSeqFreqsByHostname.put(host, TcpConversationUtils.countPacketSequenceFrequencies(convs)));
+ System.out.println("Counted frequencies of packet sequences exchanged with each hostname.");
+ // For each hostname, count frequencies of packet pairs exchanged with that hostname across all conversations
+ final Map<String, Map<String, Integer>> pktPairFreqsByHostname =
+ TcpConversationUtils.countPacketPairFrequenciesByHostname(allConversations, dnsMap);
+ System.out.println("Counted frequencies of packet pairs per hostname");
+ // For each user action, reassemble the set of TCP connections occurring shortly after
+ final Map<UserAction, List<Conversation>> userActionToConversations = trafficLabeler.getLabeledReassembledTcpTraffic();
+ final Map<UserAction, Map<String, List<Conversation>>> userActionsToConvsByHostname = trafficLabeler.getLabeledReassembledTcpTraffic(dnsMap);
+ System.out.println("Reassembled TCP conversations occurring shortly after each user event");
+
+
+
+ // Contains all ON events: hostname -> sequence identifier -> list of conversations with that sequence
+ Map<String, Map<String, List<Conversation>>> ons = new HashMap<>();
+ // Contains all OFF events: hostname -> sequence identifier -> list of conversations with that sequence
+ Map<String, Map<String, List<Conversation>>> offs = new HashMap<>();
+ userActionsToConvsByHostname.forEach((ua, hostnameToConvs) -> {
+ Map<String, Map<String, List<Conversation>>> outer = ua.getType() == Type.TOGGLE_ON ? ons : offs;
+ hostnameToConvs.forEach((host, convs) -> {
+ Map<String, List<Conversation>> seqsToConvs = TcpConversationUtils.
+ groupConversationsByPacketSequence(convs);
+ outer.merge(host, seqsToConvs, (oldMap, newMap) -> {
+ newMap.forEach((sequence, cs) -> oldMap.merge(sequence, cs, (list1, list2) -> {
+ list1.addAll(list2);
+ return list1;
+ }));
+ return oldMap;
+ });
+ });
});
- System.out.println("list of pairs produced");
- // ----------------------------
+
+ System.out.println("");
+
+ // -------------------------------------------------------------------------------------------------------------
+ // -------------------------------------------------------------------------------------------------------------
}
}
-// TP-Link MAC 50:c7:bf:33:1f:09 and usually IP 192.168.1.159 (remember to verify per file)
\ No newline at end of file
+// TP-Link MAC 50:c7:bf:33:1f:09 and usually IP 192.168.1.159 (remember to verify per file)
+// frame.len >= 556 && frame.len <= 558 && ip.addr == 192.168.1.159
\ No newline at end of file