-
Notifications
You must be signed in to change notification settings - Fork 6
Expand file tree
/
Copy pathpcap-to-ngrams.py
More file actions
51 lines (44 loc) · 1.85 KB
/
Copy pathpcap-to-ngrams.py
File metadata and controls
51 lines (44 loc) · 1.85 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
#!/usr/bin/env python
'''
A simple script to convert pcap files to encoded ngrams
NOTE: The label given to an ngram depends on the filaname, use the process.py script to update filenames
'''
from __future__ import print_function, division
from p2flib import *
from f2nlib import *
import os
def loop_folder(folder_name, time_out, no_words):
'''
Function to loop over a folder and convert each pcap file to ngrams
'''
import glob
pcap_inputs = []
for pcap_file_name in glob.glob( os.path.join(folder_name, '*.pcap') ):
print("--> start to process pcap_file_nam: [%s]"%(pcap_file_name))
pcap2words(pcap_file_name, pcap_file_name.rsplit('.pcap')[0] + ".words", time_out)
words2ngram(pcap_file_name.rsplit('.pcap')[0] + ".words",
pcap_file_name.rsplit('.pcap')[0] + "ngram.csv", int(no_words))
if __name__ == "__main__":
import sys
import argparse
'''
Parse the command line arguments
'''
parser = argparse.ArgumentParser(description='convert txt file to flows')
parser.add_argument('-p', '--pcap', default=None,
help='specify the pcap file you want to process')
parser.add_argument('-f', '--folder', default=None,
help='specify the folder you want to loop through')
parser.add_argument('-t', '--time_out', default=10, type=float,
help='time out time')
parser.add_argument('-n', '--no_words', default=3,
help='specify the number of words in a n-gram')
args = parser.parse_args()
if args.pcap:
pcap2words(args.pcap, args.pcap.rsplit('.pcap')[0] + '.words', args.time_out)
words2ngram(args.pcap.rsplit('.pcap')[0] + ".words",
args.pcap.rsplit('.pcap')[0] + "ngram.csv", int(args.no_words))
elif args.folder:
loop_folder(args.folder, args.time_out, args.no_words)
else:
parser.print_help()