netflow/netflow/v5.py

#!/usr/bin/env python3

"""
Netflow V5 collector and parser implementation in Python 3.
Created purely for fun. Not battled tested nor will it be.

Reference: https://www.cisco.com/c/en/us/td/docs/net_mgmt/netflow_collection_engine/3-6/user/guide/format.html
This script is specifically implemented in combination with softflowd. See https://github.com/djmdjm/softflowd
"""

import struct


class V5DataFlow:
    """Holds one v5 DataRecord
    """
    length = 48

    def __init__(self, data):
        self.data = {}
        self.data['IPV4_SRC_ADDR'] = struct.unpack('!I', data[:4])[0]
        self.data['IPV4_DST_ADDR'] = struct.unpack('!I', data[4:8])[0]
        self.data['NEXT_HOP'] = struct.unpack('!I', data[8:12])[0]
        self.data['INPUT'] = struct.unpack('!H', data[12:14])[0]
        self.data['OUTPUT'] = struct.unpack('!H', data[14:16])[0]
        self.data['IN_PACKETS'] = struct.unpack('!I', data[16:20])[0]
        self.data['IN_OCTETS'] = struct.unpack('!I', data[20:24])[0]
        self.data['FIRST_SWITCHED'] = struct.unpack('!I', data[24:28])[0]
        self.data['LAST_SWITCHED'] = struct.unpack('!I', data[28:32])[0]
        self.data['SRC_PORT'] = struct.unpack('!H', data[32:34])[0]
        self.data['DST_PORT'] = struct.unpack('!H', data[34:36])[0]
        # Byte 36 is used for padding
        self.data['TCP_FLAGS'] = struct.unpack('!B', data[37:38])[0]
        self.data['PROTO'] = struct.unpack('!B', data[38:39])[0]
        self.data['TOS'] = struct.unpack('!B', data[39:40])[0]
        self.data['SRC_AS'] = struct.unpack('!H', data[40:42])[0]
        self.data['DST_AS'] = struct.unpack('!H', data[42:44])[0]
        self.data['SRC_MASK'] = struct.unpack('!B', data[44:45])[0]
        self.data['DST_MASK'] = struct.unpack('!B', data[45:46])[0]
        # Word 46 is used for padding

    def __repr__(self):
        return "<DataRecord with data {}>".format(self.data)


class V5Header:
    """The header of the V5ExportPacket
    """
    length = 24

    def __init__(self, data):
        header = struct.unpack('!HHIIIIBBH', data[:self.length])
        self.version = header[0]
        self.count = header[1]
        self.uptime = header[2]
        self.timestamp = header[3]
        self.timestamp_nano = header[4]
        self.sequence = header[5]
        self.engine_type = header[6]
        self.engine_id = header[7]
        self.sampling_interval = header[8]


class V5ExportPacket:
    """The flow record holds the header and data flowsets.
    """
    def __init__(self, data):
        self.flows = []
        self.header = V5Header(data)

        offset = self.header.length
        for flow_count in range(0, self.header.count):
            flow = V5DataFlow(data[offset:])
            self.flows.append(flow)
            offset += flow.length

    def __repr__(self):
        return "<ExportPacket v{} with {} records>".format(
                self.header.version, self.header.count)
Add support for v1 and v5 NetFlow packets Thanks to @alieissa for the initial v1 and v5 code 2019-10-17 05:23:51 +02:00			`#!/usr/bin/env python3`

			`"""`
			`Netflow V5 collector and parser implementation in Python 3.`
			`Created purely for fun. Not battled tested nor will it be.`

			`Reference: https://www.cisco.com/c/en/us/td/docs/net_mgmt/netflow_collection_engine/3-6/user/guide/format.html`
Rename classes in v1, v5 and v9 according to version Until now, every NetFlow version file used similar names for their classes, e.g. "Header". These are now prefixed with their respective version, e.g. "V1Header", to avoid confusion in imports etc. 2020-03-29 19:49:57 +02:00			`This script is specifically implemented in combination with softflowd. See https://github.com/djmdjm/softflowd`
Add support for v1 and v5 NetFlow packets Thanks to @alieissa for the initial v1 and v5 code 2019-10-17 05:23:51 +02:00			`"""`

			`import struct`


Rename classes in v1, v5 and v9 according to version Until now, every NetFlow version file used similar names for their classes, e.g. "Header". These are now prefixed with their respective version, e.g. "V1Header", to avoid confusion in imports etc. 2020-03-29 19:49:57 +02:00			`class V5DataFlow:`
			`"""Holds one v5 DataRecord`
			`"""`
Add support for v1 and v5 NetFlow packets Thanks to @alieissa for the initial v1 and v5 code 2019-10-17 05:23:51 +02:00			`length = 48`

			`def __init__(self, data):`
			`self.data = {}`
			`self.data['IPV4_SRC_ADDR'] = struct.unpack('!I', data[:4])[0]`
			`self.data['IPV4_DST_ADDR'] = struct.unpack('!I', data[4:8])[0]`
			`self.data['NEXT_HOP'] = struct.unpack('!I', data[8:12])[0]`
			`self.data['INPUT'] = struct.unpack('!H', data[12:14])[0]`
			`self.data['OUTPUT'] = struct.unpack('!H', data[14:16])[0]`
			`self.data['IN_PACKETS'] = struct.unpack('!I', data[16:20])[0]`
			`self.data['IN_OCTETS'] = struct.unpack('!I', data[20:24])[0]`
			`self.data['FIRST_SWITCHED'] = struct.unpack('!I', data[24:28])[0]`
			`self.data['LAST_SWITCHED'] = struct.unpack('!I', data[28:32])[0]`
			`self.data['SRC_PORT'] = struct.unpack('!H', data[32:34])[0]`
			`self.data['DST_PORT'] = struct.unpack('!H', data[34:36])[0]`
			`# Byte 36 is used for padding`
			`self.data['TCP_FLAGS'] = struct.unpack('!B', data[37:38])[0]`
			`self.data['PROTO'] = struct.unpack('!B', data[38:39])[0]`
			`self.data['TOS'] = struct.unpack('!B', data[39:40])[0]`
			`self.data['SRC_AS'] = struct.unpack('!H', data[40:42])[0]`
			`self.data['DST_AS'] = struct.unpack('!H', data[42:44])[0]`
			`self.data['SRC_MASK'] = struct.unpack('!B', data[44:45])[0]`
			`self.data['DST_MASK'] = struct.unpack('!B', data[45:46])[0]`
			`# Word 46 is used for padding`

			`def __repr__(self):`
			`return "<DataRecord with data {}>".format(self.data)`


Rename classes in v1, v5 and v9 according to version Until now, every NetFlow version file used similar names for their classes, e.g. "Header". These are now prefixed with their respective version, e.g. "V1Header", to avoid confusion in imports etc. 2020-03-29 19:49:57 +02:00			`class V5Header:`
			`"""The header of the V5ExportPacket`
			`"""`
Add support for v1 and v5 NetFlow packets Thanks to @alieissa for the initial v1 and v5 code 2019-10-17 05:23:51 +02:00			`length = 24`

			`def __init__(self, data):`
			`header = struct.unpack('!HHIIIIBBH', data[:self.length])`
			`self.version = header[0]`
			`self.count = header[1]`
			`self.uptime = header[2]`
			`self.timestamp = header[3]`
			`self.timestamp_nano = header[4]`
			`self.sequence = header[5]`
			`self.engine_type = header[6]`
			`self.engine_id = header[7]`
			`self.sampling_interval = header[8]`


			`class V5ExportPacket:`
Rename classes in v1, v5 and v9 according to version Until now, every NetFlow version file used similar names for their classes, e.g. "Header". These are now prefixed with their respective version, e.g. "V1Header", to avoid confusion in imports etc. 2020-03-29 19:49:57 +02:00			`"""The flow record holds the header and data flowsets.`
			`"""`
Add support for v1 and v5 NetFlow packets Thanks to @alieissa for the initial v1 and v5 code 2019-10-17 05:23:51 +02:00			`def __init__(self, data):`
			`self.flows = []`
Rename classes in v1, v5 and v9 according to version Until now, every NetFlow version file used similar names for their classes, e.g. "Header". These are now prefixed with their respective version, e.g. "V1Header", to avoid confusion in imports etc. 2020-03-29 19:49:57 +02:00			`self.header = V5Header(data)`
Add support for v1 and v5 NetFlow packets Thanks to @alieissa for the initial v1 and v5 code 2019-10-17 05:23:51 +02:00
			`offset = self.header.length`
			`for flow_count in range(0, self.header.count):`
Rename classes in v1, v5 and v9 according to version Until now, every NetFlow version file used similar names for their classes, e.g. "Header". These are now prefixed with their respective version, e.g. "V1Header", to avoid confusion in imports etc. 2020-03-29 19:49:57 +02:00			`flow = V5DataFlow(data[offset:])`
Add support for v1 and v5 NetFlow packets Thanks to @alieissa for the initial v1 and v5 code 2019-10-17 05:23:51 +02:00			`self.flows.append(flow)`
			`offset += flow.length`

			`def __repr__(self):`
			`return "<ExportPacket v{} with {} records>".format(`
			`self.header.version, self.header.count)`