#!/usr/bin/python

##
## Copyright (c) 2020 Intel Corporation
##
## Licensed under the Apache License, Version 2.0 (the "License");
## you may not use this file except in compliance with the License.
## You may obtain a copy of the License at
##
##
##     http://www.apache.org/licenses/LICENSE-2.0
##
## Unless required by applicable law or agreed to in writing, software
## distributed under the License is distributed on an "AS IS" BASIS,
## WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
## See the License for the specific language governing permissions and
## limitations under the License.
##

import yaml
import requests
import time
import copy
from past.utils import old_div
from rapid_log import RapidLog
from rapid_log import bcolors
inf = float("inf")
from datetime import datetime as dt

class RapidTest(object):
    """
    Class to manage the testing
    """
    def __init__(self, test_param, runtime, testname, environment_file ):
        self.test = test_param
        self.test['runtime'] = runtime
        self.test['testname'] = testname
        self.test['environment_file'] = environment_file
        if 'maxr' not in self.test.keys():
            self.test['maxr'] = 1
        if 'maxz' not in self.test.keys():
            self.test['maxz'] = inf
        with open('format.yaml') as f:
            self.data_format = yaml.load(f, Loader=yaml.FullLoader)

    @staticmethod
    def get_percentageof10Gbps(pps_speed,size):
        # speed is given in pps, returning % of 10Gb/s
        # 12 bytes is the inter packet gap 
        # pre-amble is 7 bytes
        # SFD (start of frame delimiter) is 1 byte
        # Total of 20 bytes overhead per packet
        return (pps_speed / 1000000.0 * 0.08 * (size+20))

    @staticmethod
    def get_pps(speed,size):
        # speed is given in % of 10Gb/s, returning Mpps
        # 12 bytes is the inter packet gap 
        # pre-amble is 7 bytes
        # SFD (start of frame delimiter) is 1 byte
        # Total of 20 bytes overhead per packet
        return (speed * 100.0 / (8*(size+20)))

    @staticmethod
    def get_speed(packet_speed,size):
        # return speed in Gb/s
        # 12 bytes is the inter packet gap 
        # pre-amble is 7 bytes
        # SFD (start of frame delimiter) is 1 byte
        # Total of 20 bytes overhead per packet
        return (packet_speed / 1000.0 * (8*(size+20)))

    @staticmethod
    def set_background_flows(background_machines, number_of_flows):
        for machine in background_machines:
            _ = machine.set_flows(number_of_flows)

    @staticmethod
    def set_background_speed(background_machines, speed):
        for machine in background_machines:
            machine.set_generator_speed(speed)

    @staticmethod
    def set_background_size(background_machines, imix):
        # imixs is a list of packet sizes
        for machine in background_machines:
            machine.set_udp_packet_size(imix)

    @staticmethod
    def start_background_traffic(background_machines):
        for machine in background_machines:
            machine.start()

    @staticmethod
    def stop_background_traffic(background_machines):
        for machine in background_machines:
            machine.stop()

    @staticmethod
    def parse_data_format_dict(data_format, variables):
        for k, v in data_format.items():
            if type(v) is dict:
                RapidTest.parse_data_format_dict(v, variables)
            else:
                if v in variables.keys():
                    data_format[k] = variables[v]

    def record_start_time(self):
        self.start = dt.now().strftime('%Y-%m-%d %H:%M:%S')

    def record_stop_time(self):
        self.stop = dt.now().strftime('%Y-%m-%d %H:%M:%S')

    def post_data(self, test, variables):
        var = copy.deepcopy(self.data_format)
        self.parse_data_format_dict(var, variables)
        if 'URL' not in var.keys():
            return
        if test not in var.keys():
            return
        URL=''
        for value in var['URL'].values():
            URL = URL + value
        HEADERS = {'X-Requested-With': 'Python requests', 'Content-type': 'application/rapid'}
        if 'Format' in var.keys():
            if var['Format'] == 'PushGateway':
                data = "\n".join("{} {}".format(k, v) for k, v in var[test].items()) + "\n"
                response = requests.post(url=URL, data=data,headers=HEADERS)
            elif var['Format'] == 'Xtesting':
                data = var[test]
                response = requests.post(url=URL, json=data)
            else:
                return
        else:
            return
        if (response.status_code != 202) and (response.status_code != 200):
            RapidLog.info('Cannot send metrics to {}'.format(URL))
            RapidLog.info(data)


    @staticmethod
    def report_result(flow_number, size, speed, pps_req_tx, pps_tx, pps_sut_tx,
        pps_rx, lat_avg, lat_perc, lat_perc_max, lat_max, tx, rx, tot_drop,
        elapsed_time,speed_prefix='', lat_avg_prefix='', lat_perc_prefix='',
        lat_max_prefix='', abs_drop_rate_prefix='', drop_rate_prefix=''):
        if flow_number < 0:
            flow_number_str = '| ({:>4}) |'.format(abs(flow_number))
        else:
            flow_number_str = '|{:>7} |'.format(flow_number)
        if pps_req_tx is None:
            pps_req_tx_str = '{0: >14}'.format('   NA     |')
        else:
            pps_req_tx_str = '{:>7.3f} Mpps |'.format(pps_req_tx)
        if pps_tx is None:
            pps_tx_str = '{0: >14}'.format('   NA     |')
        else:
            pps_tx_str = '{:>7.3f} Mpps |'.format(pps_tx) 
        if pps_sut_tx is None:
            pps_sut_tx_str = '{0: >14}'.format('   NA     |')
        else:
            pps_sut_tx_str = '{:>7.3f} Mpps |'.format(pps_sut_tx)
        if pps_rx is None:
            pps_rx_str = '{0: >25}'.format('NA        |')
        else:
            pps_rx_str = bcolors.OKBLUE + '{:>4.1f} Gb/s |{:7.3f} Mpps {}|'.format(
                    RapidTest.get_speed(pps_rx,size),pps_rx,bcolors.ENDC)
        if tot_drop is None:
            tot_drop_str = ' |       NA  | '
        else:
            tot_drop_str = ' | {:>9.0f} | '.format(tot_drop)
        if lat_perc is None:
            lat_perc_str = ' |{:^10.10}|'.format('NA')
        elif lat_perc_max == True:
            lat_perc_str = '|>{}{:>5.0f} us{} |'.format(lat_perc_prefix,
                    float(lat_perc), bcolors.ENDC) 
        else:
            lat_perc_str = '| {}{:>5.0f} us{} |'.format(lat_perc_prefix,
                    float(lat_perc), bcolors.ENDC) 
        if elapsed_time is None:
            elapsed_time_str = ' NA |'
        else:
            elapsed_time_str = '{:>3.0f} |'.format(elapsed_time)
        return(flow_number_str + '{:>5.1f}'.format(speed) + '% ' + speed_prefix
                + '{:>6.3f}'.format(RapidTest.get_pps(speed,size)) + ' Mpps|' +
                pps_req_tx_str + pps_tx_str + bcolors.ENDC + pps_sut_tx_str +
                pps_rx_str + lat_avg_prefix + ' {:>6.0f}'.format(lat_avg) +
                ' us' + lat_perc_str +lat_max_prefix+'{:>6.0f}'.format(lat_max)
                + ' us | ' + '{:>9.0f}'.format(tx) + ' | {:>9.0f}'.format(rx) +
                ' | '+ abs_drop_rate_prefix+ '{:>9.0f}'.format(tx-rx) +
                tot_drop_str +drop_rate_prefix +
                '{:>5.2f}'.format(100*old_div(float(tx-rx),tx)) + bcolors.ENDC +
                ' |' + elapsed_time_str)
            
    def run_iteration(self, requested_duration, flow_number, size, speed):
        BUCKET_SIZE_EXP = self.gen_machine.bucket_size_exp
        LAT_PERCENTILE = self.test['lat_percentile']
        r = 0;
        sleep_time = 2
        while (r < self.test['maxr']):
            time.sleep(sleep_time)
            # Sleep_time is needed to be able to do accurate measurements to check for packet loss. We need to make this time large enough so that we do not take the first measurement while some packets from the previous tests migth still be in flight
            t1_rx, t1_non_dp_rx, t1_tx, t1_non_dp_tx, t1_drop, t1_tx_fail, t1_tsc, abs_tsc_hz = self.gen_machine.core_stats()
            t1_dp_rx = t1_rx - t1_non_dp_rx
            t1_dp_tx = t1_tx - t1_non_dp_tx
            self.gen_machine.set_generator_speed(0)
            self.gen_machine.start_gen_cores()
            if self.background_machines:
                self.set_background_speed(self.background_machines, 0)
                self.start_background_traffic(self.background_machines)
            if 'ramp_step' in self.test.keys():
                ramp_speed = self.test['ramp_step']
            else:
                ramp_speed = speed
            while ramp_speed < speed:
                self.gen_machine.set_generator_speed(ramp_speed)
                if self.background_machines:
                    self.set_background_speed(self.background_machines, ramp_speed)
                time.sleep(2)
                ramp_speed = ramp_speed + self.test['ramp_step']
            self.gen_machine.set_generator_speed(speed)
            if self.background_machines:
                self.set_background_speed(self.background_machines, speed)
            time.sleep(2) ## Needs to be 2 seconds since this 1 sec is the time that PROX uses to refresh the stats. Note that this can be changed in PROX!! Don't do it.
            start_bg_gen_stats = []
            for bg_gen_machine in self.background_machines:
                bg_rx, bg_non_dp_rx, bg_tx, bg_non_dp_tx, _, _, bg_tsc, _ = bg_gen_machine.core_stats()
                bg_gen_stat = {
                        "bg_dp_rx" : bg_rx - bg_non_dp_rx,
                        "bg_dp_tx" : bg_tx - bg_non_dp_tx,
                        "bg_tsc"   : bg_tsc
                        }
                start_bg_gen_stats.append(dict(bg_gen_stat))
            if self.sut_machine!= None:
                t2_sut_rx, t2_sut_non_dp_rx, t2_sut_tx, t2_sut_non_dp_tx, t2_sut_drop, t2_sut_tx_fail, t2_sut_tsc, sut_tsc_hz = self.sut_machine.core_stats()
            t2_rx, t2_non_dp_rx, t2_tx, t2_non_dp_tx, t2_drop, t2_tx_fail, t2_tsc, tsc_hz = self.gen_machine.core_stats()
            tx = t2_tx - t1_tx
            dp_tx =  tx - (t2_non_dp_tx - t1_non_dp_tx )
            dp_rx =  t2_rx - t1_rx - (t2_non_dp_rx - t1_non_dp_rx) 
            tot_dp_drop = dp_tx - dp_rx
            if tx == 0:
                RapidLog.critical("TX = 0. Test interrupted since no packet has been sent.")
            if dp_tx == 0:
                RapidLog.critical("Only non-dataplane packets (e.g. ARP) sent. Test interrupted since no packet has been sent.")
            # Ask PROX to calibrate the bucket size once we have a PROX function to do this.
            # Measure latency statistics per second
            lat_min, lat_max, lat_avg, used_avg, t2_lat_tsc, lat_hz, buckets = self.gen_machine.lat_stats()
            lat_samples = sum(buckets)
            sample_count = 0
            for sample_percentile, bucket in enumerate(buckets,start=1):
                sample_count += bucket
                if sample_count > (lat_samples * LAT_PERCENTILE):
                    break
            percentile_max = (sample_percentile == len(buckets))
            sample_percentile = sample_percentile *  float(2 ** BUCKET_SIZE_EXP) / (old_div(float(lat_hz),float(10**6)))
            if self.test['test'] == 'fixed_rate':
                RapidLog.info(self.report_result(flow_number,size,speed,None,None,None,None,lat_avg,sample_percentile,percentile_max,lat_max, dp_tx, dp_rx , None, None))
            tot_rx = tot_non_dp_rx = tot_tx = tot_non_dp_tx = tot_drop = 0
            lat_avg = used_avg = 0
            buckets_total = buckets
            tot_lat_samples = sum(buckets)
            tot_lat_measurement_duration = float(0)
            tot_core_measurement_duration = float(0)
            tot_sut_core_measurement_duration = float(0)
            tot_sut_rx = tot_sut_non_dp_rx = tot_sut_tx = tot_sut_non_dp_tx = tot_sut_drop = tot_sut_tx_fail = tot_sut_tsc = 0
            lat_avail = core_avail = sut_avail = False
            while (tot_core_measurement_duration - float(requested_duration) <= 0.1) or (tot_lat_measurement_duration - float(requested_duration) <= 0.1):
                time.sleep(0.5)
                lat_min_sample, lat_max_sample, lat_avg_sample, used_sample, t3_lat_tsc, lat_hz, buckets = self.gen_machine.lat_stats()
                # Get statistics after some execution time
                if t3_lat_tsc != t2_lat_tsc:
                    single_lat_measurement_duration = (t3_lat_tsc - t2_lat_tsc) * 1.0 / lat_hz  # time difference between the 2 measurements, expressed in seconds.
                    # A second has passed in between to lat_stats requests. Hence we need to process the results
                    tot_lat_measurement_duration = tot_lat_measurement_duration + single_lat_measurement_duration
                    if lat_min > lat_min_sample:
                        lat_min = lat_min_sample
                    if lat_max < lat_max_sample:
                        lat_max = lat_max_sample
                    lat_avg = lat_avg + lat_avg_sample * single_lat_measurement_duration # Sometimes, There is more than 1 second between 2 lat_stats. Hence we will take the latest measurement
                    used_avg = used_avg + used_sample * single_lat_measurement_duration  # and give it more weigth.
                    lat_samples = sum(buckets)
                    tot_lat_samples += lat_samples
                    sample_count = 0
                    for sample_percentile, bucket in enumerate(buckets,start=1):
                        sample_count += bucket
                        if sample_count > lat_samples * LAT_PERCENTILE:
                            break
                    percentile_max = (sample_percentile == len(buckets))
                    bucket_size = float(2 ** BUCKET_SIZE_EXP) / (old_div(float(lat_hz),float(10**6)))
                    sample_percentile = sample_percentile *  bucket_size
                    buckets_total = [buckets_total[i] + buckets[i] for i in range(len(buckets_total))]
                    t2_lat_tsc = t3_lat_tsc
                    lat_avail = True
                t3_rx, t3_non_dp_rx, t3_tx, t3_non_dp_tx, t3_drop, t3_tx_fail, t3_tsc, tsc_hz = self.gen_machine.core_stats()
                if t3_tsc != t2_tsc:
                    single_core_measurement_duration = (t3_tsc - t2_tsc) * 1.0 / tsc_hz  # time difference between the 2 measurements, expressed in seconds.
                    tot_core_measurement_duration = tot_core_measurement_duration + single_core_measurement_duration
                    delta_rx = t3_rx - t2_rx
                    tot_rx += delta_rx
                    delta_non_dp_rx = t3_non_dp_rx - t2_non_dp_rx
                    tot_non_dp_rx += delta_non_dp_rx
                    delta_tx = t3_tx - t2_tx
                    tot_tx += delta_tx
                    delta_non_dp_tx = t3_non_dp_tx - t2_non_dp_tx
                    tot_non_dp_tx += delta_non_dp_tx
                    delta_dp_tx = delta_tx -delta_non_dp_tx
                    delta_dp_rx = delta_rx -delta_non_dp_rx
                    delta_dp_drop = delta_dp_tx - delta_dp_rx
                    tot_dp_drop += delta_dp_drop
                    delta_drop = t3_drop - t2_drop
                    tot_drop += delta_drop
                    t2_rx, t2_non_dp_rx, t2_tx, t2_non_dp_tx, t2_drop, t2_tx_fail, t2_tsc = t3_rx, t3_non_dp_rx, t3_tx, t3_non_dp_tx, t3_drop, t3_tx_fail, t3_tsc
                    core_avail = True
                if self.sut_machine!=None:
                    t3_sut_rx, t3_sut_non_dp_rx, t3_sut_tx, t3_sut_non_dp_tx, t3_sut_drop, t3_sut_tx_fail, t3_sut_tsc, sut_tsc_hz = self.sut_machine.core_stats()
                    if t3_sut_tsc != t2_sut_tsc:
                        single_sut_core_measurement_duration = (t3_sut_tsc - t2_sut_tsc) * 1.0 / tsc_hz  # time difference between the 2 measurements, expressed in seconds.
                        tot_sut_core_measurement_duration = tot_sut_core_measurement_duration + single_sut_core_measurement_duration
                        tot_sut_rx += t3_sut_rx - t2_sut_rx
                        tot_sut_non_dp_rx += t3_sut_non_dp_rx - t2_sut_non_dp_rx
                        delta_sut_tx = t3_sut_tx - t2_sut_tx
                        tot_sut_tx += delta_sut_tx
                        delta_sut_non_dp_tx = t3_sut_non_dp_tx - t2_sut_non_dp_tx
                        tot_sut_non_dp_tx += delta_sut_non_dp_tx 
                        t2_sut_rx, t2_sut_non_dp_rx, t2_sut_tx, t2_sut_non_dp_tx, t2_sut_drop, t2_sut_tx_fail, t2_sut_tsc = t3_sut_rx, t3_sut_non_dp_rx, t3_sut_tx, t3_sut_non_dp_tx, t3_sut_drop, t3_sut_tx_fail, t3_sut_tsc
                        sut_avail = True
                if self.test['test'] == 'fixed_rate':
                    if lat_avail == core_avail == True:
                        lat_avail = core_avail = False
                        pps_req_tx = (delta_tx + delta_drop - delta_rx)/single_core_measurement_duration/1000000
                        pps_tx = delta_tx/single_core_measurement_duration/1000000
                        if self.sut_machine != None and sut_avail:
                            pps_sut_tx = delta_sut_tx/single_sut_core_measurement_duration/1000000
                            sut_avail = False
                        else:
                            pps_sut_tx = None
                        pps_rx = delta_rx/single_core_measurement_duration/1000000
                        RapidLog.info(self.report_result(flow_number, size,
                            speed, pps_req_tx, pps_tx, pps_sut_tx, pps_rx,
                            lat_avg_sample, sample_percentile, percentile_max,
                            lat_max_sample, delta_dp_tx, delta_dp_rx,
                            tot_dp_drop, single_core_measurement_duration))
                        variables = {
                                'Flows': flow_number,
                                'Size': size,
                                'RequestedSpeed': self.get_pps(speed,size),
                                'CoreGenerated': pps_req_tx,
                                'SentByNIC': pps_tx,
                                'FwdBySUT': pps_sut_tx,
                                'RevByCore': pps_rx,
                                'AvgLatency': lat_avg_sample,
                                'PCTLatency': sample_percentile,
                                'MaxLatency': lat_max_sample,
                                'PacketsSent': delta_dp_tx,
                                'PacketsReceived': delta_dp_rx,
                                'PacketsLost': tot_dp_drop,
                                'bucket_size': bucket_size,
                                'buckets': buckets}

                        self.post_data('rapid_flowsizetest', variables)
            end_bg_gen_stats = []
            for bg_gen_machine in self.background_machines:
                bg_rx, bg_non_dp_rx, bg_tx, bg_non_dp_tx, _, _, bg_tsc, bg_hz = bg_gen_machine.core_stats()
                bg_gen_stat = {"bg_dp_rx" : bg_rx - bg_non_dp_rx,
                        "bg_dp_tx" : bg_tx - bg_non_dp_tx,
                        "bg_tsc"   : bg_tsc,
                        "bg_hz"    : bg_hz
                        }
                end_bg_gen_stats.append(dict(bg_gen_stat))
            i = 0
            bg_rates =[]
            while i < len(end_bg_gen_stats):
                bg_rates.append(0.000001*(end_bg_gen_stats[i]['bg_dp_rx'] -
                    start_bg_gen_stats[i]['bg_dp_rx']) / ((end_bg_gen_stats[i]['bg_tsc'] -
                    start_bg_gen_stats[i]['bg_tsc']) * 1.0 / end_bg_gen_stats[i]['bg_hz']))
                i += 1
            if len(bg_rates):
                avg_bg_rate = sum(bg_rates) / len(bg_rates)
                RapidLog.debug('Average Background traffic rate: {:>7.3f} Mpps'.format(avg_bg_rate))
            else:
                avg_bg_rate = None
            #Stop generating
            self.gen_machine.stop_gen_cores()
            r += 1
            lat_avg = old_div(lat_avg, float(tot_lat_measurement_duration))
            used_avg = old_div(used_avg, float(tot_lat_measurement_duration))
            t4_tsc = t2_tsc
            while t4_tsc == t2_tsc:
                t4_rx, t4_non_dp_rx, t4_tx, t4_non_dp_tx, t4_drop, t4_tx_fail, t4_tsc, abs_tsc_hz = self.gen_machine.core_stats()
            if self.test['test'] == 'fixed_rate':
                t4_lat_tsc = t2_lat_tsc
                while t4_lat_tsc == t2_lat_tsc:
                    lat_min_sample, lat_max_sample, lat_avg_sample, used_sample, t4_lat_tsc, lat_hz, buckets = self.gen_machine.lat_stats()
                sample_count = 0
                lat_samples = sum(buckets)
                for percentile, bucket in enumerate(buckets,start=1):
                    sample_count += bucket
                    if sample_count > lat_samples * LAT_PERCENTILE:
                        break
                percentile_max = (percentile == len(buckets))
                percentile = percentile *  bucket_size
                lat_max = lat_max_sample
                lat_avg = lat_avg_sample
                delta_rx = t4_rx - t2_rx
                delta_non_dp_rx = t4_non_dp_rx - t2_non_dp_rx
                delta_tx = t4_tx - t2_tx
                delta_non_dp_tx = t4_non_dp_tx - t2_non_dp_tx
                delta_dp_tx = delta_tx -delta_non_dp_tx
                delta_dp_rx = delta_rx -delta_non_dp_rx
                dp_tx = delta_dp_tx
                dp_rx = delta_dp_rx
                tot_dp_drop += delta_dp_tx - delta_dp_rx
                pps_req_tx = None
                pps_tx = None
                pps_sut_tx = None
                pps_rx = None
                drop_rate = 100.0*(dp_tx-dp_rx)/dp_tx
                tot_core_measurement_duration = None
                break ## Not really needed since the while loop will stop when evaluating the value of r
            else:
                sample_count = 0
                buckets = buckets_total
                for percentile, bucket in enumerate(buckets_total,start=1):
                    sample_count += bucket
                    if sample_count > tot_lat_samples * LAT_PERCENTILE:
                        break
                percentile_max = (percentile == len(buckets_total))
                percentile = percentile *  bucket_size
                pps_req_tx = (tot_tx + tot_drop - tot_rx)/tot_core_measurement_duration/1000000.0 # tot_drop is all packets dropped by all tasks. This includes packets dropped at the generator task + packets dropped by the nop task. In steady state, this equals to the number of packets received by this VM
                pps_tx = tot_tx/tot_core_measurement_duration/1000000.0 # tot_tx is all generated packets actually accepted by the interface
                pps_rx = tot_rx/tot_core_measurement_duration/1000000.0 # tot_rx is all packets received by the nop task = all packets received in the gen VM
                if self.sut_machine != None and sut_avail:
                    pps_sut_tx = tot_sut_tx / tot_sut_core_measurement_duration / 1000000.0
                else:
                    pps_sut_tx = None
                dp_tx = (t4_tx - t1_tx) - (t4_non_dp_tx - t1_non_dp_tx)
                dp_rx = (t4_rx - t1_rx) - (t4_non_dp_rx - t1_non_dp_rx)
                tot_dp_drop = dp_tx - dp_rx
                drop_rate = 100.0*tot_dp_drop/dp_tx
                if ((drop_rate < self.test['drop_rate_threshold']) or (tot_dp_drop == self.test['drop_rate_threshold'] ==0) or (tot_dp_drop > self.test['maxz'])):
                    break
        return(pps_req_tx,pps_tx,pps_sut_tx,pps_rx,lat_avg,percentile,percentile_max,lat_max,dp_tx,dp_rx,tot_dp_drop,(t4_tx_fail - t1_tx_fail),drop_rate,lat_min,used_avg,r,tot_core_measurement_duration,avg_bg_rate,bucket_size,buckets)