/*****************************************************************************
 *                                McPAT/CACTI
 *                      SOFTWARE LICENSE AGREEMENT
 *            Copyright 2012 Hewlett-Packard Development Company, L.P.
 *            Copyright (c) 2010-2013 Advanced Micro Devices, Inc.
 *                          All Rights Reserved
 *
 * Redistribution and use in source and binary forms, with or without
 * modification, are permitted provided that the following conditions are
 * met: redistributions of source code must retain the above copyright
 * notice, this list of conditions and the following disclaimer;
 * redistributions in binary form must reproduce the above copyright
 * notice, this list of conditions and the following disclaimer in the
 * documentation and/or other materials provided with the distribution;
 * neither the name of the copyright holders nor the names of its
 * contributors may be used to endorse or promote products derived from
 * this software without specific prior written permission.

 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
 *
 ***************************************************************************/

#include <pthread.h>

#include <algorithm>
#include <cmath>
#include <ctime>
#include <iostream>

#include "Ucache.h"
#include "area.h"
#include "basic_circuit.h"
#include "cacti_interface.h"
#include "component.h"
#include "const.h"
#include "parameter.h"

using namespace std;


bool mem_array::lt(const mem_array * m1, const mem_array * m2) {
    if (m1->Nspd < m2->Nspd) return true;
    else if (m1->Nspd > m2->Nspd) return false;
    else if (m1->Ndwl < m2->Ndwl) return true;
    else if (m1->Ndwl > m2->Ndwl) return false;
    else if (m1->Ndbl < m2->Ndbl) return true;
    else if (m1->Ndbl > m2->Ndbl) return false;
    else if (m1->deg_bl_muxing < m2->deg_bl_muxing) return true;
    else if (m1->deg_bl_muxing > m2->deg_bl_muxing) return false;
    else if (m1->Ndsam_lev_1 < m2->Ndsam_lev_1) return true;
    else if (m1->Ndsam_lev_1 > m2->Ndsam_lev_1) return false;
    else if (m1->Ndsam_lev_2 < m2->Ndsam_lev_2) return true;
    else return false;
}



void uca_org_t::find_delay() {
    mem_array * data_arr = data_array2;
    mem_array * tag_arr  = tag_array2;

    // check whether it is a regular cache or scratch ram
    if (g_ip->pure_ram || g_ip->pure_cam || g_ip->fully_assoc) {
        access_time = data_arr->access_time;
    }
    // Both tag and data lookup happen in parallel
    // and the entire set is sent over the data array h-tree without
    // waiting for the way-select signal --TODO add the corresponding
    // power overhead Nav
    else if (g_ip->fast_access == true) {
        access_time = MAX(tag_arr->access_time, data_arr->access_time);
    }
    // Tag is accessed first. On a hit, way-select signal along with the
    // address is sent to read/write the appropriate block in the data
    // array
    else if (g_ip->is_seq_acc == true) {
        access_time = tag_arr->access_time + data_arr->access_time;
    }
    // Normal access: tag array access and data array access happen in parallel.
    // But, the data array will wait for the way-select and transfer only the
    // appropriate block over the h-tree.
    else {
        access_time = MAX(tag_arr->access_time + data_arr->delay_senseamp_mux_decoder,
                          data_arr->delay_before_subarray_output_driver) +
                      data_arr->delay_from_subarray_output_driver_to_output;
    }
}



void uca_org_t::find_energy() {
    if (!(g_ip->pure_ram || g_ip->pure_cam || g_ip->fully_assoc))
        power = data_array2->power + tag_array2->power;
    else
        power = data_array2->power;
}



void uca_org_t::find_area() {
    if (g_ip->pure_ram || g_ip->pure_cam || g_ip->fully_assoc) {
        cache_ht  = data_array2->height;
        cache_len = data_array2->width;
    } else {
        cache_ht  = MAX(tag_array2->height, data_array2->height);
        cache_len = tag_array2->width + data_array2->width;
    }
    area = cache_ht * cache_len;
}

void uca_org_t::adjust_area() {
    double area_adjust;
    if (g_ip->pure_ram || g_ip->pure_cam || g_ip->fully_assoc) {
        if (data_array2->area_efficiency / 100.0 < 0.2) {
            //area_adjust = sqrt(area/(area*(data_array2->area_efficiency/100.0)/0.2));
            area_adjust = sqrt(0.2 / (data_array2->area_efficiency / 100.0));
            cache_ht  = cache_ht / area_adjust;
            cache_len = cache_len / area_adjust;
        }
    }
    area = cache_ht * cache_len;
}

void uca_org_t::find_cyc() {
    if ((g_ip->pure_ram || g_ip->pure_cam || g_ip->fully_assoc)) {
        cycle_time = data_array2->cycle_time;
    } else {
        cycle_time = MAX(tag_array2->cycle_time,
                         data_array2->cycle_time);
    }
}

uca_org_t :: uca_org_t()
        : tag_array2(0),
        data_array2(0) {

}

void uca_org_t :: cleanup() {
    if (data_array2 != 0)
        delete data_array2;
    if (tag_array2 != 0)
        delete tag_array2;
}