Database: Added SM-6.0 profile [Contribution from Massimiliano Fatica]
This commit is contained in:
@@ -1,73 +1,74 @@
|
||||
/*
|
||||
* Copyright (c) 2015, PHILIPPE TILLET. All rights reserved.
|
||||
*
|
||||
* This file is part of ISAAC.
|
||||
*
|
||||
* ISAAC is free software; you can redistribute it and/or
|
||||
* modify it under the terms of the GNU Lesser General Public
|
||||
* License as published by the Free Software Foundation; either
|
||||
* version 2.1 of the License, or (at your option) any later version.
|
||||
*
|
||||
* This library is distributed in the hope that it will be useful,
|
||||
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
||||
* Lesser General Public License for more details.
|
||||
*
|
||||
* You should have received a copy of the GNU Lesser General Public
|
||||
* License along with this library; if not, write to the Free Software
|
||||
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
|
||||
* MA 02110-1301 USA
|
||||
*/
|
||||
|
||||
#include "isaac/driver/device.h"
|
||||
#include "isaac/runtime/profiles.h"
|
||||
|
||||
//Default
|
||||
#include "database/unknown/unknown.hpp"
|
||||
|
||||
//Intel
|
||||
#include "database/intel/broadwell.hpp"
|
||||
|
||||
//NVidia
|
||||
#include "database/nvidia/sm_3_0.hpp"
|
||||
#include "database/nvidia/sm_5_2.hpp"
|
||||
#include "database/nvidia/sm_6_1.hpp"
|
||||
|
||||
//AMD
|
||||
#include "database/amd/gcn_3.hpp"
|
||||
|
||||
namespace isaac
|
||||
{
|
||||
namespace runtime
|
||||
{
|
||||
|
||||
#define DATABASE_ENTRY(TYPE, VENDOR, ARCHITECTURE, STRING) \
|
||||
{std::make_tuple(driver::Device::Type::TYPE, driver::Device::Vendor::VENDOR, driver::Device::Architecture::ARCHITECTURE), STRING}
|
||||
|
||||
const profiles::presets_type profiles::presets_ =
|
||||
{
|
||||
//DEFAULT
|
||||
DATABASE_ENTRY(UNKNOWN, UNKNOWN, UNKNOWN, database::unknown::unknown),
|
||||
//INTEL
|
||||
DATABASE_ENTRY(GPU, INTEL, BROADWELL, database::intel::broadwell),
|
||||
//NVIDIA
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_2_0, database::nvidia::sm_3_0),
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_2_1, database::nvidia::sm_3_0),
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_3_0, database::nvidia::sm_3_0),
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_3_5, database::nvidia::sm_3_0),
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_3_7, database::nvidia::sm_3_0),
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_5_0, database::nvidia::sm_5_2),
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_5_2, database::nvidia::sm_5_2),
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_6_0, database::nvidia::sm_6_1),
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_6_1, database::nvidia::sm_6_1),
|
||||
//AMD
|
||||
DATABASE_ENTRY(GPU, AMD, GCN_1, database::amd::gcn_3),
|
||||
DATABASE_ENTRY(GPU, AMD, GCN_2, database::amd::gcn_3),
|
||||
DATABASE_ENTRY(GPU, AMD, GCN_3, database::amd::gcn_3),
|
||||
DATABASE_ENTRY(GPU, AMD, GCN_4, database::amd::gcn_3)
|
||||
};
|
||||
|
||||
#undef DATABASE_ENTRY
|
||||
|
||||
}
|
||||
}
|
||||
/*
|
||||
* Copyright (c) 2015, PHILIPPE TILLET. All rights reserved.
|
||||
*
|
||||
* This file is part of ISAAC.
|
||||
*
|
||||
* ISAAC is free software; you can redistribute it and/or
|
||||
* modify it under the terms of the GNU Lesser General Public
|
||||
* License as published by the Free Software Foundation; either
|
||||
* version 2.1 of the License, or (at your option) any later version.
|
||||
*
|
||||
* This library is distributed in the hope that it will be useful,
|
||||
* but WITHOUT ANY WARRANTY; without even the implied warranty of
|
||||
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
||||
* Lesser General Public License for more details.
|
||||
*
|
||||
* You should have received a copy of the GNU Lesser General Public
|
||||
* License along with this library; if not, write to the Free Software
|
||||
* Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston,
|
||||
* MA 02110-1301 USA
|
||||
*/
|
||||
|
||||
#include "isaac/driver/device.h"
|
||||
#include "isaac/runtime/profiles.h"
|
||||
|
||||
//Default
|
||||
#include "database/unknown/unknown.hpp"
|
||||
|
||||
//Intel
|
||||
#include "database/intel/broadwell.hpp"
|
||||
|
||||
//NVidia
|
||||
#include "database/nvidia/sm_3_0.hpp"
|
||||
#include "database/nvidia/sm_5_2.hpp"
|
||||
#include "database/nvidia/sm_6_0.hpp"
|
||||
#include "database/nvidia/sm_6_1.hpp"
|
||||
|
||||
//AMD
|
||||
#include "database/amd/gcn_3.hpp"
|
||||
|
||||
namespace isaac
|
||||
{
|
||||
namespace runtime
|
||||
{
|
||||
|
||||
#define DATABASE_ENTRY(TYPE, VENDOR, ARCHITECTURE, STRING) \
|
||||
{std::make_tuple(driver::Device::Type::TYPE, driver::Device::Vendor::VENDOR, driver::Device::Architecture::ARCHITECTURE), STRING}
|
||||
|
||||
const profiles::presets_type profiles::presets_ =
|
||||
{
|
||||
//DEFAULT
|
||||
DATABASE_ENTRY(UNKNOWN, UNKNOWN, UNKNOWN, database::unknown::unknown),
|
||||
//INTEL
|
||||
DATABASE_ENTRY(GPU, INTEL, BROADWELL, database::intel::broadwell),
|
||||
//NVIDIA
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_2_0, database::nvidia::sm_3_0),
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_2_1, database::nvidia::sm_3_0),
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_3_0, database::nvidia::sm_3_0),
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_3_5, database::nvidia::sm_3_0),
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_3_7, database::nvidia::sm_3_0),
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_5_0, database::nvidia::sm_5_2),
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_5_2, database::nvidia::sm_5_2),
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_6_0, database::nvidia::sm_6_0),
|
||||
DATABASE_ENTRY(GPU, NVIDIA, SM_6_1, database::nvidia::sm_6_1),
|
||||
//AMD
|
||||
DATABASE_ENTRY(GPU, AMD, GCN_1, database::amd::gcn_3),
|
||||
DATABASE_ENTRY(GPU, AMD, GCN_2, database::amd::gcn_3),
|
||||
DATABASE_ENTRY(GPU, AMD, GCN_3, database::amd::gcn_3),
|
||||
DATABASE_ENTRY(GPU, AMD, GCN_4, database::amd::gcn_3)
|
||||
};
|
||||
|
||||
#undef DATABASE_ENTRY
|
||||
|
||||
}
|
||||
}
|
||||
|
1
lib/runtime/database/nvidia/json/sm_6_0.json
Normal file
1
lib/runtime/database/nvidia/json/sm_6_0.json
Normal file
File diff suppressed because one or more lines are too long
59278
lib/runtime/database/nvidia/sm_6_0.hpp
Normal file
59278
lib/runtime/database/nvidia/sm_6_0.hpp
Normal file
File diff suppressed because it is too large
Load Diff
@@ -73,7 +73,7 @@ def main():
|
||||
libraries += ['gnustl_shared']
|
||||
|
||||
#Source files
|
||||
src = 'src/lib/runtime/predictors/random_forest.cpp src/lib/runtime/profiles.cpp src/lib/runtime/database.cpp src/lib/runtime/execute.cpp src/lib/exception/driver.cpp src/lib/exception/api.cpp src/lib/random/rand.cpp src/lib/jit/generation/elementwise_1d.cpp src/lib/jit/generation/reduce_2d.cpp src/lib/jit/generation/reduce_1d.cpp src/lib/jit/generation/base.cpp src/lib/jit/generation/gemm.cpp src/lib/jit/generation/engine/keywords.cpp src/lib/jit/generation/engine/stream.cpp src/lib/jit/generation/elementwise_2d.cpp src/lib/jit/syntax/expression/expression.cpp src/lib/jit/syntax/expression/preset.cpp src/lib/jit/syntax/expression/operations.cpp src/lib/jit/syntax/engine/binder.cpp src/lib/jit/syntax/engine/macro.cpp src/lib/jit/syntax/engine/process.cpp src/lib/jit/syntax/engine/object.cpp src/lib/value_scalar.cpp src/lib/array.cpp src/lib/api/blas/cublas.cpp src/lib/api/blas/clBLAS.cpp src/lib/driver/dispatch.cpp src/lib/driver/kernel.cpp src/lib/driver/backend.cpp src/lib/driver/platform.cpp src/lib/driver/buffer.cpp src/lib/driver/event.cpp src/lib/driver/ndrange.cpp src/lib/driver/device.cpp src/lib/driver/program_cache.cpp src/lib/driver/check.cpp src/lib/driver/command_queue.cpp src/lib/driver/handle.cpp src/lib/driver/context.cpp src/lib/driver/program.cpp '.split() + [os.path.join('src', 'bind', sf) for sf in ['_isaac.cpp', 'core.cpp', 'driver.cpp', 'kernels.cpp', 'exceptions.cpp']]
|
||||
src = 'src/lib/exception/api.cpp src/lib/exception/driver.cpp src/lib/value_scalar.cpp src/lib/random/rand.cpp src/lib/driver/check.cpp src/lib/driver/ndrange.cpp src/lib/driver/platform.cpp src/lib/driver/backend.cpp src/lib/driver/program.cpp src/lib/driver/command_queue.cpp src/lib/driver/event.cpp src/lib/driver/kernel.cpp src/lib/driver/handle.cpp src/lib/driver/device.cpp src/lib/driver/program_cache.cpp src/lib/driver/buffer.cpp src/lib/driver/context.cpp src/lib/driver/dispatch.cpp src/lib/jit/generation/engine/stream.cpp src/lib/jit/generation/engine/keywords.cpp src/lib/jit/generation/reduce_1d.cpp src/lib/jit/generation/elementwise_1d.cpp src/lib/jit/generation/base.cpp src/lib/jit/generation/elementwise_2d.cpp src/lib/jit/generation/reduce_2d.cpp src/lib/jit/generation/gemm.cpp src/lib/jit/syntax/engine/object.cpp src/lib/jit/syntax/engine/macro.cpp src/lib/jit/syntax/engine/process.cpp src/lib/jit/syntax/engine/binder.cpp src/lib/jit/syntax/expression/operations.cpp src/lib/jit/syntax/expression/expression.cpp src/lib/jit/syntax/expression/preset.cpp src/lib/api/blas/clBLAS.cpp src/lib/api/blas/cublas.cpp src/lib/runtime/execute.cpp src/lib/runtime/predictors/random_forest.cpp src/lib/runtime/profiles.cpp src/lib/runtime/database.cpp src/lib/array.cpp '.split() + [os.path.join('src', 'bind', sf) for sf in ['_isaac.cpp', 'core.cpp', 'driver.cpp', 'kernels.cpp', 'exceptions.cpp']]
|
||||
boostsrc = 'external/boost/libs/'
|
||||
for s in ['numpy','python','smart_ptr','system','thread']:
|
||||
src = src + [x for x in recursive_glob('external/boost/libs/' + s + '/src/','.cpp') if 'win32' not in x and 'pthread' not in x]
|
||||
|
Reference in New Issue
Block a user