diff --git a/.gitattributes b/.gitattributes new file mode 100644 index 0000000..1ff0c42 --- /dev/null +++ b/.gitattributes @@ -0,0 +1,63 @@ +############################################################################### +# Set default behavior to automatically normalize line endings. +############################################################################### +* text=auto + +############################################################################### +# Set default behavior for command prompt diff. +# +# This is need for earlier builds of msysgit that does not have it on by +# default for csharp files. +# Note: This is only used by command line +############################################################################### +#*.cs diff=csharp + +############################################################################### +# Set the merge driver for project and solution files +# +# Merging from the command prompt will add diff markers to the files if there +# are conflicts (Merging from VS is not affected by the settings below, in VS +# the diff markers are never inserted). Diff markers may cause the following +# file extensions to fail to load in VS. An alternative would be to treat +# these files as binary and thus will always conflict and require user +# intervention with every merge. To do so, just uncomment the entries below +############################################################################### +#*.sln merge=binary +#*.csproj merge=binary +#*.vbproj merge=binary +#*.vcxproj merge=binary +#*.vcproj merge=binary +#*.dbproj merge=binary +#*.fsproj merge=binary +#*.lsproj merge=binary +#*.wixproj merge=binary +#*.modelproj merge=binary +#*.sqlproj merge=binary +#*.wwaproj merge=binary + +############################################################################### +# behavior for image files +# +# image files are treated as binary by default. +############################################################################### +#*.jpg binary +#*.png binary +#*.gif binary + +############################################################################### +# diff behavior for common document formats +# +# Convert binary document formats to text before diffing them. This feature +# is only available from the command line. Turn it on by uncommenting the +# entries below. +############################################################################### +#*.doc diff=astextplain +#*.DOC diff=astextplain +#*.docx diff=astextplain +#*.DOCX diff=astextplain +#*.dot diff=astextplain +#*.DOT diff=astextplain +#*.pdf diff=astextplain +#*.PDF diff=astextplain +#*.rtf diff=astextplain +#*.RTF diff=astextplain diff --git a/Proj2_Win/CPUversion/CPUSum.cpp b/Proj2_Win/CPUversion/CPUSum.cpp new file mode 100644 index 0000000..cc52263 --- /dev/null +++ b/Proj2_Win/CPUversion/CPUSum.cpp @@ -0,0 +1,78 @@ +#include "stdafx.h" +#include "CPUSum.h" +#include + +CPUSum::CPUSum() +{ +} + + +CPUSum::~CPUSum() +{ +} + +void CPUSum::scan_inclusive(const int *in, int *out, long n) +{ + out[0] = in[0]; + for (long i = 1; i < n; i++) + { + out[i] = out[i - 1] + in[i]; + } +} + +void CPUSum::scan_exclusive(const int *in, int *out, long n) +{ + out[0] = 0; + for (long i = 1; i < n; i++) + { + out[i] = out[i - 1] + in[i-1]; + } +} + +void CPUSum::print(const int *a, long n) +{ + for (long i = 0; i < n; i++) + { + std::cout << a[i] << " "; + } + std::cout << std::endl; +} + +void CPUSum::transform_bool(const int *in, int *out, long n) +{ + for (long i = 0; i < n; i++) + { + if (in[i] > 0) + out[i] = 1; + else + { + out[i] = 0; + } + } +} + +void CPUSum::scatter(const int *in, int *out, const long len, long &newLength) +{ + int *temp = new int[len]; + int *temp2 = new int[len]; + transform_bool(in, temp, len); + scan_inclusive(temp, temp2, len); + newLength = temp2[len - 1]; + //out = new int[newLength]; + int pos = 0; + if (in[0] > 0) + { + out[pos++] = in[0]; + } + for (long i = 1; i < len; i++) + { + if (temp2[i] > temp2[i - 1]) + { + out[pos++] = in[i]; + } + } + delete[] temp; + delete[] temp2; + //print(out, newLength); + //delete[] out; +} \ No newline at end of file diff --git a/Proj2_Win/CPUversion/CPUSum.h b/Proj2_Win/CPUversion/CPUSum.h new file mode 100644 index 0000000..e531b2d --- /dev/null +++ b/Proj2_Win/CPUversion/CPUSum.h @@ -0,0 +1,13 @@ +#pragma once +class CPUSum +{ +public: + void scan_inclusive(const int *in, int *out,long n); + void scan_exclusive(const int*in, int *out, long n); + void transform_bool(const int *in, int *out, long n); + void print(const int *a, long n); + void scatter(const int *in, int *out, const long len, long &newLength); + CPUSum(); + ~CPUSum(); +}; + diff --git a/Proj2_Win/CPUversion/CPUversion.cpp b/Proj2_Win/CPUversion/CPUversion.cpp new file mode 100644 index 0000000..c6818a2 --- /dev/null +++ b/Proj2_Win/CPUversion/CPUversion.cpp @@ -0,0 +1,73 @@ +// CPUversion.cpp : Defines the entry point for the console application. +// + +#include "stdafx.h" +#include "CPUSum.h" +#include +#define TEST_TIMES 100 +#define LENGTH 100000 +void test(const int *in, int *out,int len){ + CPUSum CPUapp; + long newLen = len; + CPUapp.scatter(in, out, len, newLen); +} +void warmup() +{ + clock_t start, finish; + double duration; + const int len = 1000; + int newLen = len; + int *in = new int[len]; + int *out = new int[len]; + int *out1 = new int[len]; + //int in[] = { 0, 0, 3, 4, 0, 6, 6, 7, 0, 7, 1, 3, 3, 2, 0, 1 }; + for (size_t i = 0; i < len; i++) + { + in[i] = i + 1; + } + int count = 10000; + start = clock(); + while (count--) + { + test(in, out, len); + } + finish = clock(); + duration = finish - start; + //CPUapp.print(out1, newLen); + printf("warmup in %f ms\n", duration); + + delete[] out; + delete[] out1; +} +int _tmain(int argc, _TCHAR* argv[]) +{ + warmup(); + clock_t start, finish; + double duration; + const long len = LENGTH; + int newLen = len; + int *in = new int[len]; + int *out = new int[len]; + int *out1 = new int[len]; + //int in[] = { 0, 0, 3, 4, 0, 6, 6, 7, 0, 7, 1, 3, 3, 2, 0, 1 }; + for (long i = 0; i < len; i++) + { + in[i] = i + 1; + } + int count = TEST_TIMES; + start = clock(); + while (count--) + { + test(in, out, len); + } + finish = clock(); + duration = finish - start; + duration = duration / TEST_TIMES; + //CPUapp.print(out1, newLen); + printf("CPU Scattering finished in %f ms\n", duration); + + delete[] out; + delete[] out1; + return 0; +} + diff --git a/Proj2_Win/CPUversion/CPUversion.vcxproj b/Proj2_Win/CPUversion/CPUversion.vcxproj new file mode 100644 index 0000000..3a3e682 --- /dev/null +++ b/Proj2_Win/CPUversion/CPUversion.vcxproj @@ -0,0 +1,97 @@ + + + + + Debug + Win32 + + + Release + Win32 + + + + {5B128216-B420-4BD4-9765-C5A0040A3C05} + Win32Proj + CPUversion + + + + Application + true + v120 + Unicode + + + Application + false + v120 + true + Unicode + + + + + + + + + + + + + true + + + false + + + + Use + Level3 + Disabled + WIN32;_DEBUG;_CONSOLE;_LIB;%(PreprocessorDefinitions) + true + + + Console + true + + + + + Level3 + Use + MaxSpeed + true + true + WIN32;NDEBUG;_CONSOLE;_LIB;%(PreprocessorDefinitions) + true + + + Console + true + true + true + + + + + + + + + + + + + + + Create + Create + + + + + + \ No newline at end of file diff --git a/Proj2_Win/CPUversion/CPUversion.vcxproj.filters b/Proj2_Win/CPUversion/CPUversion.vcxproj.filters new file mode 100644 index 0000000..878b1f2 --- /dev/null +++ b/Proj2_Win/CPUversion/CPUversion.vcxproj.filters @@ -0,0 +1,42 @@ + + + + + {4FC737F1-C7A5-4376-A066-2A32D752A2FF} + cpp;c;cc;cxx;def;odl;idl;hpj;bat;asm;asmx + + + {93995380-89BD-4b04-88EB-625FBE52EBFB} + h;hh;hpp;hxx;hm;inl;inc;xsd + + + {67DA6AB6-F800-4c08-8B7A-83BB121AAD01} + rc;ico;cur;bmp;dlg;rc2;rct;bin;rgs;gif;jpg;jpeg;jpe;resx;tiff;tif;png;wav;mfcribbon-ms + + + + + + + + Header Files + + + Header Files + + + Header Files + + + + + Source Files + + + Source Files + + + Source Files + + + \ No newline at end of file diff --git a/Proj2_Win/CPUversion/Debug/CPUversion.Build.CppClean.log b/Proj2_Win/CPUversion/Debug/CPUversion.Build.CppClean.log new file mode 100644 index 0000000..ef16106 --- /dev/null +++ b/Proj2_Win/CPUversion/Debug/CPUversion.Build.CppClean.log @@ -0,0 +1,15 @@ +h:\documents\gpu programming\project2-streamcompaction\proj2_win\cpuversion\debug\cpuversion.pch +h:\documents\gpu programming\project2-streamcompaction\proj2_win\cpuversion\debug\vc120.pdb +h:\documents\gpu programming\project2-streamcompaction\proj2_win\cpuversion\debug\vc120.idb +h:\documents\gpu programming\project2-streamcompaction\proj2_win\cpuversion\debug\stdafx.obj +h:\documents\gpu programming\project2-streamcompaction\proj2_win\cpuversion\debug\cpusum.obj +h:\documents\gpu programming\project2-streamcompaction\proj2_win\cpuversion\debug\cpuversion.obj +h:\documents\gpu programming\project2-streamcompaction\proj2_win\debug\cpuversion.ilk +h:\documents\gpu programming\project2-streamcompaction\proj2_win\debug\cpuversion.exe +h:\documents\gpu programming\project2-streamcompaction\proj2_win\debug\cpuversion.pdb +h:\documents\gpu programming\project2-streamcompaction\proj2_win\cpuversion\debug\cpuversion.tlog\cl.command.1.tlog +h:\documents\gpu programming\project2-streamcompaction\proj2_win\cpuversion\debug\cpuversion.tlog\cl.read.1.tlog +h:\documents\gpu programming\project2-streamcompaction\proj2_win\cpuversion\debug\cpuversion.tlog\cl.write.1.tlog +h:\documents\gpu programming\project2-streamcompaction\proj2_win\cpuversion\debug\cpuversion.tlog\link.command.1.tlog +h:\documents\gpu programming\project2-streamcompaction\proj2_win\cpuversion\debug\cpuversion.tlog\link.read.1.tlog +h:\documents\gpu programming\project2-streamcompaction\proj2_win\cpuversion\debug\cpuversion.tlog\link.write.1.tlog diff --git a/Proj2_Win/CPUversion/Debug/CPUversion.log b/Proj2_Win/CPUversion/Debug/CPUversion.log new file mode 100644 index 0000000..ac44ea0 --- /dev/null +++ b/Proj2_Win/CPUversion/Debug/CPUversion.log @@ -0,0 +1,15 @@ +Build started 10/3/2014 10:53:44 PM. + 1>Project "H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\CPUversion\CPUversion.vcxproj" on node 2 (Build target(s)). + 1>ClCompile: + C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\bin\CL.exe /c /ZI /nologo /W3 /WX- /sdl /Od /Oy- /D WIN32 /D _DEBUG /D _CONSOLE /D _LIB /D _UNICODE /D UNICODE /Gm /EHsc /RTC1 /MDd /GS /fp:precise /Zc:wchar_t /Zc:forScope /Yu"stdafx.h" /Fp"Debug\CPUversion.pch" /Fo"Debug\\" /Fd"Debug\vc120.pdb" /Gd /TP /analyze- /errorReport:prompt CPUversion.cpp + CPUversion.cpp + Link: + C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\bin\link.exe /ERRORREPORT:PROMPT /OUT:"H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Debug\CPUversion.exe" /INCREMENTAL /NOLOGO kernel32.lib user32.lib gdi32.lib winspool.lib comdlg32.lib advapi32.lib shell32.lib ole32.lib oleaut32.lib uuid.lib odbc32.lib odbccp32.lib /MANIFEST /MANIFESTUAC:"level='asInvoker' uiAccess='false'" /manifest:embed /DEBUG /PDB:"H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Debug\CPUversion.pdb" /SUBSYSTEM:CONSOLE /TLBID:1 /DYNAMICBASE /NXCOMPAT /IMPLIB:"H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Debug\CPUversion.lib" /MACHINE:X86 Debug\CPUSum.obj + Debug\CPUversion.obj + Debug\stdafx.obj + CPUversion.vcxproj -> H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Debug\CPUversion.exe + 1>Done Building Project "H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\CPUversion\CPUversion.vcxproj" (Build target(s)). + +Build succeeded. + +Time Elapsed 00:00:00.24 diff --git a/Proj2_Win/CPUversion/Debug/CPUversion.tlog/CL.read.1.tlog b/Proj2_Win/CPUversion/Debug/CPUversion.tlog/CL.read.1.tlog new file mode 100644 index 0000000..e433463 Binary files /dev/null and b/Proj2_Win/CPUversion/Debug/CPUversion.tlog/CL.read.1.tlog differ diff --git a/Proj2_Win/CPUversion/Debug/CPUversion.tlog/CL.write.1.tlog b/Proj2_Win/CPUversion/Debug/CPUversion.tlog/CL.write.1.tlog new file mode 100644 index 0000000..b695643 Binary files /dev/null and b/Proj2_Win/CPUversion/Debug/CPUversion.tlog/CL.write.1.tlog differ diff --git a/Proj2_Win/CPUversion/Debug/CPUversion.tlog/CPUversion.lastbuildstate b/Proj2_Win/CPUversion/Debug/CPUversion.tlog/CPUversion.lastbuildstate new file mode 100644 index 0000000..1da190d --- /dev/null +++ b/Proj2_Win/CPUversion/Debug/CPUversion.tlog/CPUversion.lastbuildstate @@ -0,0 +1,2 @@ +#TargetFrameworkVersion=v4.0:PlatformToolSet=v120:EnableManagedIncrementalBuild=false:VCToolArchitecture=Native32Bit +Debug|Win32|H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\| diff --git a/Proj2_Win/CPUversion/Debug/CPUversion.tlog/cl.command.1.tlog b/Proj2_Win/CPUversion/Debug/CPUversion.tlog/cl.command.1.tlog new file mode 100644 index 0000000..5888ee4 Binary files /dev/null and b/Proj2_Win/CPUversion/Debug/CPUversion.tlog/cl.command.1.tlog differ diff --git a/Proj2_Win/CPUversion/Debug/CPUversion.tlog/link.command.1.tlog b/Proj2_Win/CPUversion/Debug/CPUversion.tlog/link.command.1.tlog new file mode 100644 index 0000000..44d06b3 Binary files /dev/null and b/Proj2_Win/CPUversion/Debug/CPUversion.tlog/link.command.1.tlog differ diff --git a/Proj2_Win/CPUversion/Debug/CPUversion.tlog/link.read.1.tlog b/Proj2_Win/CPUversion/Debug/CPUversion.tlog/link.read.1.tlog new file mode 100644 index 0000000..f552a92 Binary files /dev/null and b/Proj2_Win/CPUversion/Debug/CPUversion.tlog/link.read.1.tlog differ diff --git a/Proj2_Win/CPUversion/Debug/CPUversion.tlog/link.write.1.tlog b/Proj2_Win/CPUversion/Debug/CPUversion.tlog/link.write.1.tlog new file mode 100644 index 0000000..9c35b3c Binary files /dev/null and b/Proj2_Win/CPUversion/Debug/CPUversion.tlog/link.write.1.tlog differ diff --git a/Proj2_Win/CPUversion/Debug/vc120.idb b/Proj2_Win/CPUversion/Debug/vc120.idb new file mode 100644 index 0000000..a7c681d Binary files /dev/null and b/Proj2_Win/CPUversion/Debug/vc120.idb differ diff --git a/Proj2_Win/CPUversion/Debug/vc120.pdb b/Proj2_Win/CPUversion/Debug/vc120.pdb new file mode 100644 index 0000000..63e056e Binary files /dev/null and b/Proj2_Win/CPUversion/Debug/vc120.pdb differ diff --git a/Proj2_Win/CPUversion/ReadMe.txt b/Proj2_Win/CPUversion/ReadMe.txt new file mode 100644 index 0000000..aa96268 --- /dev/null +++ b/Proj2_Win/CPUversion/ReadMe.txt @@ -0,0 +1,40 @@ +======================================================================== + CONSOLE APPLICATION : CPUversion Project Overview +======================================================================== + +AppWizard has created this CPUversion application for you. + +This file contains a summary of what you will find in each of the files that +make up your CPUversion application. + + +CPUversion.vcxproj + This is the main project file for VC++ projects generated using an Application Wizard. + It contains information about the version of Visual C++ that generated the file, and + information about the platforms, configurations, and project features selected with the + Application Wizard. + +CPUversion.vcxproj.filters + This is the filters file for VC++ projects generated using an Application Wizard. + It contains information about the association between the files in your project + and the filters. This association is used in the IDE to show grouping of files with + similar extensions under a specific node (for e.g. ".cpp" files are associated with the + "Source Files" filter). + +CPUversion.cpp + This is the main application source file. + +///////////////////////////////////////////////////////////////////////////// +Other standard files: + +StdAfx.h, StdAfx.cpp + These files are used to build a precompiled header (PCH) file + named CPUversion.pch and a precompiled types file named StdAfx.obj. + +///////////////////////////////////////////////////////////////////////////// +Other notes: + +AppWizard uses "TODO:" comments to indicate parts of the source code you +should add to or customize. + +///////////////////////////////////////////////////////////////////////////// diff --git a/Proj2_Win/CPUversion/stdafx.cpp b/Proj2_Win/CPUversion/stdafx.cpp new file mode 100644 index 0000000..e2a4d41 --- /dev/null +++ b/Proj2_Win/CPUversion/stdafx.cpp @@ -0,0 +1,8 @@ +// stdafx.cpp : source file that includes just the standard includes +// CPUversion.pch will be the pre-compiled header +// stdafx.obj will contain the pre-compiled type information + +#include "stdafx.h" + +// TODO: reference any additional headers you need in STDAFX.H +// and not in this file diff --git a/Proj2_Win/CPUversion/stdafx.h b/Proj2_Win/CPUversion/stdafx.h new file mode 100644 index 0000000..b005a83 --- /dev/null +++ b/Proj2_Win/CPUversion/stdafx.h @@ -0,0 +1,15 @@ +// stdafx.h : include file for standard system include files, +// or project specific include files that are used frequently, but +// are changed infrequently +// + +#pragma once + +#include "targetver.h" + +#include +#include + + + +// TODO: reference additional headers your program requires here diff --git a/Proj2_Win/CPUversion/targetver.h b/Proj2_Win/CPUversion/targetver.h new file mode 100644 index 0000000..87c0086 --- /dev/null +++ b/Proj2_Win/CPUversion/targetver.h @@ -0,0 +1,8 @@ +#pragma once + +// Including SDKDDKVer.h defines the highest available Windows platform. + +// If you wish to build your application for a previous Windows platform, include WinSDKVer.h and +// set the _WIN32_WINNT macro to the platform you wish to support before including SDKDDKVer.h. + +#include diff --git a/Proj2_Win/Debug/CPUversion.ilk b/Proj2_Win/Debug/CPUversion.ilk new file mode 100644 index 0000000..eec5f66 Binary files /dev/null and b/Proj2_Win/Debug/CPUversion.ilk differ diff --git a/Proj2_Win/Debug/CPUversion.pdb b/Proj2_Win/Debug/CPUversion.pdb new file mode 100644 index 0000000..663f92f Binary files /dev/null and b/Proj2_Win/Debug/CPUversion.pdb differ diff --git a/Proj2_Win/Debug/Proj2_Win.ilk b/Proj2_Win/Debug/Proj2_Win.ilk new file mode 100644 index 0000000..c3d5aaf Binary files /dev/null and b/Proj2_Win/Debug/Proj2_Win.ilk differ diff --git a/Proj2_Win/Debug/Proj2_Win.pdb b/Proj2_Win/Debug/Proj2_Win.pdb new file mode 100644 index 0000000..e577bf4 Binary files /dev/null and b/Proj2_Win/Debug/Proj2_Win.pdb differ diff --git a/Proj2_Win/Proj2_Win.sdf b/Proj2_Win/Proj2_Win.sdf new file mode 100644 index 0000000..f3c2314 Binary files /dev/null and b/Proj2_Win/Proj2_Win.sdf differ diff --git a/Proj2_Win/Proj2_Win.sln b/Proj2_Win/Proj2_Win.sln new file mode 100644 index 0000000..a146c9f --- /dev/null +++ b/Proj2_Win/Proj2_Win.sln @@ -0,0 +1,36 @@ + +Microsoft Visual Studio Solution File, Format Version 12.00 +# Visual Studio 2013 +VisualStudioVersion = 12.0.21005.1 +MinimumVisualStudioVersion = 10.0.40219.1 +Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "Proj2_Win", "Proj2_Win\Proj2_Win.vcxproj", "{C5E799E7-3C2C-4831-9903-5EFB81FE7E23}" +EndProject +Project("{8BC9CEB8-8B4A-11D0-8D11-00A0C91BC942}") = "CPUversion", "CPUversion\CPUversion.vcxproj", "{5B128216-B420-4BD4-9765-C5A0040A3C05}" +EndProject +Global + GlobalSection(SolutionConfigurationPlatforms) = preSolution + Debug|Win32 = Debug|Win32 + Debug|x64 = Debug|x64 + Release|Win32 = Release|Win32 + Release|x64 = Release|x64 + EndGlobalSection + GlobalSection(ProjectConfigurationPlatforms) = postSolution + {C5E799E7-3C2C-4831-9903-5EFB81FE7E23}.Debug|Win32.ActiveCfg = Debug|Win32 + {C5E799E7-3C2C-4831-9903-5EFB81FE7E23}.Debug|Win32.Build.0 = Debug|Win32 + {C5E799E7-3C2C-4831-9903-5EFB81FE7E23}.Debug|x64.ActiveCfg = Debug|x64 + {C5E799E7-3C2C-4831-9903-5EFB81FE7E23}.Debug|x64.Build.0 = Debug|x64 + {C5E799E7-3C2C-4831-9903-5EFB81FE7E23}.Release|Win32.ActiveCfg = Release|Win32 + {C5E799E7-3C2C-4831-9903-5EFB81FE7E23}.Release|Win32.Build.0 = Release|Win32 + {C5E799E7-3C2C-4831-9903-5EFB81FE7E23}.Release|x64.ActiveCfg = Release|x64 + {C5E799E7-3C2C-4831-9903-5EFB81FE7E23}.Release|x64.Build.0 = Release|x64 + {5B128216-B420-4BD4-9765-C5A0040A3C05}.Debug|Win32.ActiveCfg = Debug|Win32 + {5B128216-B420-4BD4-9765-C5A0040A3C05}.Debug|Win32.Build.0 = Debug|Win32 + {5B128216-B420-4BD4-9765-C5A0040A3C05}.Debug|x64.ActiveCfg = Debug|Win32 + {5B128216-B420-4BD4-9765-C5A0040A3C05}.Release|Win32.ActiveCfg = Release|Win32 + {5B128216-B420-4BD4-9765-C5A0040A3C05}.Release|Win32.Build.0 = Release|Win32 + {5B128216-B420-4BD4-9765-C5A0040A3C05}.Release|x64.ActiveCfg = Release|Win32 + EndGlobalSection + GlobalSection(SolutionProperties) = preSolution + HideSolutionNode = FALSE + EndGlobalSection +EndGlobal diff --git a/Proj2_Win/Proj2_Win.v12.suo b/Proj2_Win/Proj2_Win.v12.suo new file mode 100644 index 0000000..acc05c4 Binary files /dev/null and b/Proj2_Win/Proj2_Win.v12.suo differ diff --git a/Proj2_Win/Proj2_Win/Debug/Proj2_Win.Build.CppClean.log b/Proj2_Win/Proj2_Win/Debug/Proj2_Win.Build.CppClean.log new file mode 100644 index 0000000..2388172 --- /dev/null +++ b/Proj2_Win/Proj2_Win/Debug/Proj2_Win.Build.CppClean.log @@ -0,0 +1,8 @@ +h:\documents\gpu programming\project2-streamcompaction\proj2_win\debug\proj2_win.ilk +h:\documents\gpu programming\project2-streamcompaction\proj2_win\debug\proj2_win.exe +h:\documents\gpu programming\project2-streamcompaction\proj2_win\debug\proj2_win.pdb +h:\documents\gpu programming\project2-streamcompaction\proj2_win\proj2_win\debug\kernel.cu.cache +h:\documents\gpu programming\project2-streamcompaction\proj2_win\proj2_win\debug\kernel.cu.obj +h:\documents\gpu programming\project2-streamcompaction\proj2_win\proj2_win\debug\proj2_win.tlog\link.command.1.tlog +h:\documents\gpu programming\project2-streamcompaction\proj2_win\proj2_win\debug\proj2_win.tlog\link.read.1.tlog +h:\documents\gpu programming\project2-streamcompaction\proj2_win\proj2_win\debug\proj2_win.tlog\link.write.1.tlog diff --git a/Proj2_Win/Proj2_Win/Debug/Proj2_Win.log b/Proj2_Win/Proj2_Win/Debug/Proj2_Win.log new file mode 100644 index 0000000..ced1f2c --- /dev/null +++ b/Proj2_Win/Proj2_Win/Debug/Proj2_Win.log @@ -0,0 +1,116 @@ +Build started 10/4/2014 5:17:53 AM. + 1>Project "H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Proj2_Win\Proj2_Win.vcxproj" on node 2 (Build target(s)). + 1>AddCudaCompileDeps: + C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\bin\cl.exe /E /nologo /showIncludes /TP /D__CUDACC__ /DWIN32 /D_DEBUG /D_CONSOLE /D_MBCS /I"C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include" /I"C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\bin" /I"C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include" /I. /FIcuda_runtime.h /c "H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Proj2_Win\kernel.cu" + CudaBuild: + Compiling CUDA source file kernel.cu... + cmd.exe /C "C:\Users\Yehua\AppData\Local\Temp\tmpce73148b35cd40ce810de0267b12d355.cmd" + "C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\bin\nvcc.exe" -gencode=arch=compute_20,code=\"sm_20,compute_20\" --use-local-env --cl-version 2013 -ccbin "C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\bin" -I"C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include" -I"C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include" -G --keep-dir Debug -maxrregcount=0 --machine 32 --compile -cudart static -g -DWIN32 -D_DEBUG -D_CONSOLE -D_MBCS -Xcompiler "/EHsc /W3 /nologo /Od /Zi /RTC1 /MDd " -o Debug\kernel.cu.obj "H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Proj2_Win\kernel.cu" + + H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Proj2_Win>"C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\bin\nvcc.exe" -gencode=arch=compute_20,code=\"sm_20,compute_20\" --use-local-env --cl-version 2013 -ccbin "C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\bin" -I"C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include" -I"C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include" -G --keep-dir Debug -maxrregcount=0 --machine 32 --compile -cudart static -g -DWIN32 -D_DEBUG -D_CONSOLE -D_MBCS -Xcompiler "/EHsc /W3 /nologo /Od /Zi /RTC1 /MDd " -o Debug\kernel.cu.obj "H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Proj2_Win\kernel.cu" + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h : warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(853): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(1820): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(2700): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(3633): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(4541): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(5447): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(6341): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(7191): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions.h : warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions.h(783): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions.h(1659): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\sm_13_double_functions.h : warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(92): warning : variable "gthid" was declared but never referenced + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(247): warning : variable "cudaStatus" was set but never used + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(268): warning : variable "cudaStatus" was set but never used + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(315): warning : variable "length" was declared but never referenced + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(317): warning : variable "cudaStatus" was set but never used + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(374): warning : variable "cudaStatus" was set but never used + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(408): warning : variable "cudaStatus" was set but never used + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h : warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(853): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(1820): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(2700): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(3633): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(4541): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(5447): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(6341): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(7191): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h : warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(853): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(1820): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(2700): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(3633): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(4541): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(5447): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(6341): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(7191): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions_decls.h : warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions_decls.h(948): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions_decls.h(1984): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions_decls.h(2932): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions_decls.h(3882): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions_decls.h(4853): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions_decls.h(5899): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions_decls.h(6842): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions_decls.h(7786): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions_decls.h(8712): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions_decls.h(9705): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions_decls.h(10766): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions.h : warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions.h(783): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions.h(1659): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\sm_13_double_functions.h : warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h : warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(853): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(1820): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(2700): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(3633): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(4541): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(5447): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(6341): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(7191): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions.h : warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions.h(783): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions.h(1659): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\sm_13_double_functions.h : warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(92): warning : variable "gthid" was declared but never referenced + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(247): warning : variable "cudaStatus" was set but never used + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(268): warning : variable "cudaStatus" was set but never used + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(315): warning : variable "length" was declared but never referenced + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(317): warning : variable "cudaStatus" was set but never used + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(374): warning : variable "cudaStatus" was set but never used + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(408): warning : variable "cudaStatus" was set but never used + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h : warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(853): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(1820): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(2700): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(3633): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(4541): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(5447): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(6341): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + 1>c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h(7191): warning C4819: The file contains a character that cannot be represented in the current code page (936). Save the file in Unicode format to prevent data loss + kernel.cu + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(20): warning C4018: '<' : signed/unsigned mismatch + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(28): warning C4018: '<' : signed/unsigned mismatch + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(287): warning C4244: 'initializing' : conversion from 'float' to 'int', possible loss of data + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(314): warning C4244: 'initializing' : conversion from 'float' to 'int', possible loss of data + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(384): warning C4244: 'initializing' : conversion from 'float' to 'int', possible loss of data + 1>H:/Documents/GPU Programming/Project2-StreamCompaction/Proj2_Win/Proj2_Win/kernel.cu(418): warning C4244: 'initializing' : conversion from 'float' to 'int', possible loss of data + Link: + C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\bin\link.exe /ERRORREPORT:PROMPT /OUT:"H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Debug\Proj2_Win.exe" /INCREMENTAL /NOLOGO /LIBPATH:"C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\lib\Win32" cudart.lib kernel32.lib user32.lib gdi32.lib winspool.lib comdlg32.lib advapi32.lib shell32.lib ole32.lib oleaut32.lib uuid.lib odbc32.lib odbccp32.lib kernel32.lib user32.lib gdi32.lib winspool.lib comdlg32.lib advapi32.lib shell32.lib ole32.lib oleaut32.lib uuid.lib odbc32.lib odbccp32.lib /MANIFEST /MANIFESTUAC:"level='asInvoker' uiAccess='false'" /manifest:embed /DEBUG /PDB:"H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Debug\Proj2_Win.pdb" /SUBSYSTEM:CONSOLE /TLBID:1 /DYNAMICBASE /NXCOMPAT /IMPLIB:"H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Debug\Proj2_Win.lib" /MACHINE:X86 Debug\kernel.cu.obj + Proj2_Win.vcxproj -> H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Debug\Proj2_Win.exe + PostBuildEvent: + echo copy "C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\bin\cudart*.dll" "H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Debug\" + copy "C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\bin\cudart*.dll" "H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Debug\" + :VCEnd + copy "C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\bin\cudart*.dll" "H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Debug\" + C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\bin\cudart32_65.dll + C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\bin\cudart64_65.dll + 2 file(s) copied. + 1>Done Building Project "H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\Proj2_Win\Proj2_Win.vcxproj" (Build target(s)). + +Build succeeded. + +Time Elapsed 00:00:05.67 diff --git a/Proj2_Win/Proj2_Win/Debug/Proj2_Win.tlog/Proj2_Win.lastbuildstate b/Proj2_Win/Proj2_Win/Debug/Proj2_Win.tlog/Proj2_Win.lastbuildstate new file mode 100644 index 0000000..1da190d --- /dev/null +++ b/Proj2_Win/Proj2_Win/Debug/Proj2_Win.tlog/Proj2_Win.lastbuildstate @@ -0,0 +1,2 @@ +#TargetFrameworkVersion=v4.0:PlatformToolSet=v120:EnableManagedIncrementalBuild=false:VCToolArchitecture=Native32Bit +Debug|Win32|H:\Documents\GPU Programming\Project2-StreamCompaction\Proj2_Win\| diff --git a/Proj2_Win/Proj2_Win/Debug/Proj2_Win.tlog/link.command.1.tlog b/Proj2_Win/Proj2_Win/Debug/Proj2_Win.tlog/link.command.1.tlog new file mode 100644 index 0000000..72b12b6 Binary files /dev/null and b/Proj2_Win/Proj2_Win/Debug/Proj2_Win.tlog/link.command.1.tlog differ diff --git a/Proj2_Win/Proj2_Win/Debug/Proj2_Win.tlog/link.read.1.tlog b/Proj2_Win/Proj2_Win/Debug/Proj2_Win.tlog/link.read.1.tlog new file mode 100644 index 0000000..e02af38 Binary files /dev/null and b/Proj2_Win/Proj2_Win/Debug/Proj2_Win.tlog/link.read.1.tlog differ diff --git a/Proj2_Win/Proj2_Win/Debug/Proj2_Win.tlog/link.write.1.tlog b/Proj2_Win/Proj2_Win/Debug/Proj2_Win.tlog/link.write.1.tlog new file mode 100644 index 0000000..4f61d69 Binary files /dev/null and b/Proj2_Win/Proj2_Win/Debug/Proj2_Win.tlog/link.write.1.tlog differ diff --git a/Proj2_Win/Proj2_Win/Debug/kernel.cu.cache b/Proj2_Win/Proj2_Win/Debug/kernel.cu.cache new file mode 100644 index 0000000..956fa4d --- /dev/null +++ b/Proj2_Win/Proj2_Win/Debug/kernel.cu.cache @@ -0,0 +1,49 @@ +Identity=kernel.cu +AdditionalCompilerOptions= +AdditionalCompilerOptions= +AdditionalDependencies= +AdditionalDeps= +AdditionalLibraryDirectories= +AdditionalOptions= +AdditionalOptions= +CInterleavedPTX=false +CodeGeneration=compute_20,sm_20 +CodeGeneration=compute_20,sm_20 +CompileOut=Debug\kernel.cu.obj +CudaRuntime=Static +CudaToolkitCustomDir= +Defines=;WIN32;_DEBUG;_CONSOLE;_MBCS; +Emulation=false +FastMath=false +GenerateLineInfo=false +GenerateRelocatableDeviceCode=false +GPUDebugInfo=true +GPUDebugInfo=true +HostDebugInfo=true +Include=;;C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include +Inputs= +Keep=false +KeepDir=Debug +LinkOut= +MaxRegCount=0 +NvccCompilation=compile +NvccPath= +Optimization=Od +Optimization=Od +PerformDeviceLink= +PtxAsOptionV=false +RequiredIncludes= +Runtime=MDd +Runtime=MDd +RuntimeChecks=RTC1 +RuntimeChecks=RTC1 +TargetMachinePlatform=32 +TargetMachinePlatform=32 +TypeInfo= +TypeInfo= +UseHostDefines=true +UseHostInclude=true +UseHostLibraryDependencies= +UseHostLibraryDirectories= +Warning=W3 +Warning=W3 diff --git a/Proj2_Win/Proj2_Win/Debug/kernel.cu.deps b/Proj2_Win/Proj2_Win/Debug/kernel.cu.deps new file mode 100644 index 0000000..fcc0a59 --- /dev/null +++ b/Proj2_Win/Proj2_Win/Debug/kernel.cu.deps @@ -0,0 +1,596 @@ +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\cuda_runtime.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_config.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\sal.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\ConcurrencySal.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\vadefs.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\limits.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\stddef.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\channel_descriptor.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\cuda_runtime_api.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\cuda_device_runtime_api.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\cuda_runtime_api.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\common_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\string.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\time.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\wtime.inl +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\time.inl +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\math_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\math.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\stdlib.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\cmath +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\yvals.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xkeycheck.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\use_ansi.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\math.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xtgmath.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xtr1common +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\cstdlib +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\cuda_surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\channel_descriptor.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\cuda_texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\channel_descriptor.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\sm_11_atomic_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\sm_12_atomic_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\sm_13_double_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\sm_20_atomic_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\sm_32_atomic_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\sm_35_atomic_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\sm_32_atomic_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\sm_20_intrinsics.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\sm_30_intrinsics.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\sm_32_intrinsics.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\sm_35_intrinsics.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\sm_32_intrinsics.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\cuda_surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_fetch_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\cuda_texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_indirect_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_indirect_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\builtin_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\driver_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\surface_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\texture_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\host_defines.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_functions.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\device_launch_parameters.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\vector_types.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\cuda_runtime.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\device_launch_parameters.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\stdio.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\swprintf.inl +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\iostream +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\istream +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\ostream +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\ios +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xlocnum +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\climits +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\cstdio +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\streambuf +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xiosbase +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xlocale +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\cstring +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\stdexcept +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\exception +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xstddef +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\cstddef +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\initializer_list +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\eh.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\malloc.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xstring +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xmemory0 +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\limits +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\ymath.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\cfloat +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\float.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtwrn.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\cwchar +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\wchar.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\new +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xutility +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\utility +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\iosfwd +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdbg.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\type_traits +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xrefwrap +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xatomic0.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\intrin.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\setjmp.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\immintrin.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\wmmintrin.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\nmmintrin.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\smmintrin.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\tmmintrin.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\pmmintrin.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\emmintrin.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xmmintrin.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\mmintrin.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\ammintrin.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\mm3dnow.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\typeinfo +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xlocinfo +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xlocinfo.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\ctype.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\locale.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xdebug +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xmemory +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xfacet +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\system_error +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\cerrno +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\errno.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\share.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/scan.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/config.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/config/config.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/config/simple_defines.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/config/compiler.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\cuda.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/config/host_system.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/config/device_system.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/config/host_device.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\host_defines.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/config/debug.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/config/compiler_fence.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/config/forceinline.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/config/hd_warning_disable.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/config/global_workarounds.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/execution_policy.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/scan.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/iterator_traits.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\iterator +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/iterator_traversal_tags.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/host_system_tag.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cpp/detail/execution_policy.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/device_system_tag.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/execution_policy.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/any_system_tag.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/iterator_traits.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/iterator_categories.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/universal_categories.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/iterator_category_to_traversal.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/iterator_category_to_system.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/type_traits.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/type_traits/has_trivial_assign.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/select_system.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/type_traits/is_metafunction_defined.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/type_traits/has_nested_type.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/minimum_system.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/type_traits/minimum_type.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/type_traits.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/scan.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/tag.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/scan.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/static_assert.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/type_traits/iterator/is_output_iterator.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/any_assign.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/functional.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\functional +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\xfunctional +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\tuple +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/functional/placeholder.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/functional/actor.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/tuple.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/tuple.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/swap.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/pair.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/pair.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/functional/value.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/functional/composite.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/functional/operators/assignment_operator.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/functional/operators/operator_adaptors.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/type_traits/result_of.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/type_traits/function_traits.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/functional/actor.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/functional/argument.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/functional.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/functional/operators.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/functional/operators/arithmetic_operators.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/functional/operators/relational_operators.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/functional/operators/logical_operators.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/functional/operators/bitwise_operators.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/functional/operators/compound_assignment_operators.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/scan_by_key.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/scan_by_key.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/transform.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/transform.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/transform.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/transform.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/for_each.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/for_each.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/for_each.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/adl/for_each.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cpp/detail/for_each.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/internal/scalar/for_each.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/function.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/raw_reference_cast.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/raw_pointer_cast.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/type_traits/pointer_traits.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/tuple_of_iterator_references.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/reference_forward_declaration.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/use_default.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/raw_reference_cast.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/tuple_transform.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/tuple_meta_transform.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/for_each.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/for_each.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/minmax.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/distance.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/distance.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/advance.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/advance.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/advance.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/advance.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/distance.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/distance.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/detail/launch_closure.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/cuda_launch_config.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/detail/launch_closure.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/temporary_array.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/tagged_iterator.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/iterator_adaptor.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/iterator_facade.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/iterator_facade_category.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/is_iterator_category.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/distance_from_result.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/iterator_adaptor_base.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/contiguous_storage.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/normal_iterator.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/is_trivial_iterator.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/allocator/allocator_traits.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/allocator/allocator_traits.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/type_traits/has_member_function.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/type_traits/is_call_possible.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/contiguous_storage.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/allocator/copy_construct_range.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/allocator/copy_construct_range.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/copy.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/copy.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/copy.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/copy.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/internal_functional.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\memory +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\stdint.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\crtdefs.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/zip_iterator.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/zip_iterator_base.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/minimum_category.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/iterator/detail/zip_iterator.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/adl/copy.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cpp/detail/copy.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/internal/scalar/copy.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/internal/scalar/copy.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/dispatch/is_trivial_copy.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/internal/scalar/general_copy.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/internal/scalar/trivial_copy.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/copy.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/copy.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/copy_device_to_device.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/copy_device_to_device.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/copy_cross_system.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/copy_cross_system.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/trivial_copy.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/trivial_copy.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/trivial_copy.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/guarded_cuda_runtime_api.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\cuda_runtime_api.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system_error.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/error_code.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/errno.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/error_category.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/error_code.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/error_condition.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/system_error.h +C:\Program Files (x86)\Microsoft Visual Studio 12.0\VC\include\string +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/system_error.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/error.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\driver_types.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/error.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/trivial_copy.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/allocator/default_construct_range.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/allocator/default_construct_range.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/uninitialized_fill.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/uninitialized_fill.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/uninitialized_fill.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/uninitialized_fill.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/fill.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/fill.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/fill.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/generate.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/generate.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/generate.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/generate.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/adl/generate.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cpp/detail/generate.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/generate.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/adl/fill.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cpp/detail/fill.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/fill.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/fill.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/util/align.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/cstdint.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/runtime_introspection.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/runtime_introspection.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/util/blocking.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/adl/uninitialized_fill.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cpp/detail/uninitialized_fill.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/uninitialized_fill.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/allocator/destroy_range.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/allocator/destroy_range.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/allocator/fill_construct_range.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/allocator/fill_construct_range.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/allocator/temporary_allocator.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/allocator/tagged_allocator.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/allocator/tagged_allocator.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/memory.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/pointer.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/pointer.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/reference.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/reference.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/memory.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/memory.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/adl/malloc_and_free.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cpp/detail/malloc_and_free.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/malloc_and_free.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/bad_alloc.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/malloc_and_free.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/adl/get_value.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cpp/detail/get_value.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/get_value.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/assign_value.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/adl/assign_value.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cpp/detail/assign_value.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/adl/iter_swap.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cpp/detail/iter_swap.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/iter_swap.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/swap.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/swap.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/swap_ranges.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/swap_ranges.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/swap_ranges.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/adl/swap_ranges.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cpp/detail/swap_ranges.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/swap_ranges.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/temporary_buffer.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/temporary_buffer.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/temporary_buffer.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/adl/temporary_buffer.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cpp/detail/temporary_buffer.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/temporary_buffer.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/allocator/temporary_allocator.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/allocator/no_throw_allocator.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/temporary_array.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/synchronize.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/synchronize.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/detail/launch_calculator.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/detail/launch_calculator.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/adl/transform.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cpp/detail/transform.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/transform.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/replace.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/detail/replace.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/replace.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/generic/replace.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/adl/replace.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cpp/detail/replace.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/replace.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/adl/scan.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cpp/detail/scan.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/internal/scalar/scan.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/scan.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/scan.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/detail/fast_scan.h +c:\program files\nvidia gpu computing toolkit\cuda\v6.5\include\thrust\system\cuda\detail\detail\fast_scan.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/reduce_intervals.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/reduce_intervals.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/internal/decompose.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/extern_shared_ptr.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/block/reduce.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/default_decomposition.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/default_decomposition.inl +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/detail/uninitialized.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/detail/alignment.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/adl/scan_by_key.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cpp/detail/scan_by_key.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/detail/internal/scalar/scan_by_key.h +C:\Program Files\NVIDIA GPU Computing Toolkit\CUDA\v6.5\include\thrust/system/cuda/detail/scan_by_key.h diff --git a/Proj2_Win/Proj2_Win/Proj2_Win.vcxproj b/Proj2_Win/Proj2_Win/Proj2_Win.vcxproj new file mode 100644 index 0000000..719fd5c --- /dev/null +++ b/Proj2_Win/Proj2_Win/Proj2_Win.vcxproj @@ -0,0 +1,160 @@ + + + + + Debug + Win32 + + + Debug + x64 + + + Release + Win32 + + + Release + x64 + + + + {C5E799E7-3C2C-4831-9903-5EFB81FE7E23} + Proj2_Win + + + + Application + true + MultiByte + v120 + + + Application + true + MultiByte + v120 + + + Application + false + true + MultiByte + v120 + + + Application + false + true + MultiByte + v120 + + + + + + + + + + + + + + + + + + + + true + + + true + + + + Level3 + Disabled + WIN32;_DEBUG;_CONSOLE;%(PreprocessorDefinitions) + + + true + Console + cudart.lib;kernel32.lib;user32.lib;gdi32.lib;winspool.lib;comdlg32.lib;advapi32.lib;shell32.lib;ole32.lib;oleaut32.lib;uuid.lib;odbc32.lib;odbccp32.lib;%(AdditionalDependencies) + + + echo copy "$(CudaToolkitBinDir)\cudart*.dll" "$(OutDir)" +copy "$(CudaToolkitBinDir)\cudart*.dll" "$(OutDir)" + + + + + Level3 + Disabled + WIN32;WIN64;_DEBUG;_CONSOLE;%(PreprocessorDefinitions) + + + true + Console + cudart.lib;kernel32.lib;user32.lib;gdi32.lib;winspool.lib;comdlg32.lib;advapi32.lib;shell32.lib;ole32.lib;oleaut32.lib;uuid.lib;odbc32.lib;odbccp32.lib;%(AdditionalDependencies) + + + echo copy "$(CudaToolkitBinDir)\cudart*.dll" "$(OutDir)" +copy "$(CudaToolkitBinDir)\cudart*.dll" "$(OutDir)" + + + 64 + + + + + Level3 + MaxSpeed + true + true + WIN32;NDEBUG;_CONSOLE;%(PreprocessorDefinitions) + + + true + true + true + Console + cudart.lib;kernel32.lib;user32.lib;gdi32.lib;winspool.lib;comdlg32.lib;advapi32.lib;shell32.lib;ole32.lib;oleaut32.lib;uuid.lib;odbc32.lib;odbccp32.lib;%(AdditionalDependencies) + + + echo copy "$(CudaToolkitBinDir)\cudart*.dll" "$(OutDir)" +copy "$(CudaToolkitBinDir)\cudart*.dll" "$(OutDir)" + + + + + Level3 + MaxSpeed + true + true + WIN32;WIN64;NDEBUG;_CONSOLE;%(PreprocessorDefinitions) + + + true + true + true + Console + cudart.lib;kernel32.lib;user32.lib;gdi32.lib;winspool.lib;comdlg32.lib;advapi32.lib;shell32.lib;ole32.lib;oleaut32.lib;uuid.lib;odbc32.lib;odbccp32.lib;%(AdditionalDependencies) + + + echo copy "$(CudaToolkitBinDir)\cudart*.dll" "$(OutDir)" +copy "$(CudaToolkitBinDir)\cudart*.dll" "$(OutDir)" + + + 64 + + + + + + + + + + \ No newline at end of file diff --git a/Proj2_Win/Proj2_Win/kernel.cu b/Proj2_Win/Proj2_Win/kernel.cu new file mode 100644 index 0000000..94e43c9 --- /dev/null +++ b/Proj2_Win/Proj2_Win/kernel.cu @@ -0,0 +1,438 @@ + +#include "cuda_runtime.h" +#include "device_launch_parameters.h" +#include +#include +#include +#include + +#define BLOCK_SIZE 512 +#define TEST_TIMES 1 +#define LENGTH 10000000 + +void scanNaive(const int *in, int *out, int len); +void scanSharedMem_singleblock(const int *in, int *out, int len); +void scanSharedMem_multiblock(const int *in, int *out, int len); +void scatter(int *in, int *out, int len); +void scatter_thrust(int *in, int *out, int len); +void printArray(const int *out, const int len) +{ + for (size_t i = 0; i < len; i++) + { + std::cout << out[i] << " "; + } + std::cout << std::endl; +} +void clearArray(int *out, const int len) +{ + for (size_t i = 0; i < len; i++) + { + out[i] = 0; + } +} +__global__ void scanKernel(const int *in, int *out, int len) +{ + int thid = threadIdx.x; + //out[thid] = (thid > 0) ? in[thid - 1] : 0; + out[thid] = in[thid]; + __syncthreads(); + for (size_t offset = 1; offset < len; offset *= 2) + { + if (thid >= offset) + out[thid] += out[thid - offset]; + __syncthreads(); + } +} +__global__ void scanKernel_shared_singleblock(const int *in, int *out, int len) +{ + extern __shared__ int temp[]; + int thid = threadIdx.x; + int pin = 0, pout = 1; + temp[pin * len + thid] = in[thid]; + //temp[pout*len + thid] = (thid > 0) ? temp[pin * len + thid -1]: 0; + temp[pout*len + thid] = temp[pin*len + thid]; + __syncthreads(); + for (size_t offset = 1; offset < len; offset *= 2) + { + if (thid >= offset) + temp[pout * len + thid] += temp[pout * len + thid - offset]; + __syncthreads(); + } + out[thid] = temp[pout * len + thid]; +} + +__device__ void scanKernel_singleblock(int *in, int *out,int *temp, const int blockSize) +{ + + int thid = threadIdx.x; + int gthid = blockIdx.x * blockDim.x + threadIdx.x; + int blockLen = blockSize; + int pin = 0, pout = 1; + temp[pin * blockLen + thid] = in[gthid]; + //temp[pout*len + thid] = (thid > 0) ? temp[pin * len + thid -1]: 0; + temp[pout*blockLen + thid] = temp[pin*blockLen + thid]; + __syncthreads(); + for (size_t offset = 1; offset < blockLen; offset *= 2) + { + if (thid >= offset) + temp[pout * blockLen + thid] += temp[pout * blockLen + thid - offset]; + __syncthreads(); + } + if (thid < blockLen) + { + out[gthid] = temp[pout * blockLen + thid]; + } + __syncthreads(); +} + +__global__ void scanKernel_multiblock(int *in, int *out, int *aux, const int blockSize) +{ + extern __shared__ int temp[]; + int gridID = blockIdx.x; + int gthid = blockIdx.x * blockDim.x + threadIdx.x; + scanKernel_singleblock(in, out, temp, blockSize); + aux[gridID] = out[(gridID) * blockDim.x + blockSize - 1]; + /* + __syncthreads(); + scanKernel_singleblock(aux, aux,temp, blockSize); + __syncthreads(); + if (gridID > 0) + { + out[gthid] += aux[gridID-1]; + } + */ +} +__global__ void prefix_add(int *aux, int *input) +{ + int gthid = blockIdx.x * blockDim.x + threadIdx.x; + if (blockIdx.x > 0) + { + input[gthid] += aux[blockIdx.x - 1]; + } + +} + +int main() +{ + const int len = LENGTH; + //int in[] = { 0, 0, 3, 4, 0, 6, 6, 7, 0, 7,1,3,3,2,0,1 }; + int *out = new int[len]; + int *scatterResult = new int[len]; + int *in = (int*) malloc(len*sizeof(int)); + for (size_t i = 0; i < len; i++) + { + in[i] = i+1; + } + //**************warm up************** + clock_t start, finish; + double duration; + int i = TEST_TIMES; + clearArray(out, len); + //printArray(in, len); + + //naive method + start = clock(); + while (i--) + { + scanNaive(in, out, len); + } + finish = clock(); + duration = finish - start; + printf("warming up in %f ms\n", duration); + //*******************timing********************** + i = TEST_TIMES; + clearArray(out, len); + //printArray(in, len); + + //naive method + start = clock(); + while (i--) + { + scanNaive(in, out, len); + } + finish = clock(); + duration = finish - start; + duration = duration / TEST_TIMES; + //printArray(in, len); + //printArray(out, len); + printf("Naive method finished in %f ms\n", duration); + //shared memory + i = TEST_TIMES; + clearArray(out, len); + start = clock(); + while (i--) + { + scanSharedMem_singleblock(in, out, len); + } + finish = clock(); + duration = finish - start; + duration = duration / TEST_TIMES; + //printArray(in, len); + //printArray(out, len); + printf("Shared memory finished in %f ms\n", duration); + //generalizing + i = TEST_TIMES; + clearArray(out, len); + start = clock(); + while (i--) + { + scanSharedMem_multiblock(in, out, len); + } + finish = clock(); + duration = finish - start; + duration = duration / TEST_TIMES; + //printArray(in, len); + //printArray(out, len); + printf("Gerneralized method finished in %f ms\n", duration); + + //***************** + //scattering + i = TEST_TIMES; + clearArray(out, len); + start = clock(); + while (i--) + { + scatter(in, scatterResult, len); + } + finish = clock(); + duration = finish - start; + duration = duration / TEST_TIMES; + //printArray(in, len); + //printArray(scatterResult, len); + printf("Scattering finished in %f ms\n", duration); + + /////////thrust + i = TEST_TIMES; + clearArray(scatterResult, len); + start = clock(); + while (i--) + { + scatter_thrust(in, scatterResult, len); + } + finish = clock(); + duration = finish - start; + duration = duration / TEST_TIMES; + printf("thrust scattering finished in %f ms\n", duration); + //*********************************************** + + /*clearArray(out, len); + printArray(in, len); + + clearArray(out, len); + scanNaive(in, out, len); + printArray(out, len); + + clearArray(out, len); + scanSharedMem_singleblock(in, out, len); + printArray(out, len); + + clearArray(out, len); + scanSharedMem_multiblock(in, out, len); + printArray(out, len); + + scatter(in, scatterResult, len); + printArray(scatterResult, len);*/ + + + delete[] scatterResult; + delete[] out; + return 0; +} + +// Helper function for using CUDA to add vectors in parallel. +void scanNaive(const int *in, int *out, int len) +{ + int *dev_in = 0; + int *dev_out = 0; + cudaError_t cudaStatus; + cudaStatus = cudaSetDevice(0); + + cudaStatus = cudaMalloc((void**)&dev_in, len * sizeof(int)); + + cudaStatus = cudaMalloc((void**)&dev_out, len* sizeof(int)); + + cudaStatus = cudaMemcpy(dev_in, in, len * sizeof(int), cudaMemcpyHostToDevice); + + cudaStatus = cudaMemcpy(dev_out, out, len * sizeof(int), cudaMemcpyHostToDevice); + + scanKernel << <1, len >> >(dev_in, dev_out, len); + + cudaStatus = cudaMemcpy(out, dev_out, len * sizeof(int), cudaMemcpyDeviceToHost); + +} + +void scanSharedMem_singleblock(const int *in, int *out, int len) +{ + int *dev_in = 0; + int *dev_out = 0; + cudaError_t cudaStatus; + cudaStatus = cudaSetDevice(0); + + cudaStatus = cudaMalloc((void**)&dev_in, len * sizeof(int)); + + cudaStatus = cudaMalloc((void**)&dev_out, len* sizeof(int)); + + cudaStatus = cudaMemcpy(dev_in, in, len * sizeof(int), cudaMemcpyHostToDevice); + + cudaStatus = cudaMemcpy(dev_out, out, len * sizeof(int), cudaMemcpyHostToDevice); + + scanKernel_shared_singleblock << <1, len, len * 2 * sizeof(int) >> >(dev_in, dev_out, len); + + cudaStatus = cudaMemcpy(out, dev_out, len * sizeof(int), cudaMemcpyDeviceToHost); + +} +void scan_recursive(int *dev_in, int *dev_out, int len) +{ + int blockSize = BLOCK_SIZE; + int gridSize = ceil(len / (float)blockSize); + int *current_out = 0; + int *current_aux = 0; + cudaMalloc((void**)¤t_aux, gridSize * sizeof(int)); + cudaMalloc((void**)¤t_out, gridSize * sizeof(int)); + + if (gridSize <= 1) + { + scanKernel_multiblock << > >(dev_in, dev_out, current_aux, blockSize); + } + else + { + scanKernel_multiblock << > >(dev_in, dev_out, current_aux, blockSize); + scan_recursive(current_aux, current_aux, gridSize); + prefix_add << > >(current_aux, dev_out); + } + cudaFree(current_aux); + cudaFree(current_out); +} +void scanSharedMem_multiblock(const int *in, int *out, int len) +{ + int *dev_in = 0; + int *dev_out = 0; + int *dev_aux = 0; + + //define block size and grid size + int blockSize = BLOCK_SIZE; + int gridSize = ceil(len / (float)blockSize); + int length = (len < blockSize) ? len : blockSize; + + cudaError_t cudaStatus; + cudaStatus = cudaMalloc((void**)&dev_in, len * sizeof(int)); + cudaStatus = cudaMalloc((void**)&dev_out, len* sizeof(int)); + cudaStatus = cudaMalloc((void**)&dev_aux, gridSize* sizeof(int)); + cudaStatus = cudaMemcpy(dev_in, in, len * sizeof(int), cudaMemcpyHostToDevice); + cudaStatus = cudaMemcpy(dev_out, out, len * sizeof(int), cudaMemcpyHostToDevice); + + scan_recursive(dev_in, dev_out, len); + cudaStatus = cudaMemcpy(out, dev_out, len * sizeof(int), cudaMemcpyDeviceToHost); + + cudaFree(dev_in); + cudaFree(dev_out); + cudaFree(dev_aux); +} + +__global__ void toFlagKernel(int *in, int *out, int len) +{ + int thid = blockIdx.x * blockDim.x + threadIdx.x; + if (thid < len) + { + if (in[thid] > 0) + out[thid] = 1; + else + out[thid] = 0; + } +} +__global__ void getScatter(int *in,int *flag, int *out, int len, int *actualLen) +{ + int thid = blockIdx.x * blockDim.x + threadIdx.x; + *actualLen = flag[len - 1]; + out[thid] = 0; + if (thid < len) + { + if (thid == 0) + { + if (in[0] > 0) + out[0] = in[0]; + } + else if (thid > 0) + { + if (flag[thid] > flag[thid - 1]) + { + out[flag[thid] - 1] = in[thid]; + } + } + } +} + +void scatter(int *in, int *out, int len) +{ + int *dev_in = 0; + int *dev_out = 0; + int *dev_flag = 0; + int *dev_result = 0; + int *actualLen = 0; + + cudaMalloc((void**)&actualLen, sizeof(int)); + cudaError_t cudaStatus; + cudaStatus = cudaMalloc((void**)&dev_in, len * sizeof(int)); + cudaStatus = cudaMalloc((void**)&dev_out, len* sizeof(int)); + cudaStatus = cudaMalloc((void**)&dev_flag, len* sizeof(int)); + cudaStatus = cudaMalloc((void**)&dev_result, len * sizeof(int)); + + cudaStatus = cudaMemcpy(dev_in, in, len * sizeof(int), cudaMemcpyHostToDevice); + cudaStatus = cudaMemcpy(dev_out, out, len * sizeof(int), cudaMemcpyHostToDevice); + + int blockSize = BLOCK_SIZE; + int gridSize = ceil(len / (float)blockSize); + toFlagKernel << > >(dev_in, dev_flag, len); + scan_recursive(dev_flag, dev_out, len); + + getScatter << > >(dev_in, dev_out, dev_result, len, actualLen); + + cudaStatus = cudaMemcpy(out, dev_result, len * sizeof(int), cudaMemcpyDeviceToHost); + + cudaFree(dev_in); + cudaFree(dev_out); + cudaFree(dev_flag); + cudaFree(dev_result); + cudaFree(actualLen); +} + +void scatter_thrust(int *in, int *out, int len) +{ + int *dev_in = 0; + int *dev_out = 0; + int *dev_flag = 0; + int *dev_result = 0; + int *actualLen = 0; + + cudaMalloc((void**)&actualLen, sizeof(int)); + cudaError_t cudaStatus; + cudaStatus = cudaMalloc((void**)&dev_in, len * sizeof(int)); + cudaStatus = cudaMalloc((void**)&dev_out, len* sizeof(int)); + cudaStatus = cudaMalloc((void**)&dev_flag, len* sizeof(int)); + cudaStatus = cudaMalloc((void**)&dev_result, len * sizeof(int)); + + cudaStatus = cudaMemcpy(dev_in, in, len * sizeof(int), cudaMemcpyHostToDevice); + cudaStatus = cudaMemcpy(dev_out, out, len * sizeof(int), cudaMemcpyHostToDevice); + + int blockSize = BLOCK_SIZE; + int gridSize = ceil(len / (float)blockSize); + toFlagKernel << > >(dev_in, dev_flag, len); + + int *hos_flag = new int[len]; + cudaMemcpy(hos_flag, dev_flag, len * sizeof(int), cudaMemcpyDeviceToHost); + + //scan_recursive(dev_flag, dev_out, len); + thrust::inclusive_scan(hos_flag,hos_flag+len,hos_flag); + cudaMemcpy(dev_flag, hos_flag, len * sizeof(int), cudaMemcpyHostToDevice); + + getScatter << > >(dev_in, dev_flag, dev_result, len, actualLen); + + cudaStatus = cudaMemcpy(out, dev_result, len * sizeof(int), cudaMemcpyDeviceToHost); + + delete[] hos_flag; + cudaFree(dev_in); + cudaFree(dev_out); + cudaFree(dev_flag); + cudaFree(dev_result); + cudaFree(actualLen); +} \ No newline at end of file diff --git a/Proj2_Win/Proj2_Win/vc120.pdb b/Proj2_Win/Proj2_Win/vc120.pdb new file mode 100644 index 0000000..20fdc67 Binary files /dev/null and b/Proj2_Win/Proj2_Win/vc120.pdb differ diff --git a/Proj2_Win/ipch/cpuversion-3af2f0cb/cpuversion-108c937a.ipch b/Proj2_Win/ipch/cpuversion-3af2f0cb/cpuversion-108c937a.ipch new file mode 100644 index 0000000..58bd873 Binary files /dev/null and b/Proj2_Win/ipch/cpuversion-3af2f0cb/cpuversion-108c937a.ipch differ diff --git a/Proj2_Win/ipch/cpuversion-f3683bca/cpuversion-108c937a.ipch b/Proj2_Win/ipch/cpuversion-f3683bca/cpuversion-108c937a.ipch new file mode 100644 index 0000000..efb59e9 Binary files /dev/null and b/Proj2_Win/ipch/cpuversion-f3683bca/cpuversion-108c937a.ipch differ diff --git a/README.md b/README.md index 6e02afa..b50b406 100644 --- a/README.md +++ b/README.md @@ -88,6 +88,26 @@ you are NOT allowed to use shared memory. include a table of how the runtimes compare on different lengths of arrays. * Plot a graph of the comparison and write a short explanation of the phenomenon you see here. +Array Length CPU +10 0.0007 +100 0.0014 +1000 0.007 +10000 0.07 +100000 0.87 +1000000 9.4 +10000000 95 +100000000 950 + +Array Length GPU +10 0.38 +100 0.27 +1000 0.73 +10000 0.87 +100000 3.73 +1000000 6.9 +10000000 32 +100000000 238 +CPU has a almost linear runtime increase because it's a completely serial program. GPU program runs slower when array size is low due to low clocking and low single core performance compared to CPU. However when array size races high, the advantage of parallel programming stands out. When the threads are fully occupied, the GPU program starts to have a linear increase of runtime. # PART 3 : OPTIMIZING PREFIX SUM In the previous section we did not take into account shared memory. In the @@ -106,6 +126,9 @@ to arbitrary length arrays, this includes arrays that will not fit on one block. * Compare this version to the parallel prefix sum using global memory. * Plot a graph of the comparison and write a short explanation of the phenomenon you see here. + +If the array size is low, global memory is faster than shared memory. Maybe it is because the shared memory is copied from the global memory at the beginning and the ending. Bank conflict may also causes the problem. + # PART 4 : ADDING SCATTER First create a serial version of scatter by expanding the serial version of @@ -117,6 +140,8 @@ array for you. Finally, write a version using thrust. * Compare your version of stream compact to your version using thrust. How do they compare? How might you optimize yours more, or how might thrust's stream compact be optimized. + My version of scattering is faster compared to the one using thrust. But my scan is slower than the one in the thrust. +Because thrust uses host memory which resulted in a lot more memory copy between the device and the host. To optimize the thrust code, device memory should be used instead of host memory. # EXTRA CREDIT (+10) For extra credit, please optimize your prefix sum for work parallelism and to diff --git a/test result.xlsx b/test result.xlsx new file mode 100644 index 0000000..ffb08f5 Binary files /dev/null and b/test result.xlsx differ