add osx support, add test generator

This commit is contained in:
Christien Rioux 2015-12-12 00:44:11 -08:00
parent 7fbd70a2bb
commit 7806e2d50d
5 changed files with 137 additions and 60 deletions

7
CMakeLists.txt Normal file
View File

@ -0,0 +1,7 @@
cmake_minimum_required(VERSION 3.3.0)
project (linecount)
add_library (linecount SHARED linecount.cpp linecount.h)
add_library (linecount_static STATIC linecount.cpp linecount.h)
add_executable (lc main.cpp)
target_link_libraries (lc linecount_static)

5
create_testfiles.sh Executable file
View File

@ -0,0 +1,5 @@
#!/bin/bash
dd if=/dev/urandom of=test1.txt bs=1000000 count=10
dd if=/dev/urandom of=test2.txt bs=1000000 count=100
dd if=/dev/urandom of=test3.txt bs=1000000 count=1000

View File

@ -8,7 +8,9 @@
#define LCCLOSEFILE(handle) CloseHandle(handle) #define LCCLOSEFILE(handle) CloseHandle(handle)
#define LCINVALIDHANDLE INVALID_HANDLE_VALUE #define LCINVALIDHANDLE INVALID_HANDLE_VALUE
#define LCSETREALLASTERROR(err, errstr) { setLastError((err), (errstr)); } #define LCSETREALLASTERROR(err, errstr) { setLastError((err), (errstr)); }
#define MAP_FAILED NULL;
typedef long long LCFILEOFFSET; typedef long long LCFILEOFFSET;
#elif defined (__unix__) || (defined (__APPLE__) && defined (__MACH__)) #elif defined (__unix__) || (defined (__APPLE__) && defined (__MACH__))
// POSIX // POSIX
@ -16,23 +18,28 @@ typedef long long LCFILEOFFSET;
#include<sys/stat.h> #include<sys/stat.h>
#include<sys/fcntl.h> #include<sys/fcntl.h>
#include<sys/mman.h> #include<sys/mman.h>
#include<pthread.h> #if (defined (__APPLE__) && defined (__MACH__))
#if (defined (__APPLE__) && defined (__MACH__)
#include <sys/sysctl.h> #include <sys/sysctl.h>
typedef off_t LCFILEOFFSET; typedef off_t LCFILEOFFSET;
#define MMAP mmap #define MMAP ::mmap
#define FSTAT ::fstat
#define STAT ::stat
#elif defined(__linux__) #elif defined(__linux__)
typedef off64_t LCFILEOFFSET; typedef off64_t LCFILEOFFSET;
#define MMAP mmap64 #define MMAP ::mmap64
#define FSTAT ::fstat64
#define STAT ::stat64
#else #else
typedef off_t LCFILEOFFSET; typedef off_t LCFILEOFFSET;
#define MMAP mmap #define MMAP ::mmap
#define FSTAT ::fstat
#define STAT ::stat
#endif #endif
#define LCOPENFILE(name) open(name, O_RDONLY) #define LCOPENFILE(name) ::open(name, O_RDONLY)
#define LCCLOSEFILE(handle) (close(handle) != -1) #define LCCLOSEFILE(handle) (::close(handle) != -1)
#define LCINVALIDHANDLE -1 #define LCINVALIDHANDLE -1
#define LCSETREALLASTERROR(err, errstr) { int __err = errno; setLastError(__err, strerror(__err)); } #define LCSETREALLASTERROR(err, errstr) { int __err = errno; setLastError(__err, ::strerror(__err)); }
#endif #endif
@ -51,37 +58,36 @@ CLineCount::CLineCount(PARAMETERS *parameters)
// Set line count parameter defaults // Set line count parameter defaults
int cpucount; int cpucount;
int allocationgranularity;
#ifdef _WIN32 #ifdef _WIN32
SYSTEM_INFO sysinfo; SYSTEM_INFO sysinfo;
GetSystemInfo(&sysinfo); GetSystemInfo(&sysinfo);
cpucount = sysinfo.dwNumberOfProcessors; cpucount = sysinfo.dwNumberOfProcessors;
#elif defined(__linux__) allocationgranularity = sysinfo.dwAllocationGranularity;
cpucount = sysconf(_SC_NPROCESSORS_ONLN); //#elif defined(__linux__)
#elif (defined (__APPLE__) && defined (__MACH__))
intsize_t count_len = sizeof(cpucount);
sysctlbyname("hw.logicalcpu", &cpucount, &count_len, NULL, 0);
#else #else
cpucount = 1; cpucount = sysconf(_SC_NPROCESSORS_ONLN);
allocationgranularity = sysconf(_SC_PAGESIZE);
//#elif (defined (__APPLE__) && defined (__MACH__))
// mmsize_t count_len = sizeof(cpucount);
// sysctlbyname("hw.logicalcpu", &cpucount, &count_len, NULL, 0);
//#else
// cpucount = 1;
#endif #endif
m_parameters.workercount = cpucount; m_parameters.threadcount = cpucount;
m_parameters.windowsize = (1024 * 1024 * 8) / cpucount; m_parameters.buffersize = (1024 * 1024);
// Override defaults if specified // Override defaults if specified
if (parameters) if (parameters)
{ {
if (parameters->windowsize != -1) if (parameters->buffersize != -1)
{ {
m_parameters.windowsize = parameters->windowsize; m_parameters.buffersize = parameters->buffersize;
#ifdef _WIN32 m_parameters.buffersize += (allocationgranularity - (m_parameters.buffersize % allocationgranularity)) % allocationgranularity;
// Window size must be multiple of allocation granularity. Round up.
SYSTEM_INFO si;
GetSystemInfo(&si);
m_parameters.windowsize += (si.dwAllocationGranularity - (m_parameters.windowsize % si.dwAllocationGranularity)) % si.dwAllocationGranularity;
#endif
} }
if (parameters->workercount != -1) if (parameters->threadcount != -1)
{ {
m_parameters.workercount = parameters->workercount; m_parameters.threadcount = parameters->threadcount;
} }
} }
@ -197,14 +203,15 @@ void *threadProc(void *ctx)
#endif #endif
{ {
LCTHREADCONTEXT *lctctx = (LCTHREADCONTEXT*)ctx; LCTHREADCONTEXT *lctctx = (LCTHREADCONTEXT*)ctx;
return lctctx->m_this->countThread(lctctx->thread_number); lctctx->m_this->countThread(lctctx->thread_number);
return NULL;
} }
unsigned int CLineCount::countThread(int thread_number) unsigned int CLineCount::countThread(int thread_number)
{ {
LCFILEOFFSET windowsize = (LCFILEOFFSET)m_parameters.windowsize; LCFILEOFFSET buffersize = (LCFILEOFFSET)m_parameters.buffersize;
LCFILEOFFSET startoffset = windowsize * (LCFILEOFFSET)thread_number; LCFILEOFFSET startoffset = buffersize * (LCFILEOFFSET)thread_number;
LCFILEOFFSET stride = windowsize * m_actual_thread_count; LCFILEOFFSET stride = buffersize * m_actual_thread_count;
LCFILEOFFSET curoffset = startoffset; LCFILEOFFSET curoffset = startoffset;
LCFILEOFFSET lastmapsize = 0; LCFILEOFFSET lastmapsize = 0;
LCLINECOUNT count = 0; LCLINECOUNT count = 0;
@ -214,11 +221,12 @@ unsigned int CLineCount::countThread(int thread_number)
{ {
if (m_thread_fail) if (m_thread_fail)
{ {
return -1; return -1;
} }
// Get best file mapping window size // Get best file mapping window size
size_t mapsize = (size_t)min((m_filesize - curoffset), windowsize); size_t mapsize = (size_t)std::min((m_filesize - curoffset), buffersize);
// Map view of file // Map view of file
#ifdef _WIN32 #ifdef _WIN32
@ -235,16 +243,17 @@ unsigned int CLineCount::countThread(int thread_number)
#else #else
if (mem) if (mem)
{ {
if(munmap(mem)!=0) if(munmap(mem, lastmapsize) !=0)
{ {
LCSETREALLASTERROR(EINVAL, _T("memory unmap failed")); LCSETREALLASTERROR(EINVAL, _T("memory unmap failed"));
m_thread_fail = true; m_thread_fail = true;
return -1; return -1;
} }
} }
mem = MMAP(NULL, mapsize, PROT_READ, MAP_FILE | MAP_SHARED, m_fd, curoffset); mem = MMAP(NULL, mapsize, PROT_READ, MAP_FILE | MAP_SHARED, m_fh, curoffset);
// printf("%p %lld %lld\n",mem, mapsize, curoffset);
#endif #endif
if (mem == NULL) if (mem == MAP_FAILED)
{ {
LCSETREALLASTERROR(EINVAL, _T("memory map failed")); LCSETREALLASTERROR(EINVAL, _T("memory map failed"));
m_thread_fail = true; m_thread_fail = true;
@ -299,7 +308,7 @@ unsigned int CLineCount::countThread(int thread_number)
#else #else
if (mem) if (mem)
{ {
if (munmap(mem) != 0) if (munmap(mem, lastmapsize) != 0)
{ {
LCSETREALLASTERROR(EINVAL, _T("memory unmap failed")); LCSETREALLASTERROR(EINVAL, _T("memory unmap failed"));
m_thread_fail = true; m_thread_fail = true;
@ -349,8 +358,8 @@ bool CLineCount::countLines(LCLINECOUNT & linecount)
} }
m_filesize = li.QuadPart; m_filesize = li.QuadPart;
#else #else
struct stat64 statbuf; struct STAT statbuf;
if(fstat64(m_fh,&statbuf)!=0) if(FSTAT(m_fh,&statbuf)!=0)
{ {
LCSETREALLASTERROR(EBADF, _T("unable to get file size")); LCSETREALLASTERROR(EBADF, _T("unable to get file size"));
return false; return false;
@ -366,16 +375,18 @@ bool CLineCount::countLines(LCLINECOUNT & linecount)
} }
// Figure out actual thread count // Figure out actual thread count
LCFILEOFFSET windowcount = (m_filesize + (m_parameters.windowsize - 1)) / m_parameters.windowsize; LCFILEOFFSET windowcount = (m_filesize + (m_parameters.buffersize - 1)) / m_parameters.buffersize;
if (windowcount < (LCFILEOFFSET) m_parameters.workercount) if (windowcount < (LCFILEOFFSET) m_parameters.threadcount)
{ {
m_actual_thread_count = (int)windowcount; m_actual_thread_count = (int)windowcount;
} }
else else
{ {
m_actual_thread_count = m_parameters.workercount; m_actual_thread_count = m_parameters.threadcount;
} }
// printf("act: %d\n",m_actual_thread_count);
#ifdef _WIN32 #ifdef _WIN32
// Prepare file mapping // Prepare file mapping
m_filemapping = CreateFileMapping(m_fh, NULL, PAGE_READONLY, 0, 0, NULL); m_filemapping = CreateFileMapping(m_fh, NULL, PAGE_READONLY, 0, 0, NULL);
@ -405,7 +416,7 @@ bool CLineCount::countLines(LCLINECOUNT & linecount)
#ifdef _WIN32 #ifdef _WIN32
success = (WaitForSingleObject(m_threads[i], INFINITE) == WAIT_OBJECT_0); success = (WaitForSingleObject(m_threads[i], INFINITE) == WAIT_OBJECT_0);
#else #else
success = pthread_join(m_threads[i]) == 0; success = pthread_join(m_threads[i], NULL) == 0;
#endif #endif
} }
@ -429,7 +440,7 @@ bool CLineCount::countLines(LCLINECOUNT & linecount)
return false; return false;
} }
if (complete != m_parameters.workercount) if (complete != m_actual_thread_count)
{ {
setLastError(ECHILD, _T("thread join failed")); setLastError(ECHILD, _T("thread join failed"));
return false; return false;

View File

@ -1,6 +1,9 @@
#ifndef __INC_LINECOUNT_H #ifndef __INC_LINECOUNT_H
#define __INC_LINECOUNT_H #define __INC_LINECOUNT_H
#define LINECOUNT_VERSION_MAJOR 1
#define LINECOUNT_VERSION_MINOR 0
///////////////////////////////////////////// Headers ///////////////////////////////////////////// Headers
////////////// Platform independent ////////////// Platform independent
@ -18,6 +21,7 @@
#include<tchar.h> #include<tchar.h>
#elif defined (__unix__) || (defined (__APPLE__) && defined (__MACH__)) // POSIX #elif defined (__unix__) || (defined (__APPLE__) && defined (__MACH__)) // POSIX
#include<unistd.h> #include<unistd.h>
#include<pthread.h>
#define _T(x) x #define _T(x) x
#define TCHAR char #define TCHAR char
#endif #endif
@ -45,7 +49,7 @@ BEGIN_LINECOUNT_NAMESPACE;
typedef std::string LCSTRING; typedef std::string LCSTRING;
typedef int LCFILEHANDLE; typedef int LCFILEHANDLE;
typedef errno_t LCERROR; typedef errno_t LCERROR;
#if (defined (__APPLE__) && defined (__MACH__) #if (defined (__APPLE__) && defined (__MACH__))
typedef off_t LCFILEOFFSET; typedef off_t LCFILEOFFSET;
#define LCLINECOUNTFMT "%lld" #define LCLINECOUNTFMT "%lld"
#elif defined(__linux__) #elif defined(__linux__)
@ -66,8 +70,8 @@ public:
struct PARAMETERS struct PARAMETERS
{ {
size_t windowsize; size_t buffersize;
int workercount; int threadcount;
}; };
private: private:

View File

@ -1,17 +1,46 @@
#include"linecount.h" #include"linecount.h"
#ifdef _WIN32 #ifdef _WIN32
#include<tchar.h> #include<tchar.h>
#else #else
#include<stdlib.h>
#define _tprintf printf #define _tprintf printf
#define _ftprintf fprintf #define _ftprintf fprintf
#define _tcscmp strcmp #define _tcscmp strcmp
#define _tcslen strlen
#define _ttoi atoi #define _ttoi atoi
#define _tcstoui64 strtoull #define _tcstoui64 strtoull
#define _T(x) x #define _T(x) x
#define TCHAR char
#endif #endif
using namespace LineCount; using namespace LineCount;
//////////////////////////////////////////////////////
void help(const TCHAR *argv0)
{
_ftprintf(stderr, _T("usage: %s [options] <file>\n"), argv0);
_ftprintf(stderr, _T(" -h --help print this usage and exit\n"));
_ftprintf(stderr, _T(" -b --buffersize <BUFFERSIZE> size of buffer per-thread to use when reading (default is 1MB)\n"));
_ftprintf(stderr, _T(" -t --threadcount <THREADCOUNT> number of threads to use (defaults to number of cpu cores)\n"));
_ftprintf(stderr, _T(" -v --version print version information and exit\n"));
}
void version(void)
{
_tprintf(_T("lc (linecount) %d.%2.2d\nCopyright (c) 2015 Christien Rioux\n"), LINECOUNT_VERSION_MAJOR, LINECOUNT_VERSION_MINOR);
}
//////////////////////////////////////////////////////
#if defined(WIN32) && defined(_UNICODE) #if defined(WIN32) && defined(_UNICODE)
int wmain(int argc, TCHAR **argv) int wmain(int argc, TCHAR **argv)
#else #else
@ -23,27 +52,43 @@ int main(int argc, char **argv)
int posparam = 0; int posparam = 0;
CLineCount::PARAMETERS params; CLineCount::PARAMETERS params;
params.windowsize = -1; params.buffersize = -1;
params.workercount = -1; params.threadcount = -1;
TCHAR *filename = NULL; TCHAR *filename = NULL;
if(argc==1)
{
help(argv[0]);
exit(0);
}
while (arg < argc) while (arg < argc)
{ {
if (_tcscmp(argv[arg], _T("--windowsize")) == 0) if (_tcscmp(argv[arg], _T("-h")) == 0 || _tcscmp(argv[arg], _T("--help")) == 0)
{
help(argv[0]);
exit(0);
}
else if (_tcscmp(argv[arg], _T("-v")) == 0 || _tcscmp(argv[arg], _T("--version")) == 0)
{
version();
exit(0);
}
else if (_tcscmp(argv[arg], _T("-b")) == 0 || _tcscmp(argv[arg], _T("--buffersize")) == 0)
{ {
arg++; arg++;
if (arg == argc) if (arg == argc)
{ {
_ftprintf(stderr, _T("missing argument to --windowsize")); _ftprintf(stderr, _T("%s: missing argument to %s\n"), argv[0], argv[arg-1]);
return 1; return 1;
} }
_TCHAR *wsstr = argv[arg]; TCHAR *wsstr = argv[arg];
// Check for size multipliers // Check for size multipliers
size_t multiplier = 1; size_t multiplier = 1;
_TCHAR *lastchar = wsstr + (_tcslen(wsstr) - 1); TCHAR *lastchar = wsstr + (_tcslen(wsstr) - 1);
if (*lastchar == _T('k') || *lastchar == _T('K')) if (*lastchar == _T('k') || *lastchar == _T('K'))
{ {
multiplier = 1024; multiplier = 1024;
@ -60,20 +105,25 @@ int main(int argc, char **argv)
lastchar = 0; lastchar = 0;
} }
_TCHAR *endptr; TCHAR *endptr;
params.windowsize = ((size_t)_tcstoui64(argv[arg], &endptr, 10)) * multiplier; params.buffersize = ((size_t)_tcstoui64(argv[arg], &endptr, 10)) * multiplier;
} }
else if (_tcscmp(argv[arg], _T("--workercount")) == 0) else if (_tcscmp(argv[arg], _T("-t")) == 0 || _tcscmp(argv[arg], _T("--threadcount")) == 0)
{ {
arg++; arg++;
if (arg == argc) if (arg == argc)
{ {
_ftprintf(stderr, _T("missing argument to --workercount")); _ftprintf(stderr, _T("%s: Missing argument to %s\n"), argv[0], argv[arg-1]);
return 1; return 1;
} }
params.workercount = _ttoi(argv[arg]); params.threadcount = _ttoi(argv[arg]);
if(params.threadcount<=0)
{
_ftprintf(stderr, _T("%s: Invalid thread count\n"), argv[0]);
return 1;
}
} }
else else
{ {
@ -83,7 +133,7 @@ int main(int argc, char **argv)
} }
else else
{ {
_ftprintf(stderr, _T("too many arguments")); _ftprintf(stderr, _T("%s: Too many arguments\n"), argv[0]);
return 1; return 1;
} }
posparam++; posparam++;
@ -94,7 +144,7 @@ int main(int argc, char **argv)
if (posparam != 1) if (posparam != 1)
{ {
_ftprintf(stderr, _T("missing required argument")); _ftprintf(stderr, _T("%s: Missing required argument\n"), argv[0]);
return 1; return 1;
} }
@ -106,7 +156,7 @@ int main(int argc, char **argv)
LCERROR err = lc.lastError(); LCERROR err = lc.lastError();
LCSTRING errstr = lc.lastErrorString(); LCSTRING errstr = lc.lastErrorString();
_ftprintf(stderr, _T("error (%d): %s\n"), err, errstr.c_str()); _ftprintf(stderr, _T("%s: Error %d (%s)\n"), argv[0], err, errstr.c_str());
return err; return err;
} }
@ -117,7 +167,7 @@ int main(int argc, char **argv)
LCERROR err = lc.lastError(); LCERROR err = lc.lastError();
LCSTRING errstr = lc.lastErrorString(); LCSTRING errstr = lc.lastErrorString();
_ftprintf(stderr, _T("error (%d): %s\n"), err, errstr.c_str()); _ftprintf(stderr, _T("%s: Error %d: (%s)\n"), argv[0], err, errstr.c_str());
return err; return err;
} }