2010-05-18 11:58:33 -04:00
|
|
|
/*
|
2010-09-09 08:16:39 -04:00
|
|
|
* Copyright (c) 2010 The WebM project authors. All Rights Reserved.
|
2010-05-18 11:58:33 -04:00
|
|
|
*
|
2010-06-18 12:39:21 -04:00
|
|
|
* Use of this source code is governed by a BSD-style license
|
2010-06-04 16:19:40 -04:00
|
|
|
* that can be found in the LICENSE file in the root of the source
|
|
|
|
* tree. An additional intellectual property rights grant can be found
|
2010-06-18 12:39:21 -04:00
|
|
|
* in the file PATENTS. All contributing project authors may
|
2010-06-04 16:19:40 -04:00
|
|
|
* be found in the AUTHORS file in the root of the source tree.
|
2010-05-18 11:58:33 -04:00
|
|
|
*/
|
|
|
|
|
|
|
|
|
2011-09-15 15:34:12 +03:00
|
|
|
#include "vpx_config.h"
|
New RTCD implementation
This is a proof of concept RTCD implementation to replace the current
system of nested includes, prototypes, INVOKE macros, etc. Currently
only the decoder specific functions are implemented in the new system.
Additional functions will be added in subsequent commits.
Overview:
RTCD "functions" are implemented as either a global function pointer
or a macro (when only one eligible specialization available).
Functions which have RTCD specializations are listed using a simple
DSL identifying the function's base name, its prototype, and the
architecture extensions that specializations are available for.
Advantages over the old system:
- No INVOKE macros. A call to an RTCD function looks like an ordinary
function call.
- No need to pass vtables around.
- If there is only one eligible function to call, the function is
called directly, rather than indirecting through a function pointer.
- Supports the notion of "required" extensions, so in combination with
the above, on x86_64 if the best function available is sse2 or lower
it will be called directly, since all x86_64 platforms implement
sse2.
- Elides all references to functions which will never be called, which
could reduce binary size. For example if sse2 is required and there
are both mmx and sse2 implementations of a certain function, the
code will have no link time references to the mmx code.
- Significantly easier to add a new function, just one file to edit.
Disadvantages:
- Requires global writable data (though this is not a new requirement)
- 1 new generated source file.
Change-Id: Iae6edab65315f79c168485c96872641c5aa09d55
2011-08-19 14:06:00 -04:00
|
|
|
#include "vpx_rtcd.h"
|
2012-01-12 16:55:44 -08:00
|
|
|
#if ARCH_ARM
|
|
|
|
#include "vpx_ports/arm.h"
|
|
|
|
#elif ARCH_X86 || ARCH_X86_64
|
|
|
|
#include "vpx_ports/x86.h"
|
|
|
|
#endif
|
2011-02-10 14:41:38 -05:00
|
|
|
#include "vp8/common/onyxc_int.h"
|
2010-05-18 11:58:33 -04:00
|
|
|
|
2011-03-25 12:53:03 +02:00
|
|
|
#if CONFIG_MULTITHREAD
|
2012-02-03 13:31:11 +09:00
|
|
|
#if HAVE_UNISTD_H && !defined(__OS2__)
|
2011-03-25 12:53:03 +02:00
|
|
|
#include <unistd.h>
|
|
|
|
#elif defined(_WIN32)
|
|
|
|
#include <windows.h>
|
|
|
|
typedef void (WINAPI *PGNSI)(LPSYSTEM_INFO);
|
2012-02-03 13:31:11 +09:00
|
|
|
#elif defined(__OS2__)
|
|
|
|
#define INCL_DOS
|
|
|
|
#define INCL_DOSSPINLOCK
|
|
|
|
#include <os2.h>
|
2011-03-25 12:53:03 +02:00
|
|
|
#endif
|
|
|
|
#endif
|
|
|
|
|
|
|
|
#if CONFIG_MULTITHREAD
|
|
|
|
static int get_cpu_count()
|
|
|
|
{
|
|
|
|
int core_count = 16;
|
|
|
|
|
2012-02-03 13:31:11 +09:00
|
|
|
#if HAVE_UNISTD_H && !defined(__OS2__)
|
2011-03-25 12:53:03 +02:00
|
|
|
#if defined(_SC_NPROCESSORS_ONLN)
|
|
|
|
core_count = sysconf(_SC_NPROCESSORS_ONLN);
|
|
|
|
#elif defined(_SC_NPROC_ONLN)
|
|
|
|
core_count = sysconf(_SC_NPROC_ONLN);
|
|
|
|
#endif
|
|
|
|
#elif defined(_WIN32)
|
|
|
|
{
|
|
|
|
PGNSI pGNSI;
|
|
|
|
SYSTEM_INFO sysinfo;
|
|
|
|
|
|
|
|
/* Call GetNativeSystemInfo if supported or
|
|
|
|
* GetSystemInfo otherwise. */
|
|
|
|
|
|
|
|
pGNSI = (PGNSI) GetProcAddress(
|
|
|
|
GetModuleHandle(TEXT("kernel32.dll")), "GetNativeSystemInfo");
|
|
|
|
if (pGNSI != NULL)
|
|
|
|
pGNSI(&sysinfo);
|
|
|
|
else
|
|
|
|
GetSystemInfo(&sysinfo);
|
|
|
|
|
|
|
|
core_count = sysinfo.dwNumberOfProcessors;
|
|
|
|
}
|
2012-02-03 13:31:11 +09:00
|
|
|
#elif defined(__OS2__)
|
|
|
|
{
|
|
|
|
ULONG proc_id;
|
|
|
|
ULONG status;
|
|
|
|
|
|
|
|
core_count = 0;
|
|
|
|
for (proc_id = 1; ; proc_id++)
|
|
|
|
{
|
|
|
|
if (DosGetProcessorStatus(proc_id, &status))
|
|
|
|
break;
|
|
|
|
|
|
|
|
if (status == PROC_ONLINE)
|
|
|
|
core_count++;
|
|
|
|
}
|
|
|
|
}
|
2011-03-25 12:53:03 +02:00
|
|
|
#else
|
|
|
|
/* other platforms */
|
|
|
|
#endif
|
|
|
|
|
|
|
|
return core_count > 0 ? core_count : 1;
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
2012-04-18 16:03:40 -07:00
|
|
|
|
|
|
|
#if HAVE_PTHREAD_H
|
|
|
|
#include <pthread.h>
|
|
|
|
static void once(void (*func)(void))
|
|
|
|
{
|
|
|
|
static pthread_once_t lock = PTHREAD_ONCE_INIT;
|
|
|
|
pthread_once(&lock, func);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
#elif defined(_WIN32)
|
|
|
|
static void once(void (*func)(void))
|
|
|
|
{
|
|
|
|
/* Using a static initializer here rather than InitializeCriticalSection()
|
|
|
|
* since there's no race-free context in which to execute it. Protecting
|
|
|
|
* it with an atomic op like InterlockedCompareExchangePointer introduces
|
|
|
|
* an x86 dependency, and InitOnceExecuteOnce requires Vista.
|
|
|
|
*/
|
|
|
|
static CRITICAL_SECTION lock = {(void *)-1, -1, 0, 0, 0, 0};
|
|
|
|
static int done;
|
|
|
|
|
|
|
|
EnterCriticalSection(&lock);
|
|
|
|
|
|
|
|
if (!done)
|
|
|
|
{
|
|
|
|
func();
|
|
|
|
done = 1;
|
|
|
|
}
|
|
|
|
|
|
|
|
LeaveCriticalSection(&lock);
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
#else
|
|
|
|
/* No-op version that performs no synchronization. vpx_rtcd() is idempotent,
|
|
|
|
* so as long as your platform provides atomic loads/stores of pointers
|
|
|
|
* no synchronization is strictly necessary.
|
|
|
|
*/
|
|
|
|
|
|
|
|
static void once(void (*func)(void))
|
|
|
|
{
|
|
|
|
static int done;
|
|
|
|
|
|
|
|
if(!done)
|
|
|
|
{
|
|
|
|
func();
|
|
|
|
done = 1;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
#endif
|
|
|
|
|
|
|
|
|
2010-05-18 11:58:33 -04:00
|
|
|
void vp8_machine_specific_config(VP8_COMMON *ctx)
|
|
|
|
{
|
2011-03-25 12:53:03 +02:00
|
|
|
#if CONFIG_MULTITHREAD
|
|
|
|
ctx->processor_core_count = get_cpu_count();
|
|
|
|
#endif /* CONFIG_MULTITHREAD */
|
New RTCD implementation
This is a proof of concept RTCD implementation to replace the current
system of nested includes, prototypes, INVOKE macros, etc. Currently
only the decoder specific functions are implemented in the new system.
Additional functions will be added in subsequent commits.
Overview:
RTCD "functions" are implemented as either a global function pointer
or a macro (when only one eligible specialization available).
Functions which have RTCD specializations are listed using a simple
DSL identifying the function's base name, its prototype, and the
architecture extensions that specializations are available for.
Advantages over the old system:
- No INVOKE macros. A call to an RTCD function looks like an ordinary
function call.
- No need to pass vtables around.
- If there is only one eligible function to call, the function is
called directly, rather than indirecting through a function pointer.
- Supports the notion of "required" extensions, so in combination with
the above, on x86_64 if the best function available is sse2 or lower
it will be called directly, since all x86_64 platforms implement
sse2.
- Elides all references to functions which will never be called, which
could reduce binary size. For example if sse2 is required and there
are both mmx and sse2 implementations of a certain function, the
code will have no link time references to the mmx code.
- Significantly easier to add a new function, just one file to edit.
Disadvantages:
- Requires global writable data (though this is not a new requirement)
- 1 new generated source file.
Change-Id: Iae6edab65315f79c168485c96872641c5aa09d55
2011-08-19 14:06:00 -04:00
|
|
|
|
2012-01-12 16:55:44 -08:00
|
|
|
#if ARCH_ARM
|
|
|
|
ctx->cpu_caps = arm_cpu_caps();
|
|
|
|
#elif ARCH_X86 || ARCH_X86_64
|
|
|
|
ctx->cpu_caps = x86_simd_caps();
|
|
|
|
#endif
|
|
|
|
|
2012-04-18 16:03:40 -07:00
|
|
|
once(vpx_rtcd);
|
2010-05-18 11:58:33 -04:00
|
|
|
}
|