virtualx-engine/thirdparty/oidn/common/thread.h

// ======================================================================== //
// Copyright 2009-2019 Intel Corporation                                    //
//                                                                          //
// Licensed under the Apache License, Version 2.0 (the "License");          //
// you may not use this file except in compliance with the License.         //
// You may obtain a copy of the License at                                  //
//                                                                          //
//     http://www.apache.org/licenses/LICENSE-2.0                           //
//                                                                          //
// Unless required by applicable law or agreed to in writing, software      //
// distributed under the License is distributed on an "AS IS" BASIS,        //
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. //
// See the License for the specific language governing permissions and      //
// limitations under the License.                                           //
// ======================================================================== //

#pragma once

#include "platform.h"

#if !defined(_WIN32)
  #include <pthread.h>
  #include <sched.h>
  #if defined(__APPLE__)
    #include <mach/thread_policy.h>
  #endif
#endif

#include <vector>
#include <mutex>

namespace oidn {

  // --------------------------------------------------------------------------
  // ThreadLocal
  // --------------------------------------------------------------------------

  // Wrapper which makes any variable thread-local
  template<typename T>
  class ThreadLocal : public Verbose
  {
  private:
  #if defined(_WIN32)
    DWORD key;
  #else
    pthread_key_t key;
  #endif

    std::vector<T*> instances;
    std::mutex mutex;

  public:
    ThreadLocal(int verbose = 0)
      : Verbose(verbose)
    {
    #if defined(_WIN32)
      key = TlsAlloc();
      if (key == TLS_OUT_OF_INDEXES)
        OIDN_FATAL("TlsAlloc failed");
    #else
      if (pthread_key_create(&key, nullptr) != 0)
        OIDN_FATAL("pthread_key_create failed");
    #endif
    }

    ~ThreadLocal()
    {
      std::lock_guard<std::mutex> lock(mutex);
      for (T* ptr : instances)
        delete ptr;

    #if defined(_WIN32)
      if (!TlsFree(key))
        OIDN_WARNING("TlsFree failed");
    #else
      if (pthread_key_delete(key) != 0)
        OIDN_WARNING("pthread_key_delete failed");
    #endif
    }

    T& get()
    {
    #if defined(_WIN32)
      T* ptr = (T*)TlsGetValue(key);
    #else
      T* ptr = (T*)pthread_getspecific(key);
    #endif

      if (ptr)
        return *ptr;

      ptr = new T;
      std::lock_guard<std::mutex> lock(mutex);
      instances.push_back(ptr);

    #if defined(_WIN32)
      if (!TlsSetValue(key, ptr))
        OIDN_FATAL("TlsSetValue failed");
    #else
      if (pthread_setspecific(key, ptr) != 0)
        OIDN_FATAL("pthread_setspecific failed");
    #endif

      return *ptr;
    }
  };

#if defined(_WIN32)

  // --------------------------------------------------------------------------
  // ThreadAffinity - Windows
  // --------------------------------------------------------------------------

  class ThreadAffinity : public Verbose
  {
  private:
    typedef BOOL (WINAPI *GetLogicalProcessorInformationExFunc)(LOGICAL_PROCESSOR_RELATIONSHIP,
                                                                PSYSTEM_LOGICAL_PROCESSOR_INFORMATION_EX,
                                                                PDWORD);

    typedef BOOL (WINAPI *SetThreadGroupAffinityFunc)(HANDLE,
                                                      CONST GROUP_AFFINITY*,
                                                      PGROUP_AFFINITY);

    GetLogicalProcessorInformationExFunc pGetLogicalProcessorInformationEx = nullptr;
    SetThreadGroupAffinityFunc pSetThreadGroupAffinity = nullptr;

    std::vector<GROUP_AFFINITY> affinities;    // thread affinities
    std::vector<GROUP_AFFINITY> oldAffinities; // original thread affinities

  public:
    ThreadAffinity(int numThreadsPerCore = INT_MAX, int verbose = 0);

    int getNumThreads() const
    {
      return (int)affinities.size();
    }

    // Sets the affinity (0..numThreads-1) of the thread after saving the current affinity
    void set(int threadIndex);

    // Restores the affinity of the thread
    void restore(int threadIndex);
  };

#elif defined(__linux__)

  // --------------------------------------------------------------------------
  // ThreadAffinity - Linux
  // --------------------------------------------------------------------------

  class ThreadAffinity : public Verbose
  {
  private:
    std::vector<cpu_set_t> affinities;    // thread affinities
    std::vector<cpu_set_t> oldAffinities; // original thread affinities

  public:
    ThreadAffinity(int numThreadsPerCore = INT_MAX, int verbose = 0);

    int getNumThreads() const
    {
      return (int)affinities.size();
    }

    // Sets the affinity (0..numThreads-1) of the thread after saving the current affinity
    void set(int threadIndex);

    // Restores the affinity of the thread
    void restore(int threadIndex);
  };

#elif defined(__APPLE__)

  // --------------------------------------------------------------------------
  // ThreadAffinity - macOS
  // --------------------------------------------------------------------------

  class ThreadAffinity : public Verbose
  {
  private:
    std::vector<thread_affinity_policy> affinities;    // thread affinities
    std::vector<thread_affinity_policy> oldAffinities; // original thread affinities

  public:
    ThreadAffinity(int numThreadsPerCore = INT_MAX, int verbose = 0);

    int getNumThreads() const
    {
      return (int)affinities.size();
    }

    // Sets the affinity (0..numThreads-1) of the thread after saving the current affinity
    void set(int threadIndex);

    // Restores the affinity of the thread
    void restore(int threadIndex);
  };

#endif

} // namespace oidn
New lightmapper -Added LocalVector (needed it) -Added stb_rect_pack (It's pretty cool, we could probably use it for other stuff too) -Fixes and changes all around the place -Added library for 128 bits fixed point (required for Delaunay3D) 2020-05-01 14:34:23 +02:00			`// ======================================================================== //`
			`// Copyright 2009-2019 Intel Corporation //`
			`// //`
			`// Licensed under the Apache License, Version 2.0 (the "License"); //`
			`// you may not use this file except in compliance with the License. //`
			`// You may obtain a copy of the License at //`
			`// //`
			`// http://www.apache.org/licenses/LICENSE-2.0 //`
			`// //`
			`// Unless required by applicable law or agreed to in writing, software //`
			`// distributed under the License is distributed on an "AS IS" BASIS, //`
			`// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. //`
			`// See the License for the specific language governing permissions and //`
			`// limitations under the License. //`
			`// ======================================================================== //`

			`#pragma once`

			`#include "platform.h"`

			`#if !defined(_WIN32)`
			`#include <pthread.h>`
			`#include <sched.h>`
			`#if defined(__APPLE__)`
			`#include <mach/thread_policy.h>`
			`#endif`
			`#endif`

			`#include <vector>`
			`#include <mutex>`

			`namespace oidn {`

			`// --------------------------------------------------------------------------`
			`// ThreadLocal`
			`// --------------------------------------------------------------------------`

			`// Wrapper which makes any variable thread-local`
			`template<typename T>`
			`class ThreadLocal : public Verbose`
			`{`
			`private:`
			`#if defined(_WIN32)`
			`DWORD key;`
			`#else`
			`pthread_key_t key;`
			`#endif`

			`std::vector<T*> instances;`
			`std::mutex mutex;`

			`public:`
			`ThreadLocal(int verbose = 0)`
			`: Verbose(verbose)`
			`{`
			`#if defined(_WIN32)`
			`key = TlsAlloc();`
			`if (key == TLS_OUT_OF_INDEXES)`
			`OIDN_FATAL("TlsAlloc failed");`
			`#else`
			`if (pthread_key_create(&key, nullptr) != 0)`
			`OIDN_FATAL("pthread_key_create failed");`
			`#endif`
			`}`

			`~ThreadLocal()`
			`{`
			`std::lock_guard<std::mutex> lock(mutex);`
			`for (T* ptr : instances)`
			`delete ptr;`

			`#if defined(_WIN32)`
			`if (!TlsFree(key))`
			`OIDN_WARNING("TlsFree failed");`
			`#else`
			`if (pthread_key_delete(key) != 0)`
			`OIDN_WARNING("pthread_key_delete failed");`
			`#endif`
			`}`

			`T& get()`
			`{`
			`#if defined(_WIN32)`
			`T* ptr = (T*)TlsGetValue(key);`
			`#else`
			`T* ptr = (T*)pthread_getspecific(key);`
			`#endif`

			`if (ptr)`
			`return *ptr;`

			`ptr = new T;`
			`std::lock_guard<std::mutex> lock(mutex);`
			`instances.push_back(ptr);`

			`#if defined(_WIN32)`
			`if (!TlsSetValue(key, ptr))`
			`OIDN_FATAL("TlsSetValue failed");`
			`#else`
			`if (pthread_setspecific(key, ptr) != 0)`
			`OIDN_FATAL("pthread_setspecific failed");`
			`#endif`

			`return *ptr;`
			`}`
			`};`

			`#if defined(_WIN32)`

			`// --------------------------------------------------------------------------`
			`// ThreadAffinity - Windows`
			`// --------------------------------------------------------------------------`

			`class ThreadAffinity : public Verbose`
			`{`
			`private:`
			`typedef BOOL (WINAPI *GetLogicalProcessorInformationExFunc)(LOGICAL_PROCESSOR_RELATIONSHIP,`
			`PSYSTEM_LOGICAL_PROCESSOR_INFORMATION_EX,`
			`PDWORD);`

			`typedef BOOL (WINAPI *SetThreadGroupAffinityFunc)(HANDLE,`
			`CONST GROUP_AFFINITY*,`
			`PGROUP_AFFINITY);`

			`GetLogicalProcessorInformationExFunc pGetLogicalProcessorInformationEx = nullptr;`
			`SetThreadGroupAffinityFunc pSetThreadGroupAffinity = nullptr;`

			`std::vector<GROUP_AFFINITY> affinities; // thread affinities`
			`std::vector<GROUP_AFFINITY> oldAffinities; // original thread affinities`

			`public:`
			`ThreadAffinity(int numThreadsPerCore = INT_MAX, int verbose = 0);`

			`int getNumThreads() const`
			`{`
			`return (int)affinities.size();`
			`}`

			`// Sets the affinity (0..numThreads-1) of the thread after saving the current affinity`
			`void set(int threadIndex);`

			`// Restores the affinity of the thread`
			`void restore(int threadIndex);`
			`};`

			`#elif defined(__linux__)`

			`// --------------------------------------------------------------------------`
			`// ThreadAffinity - Linux`
			`// --------------------------------------------------------------------------`

			`class ThreadAffinity : public Verbose`
			`{`
			`private:`
			`std::vector<cpu_set_t> affinities; // thread affinities`
			`std::vector<cpu_set_t> oldAffinities; // original thread affinities`

			`public:`
			`ThreadAffinity(int numThreadsPerCore = INT_MAX, int verbose = 0);`

			`int getNumThreads() const`
			`{`
			`return (int)affinities.size();`
			`}`

			`// Sets the affinity (0..numThreads-1) of the thread after saving the current affinity`
			`void set(int threadIndex);`

			`// Restores the affinity of the thread`
			`void restore(int threadIndex);`
			`};`

			`#elif defined(__APPLE__)`

			`// --------------------------------------------------------------------------`
			`// ThreadAffinity - macOS`
			`// --------------------------------------------------------------------------`

			`class ThreadAffinity : public Verbose`
			`{`
			`private:`
			`std::vector<thread_affinity_policy> affinities; // thread affinities`
			`std::vector<thread_affinity_policy> oldAffinities; // original thread affinities`

			`public:`
			`ThreadAffinity(int numThreadsPerCore = INT_MAX, int verbose = 0);`

			`int getNumThreads() const`
			`{`
			`return (int)affinities.size();`
			`}`

			`// Sets the affinity (0..numThreads-1) of the thread after saving the current affinity`
			`void set(int threadIndex);`

			`// Restores the affinity of the thread`
			`void restore(int threadIndex);`
			`};`

			`#endif`

			`} // namespace oidn`